diff --git a/.actions/assistant.py b/.actions/assistant.py new file mode 100644 index 0000000..bd134e2 --- /dev/null +++ b/.actions/assistant.py @@ -0,0 +1,474 @@ +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +import glob +import logging +import os +import pathlib +import re +import shutil +import tarfile +import tempfile +import urllib.request +from distutils.version import LooseVersion +from itertools import chain +from os.path import dirname, isfile +from pathlib import Path +from typing import Any, Dict, Iterable, Iterator, List, Optional, Sequence, Tuple, Union + +from pkg_resources import parse_requirements, Requirement, yield_lines + +REQUIREMENT_FILES = { + "pytorch": ( + "requirements/pytorch/base.txt", + "requirements/pytorch/extra.txt", + "requirements/pytorch/strategies.txt", + "requirements/pytorch/examples.txt", + ), + "app": ( + "requirements/app/base.txt", + "requirements/app/ui.txt", + "requirements/app/cloud.txt", + ), + "fabric": ( + "requirements/fabric/base.txt", + "requirements/fabric/strategies.txt", + ), + "data": ( + "requirements/data/data.txt", + "requirements/data/cloud.txt", + "requirements/data/examples.txt", + ), +} +REQUIREMENT_FILES_ALL = list(chain(*REQUIREMENT_FILES.values())) + +_PROJECT_ROOT = os.path.dirname(os.path.dirname(__file__)) + + +class _RequirementWithComment(Requirement): + strict_string = "# strict" + + def __init__(self, *args: Any, comment: str = "", pip_argument: Optional[str] = None, **kwargs: Any) -> None: + super().__init__(*args, **kwargs) + self.comment = comment + assert pip_argument is None or pip_argument # sanity check that it's not an empty str + self.pip_argument = pip_argument + self.strict = self.strict_string in comment.lower() + + def adjust(self, unfreeze: str) -> str: + """Remove version restrictions unless they are strict. + + >>> _RequirementWithComment("arrow<=1.2.2,>=1.2.0", comment="# anything").adjust("none") + 'arrow<=1.2.2,>=1.2.0' + >>> _RequirementWithComment("arrow<=1.2.2,>=1.2.0", comment="# strict").adjust("none") + 'arrow<=1.2.2,>=1.2.0 # strict' + >>> _RequirementWithComment("arrow<=1.2.2,>=1.2.0", comment="# my name").adjust("all") + 'arrow>=1.2.0' + >>> _RequirementWithComment("arrow>=1.2.0, <=1.2.2", comment="# strict").adjust("all") + 'arrow<=1.2.2,>=1.2.0 # strict' + >>> _RequirementWithComment("arrow").adjust("all") + 'arrow' + >>> _RequirementWithComment("arrow>=1.2.0, <=1.2.2", comment="# cool").adjust("major") + 'arrow<2.0,>=1.2.0' + >>> _RequirementWithComment("arrow>=1.2.0, <=1.2.2", comment="# strict").adjust("major") + 'arrow<=1.2.2,>=1.2.0 # strict' + >>> _RequirementWithComment("arrow>=1.2.0").adjust("major") + 'arrow>=1.2.0' + >>> _RequirementWithComment("arrow").adjust("major") + 'arrow' + """ + out = str(self) + if self.strict: + return f"{out} {self.strict_string}" + if unfreeze == "major": + for operator, version in self.specs: + if operator in ("<", "<="): + major = LooseVersion(version).version[0] + # replace upper bound with major version increased by one + return out.replace(f"{operator}{version}", f"<{major + 1}.0") + elif unfreeze == "all": + for operator, version in self.specs: + if operator in ("<", "<="): + # drop upper bound + return out.replace(f"{operator}{version},", "") + elif unfreeze != "none": + raise ValueError(f"Unexpected unfreeze: {unfreeze!r} value.") + return out + + +def _parse_requirements(strs: Union[str, Iterable[str]]) -> Iterator[_RequirementWithComment]: + """Adapted from `pkg_resources.parse_requirements` to include comments. + + >>> txt = ['# ignored', '', 'this # is an', '--piparg', 'example', 'foo # strict', 'thing', '-r different/file.txt'] + >>> [r.adjust('none') for r in _parse_requirements(txt)] + ['this', 'example', 'foo # strict', 'thing'] + >>> txt = '\\n'.join(txt) + >>> [r.adjust('none') for r in _parse_requirements(txt)] + ['this', 'example', 'foo # strict', 'thing'] + """ + lines = yield_lines(strs) + pip_argument = None + for line in lines: + # Drop comments -- a hash without a space may be in a URL. + if " #" in line: + comment_pos = line.find(" #") + line, comment = line[:comment_pos], line[comment_pos:] + else: + comment = "" + # If there is a line continuation, drop it, and append the next line. + if line.endswith("\\"): + line = line[:-2].strip() + try: + line += next(lines) + except StopIteration: + return + # If there's a pip argument, save it + if line.startswith("--"): + pip_argument = line + continue + if line.startswith("-r "): + # linked requirement files are unsupported + continue + yield _RequirementWithComment(line, comment=comment, pip_argument=pip_argument) + pip_argument = None + + +def load_requirements(path_dir: str, file_name: str = "base.txt", unfreeze: str = "all") -> List[str]: + """Loading requirements from a file. + + >>> path_req = os.path.join(_PROJECT_ROOT, "requirements") + >>> load_requirements(path_req, "docs.txt", unfreeze="major") # doctest: +ELLIPSIS +NORMALIZE_WHITESPACE + ['sphinx<...] + """ + assert unfreeze in {"none", "major", "all"} + path = Path(path_dir) / file_name + if not path.exists(): + logging.warning(f"Folder {path_dir} does not have any base requirements.") + return [] + assert path.exists(), (path_dir, file_name, path) + text = path.read_text() + return [req.adjust(unfreeze) for req in _parse_requirements(text)] + + +def load_readme_description(path_dir: str, homepage: str, version: str) -> str: + """Load readme as decribtion. + + >>> load_readme_description(_PROJECT_ROOT, "", "") # doctest: +ELLIPSIS +NORMALIZE_WHITESPACE + '...PyTorch Lightning is just organized PyTorch...' + """ + path_readme = os.path.join(path_dir, "README.md") + with open(path_readme, encoding="utf-8") as fo: + text = fo.read() + + # drop images from readme + text = text.replace( + "![PT to PL](docs/source-pytorch/_static/images/general/pl_quick_start_full_compressed.gif)", "" + ) + + # https://github.com/Lightning-AI/lightning/raw/master/docs/source/_static/images/lightning_module/pt_to_pl.png + github_source_url = os.path.join(homepage, "raw", version) + # replace relative repository path to absolute link to the release + # do not replace all "docs" as in the readme we reger some other sources with particular path to docs + text = text.replace( + "docs/source-pytorch/_static/", f"{os.path.join(github_source_url, 'docs/source-app/_static/')}" + ) + + # readthedocs badge + text = text.replace("badge/?version=stable", f"badge/?version={version}") + text = text.replace("pytorch-lightning.readthedocs.io/en/stable/", f"pytorch-lightning.readthedocs.io/en/{version}") + # codecov badge + text = text.replace("/branch/master/graph/badge.svg", f"/release/{version}/graph/badge.svg") + # github actions badge + text = text.replace("badge.svg?branch=master&event=push", f"badge.svg?tag={version}") + # azure pipelines badge + text = text.replace("?branchName=master", f"?branchName=refs%2Ftags%2F{version}") + + skip_begin = r"" + skip_end = r"" + # todo: wrap content as commented description + text = re.sub(rf"{skip_begin}.+?{skip_end}", "", text, flags=re.IGNORECASE + re.DOTALL) + + # # https://github.com/Borda/pytorch-lightning/releases/download/1.1.0a6/codecov_badge.png + # github_release_url = os.path.join(homepage, "releases", "download", version) + # # download badge and replace url with local file + # text = _parse_for_badge(text, github_release_url) + return text + + +def distribute_version(src_folder: str, ver_file: str = "version.info") -> None: + """Copy the global version to all packages.""" + ls_ver = glob.glob(os.path.join(src_folder, "*", "__version__.py")) + ver_template = os.path.join(src_folder, ver_file) + for fpath in ls_ver: + fpath = os.path.join(os.path.dirname(fpath), ver_file) + print("Distributing the version to", fpath) + if os.path.isfile(fpath): + os.remove(fpath) + shutil.copy2(ver_template, fpath) + + +def _download_frontend(pkg_path: str): + """Downloads an archive file for a specific release of the Lightning frontend and extracts it to the correct + directory.""" + + try: + frontend_dir = pathlib.Path(pkg_path, "ui") + download_dir = tempfile.mkdtemp() + + shutil.rmtree(frontend_dir, ignore_errors=True) + # TODO: remove this once lightning-ui package is ready as a dependency + frontend_release_url = "https://storage.googleapis.com/grid-packages/lightning-ui/v0.0.0/build.tar.gz" + response = urllib.request.urlopen(frontend_release_url) + + file = tarfile.open(fileobj=response, mode="r|gz") + file.extractall(path=download_dir) + + shutil.move(os.path.join(download_dir, "build"), frontend_dir) + print("The Lightning UI has successfully been downloaded!") + + # If installing from source without internet connection, we don't want to break the installation + except Exception: + print("The Lightning UI downloading has failed!") + + +def _load_aggregate_requirements(req_dir: str = "requirements", freeze_requirements: bool = False) -> None: + """Load all base requirements from all particular packages and prune duplicates. + + >>> _load_aggregate_requirements(os.path.join(_PROJECT_ROOT, "requirements")) + """ + requires = [ + load_requirements(d, unfreeze="none" if freeze_requirements else "major") + for d in glob.glob(os.path.join(req_dir, "*")) + # skip empty folder (git artifacts), and resolving Will's special issue + if os.path.isdir(d) and len(glob.glob(os.path.join(d, "*"))) > 0 and not os.path.basename(d).startswith("_") + ] + if not requires: + return + # TODO: add some smarter version aggregation per each package + requires = sorted(set(chain(*requires))) + with open(os.path.join(req_dir, "base.txt"), "w") as fp: + fp.writelines([ln + os.linesep for ln in requires] + [os.linesep]) + + +def _retrieve_files(directory: str, *ext: str) -> List[str]: + all_files = [] + for root, _, files in os.walk(directory): + for fname in files: + if not ext or any(os.path.split(fname)[1].lower().endswith(e) for e in ext): + all_files.append(os.path.join(root, fname)) + + return all_files + + +def _replace_imports(lines: List[str], mapping: List[Tuple[str, str]], lightning_by: str = "") -> List[str]: + """Replace imports of standalone package to lightning. + + >>> lns = [ + ... '"lightning_app"', + ... "lightning_app", + ... "lightning_app/", + ... "delete_cloud_lightning_apps", + ... "from lightning_app import", + ... "lightning_apps = []", + ... "lightning_app and pytorch_lightning are ours", + ... "def _lightning_app():", + ... ":class:`~lightning_app.core.flow.LightningFlow`", + ... "http://pytorch_lightning.ai", + ... "from lightning import __version__", + ... "@lightning.ai" + ... ] + >>> mapping = [("lightning_app", "lightning.app"), ("pytorch_lightning", "lightning.pytorch")] + >>> _replace_imports(lns, mapping, lightning_by="lightning_fabric") # doctest: +NORMALIZE_WHITESPACE + ['"lightning.app"', \ + 'lightning.app', \ + 'lightning_app/', \ + 'delete_cloud_lightning_apps', \ + 'from lightning.app import', \ + 'lightning_apps = []', \ + 'lightning.app and lightning.pytorch are ours', \ + 'def _lightning_app():', \ + ':class:`~lightning.app.core.flow.LightningFlow`', \ + 'http://pytorch_lightning.ai', \ + 'from lightning_fabric import __version__', \ + '@lightning.ai'] + """ + out = lines[:] + for source_import, target_import in mapping: + for i, ln in enumerate(out): + out[i] = re.sub( + rf"([^_/@]|^){source_import}([^_\w/]|$)", + rf"\1{target_import}\2", + ln, + ) + if lightning_by: # in addition, replace base package + out[i] = out[i].replace("from lightning import ", f"from {lightning_by} import ") + out[i] = out[i].replace("import lightning ", f"import {lightning_by} ") + return out + + +def copy_replace_imports( + source_dir: str, + source_imports: Sequence[str], + target_imports: Sequence[str], + target_dir: Optional[str] = None, + lightning_by: str = "", +) -> None: + """Copy package content with import adjustments.""" + print(f"Replacing imports: {locals()}") + assert len(source_imports) == len(target_imports), ( + "source and target imports must have the same length, " + f"source: {len(source_imports)}, target: {len(target_imports)}" + ) + if target_dir is None: + target_dir = source_dir + + ls = _retrieve_files(source_dir) + for fp in ls: + fp_new = fp.replace(source_dir, target_dir) + _, ext = os.path.splitext(fp) + if ext in (".png", ".jpg", ".ico"): + os.makedirs(dirname(fp_new), exist_ok=True) + if not isfile(fp_new): + shutil.copy(fp, fp_new) + continue + if ext in (".pyc",): + continue + # Try to parse everything else + with open(fp, encoding="utf-8") as fo: + try: + lines = fo.readlines() + except UnicodeDecodeError: + # a binary file, skip + print(f"Skipped replacing imports for {fp}") + continue + lines = _replace_imports(lines, list(zip(source_imports, target_imports)), lightning_by=lightning_by) + os.makedirs(os.path.dirname(fp_new), exist_ok=True) + with open(fp_new, "w", encoding="utf-8") as fo: + fo.writelines(lines) + + +def create_mirror_package(source_dir: str, package_mapping: Dict[str, str]) -> None: + # replace imports and copy the code + mapping = package_mapping.copy() + mapping.pop("lightning", None) # pop this key to avoid replacing `lightning` to `lightning.lightning` + + mapping = {f"lightning.{sp}": sl for sp, sl in mapping.items()} + for pkg_from, pkg_to in mapping.items(): + copy_replace_imports( + source_dir=os.path.join(source_dir, pkg_from.replace(".", os.sep)), + # pytorch_lightning uses lightning_fabric, so we need to replace all imports for all directories + source_imports=mapping.keys(), + target_imports=mapping.values(), + target_dir=os.path.join(source_dir, pkg_to.replace(".", os.sep)), + lightning_by=pkg_from, + ) + + +class AssistantCLI: + @staticmethod + def requirements_prune_pkgs(packages: Sequence[str], req_files: Sequence[str] = REQUIREMENT_FILES_ALL) -> None: + """Remove some packages from given requirement files.""" + if isinstance(req_files, str): + req_files = [req_files] + for req in req_files: + AssistantCLI._prune_packages(req, packages) + + @staticmethod + def _prune_packages(req_file: str, packages: Sequence[str]) -> None: + """Remove some packages from given requirement files.""" + path = Path(req_file) + assert path.exists() + text = path.read_text() + lines = text.splitlines() + final = [] + for line in lines: + ln_ = line.strip() + if not ln_ or ln_.startswith("#"): + final.append(line) + continue + req = list(parse_requirements(ln_))[0] + if req.name not in packages: + final.append(line) + print(final) + path.write_text("\n".join(final) + "\n") + + @staticmethod + def _replace_min(fname: str) -> None: + with open(fname, encoding="utf-8") as fo: + req = fo.read().replace(">=", "==") + with open(fname, "w", encoding="utf-8") as fw: + fw.write(req) + + @staticmethod + def replace_oldest_ver(requirement_fnames: Sequence[str] = REQUIREMENT_FILES_ALL) -> None: + """Replace the min package version by fixed one.""" + for fname in requirement_fnames: + print(fname) + AssistantCLI._replace_min(fname) + + @staticmethod + def copy_replace_imports( + source_dir: str, + source_import: str, + target_import: str, + target_dir: Optional[str] = None, + lightning_by: str = "", + ) -> None: + """Copy package content with import adjustments.""" + source_imports = source_import.strip().split(",") + target_imports = target_import.strip().split(",") + copy_replace_imports( + source_dir, source_imports, target_imports, target_dir=target_dir, lightning_by=lightning_by + ) + + @staticmethod + def pull_docs_files( + gh_user_repo: str, + target_dir: str = "docs/source-pytorch/XXX", + checkout: str = "tags/1.0.0", + source_dir: str = "docs/source", + ) -> None: + """Pull docs pages from external source and append to local docs.""" + import zipfile + + zip_url = f"https://github.com/{gh_user_repo}/archive/refs/{checkout}.zip" + + with tempfile.TemporaryDirectory() as tmp: + zip_file = os.path.join(tmp, "repo.zip") + urllib.request.urlretrieve(zip_url, zip_file) + + with zipfile.ZipFile(zip_file, "r") as zip_ref: + zip_ref.extractall(tmp) + + zip_dirs = [d for d in glob.glob(os.path.join(tmp, "*")) if os.path.isdir(d)] + # check that the extracted archive has only repo folder + assert len(zip_dirs) == 1 + repo_dir = zip_dirs[0] + + ls_pages = glob.glob(os.path.join(repo_dir, source_dir, "*.rst")) + ls_pages += glob.glob(os.path.join(repo_dir, source_dir, "**", "*.rst")) + for rst in ls_pages: + rel_rst = rst.replace(os.path.join(repo_dir, source_dir) + os.path.sep, "") + rel_dir = os.path.dirname(rel_rst) + os.makedirs(os.path.join(_PROJECT_ROOT, target_dir, rel_dir), exist_ok=True) + new_rst = os.path.join(_PROJECT_ROOT, target_dir, rel_rst) + if os.path.isfile(new_rst): + logging.warning(f"Page {new_rst} already exists in the local tree so it will be skipped.") + continue + shutil.copy(rst, new_rst) + + +if __name__ == "__main__": + import jsonargparse + + jsonargparse.CLI(AssistantCLI, as_positional=False) diff --git a/.actions/pull_legacy_checkpoints.sh b/.actions/pull_legacy_checkpoints.sh new file mode 100644 index 0000000..b61647a --- /dev/null +++ b/.actions/pull_legacy_checkpoints.sh @@ -0,0 +1,11 @@ +#!/bin/bash + +# Run this script from the project root. +URL="https://pl-public-data.s3.amazonaws.com/legacy/checkpoints.zip" +mkdir -p tests/legacy +# wget is simpler but does not work on Windows +python -c "from urllib.request import urlretrieve; urlretrieve('$URL', 'tests/legacy/checkpoints.zip')" +ls -l tests/legacy/ + +unzip -o tests/legacy/checkpoints.zip -d tests/legacy/ +ls -l tests/legacy/checkpoints/ diff --git a/.actions/requirements.txt b/.actions/requirements.txt new file mode 100644 index 0000000..fdd6005 --- /dev/null +++ b/.actions/requirements.txt @@ -0,0 +1,2 @@ +jsonargparse>=4.16.0 +requests diff --git a/.github/workflows/deploy-gh-pages.yml b/.github/workflows/deploy-gh-pages.yml index 46998e5..879db68 100644 --- a/.github/workflows/deploy-gh-pages.yml +++ b/.github/workflows/deploy-gh-pages.yml @@ -1,47 +1,93 @@ -name: gh-pages deploy +name: Build Lightning Docs & Deploy to gh-pages on: push: branches: - master +defaults: + run: + shell: bash + +env: + FREEZE_REQUIREMENTS: "1" + TORCH_URL: "https://download.pytorch.org/whl/cpu/torch_stable.html" + PYPI_CACHE_DIR: "_pip-wheels" + jobs: - build: + make-html: runs-on: ubuntu-latest + container: + image: pytorchlightning/pytorch_lightning:docs + strategy: + fail-fast: false + matrix: + pkg-name: ["app", "fabric", "pytorch"] steps: - uses: actions/checkout@v3 + with: + submodules: true - - name: Set up Python 3.8 - uses: actions/setup-python@v3 + - name: pip wheels cache + uses: actions/cache/restore@v3 with: - python-version: '3.8' + path: ${{ env.PYPI_CACHE_DIR }} + key: pypi_wheels - - name: Upgrade pip - run: python3 -m pip install --upgrade pip + - name: Install package & dependencies + run: | + mkdir -p $PYPI_CACHE_DIR # in case cache was not hit + ls -lh $PYPI_CACHE_DIR + mkdir -p pypi_pkgs # in case template is not pulled + pip --version + pip install -U -r requirements.txt \ + -f pypi_pkgs/ -f $PYPI_CACHE_DIR -f ${TORCH_URL} + pip install -U -r requirements/${{ matrix.pkg-name }}/docs.txt \ + -f pypi_pkgs/ -f $PYPI_CACHE_DIR -f ${TORCH_URL} + pip list + shell: bash - - name: Get pip cache dir - id: pip-cache - run: echo "::set-output name=dir::$(pip cache dir)" + - name: Make Documentation + working-directory: ./docs/source-${{ matrix.pkg-name }} + run: make html --debug --jobs $(nproc) SPHINXOPTS="-W --keep-going" - - name: Cache dependencies - uses: actions/cache@v2 - with: - path: ${{ steps.pip-cache.outputs.dir }} - key: ${{ runner.os }}-pip-${{ hashFiles('**/requirements.txt') }} - restore-keys: | - ${{ runner.os }}-pip- + - name: Keep artifact + id: keep-artifact + run: python -c "print('DAYS=' + str(7 if '${{ github.event_name }}'.startswith('pull_request') else 0))" >> $GITHUB_OUTPUT - - name: Install dependencies - run: pip install -r requirements.txt + - name: Upload built docs + uses: actions/upload-artifact@v3 + with: + name: docs-${{ matrix.pkg-name }}-${{ github.sha }} + path: docs/build/html/ + retention-days: ${{ steps.keep-artifact.outputs.DAYS }} - - name: Build Sphinx documents - run: make docs + - name: Dump handy wheels + if: github.event_name == 'push' && github.ref == 'refs/heads/master' + continue-on-error: true + uses: ./.github/actions/pip-wheels + with: + wheel-dir: ${{ env.PYPI_CACHE_DIR }} + torch-url: ${{ env.TORCH_URL }} + cache-key: "pypi_wheels" + deploy-docs: + needs: [make-html] + runs-on: ubuntu-latest + strategy: + fail-fast: false + matrix: + pkg-name: ["app", "fabric", "pytorch"] + steps: + - uses: actions/download-artifact@v3 + with: + name: docs-${{ matrix.pkg-name }}-${{ github.sha }} + path: docs/build/html/ - name: Deploy to gh-pages branch uses: peaceiris/actions-gh-pages@v3 with: github_token: ${{ secrets.DEPLOY_TOKEN }} - publish_dir: ./build/html + publish_dir: ./docs/build/html cname: docs.pytorchlightning.kr enable_jekyll: false force_orphan: true diff --git a/.gitignore b/.gitignore index 923c2a1..c9307d0 100644 --- a/.gitignore +++ b/.gitignore @@ -2,23 +2,30 @@ .DS_Store run_configs/ model_weights/ -app/models/ pip-wheel-metadata/ lightning_logs/ .vscode/ -# Test-tube -test_tube_*/ - # Documentations -docs/source/api -docs/source/*.md -docs/source/generated -docs/source/*/generated -docs/source/notebooks -docs/source/_static/images/course_UvA-DL -docs/source/_static/images/lightning_examples +docs/venv*/ +docs/build*/ +docs/source-app/generated +docs/source-app/*/generated +docs/source-app/_static/fetched-s3-assets +docs/source-fabric/_static/fetched-s3-assets +docs/source-pytorch/api +docs/source-pytorch/*.md +docs/source-pytorch/generated +docs/source-pytorch/*/generated +docs/source-pytorch/notebooks +docs/source-pytorch/_static/images/course_UvA-DL +docs/source-pytorch/_static/images/lightning_examples +docs/source-pytorch/_static/fetched-s3-assets + +docs/source-fabric/*/generated +# C extensions +*.so # Byte-compiled / optimized / DLL files __pycache__/ *.py[cod] @@ -27,11 +34,6 @@ timit_data/ grid_generated* grid_ori* - - -# C extensions -*.so - # PyCharm .idea/ @@ -53,6 +55,18 @@ wheels/ *.egg-info/ .installed.cfg *.egg +src/*/version.info +src/lightning_app/* +src/lightning_fabric/* +src/pytorch_lightning/* +!src/*/__about__.py +!src/*/__main__.py +!src/*/__setup__.py +!src/*/__version__.py +!src/*/MANIFEST.in +!src/*/py.typed +!src/*/README.md +!src/*/shell-folder_code-lives-lightning.info # PyInstaller # Usually these files are written by a python script from a template @@ -113,6 +127,8 @@ celerybeat-schedule # dotenv .env +.env.staging +.env.local # virtualenv .venv @@ -134,13 +150,15 @@ ENV/ .mypy_cache/ # pytest .pytest_cache/ +# ruff +.ruff_cache/ # data .data/ Datasets/ mnist/ MNIST/ -legacy/checkpoints/ +tests/legacy/checkpoints/ *.gz *ubyte @@ -149,7 +167,6 @@ ml-runs/ mlruns/ *.zip *.ckpt -pytorch\ lightning test-reports/ wandb .forked/ @@ -163,3 +180,32 @@ cifar-10-batches-py # ctags tags .tags +src/lightning_app/ui/* +src/lightning/app/ui/* +*examples/template_react_ui* +hars* +artifacts/* +*docs/examples* + +# tutorials +our_model.tar +test.png +saved_models +data/ +!src/lightning/data/ +!examples/data/ +!tests/tests_pytorch/utilities/data/ +!requirements/data/ +.shared +.lightning +node_modules/ + +# examples +**/events.out.tfevents.* +examples/**/*.png + +# CI +.wheels/ + +# sourced notebooks from tutorials +_notebooks/.notebooks/ diff --git a/.gitmodules b/.gitmodules new file mode 100644 index 0000000..828dd19 --- /dev/null +++ b/.gitmodules @@ -0,0 +1,4 @@ +[submodule "_notebooks"] + path = _notebooks + url = https://github.com/PyTorchKorea/lightning-tutorials-kr.git + branch = publication diff --git a/.lightningignore b/.lightningignore new file mode 100644 index 0000000..4ce8d52 --- /dev/null +++ b/.lightningignore @@ -0,0 +1,16 @@ +_notebooks +.azure +.github +.ipynb_checkpoints +.pytest_cache +.shared +.storage +.venv +.vscode +.git +artifacts +Datasets +dist +docs +examples +tests diff --git a/Makefile b/Makefile index 2159c7f..c303c68 100644 --- a/Makefile +++ b/Makefile @@ -1,25 +1,38 @@ -# Minimal makefile for Sphinx documentation -# +.PHONY: test clean docs -# You can set these variables from the command line. -SPHINXOPTS = -SPHINXBUILD = sphinx-build -SOURCEDIR = source -BUILDDIR = build +# to imitate SLURM set only single node +export SLURM_LOCALID=0 +# assume you have installed need packages +export SPHINX_MOCK_REQUIREMENTS=1 +# install only Lightning Trainer packages +export PACKAGE_NAME=pytorch -# Put it first so that "make" without argument is like "make help". -help: - @$(SPHINXBUILD) -M help "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O) - -.PHONY: help Makefile - -# Catch-all target: route all unknown targets to Sphinx using the new -# "make mode" option. $(O) is meant as a shortcut for $(SPHINXOPTS). -%: Makefile - @$(SPHINXBUILD) -M $@ "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O) -v +clean: + # clean all temp runs + rm -rf $(shell find . -name "mlruns") + rm -rf $(shell find . -name "lightning_log") + rm -rf $(shell find . -name "lightning_logs") + rm -rf _ckpt_* + rm -rf .mypy_cache + rm -rf .pytest_cache + rm -rf ./docs/build + rm -rf ./docs/source-fabric/api/generated + rm -rf ./docs/source-pytorch/notebooks + rm -rf ./docs/source-pytorch/generated + rm -rf ./docs/source-pytorch/*/generated + rm -rf ./docs/source-pytorch/api + rm -rf ./docs/source-app/generated + rm -rf ./docs/source-app/*/generated + rm -rf build + rm -rf dist + rm -rf *.egg-info docs: - make html - echo "Build finished. The HTML pages are in $(BUILDDIR)/html." + git submodule update --init --recursive # get Notebook submodule + pip install -qq lightning # install (stable) Lightning from PyPI instead of src + pip install -qq -r requirements/app/base.txt + pip install -qq -r requirements/pytorch/docs.txt + cd docs/source-pytorch && $(MAKE) html --jobs $(nproc) && cd ../../ -.PHONY: all docs clean +update: + git submodule update --init --recursive --remote diff --git a/README.md b/README.md index 4979a18..70db3e5 100644 --- a/README.md +++ b/README.md @@ -1,79 +1,633 @@ -# PyTorch-Lightning Docs +
-We are using Sphinx with Napoleon extension. -Moreover, we set Google style to follow with type convention. +Lightning -- [Napoleon formatting with Google style](https://sphinxcontrib-napoleon.readthedocs.io/en/latest/example_google.html) -- [ReStructured Text (reST)](https://docs.pylonsproject.org/projects/docs-style-guide/) -- [Paragraph-level markup](https://www.sphinx-doc.org/en/master/usage/restructuredtext/basics.html#paragraphs) +
+
-See following short example of a sample function taking one position string and optional +**The Deep Learning framework to train, deploy, and ship AI products Lightning fast.** -```python -from typing import Optional +**NEW- Lightning 2.0 is featuring a clean and stable API!!** + +______________________________________________________________________ + +

+ Lightning.ai • + PyTorch Lightning • + Fabric • + Lightning Apps • + Docs • + Community • + Contribute • +

+ + + +[![PyPI - Python Version](https://img.shields.io/pypi/pyversions/pytorch-lightning)](https://pypi.org/project/pytorch-lightning/) +[![PyPI Status](https://badge.fury.io/py/pytorch-lightning.svg)](https://badge.fury.io/py/pytorch-lightning) +[![PyPI Status](https://pepy.tech/badge/pytorch-lightning)](https://pepy.tech/project/pytorch-lightning) +[![Conda](https://img.shields.io/conda/v/conda-forge/lightning?label=conda&color=success)](https://anaconda.org/conda-forge/lightning) +[![DockerHub](https://img.shields.io/docker/pulls/pytorchlightning/pytorch_lightning.svg)](https://hub.docker.com/r/pytorchlightning/pytorch_lightning) +[![codecov](https://codecov.io/gh/Lightning-AI/lightning/branch/master/graph/badge.svg?token=SmzX8mnKlA)](https://codecov.io/gh/Lightning-AI/lightning) + +[![Discord](https://img.shields.io/discord/1077906959069626439?style=plastic)](https://discord.gg/VptPCZkGNa) +![GitHub commit activity](https://img.shields.io/github/commit-activity/w/lightning-ai/lightning) +[![license](https://img.shields.io/badge/License-Apache%202.0-blue.svg)](https://github.com/Lightning-AI/lightning/blob/master/LICENSE) + + + +
+ +## Install Lightning + +Simple installation from PyPI + +```bash +pip install lightning +``` + -def my_func(param_a: int, param_b: Optional[float] = None) -> str: - """Sample function. +
+ Other installation options + - Args: - param_a: first parameter - param_b: second parameter +#### Install with optional dependencies - Return: - sum of both numbers +```bash +pip install lightning['extra'] +``` - Example:: +#### Conda - >>> my_func(1, 2) - 3 +```bash +conda install lightning -c conda-forge +``` - Note: - If you want to add something. - """ - p = param_b if param_b else 0 - return str(param_a + p) +#### Install stable version + +Install future release from the source + +```bash +pip install https://github.com/Lightning-AI/lightning/archive/refs/heads/release/stable.zip -U ``` -## Building Docs +#### Install bleeding-edge -When updating the docs, make sure to build them first locally and visually inspect the html files in your browser for -formatting errors. In certain cases, a missing blank line or a wrong indent can lead to a broken layout. -Run these commands +Install nightly from the source (no guarantees) ```bash -git submodule update --init --recursive -pip install -r requirements/docs.txt -make clean -cd docs -make html +pip install https://github.com/Lightning-AI/lightning/archive/refs/heads/master.zip -U ``` -and open `docs/build/html/index.html` in your browser. +or from testing PyPI + +```bash +pip install -iU https://test.pypi.org/simple/ pytorch-lightning +``` + +
+ + +______________________________________________________________________ + +## Lightning has 3 core packages -When you send a PR the continuous integration will run tests and build the docs. You can access a preview of the html pages in the -_Artifacts_ tab in CircleCI when you click on the task named _build-Docs_ of _ci-tests_ at the bottom of the PR page. +[PyTorch Lightning: Train and deploy PyTorch at scale](#pytorch-lightning-train-and-deploy-pytorch-at-scale). +
+[Lightning Fabric: Expert control](#lightning-fabric-expert-control). +
+[Lightning Apps: Build AI products and ML workflows](#lightning-apps-build-ai-products-and-ml-workflows). -Notes (Optional): +Lightning gives you granular control over how much abstraction you want to add over PyTorch. -- You need to have LaTeX installed for rendering math equations. You can for example install TeXLive by doing one of the following: - - on Ubuntu (Linux) run `apt-get install texlive` or otherwise follow the instructions on the TeXLive website - - use the [RTD docker image](https://hub.docker.com/r/readthedocs/build) +
+ +
-## Developing docs +______________________________________________________________________ -When developing the docs, building docs can be VERY slow locally because of the notebook tutorials. -To speed this up, enable this flag in before building docs: +# PyTorch Lightning: Train and Deploy PyTorch at Scale + +PyTorch Lightning is just organized PyTorch - Lightning disentangles PyTorch code to decouple the science from the engineering. + +![PT to PL](docs/source-pytorch/_static/images/general/pl_quick_start_full_compressed.gif) + +______________________________________________________________________ + +### Hello simple model + +```python +# main.py +# ! pip install torchvision +import torch, torch.nn as nn, torch.utils.data as data, torchvision as tv, torch.nn.functional as F +import lightning as L + +# -------------------------------- +# Step 1: Define a LightningModule +# -------------------------------- +# A LightningModule (nn.Module subclass) defines a full *system* +# (ie: an LLM, diffusion model, autoencoder, or simple image classifier). + + +class LitAutoEncoder(L.LightningModule): + def __init__(self): + super().__init__() + self.encoder = nn.Sequential(nn.Linear(28 * 28, 128), nn.ReLU(), nn.Linear(128, 3)) + self.decoder = nn.Sequential(nn.Linear(3, 128), nn.ReLU(), nn.Linear(128, 28 * 28)) + + def forward(self, x): + # in lightning, forward defines the prediction/inference actions + embedding = self.encoder(x) + return embedding + + def training_step(self, batch, batch_idx): + # training_step defines the train loop. It is independent of forward + x, y = batch + x = x.view(x.size(0), -1) + z = self.encoder(x) + x_hat = self.decoder(z) + loss = F.mse_loss(x_hat, x) + self.log("train_loss", loss) + return loss + + def configure_optimizers(self): + optimizer = torch.optim.Adam(self.parameters(), lr=1e-3) + return optimizer + + +# ------------------- +# Step 2: Define data +# ------------------- +dataset = tv.datasets.MNIST(".", download=True, transform=tv.transforms.ToTensor()) +train, val = data.random_split(dataset, [55000, 5000]) + +# ------------------- +# Step 3: Train +# ------------------- +autoencoder = LitAutoEncoder() +trainer = L.Trainer() +trainer.fit(autoencoder, data.DataLoader(train), data.DataLoader(val)) +``` + +Run the model on your terminal ```bash -# builds notebooks which is slow -export PL_FAST_DOCS_DEV=0 +pip install torchvision +python main.py +``` + +______________________________________________________________________ + +## Advanced features + +Lightning has over [40+ advanced features](https://lightning.ai/docs/pytorch/stable/common/trainer.html#trainer-flags) designed for professional AI research at scale. + +Here are some examples: + +
+ +
+ +
+ Train on 1000s of GPUs without code changes + +```python +# 8 GPUs +# no code changes needed +trainer = Trainer(accelerator="gpu", devices=8) -# fast notebook build which is fast -export PL_FAST_DOCS_DEV=1 +# 256 GPUs +trainer = Trainer(accelerator="gpu", devices=8, num_nodes=32) ``` -## docs CSS/theme +
+ +
+ Train on other accelerators like TPUs without code changes + +```python +# no code changes needed +trainer = Trainer(accelerator="tpu", devices=8) +``` + +
+ +
+ 16-bit precision + +```python +# no code changes needed +trainer = Trainer(precision=16) +``` + +
+ +
+ Experiment managers + +```python +from lightning import loggers + +# tensorboard +trainer = Trainer(logger=TensorBoardLogger("logs/")) + +# weights and biases +trainer = Trainer(logger=loggers.WandbLogger()) + +# comet +trainer = Trainer(logger=loggers.CometLogger()) + +# mlflow +trainer = Trainer(logger=loggers.MLFlowLogger()) + +# neptune +trainer = Trainer(logger=loggers.NeptuneLogger()) + +# ... and dozens more +``` + +
+ +
+ +Early Stopping + +```python +es = EarlyStopping(monitor="val_loss") +trainer = Trainer(callbacks=[es]) +``` + +
+ +
+ Checkpointing + +```python +checkpointing = ModelCheckpoint(monitor="val_loss") +trainer = Trainer(callbacks=[checkpointing]) +``` + +
+ +
+ Export to torchscript (JIT) (production use) + +```python +# torchscript +autoencoder = LitAutoEncoder() +torch.jit.save(autoencoder.to_torchscript(), "model.pt") +``` + +
+ +
+ Export to ONNX (production use) + +```python +# onnx +with tempfile.NamedTemporaryFile(suffix=".onnx", delete=False) as tmpfile: + autoencoder = LitAutoEncoder() + input_sample = torch.randn((1, 64)) + autoencoder.to_onnx(tmpfile.name, input_sample, export_params=True) + os.path.isfile(tmpfile.name) +``` + +
+ +______________________________________________________________________ + +## Advantages over unstructured PyTorch + +- Models become hardware agnostic +- Code is clear to read because engineering code is abstracted away +- Easier to reproduce +- Make fewer mistakes because lightning handles the tricky engineering +- Keeps all the flexibility (LightningModules are still PyTorch modules), but removes a ton of boilerplate +- Lightning has dozens of integrations with popular machine learning tools. +- [Tested rigorously with every new PR](https://github.com/Lightning-AI/lightning/tree/master/tests). We test every combination of PyTorch and Python supported versions, every OS, multi GPUs and even TPUs. +- Minimal running speed overhead (about 300 ms per epoch compared with pure PyTorch). + +______________________________________________________________________ + +
+ Read the PyTorch Lightning docs +
+ +______________________________________________________________________ + +# Lightning Fabric: Expert control. + +Run on any device at any scale with expert-level control over PyTorch training loop and scaling strategy. You can even write your own Trainer. + +Fabric is designed for the most complex models like foundation model scaling, LLMs, diffusion, transformers, reinforcement learning, active learning. Of any size. + + + + + + + + + +
What to changeResulting Fabric Code (copy me!)
+ + +```diff ++ import lightning as L + import torch; import torchvision as tv + + dataset = tv.datasets.CIFAR10("data", download=True, + train=True, + transform=tv.transforms.ToTensor()) + ++ fabric = L.Fabric() ++ fabric.launch() + + model = tv.models.resnet18() + optimizer = torch.optim.SGD(model.parameters(), lr=0.001) +- device = "cuda" if torch.cuda.is_available() else "cpu" +- model.to(device) ++ model, optimizer = fabric.setup(model, optimizer) + + dataloader = torch.utils.data.DataLoader(dataset, batch_size=8) ++ dataloader = fabric.setup_dataloaders(dataloader) + + model.train() + num_epochs = 10 + for epoch in range(num_epochs): + for batch in dataloader: + inputs, labels = batch +- inputs, labels = inputs.to(device), labels.to(device) + optimizer.zero_grad() + outputs = model(inputs) + loss = torch.nn.functional.cross_entropy(outputs, labels) +- loss.backward() ++ fabric.backward(loss) + optimizer.step() + print(loss.data) +``` + + + + + +```Python +import lightning as L +import torch; import torchvision as tv + +dataset = tv.datasets.CIFAR10("data", download=True, + train=True, + transform=tv.transforms.ToTensor()) + +fabric = L.Fabric() +fabric.launch() + +model = tv.models.resnet18() +optimizer = torch.optim.SGD(model.parameters(), lr=0.001) +model, optimizer = fabric.setup(model, optimizer) + +dataloader = torch.utils.data.DataLoader(dataset, batch_size=8) +dataloader = fabric.setup_dataloaders(dataloader) + +model.train() +num_epochs = 10 +for epoch in range(num_epochs): + for batch in dataloader: + inputs, labels = batch + optimizer.zero_grad() + outputs = model(inputs) + loss = torch.nn.functional.cross_entropy(outputs, labels) + fabric.backward(loss) + optimizer.step() + print(loss.data) +``` + + +
+ +## Key features + +
+ Easily switch from running on CPU to GPU (Apple Silicon, CUDA, …), TPU, multi-GPU or even multi-node training + +```python +# Use your available hardware +# no code changes needed +fabric = Fabric() + +# Run on GPUs (CUDA or MPS) +fabric = Fabric(accelerator="gpu") + +# 8 GPUs +fabric = Fabric(accelerator="gpu", devices=8) + +# 256 GPUs, multi-node +fabric = Fabric(accelerator="gpu", devices=8, num_nodes=32) + +# Run on TPUs +fabric = Fabric(accelerator="tpu") +``` + +
+ +
+ Use state-of-the-art distributed training strategies (DDP, FSDP, DeepSpeed) and mixed precision out of the box + +```python +# Use state-of-the-art distributed training techniques +fabric = Fabric(strategy="ddp") +fabric = Fabric(strategy="deepspeed") +fabric = Fabric(strategy="fsdp") + +# Switch the precision +fabric = Fabric(precision="16-mixed") +fabric = Fabric(precision="64") +``` + +
+ +
+ All the device logic boilerplate is handled for you + +```diff + # no more of this! +- model.to(device) +- batch.to(device) +``` + +
+ +
+ Build your own custom Trainer using Fabric primitives for training checkpointing, logging, and more + +```python +import lightning as L + + +class MyCustomTrainer: + def __init__(self, accelerator="auto", strategy="auto", devices="auto", precision="32-true"): + self.fabric = L.Fabric(accelerator=accelerator, strategy=strategy, devices=devices, precision=precision) + + def fit(self, model, optimizer, dataloader, max_epochs): + self.fabric.launch() + + model, optimizer = self.fabric.setup(model, optimizer) + dataloader = self.fabric.setup_dataloaders(dataloader) + model.train() + + for epoch in range(max_epochs): + for batch in dataloader: + input, target = batch + optimizer.zero_grad() + output = model(input) + loss = loss_fn(output, target) + self.fabric.backward(loss) + optimizer.step() +``` + +You can find a more extensive example in our [examples](examples/fabric/build_your_own_trainer) + +
+ +______________________________________________________________________ + +
+ Read the Lightning Fabric docs +
+ +______________________________________________________________________ + +# Lightning Apps: Build AI products and ML workflows + +Lightning Apps remove the cloud infrastructure boilerplate so you can focus on solving the research or business problems. Lightning Apps can run on the Lightning Cloud, your own cluster or a private cloud. + +
+ +
+ +## Hello Lightning app world + +```python +# app.py +import lightning as L + + +class TrainComponent(L.LightningWork): + def run(self, x): + print(f"train a model on {x}") + + +class AnalyzeComponent(L.LightningWork): + def run(self, x): + print(f"analyze model on {x}") + + +class WorkflowOrchestrator(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.train = TrainComponent(cloud_compute=L.CloudCompute("cpu")) + self.analyze = AnalyzeComponent(cloud_compute=L.CloudCompute("gpu")) + + def run(self): + self.train.run("CPU machine 1") + self.analyze.run("GPU machine 2") + + +app = L.LightningApp(WorkflowOrchestrator()) +``` + +Run on the cloud or locally + +```bash +# run on the cloud +lightning run app app.py --setup --cloud + +# run locally +lightning run app app.py +``` + +______________________________________________________________________ + +
+ Read the Lightning Apps docs +
+ +______________________________________________________________________ + +## Examples + +###### Self-supervised Learning + +- [CPC transforms](https://lightning-bolts.readthedocs.io/en/stable/transforms/self_supervised.html#cpc-transforms) +- [Moco v2 tranforms](https://lightning-bolts.readthedocs.io/en/stable/transforms/self_supervised.html#moco-v2-transforms) +- [SimCLR transforms](https://lightning-bolts.readthedocs.io/en/stable/transforms/self_supervised.html#simclr-transforms) + +###### Convolutional Architectures + +- [GPT-2](https://lightning-bolts.readthedocs.io/en/stable/models/convolutional.html#gpt-2) +- [UNet](https://lightning-bolts.readthedocs.io/en/stable/models/convolutional.html#unet) + +###### Reinforcement Learning + +- [DQN Loss](https://lightning-bolts.readthedocs.io/en/stable/losses.html#dqn-loss) +- [Double DQN Loss](https://lightning-bolts.readthedocs.io/en/stable/losses.html#double-dqn-loss) +- [Per DQN Loss](https://lightning-bolts.readthedocs.io/en/stable/losses.html#per-dqn-loss) + +###### GANs + +- [Basic GAN](https://lightning-bolts.readthedocs.io/en/stable/models/gans.html#basic-gan) +- [DCGAN](https://lightning-bolts.readthedocs.io/en/stable/models/gans.html#dcgan) + +###### Classic ML + +- [Logistic Regression](https://lightning-bolts.readthedocs.io/en/stable/models/classic_ml.html#logistic-regression) +- [Linear Regression](https://lightning-bolts.readthedocs.io/en/stable/models/classic_ml.html#linear-regression) + +______________________________________________________________________ + +## Continuous Integration + +Lightning is rigorously tested across multiple CPUs, GPUs, TPUs, IPUs, and HPUs and against major Python and PyTorch versions. + +###### \*Codecov is > 90%+ but build delays may show less + +
+ Current build statuses + +
+ +| System / PyTorch ver. | 1.11 | 1.12 | 1.13 | 2.0 | +| :--------------------------------: | :---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------: | :-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------: | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | ---- | +| Linux py3.9 \[GPUs\] | - | [![Build Status]()](https://dev.azure.com/Lightning-AI/lightning/_build/latest?definitionId=24&branchName=master) | [![Build Status]()](https://dev.azure.com/Lightning-AI/lightning/_build/latest?definitionId=24&branchName=master) | Soon | +| Linux py3.9 \[TPUs\] | - | [![Test PyTorch - TPU](https://github.com/Lightning-AI/lightning/actions/workflows/tpu-tests.yml/badge.svg)](https://github.com/Lightning-AI/lightning/actions/workflows/tpu-tests.yml) | | Soon | +| Linux py3.8 \[IPUs\] | - | - | [![Build Status]()](https://dev.azure.com/Lightning-AI/lightning/_build/latest?definitionId=25&branchName=master) | Soon | +| Linux (multiple Python versions) | [![Test PyTorch](https://github.com/Lightning-AI/lightning/actions/workflows/ci-tests-pytorch.yml/badge.svg)](https://github.com/Lightning-AI/lightning/actions/workflows/ci-tests-pytorch.yml) | [![Test PyTorch](https://github.com/Lightning-AI/lightning/actions/workflows/ci-tests-pytorch.yml/badge.svg)](https://github.com/Lightning-AI/lightning/actions/workflows/ci-tests-pytorch.yml) | [![Test PyTorch](https://github.com/Lightning-AI/lightning/actions/workflows/ci-tests-pytorch.yml/badge.svg)](https://github.com/Lightning-AI/lightning/actions/workflows/ci-tests-pytorch.yml) | Soon | +| OSX (multiple Python versions) | [![Test PyTorch](https://github.com/Lightning-AI/lightning/actions/workflows/ci-tests-pytorch.yml/badge.svg)](https://github.com/Lightning-AI/lightning/actions/workflows/ci-tests-pytorch.yml) | [![Test PyTorch](https://github.com/Lightning-AI/lightning/actions/workflows/ci-tests-pytorch.yml/badge.svg)](https://github.com/Lightning-AI/lightning/actions/workflows/ci-tests-pytorch.yml) | [![Test PyTorch](https://github.com/Lightning-AI/lightning/actions/workflows/ci-tests-pytorch.yml/badge.svg)](https://github.com/Lightning-AI/lightning/actions/workflows/ci-tests-pytorch.yml) | Soon | +| Windows (multiple Python versions) | [![Test PyTorch](https://github.com/Lightning-AI/lightning/actions/workflows/ci-tests-pytorch.yml/badge.svg)](https://github.com/Lightning-AI/lightning/actions/workflows/ci-tests-pytorch.yml) | [![Test PyTorch](https://github.com/Lightning-AI/lightning/actions/workflows/ci-tests-pytorch.yml/badge.svg)](https://github.com/Lightning-AI/lightning/actions/workflows/ci-tests-pytorch.yml) | [![Test PyTorch](https://github.com/Lightning-AI/lightning/actions/workflows/ci-tests-pytorch.yml/badge.svg)](https://github.com/Lightning-AI/lightning/actions/workflows/ci-tests-pytorch.yml) | Soon | + +
+
+ +______________________________________________________________________ + +## Community + +The lightning community is maintained by + +- [10+ core contributors](https://lightning.ai/docs/pytorch/latest/community/governance.html) who are all a mix of professional engineers, Research Scientists, and Ph.D. students from top AI labs. +- 800+ community contributors. + +Want to help us build Lightning and reduce boilerplate for thousands of researchers? [Learn how to make your first contribution here](https://lightning.ai/docs/pytorch/stable/generated/CONTRIBUTING.html) + +Lightning is also part of the [PyTorch ecosystem](https://pytorch.org/ecosystem/) which requires projects to have solid testing, documentation and support. + +### Asking for help + +If you have any questions please: -To change the CSS theme of the docs, go [here](https://github.com/PyTorchLightning/lightning_sphinx_theme). -Apologies in advance... this is a bit complex to build and requires basic understanding of javascript/npm. +1. [Read the docs](https://lightning.ai/docs). +1. [Search through existing Discussions](https://github.com/Lightning-AI/lightning/discussions), or [add a new question](https://github.com/Lightning-AI/lightning/discussions/new) +1. [Join our discord](https://discord.com/invite/tfXFetEZxv). diff --git a/__about__.py b/__about__.py deleted file mode 100644 index 0a309f9..0000000 --- a/__about__.py +++ /dev/null @@ -1,38 +0,0 @@ -import time - -_this_year = time.strftime("%Y") -__version__ = "1.7.0dev" -__author__ = "William Falcon et al." -__author_email__ = "waf2107@columbia.edu" -__license__ = "Apache-2.0" -__copyright__ = f"Copyright (c) 2018-{_this_year}, {__author__}." -__homepage__ = "https://github.com/PyTorchLightning/pytorch-lightning" -__docs_url__ = "https://pytorch-lightning.readthedocs.io/en/stable/" -# this has to be simple string, see: https://github.com/pypa/twine/issues/522 -__docs__ = ( - "PyTorch Lightning is the lightweight PyTorch wrapper for ML researchers." - " Scale your models. Write less boilerplate." -) -__long_docs__ = """ -Lightning is a way to organize your PyTorch code to decouple the science code from the engineering. - It's more of a style-guide than a framework. - -In Lightning, you organize your code into 3 distinct categories: - -1. Research code (goes in the LightningModule). -2. Engineering code (you delete, and is handled by the Trainer). -3. Non-essential research code (logging, etc. this goes in Callbacks). - -Although your research/production project might start simple, once you add things like GPU AND TPU training, - 16-bit precision, etc, you end up spending more time engineering than researching. - Lightning automates AND rigorously tests those parts for you. - -Overall, Lightning guarantees rigorously tested, correct, modern best practices for the automated parts. - -Documentation -------------- -- https://pytorch-lightning.readthedocs.io/en/latest -- https://pytorch-lightning.readthedocs.io/en/stable -""" - -__all__ = ["__author__", "__author_email__", "__copyright__", "__docs__", "__homepage__", "__license__", "__version__"] diff --git a/_notebooks/.actions/README.md b/_notebooks/.actions/README.md new file mode 100644 index 0000000..7eb3226 --- /dev/null +++ b/_notebooks/.actions/README.md @@ -0,0 +1,11 @@ +scripts for generating notebooks + +**GHA here** + +- generate notebooks +- flow to ban any added notebook in PR (fail if changes in .notebooks) + +**PL side** + +- git submodule with these examples +- gha cron to update submodule head diff --git a/_notebooks/.actions/assistant.py b/_notebooks/.actions/assistant.py new file mode 100644 index 0000000..f489308 --- /dev/null +++ b/_notebooks/.actions/assistant.py @@ -0,0 +1,713 @@ +import base64 +import json +import os +import re +from datetime import datetime +from shutil import copyfile +from textwrap import wrap +from typing import Any, Dict, List, Optional, Sequence, Tuple +from warnings import warn + +import fire +import requests +import tqdm +import yaml +from pip._internal.operations import freeze +from wcmatch import glob + +_PATH_HERE = os.path.dirname(__file__) +_PATH_ROOT = os.path.dirname(_PATH_HERE) +PATH_REQ_DEFAULT = os.path.join(_PATH_ROOT, "_requirements", "default.txt") +PATH_SCRIPT_RENDER = os.path.join(_PATH_HERE, "_ipynb-render.sh") +PATH_SCRIPT_TEST = os.path.join(_PATH_HERE, "_ipynb-test.sh") +# https://askubuntu.com/questions/909918/how-to-show-unzip-progress +UNZIP_PROGRESS_BAR = ' | awk \'BEGIN {ORS=" "} {if(NR%10==0)print "."}\'' +REPO_NAME = "lightning-tutorials" +COLAB_REPO_LINK = "https://colab.research.google.com/github/PytorchLightning" +BRANCH_DEFAULT = "main" +BRANCH_PUBLISHED = "publication" +DIR_NOTEBOOKS = ".notebooks" +URL_PL_DOWNLOAD = f"https://github.com/Lightning-AI/{REPO_NAME}/raw/{BRANCH_DEFAULT}" +TEMPLATE_HEADER = f"""# %%%% [markdown] +# +# # %(title)s +# +# * **Author:** %(author)s +# * **License:** %(license)s +# * **Generated:** %(generated)s +# +# %(description)s +# +# --- +# Open in [![Open In Colab](https://colab.research.google.com/assets/colab-badge.png){{height="20px" width="117px"}}]({COLAB_REPO_LINK}/{REPO_NAME}/blob/{BRANCH_PUBLISHED}/{DIR_NOTEBOOKS}/%(local_ipynb)s) +# +# Give us a ⭐ [on Github](https://www.github.com/Lightning-AI/lightning/) +# | Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/stable/) +# | Join us [on Slack](https://www.pytorchlightning.ai/community) + +""" +TEMPLATE_SETUP = """# %%%% [markdown] +# ## Setup +# This notebook requires some packages besides pytorch-lightning. + +# %%%% colab={} colab_type="code" id="LfrJLKPFyhsK" +# ! pip install --quiet %(requirements)s + +""" +TEMPLATE_FOOTER = """ +# %% [markdown] +# ## Congratulations - Time to Join the Community! +# +# Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning +# movement, you can do so in the following ways! +# +# ### Star [Lightning](https://github.com/Lightning-AI/lightning) on GitHub +# The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool +# tools we're building. +# +# ### Join our [Slack](https://www.pytorchlightning.ai/community)! +# The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself +# and share your interests in `#general` channel +# +# +# ### Contributions ! +# The best way to contribute to our community is to become a code contributor! At any time you can go to +# [Lightning](https://github.com/Lightning-AI/lightning) or [Bolt](https://github.com/Lightning-AI/lightning-bolts) +# GitHub Issues page and filter for "good first issue". +# +# * [Lightning good first issue](https://github.com/Lightning-AI/lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22) +# * [Bolt good first issue](https://github.com/Lightning-AI/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22) +# * You can also contribute your own notebooks with useful examples ! +# +# ### Great thanks from the entire Pytorch Lightning Team for your interest ! +# +# [![Pytorch Lightning](https://raw.githubusercontent.com/Lightning-AI/lightning/master/docs/source/_static/images/logo.png){height="60px" width="240px"}](https://pytorchlightning.ai) + +""" +TEMPLATE_CARD_ITEM = """ +.. customcarditem:: + :header: %(title)s + :card_description: %(short_description)s + :tags: %(tags)s +""" + + +def load_requirements(path_req: str = PATH_REQ_DEFAULT) -> list: + """Load the requirements from a file.""" + with open(path_req) as fp: + req = fp.readlines() + req = [r[: r.index("#")] if "#" in r else r for r in req] + req = [r.strip() for r in req] + req = [r for r in req if r] + return req + + +def get_running_cuda_version() -> str: + """Extract the version of actual CUDA for this runtime.""" + try: + import torch + + return torch.version.cuda or "" + except ImportError: + return "" + + +def get_running_torch_version(): + """Extract the version of actual PyTorch for this runtime.""" + try: + import torch + + ver = torch.__version__ + return ver[: ver.index("+")] if "+" in ver else ver + except ImportError: + return "" + + +_TORCH_VERSION = get_running_torch_version() +_CUDA_VERSION = get_running_cuda_version() +_RUNTIME_VERSIONS = dict( + TORCH_VERSION_FULL=_TORCH_VERSION, + TORCH_VERSION=_TORCH_VERSION[: _TORCH_VERSION.index("+")] if "+" in _TORCH_VERSION else _TORCH_VERSION, + TORCH_MAJOR_DOT_MINOR=".".join(_TORCH_VERSION.split(".")[:2]), + CUDA_VERSION=_CUDA_VERSION, + CUDA_MAJOR_MINOR=_CUDA_VERSION.replace(".", ""), + DEVICE=f"cu{_CUDA_VERSION.replace('.', '')}" if _CUDA_VERSION else "cpu", +) + + +class AssistantCLI: + """Collection of handy CLI commands.""" + + _LOCAL_ACCELERATOR = "cpu,gpu" if get_running_cuda_version() else "cpu" + DEVICE_ACCELERATOR = os.environ.get("ACCELERATOR", _LOCAL_ACCELERATOR).lower() + DATASETS_FOLDER = os.environ.get("PATH_DATASETS", "_datasets") + DRY_RUN = bool(int(os.environ.get("DRY_RUN", 0))) + _META_REQUIRED_FIELDS = ("title", "author", "license", "description") + _SKIP_DIRS = ( + ".actions", + ".azure", + ".datasets", + ".github", + "_docs", + "_TEMP", + "_requirements", + DIR_NOTEBOOKS, + ) + _META_FILE_REGEX = ".meta.{yaml,yml}" + _META_PIP_KEY = "pip__" + _META_ACCEL_DEFAULT = _LOCAL_ACCELERATOR.split(",") + + # Map directory names to tag names. Note that dashes will be replaced with spaces in rendered tags in the docs. + _DIR_TO_TAG = { + "course_UvA-DL": "UvA-DL-Course", + "lightning_examples": "Lightning-Examples", + "flash_tutorials": "Kaggle", + } + _BASH_SCRIPT_BASE = ("#!/bin/bash", "set -e", "") + _EXT_ARCHIVE_ZIP = (".zip",) + _EXT_ARCHIVE_TAR = (".tar", ".gz") + _EXT_ARCHIVE = _EXT_ARCHIVE_ZIP + _EXT_ARCHIVE_TAR + _AZURE_POOL = "lit-rtx-3090" + _AZURE_DOCKER = "pytorchlightning/pytorch_lightning:base-cuda-py3.9-torch1.12-cuda11.6.1" + + @staticmethod + def _find_meta(folder: str) -> str: + """Search for a meta file in given folder and return its path. + + Args: + folder: path to the folder with python script, meta and artefacts + """ + files = glob.glob(os.path.join(folder, AssistantCLI._META_FILE_REGEX), flags=glob.BRACE) + if len(files) == 1: + return files[0] + return "" + + @staticmethod + def _load_meta(folder: str, strict: bool = False) -> Optional[dict]: + """Loading meta-data for a particular notebook with given folder path. + + Args: + folder: path to the folder with python script, meta and artefacts + strict: raise error if meta is missing required feilds + """ + fpath = AssistantCLI._find_meta(folder) + assert fpath, f"Missing meta file in folder: {folder}" + meta = yaml.safe_load(open(fpath)) + + if strict: + meta_miss = [fl for fl in AssistantCLI._META_REQUIRED_FIELDS if fl not in meta] + if meta_miss: + raise ValueError(f"Meta file '{fpath}' is missing the following fields: {meta_miss}") + return meta + + @staticmethod + def _valid_conf_folder(folder: str) -> Tuple[str, str]: + """Validate notebook folder if it has required meta file and optional thumb. + + Args: + folder: path to the folder with python script, meta and artefacts + """ + meta_files = [os.path.join(folder, f".meta.{ext}") for ext in ("yml", "yaml")] + meta_files = [pf for pf in meta_files if os.path.isfile(pf)] + if len(meta_files) != 1: + raise FileExistsError(f"found {len(meta_files)} meta (yaml|yml) files in folder: {folder}") + thumb_files = glob.glob(os.path.join(folder, ".thumb.*")) + thumb_names = list(map(os.path.basename, thumb_files)) + if len(thumb_files) > 1: + raise FileExistsError(f"Too many thumb files ({thumb_names}) found in folder: {folder}") + thumb = thumb_files[0] if thumb_files else "" + return meta_files[0], thumb + + @staticmethod + def _valid_folder(folder: str, ext: str) -> Tuple[str, str, str]: + """Validate notebook folder if it has required meta file, python script or ipython notebook (depending on + the stage) and optional thumb. + + Args: + folder: path to the folder with python script, meta and artefacts + ext: extension determining the stage - ".py" for python script nad ".ipynb" for notebook + """ + files = glob.glob(os.path.join(folder, f"*{ext}")) + if len(files) != 1: + names = list(map(os.path.basename, files)) + raise FileNotFoundError(f"Missing required '{ext}' file in folder: {folder} among {names}") + meta_file, thumb_file = AssistantCLI._valid_conf_folder(folder) + return files[0], meta_file, thumb_file + + @staticmethod + def _valid_accelerator(folder: str) -> bool: + """Parse standard requirements from meta file. + + Args: + folder: path to the folder with python script, meta and artefacts + """ + meta = AssistantCLI._load_meta(folder) + meta_accels = [acc.lower() for acc in meta.get("accelerator", AssistantCLI._META_ACCEL_DEFAULT)] + device_accels = AssistantCLI.DEVICE_ACCELERATOR.lower().split(",") + return any(ac in meta_accels for ac in device_accels) + + @staticmethod + def _parse_requirements(folder: str) -> Tuple[str, str]: + """Parse standard requirements from meta file. + + Args: + folder: path to the folder with python script, meta and artefacts + """ + meta = AssistantCLI._load_meta(folder) + reqs = meta.get("requirements", []) + + meta_pip_args = { + k.replace(AssistantCLI._META_PIP_KEY, ""): v + for k, v in meta.items() + if k.startswith(AssistantCLI._META_PIP_KEY) + } + pip_args = ["--extra-index-url https://download.pytorch.org/whl/" + _RUNTIME_VERSIONS.get("DEVICE")] + for pip_key in meta_pip_args: + if not isinstance(meta_pip_args[pip_key], (list, tuple, set)): + meta_pip_args[pip_key] = [meta_pip_args[pip_key]] + for arg in meta_pip_args[pip_key]: + arg = arg % _RUNTIME_VERSIONS + pip_args.append(f"--{pip_key} {arg}") + + return " ".join([f'"{req}"' for req in reqs]), " ".join(pip_args) + + @staticmethod + def _bash_download_data(folder: str) -> List[str]: + """Generate sequence of commands for optional downloading dataset specified in the meta file. + + Args: + folder: path to the folder with python script, meta and artefacts + """ + meta = AssistantCLI._load_meta(folder) + datasets = meta.get("datasets", {}) + data_kaggle = datasets.get("kaggle", []) + cmd = [f"python -m kaggle competitions download -c {name}" for name in data_kaggle] + files = [f"{name}.zip" for name in data_kaggle] + data_web = datasets.get("web", []) + cmd += [f"wget {web} --progress=bar:force:noscroll --tries=3" for web in data_web] + files += [os.path.basename(web) for web in data_web] + for fn in files: + name, ext = os.path.splitext(fn) + if ext not in AssistantCLI._EXT_ARCHIVE: + continue + if ext in AssistantCLI._EXT_ARCHIVE_ZIP: + cmd += [f"unzip -o {fn} -d {AssistantCLI.DATASETS_FOLDER}/{name} {UNZIP_PROGRESS_BAR}"] + else: + cmd += [f"tar -zxvf {fn} --overwrite"] + cmd += [f"rm {fn}"] + cmd += [f"tree -L 2 {AssistantCLI.DATASETS_FOLDER}"] + return cmd + + @staticmethod + def bash_render(folder: str, output_file: str = PATH_SCRIPT_RENDER) -> Optional[str]: + """Prepare bash script for running rendering of a particular notebook. + + Args: + folder: name/path to a folder with notebook files + output_file: if defined, stream the commands to the file + + Returns: + string with nash script content + """ + cmd = list(AssistantCLI._BASH_SCRIPT_BASE) + [f"# Rendering: {folder}"] + if not AssistantCLI.DRY_RUN: + cmd += AssistantCLI._bash_download_data(folder) + ipynb_file, meta_file, thumb_file = AssistantCLI._valid_folder(folder, ext=".ipynb") + pub_ipynb = os.path.join(DIR_NOTEBOOKS, f"{folder}.ipynb") + pub_meta = pub_ipynb.replace(".ipynb", ".yaml") + pub_dir = os.path.dirname(pub_ipynb) + thumb_ext = os.path.splitext(thumb_file)[-1] if thumb_file else "." + pub_thumb = os.path.join(DIR_NOTEBOOKS, f"{folder}{thumb_ext}") if thumb_file else "" + cmd.append(f"mkdir -p {pub_dir}") + if AssistantCLI.DRY_RUN: + # dry run does not execute the notebooks just takes them as they are + cmd.append(f"cp {ipynb_file} {pub_ipynb}") + # copy and add meta config + cmd += [f"cp {meta_file} {pub_meta}", f"cat {pub_meta}", f"git add {pub_meta}"] + else: + pip_req, pip_args = AssistantCLI._parse_requirements(folder) + cmd += [f"pip install {pip_req} --quiet {pip_args}", "pip list"] + cmd.append(f"# available: {AssistantCLI.DEVICE_ACCELERATOR}\n") + if AssistantCLI._valid_accelerator(folder): + cmd.append(f"python -m papermill {ipynb_file} {pub_ipynb} --kernel python") + else: + warn("Invalid notebook's accelerator for this device. So no outputs will be generated.", RuntimeWarning) + cmd.append(f"cp {ipynb_file} {pub_ipynb}") + # Export the actual packages used in runtime + cmd.append(f"meta_file=$(python .actions/assistant.py update-env-details {folder})") + # copy and add to version the enriched meta config + cmd += ["echo $meta_file", "cat $meta_file", "git add $meta_file"] + # if thumb image is linked to the notebook, copy and version it too + if thumb_file: + cmd += [f"cp {thumb_file} {pub_thumb}", f"git add {pub_thumb}"] + # add the generated notebook to version + cmd.append(f"git add {pub_ipynb}") + if not output_file: + return os.linesep.join(cmd) + with open(output_file, "w") as fp: + fp.write(os.linesep.join(cmd)) + + @staticmethod + def bash_test(folder: str, output_file: str = PATH_SCRIPT_TEST) -> Optional[str]: + """Prepare bash script for running tests of a particular notebook. + + Args: + folder: name/path to a folder with notebook files + output_file: if defined, stream the commands to the file + + Returns: + string with nash script content + """ + cmd = list(AssistantCLI._BASH_SCRIPT_BASE) + [f"# Testing: {folder}"] + cmd += AssistantCLI._bash_download_data(folder) + ipynb_file, meta_file, _ = AssistantCLI._valid_folder(folder, ext=".ipynb") + + # prepare isolated environment with inheriting the global packages + path_venv = os.path.join(folder, "venv") + cmd += [ + f"python -m virtualenv --system-site-packages {path_venv}", + f"source {os.path.join(path_venv, 'bin', 'activate')}", + "pip --version", + ] + + cmd.append(f"# available: {AssistantCLI.DEVICE_ACCELERATOR}") + if AssistantCLI._valid_accelerator(folder): + # and install specific packages + pip_req, pip_args = AssistantCLI._parse_requirements(folder) + cmd += [f"pip install {pip_req} --quiet {pip_args}", "pip list"] + # Export the actual packages used in runtime + cmd.append(f"meta_file=$(python .actions/assistant.py update-env-details {folder} --base_path .)") + # show created meta config + cmd += ["echo $meta_file", "cat $meta_file"] + cmd.append(f"python -m pytest {ipynb_file} -v --nbval --nbval-cell-timeout=300") + else: + pub_ipynb = os.path.join(DIR_NOTEBOOKS, f"{folder}.ipynb") + pub_meta = pub_ipynb.replace(".ipynb", ".yaml") + # copy and add meta config + cmd += [ + f"mkdir -p {os.path.dirname(pub_meta)}", + f"cp {meta_file} {pub_meta}", + f"cat {pub_meta}", + f"git add {pub_meta}", + ] + warn("Invalid notebook's accelerator for this device. So no tests will be run!!!", RuntimeWarning) + # deactivate and clean local environment + cmd += ["deactivate", f"rm -rf {os.path.join(folder, 'venv')}"] + if not output_file: + return os.linesep.join(cmd) + with open(output_file, "w") as fp: + fp.write(os.linesep.join(cmd)) + + @staticmethod + def convert_ipynb(folder: str) -> None: + """Add template header and footer to the python base script. + + Args: + folder: folder with python script + """ + fpath, _, _ = AssistantCLI._valid_folder(folder, ext=".py") + with open(fpath) as fp: + py_script = fp.readlines() + + meta = AssistantCLI._load_meta(folder, strict=True) + meta.update( + dict(local_ipynb=f"{folder}.ipynb"), + generated=datetime.now().isoformat(), + ) + meta["description"] = meta["description"].replace(os.linesep, f"{os.linesep}# ") + + header = TEMPLATE_HEADER % meta + requires = set(load_requirements() + meta["requirements"]) + setup = TEMPLATE_SETUP % dict(requirements=" ".join([f'"{req}"' for req in requires])) + py_script = [header + setup] + py_script + [TEMPLATE_FOOTER] + + py_script = AssistantCLI._replace_images(py_script, folder) + + with open(fpath, "w") as fp: + fp.writelines(py_script) + + os.system(f'python -m jupytext --set-formats "ipynb,py:percent" {fpath}') + + @staticmethod + def _replace_images(lines: list, local_dir: str) -> list: + """Update images by URL to GitHub raw source. + + Args: + lines: string lines from python script + local_dir: relative path to the folder with script + """ + md = os.linesep.join([ln.rstrip() for ln in lines]) + p_imgs = [] + # todo: add a rule to replace this paths only i md sections + # because * is a greedy quantifier, trying to match as much as it can. Make it *? + p_imgs += re.findall(r"src=\"(.*?)\"", md) + p_imgs += re.findall(r"!\[.*?\]\((.*?)\)", md) + + # update all images + for p_img in set(p_imgs): + if p_img.startswith("http://") or p_img.startswith("https://"): + url_path = p_img + im = requests.get(p_img, stream=True).raw.read() + else: + url_path = "/".join([URL_PL_DOWNLOAD, local_dir, p_img]) + p_local_img = os.path.join(local_dir, p_img) + with open(p_local_img, "rb") as fp: + im = fp.read() + im_base64 = base64.b64encode(im).decode("utf-8") + _, ext = os.path.splitext(p_img) + md = md.replace(f'src="{p_img}"', f'src="{url_path}"') + md = md.replace(f"]({p_img})", f"](data:image/{ext[1:]};base64,{im_base64})") + + return [ln + os.linesep for ln in md.split(os.linesep)] + + @staticmethod + def _is_ipynb_parent_dir(dir_path: str) -> bool: + """Determine in recursive fasion of a folder is valid notebook file or any of sub-folders is.""" + if AssistantCLI._find_meta(dir_path): + return True + sub_dirs = [d for d in glob.glob(os.path.join(dir_path, "*")) if os.path.isdir(d)] + return any(AssistantCLI._is_ipynb_parent_dir(d) for d in sub_dirs) + + @staticmethod + def group_folders( + fpath_gitdiff: str, + fpath_change_folders: str = "changed-folders.txt", + fpath_drop_folders: str = "dropped-folders.txt", + fpath_actual_dirs: Sequence[str] = tuple(), + strict: bool = True, + root_path: str = "", + ) -> None: + """Parsing the raw git diff and group changes by folders. + + Args: + fpath_gitdiff: raw git changes + + Generate the git change list: + > head=$(git rev-parse origin/main) + > git diff --name-only $head --output=master-diff.txt + + fpath_change_folders: output file with changed folders + fpath_drop_folders: output file with deleted folders + fpath_actual_dirs: files with listed all folder in particular stat + strict: raise error if some folder outside skipped does not have valid meta file + root_path: path to the root tobe added for all local folder paths in files + + Example: + $ python assistant.py group-folders ../target-diff.txt \ + --fpath_actual_dirs "['../dirs-main.txt', '../dirs-publication.txt']" + """ + with open(fpath_gitdiff) as fp: + changed = [ln.strip() for ln in fp.readlines()] + dirs = [os.path.dirname(ln) for ln in changed] + # not empty paths + dirs = [ln for ln in dirs if ln] + + if fpath_actual_dirs: + assert isinstance(fpath_actual_dirs, list) + assert all(os.path.isfile(p) for p in fpath_actual_dirs) + dir_sets = [{ln.strip() for ln in open(fp).readlines()} for fp in fpath_actual_dirs] + # get only different + dirs += list(set.union(*dir_sets) - set.intersection(*dir_sets)) + + if root_path: + dirs = [os.path.join(root_path, d) for d in dirs] + # unique folders + dirs = set(dirs) + # drop folder with skip folder + dirs = [pd for pd in dirs if not any(nd in AssistantCLI._SKIP_DIRS for nd in pd.split(os.path.sep))] + # valid folder has meta + dirs_exist = [d for d in dirs if os.path.isdir(d)] + dirs_invalid = [d for d in dirs_exist if not AssistantCLI._find_meta(d)] + if strict and dirs_invalid: + msg = f"Following folders do not have valid `{AssistantCLI._META_FILE_REGEX}`" + warn(f"{msg}: \n {os.linesep.join(dirs_invalid)}") + # check if there is other valid folder in its tree + dirs_invalid = [pd for pd in dirs_invalid if not AssistantCLI._is_ipynb_parent_dir(pd)] + if dirs_invalid: + raise FileNotFoundError(f"{msg} nor sub-folder: \n {os.linesep.join(dirs_invalid)}") + + dirs_change = [d for d in dirs_exist if AssistantCLI._find_meta(d)] + with open(fpath_change_folders, "w") as fp: + fp.write(os.linesep.join(sorted(dirs_change))) + + dirs_drop = [d for d in dirs if not os.path.isdir(d)] + with open(fpath_drop_folders, "w") as fp: + fp.write(os.linesep.join(sorted(dirs_drop))) + + @staticmethod + def generate_matrix(fpath_change_folders: str) -> str: + """Generate Azure matrix with leaf for each changed notebook. + + Args: + fpath_change_folders: output of previous ``group_folders`` + """ + with open(fpath_change_folders) as fp: + folders = [ln.strip() for ln in fp.readlines()] + # set default so the matrix has at least one runner + if not folders: + return "" + mtx = {} + for ln in folders: + mtx[ln] = { + "notebook": ln, + # TODO: allow defining some custom pools with different devices + "agent-pool": AssistantCLI._AZURE_POOL, + # TODO: allow defining some custom images with with python or PT + "docker-image": AssistantCLI._AZURE_DOCKER, + } + return json.dumps(mtx) + + @staticmethod + def _get_card_item_cell(path_ipynb: str, path_meta: str, path_thumb: Optional[str]) -> Dict[str, Any]: + """Build the card item cell for the given notebook path.""" + meta = yaml.safe_load(open(path_meta)) + + # Clamp description length + wrapped_description = wrap( + meta.get("short_description", meta["description"]).strip().replace(os.linesep, " "), 175 + ) + suffix = "..." if len(wrapped_description) > 1 else "" + meta["short_description"] = wrapped_description[0] + suffix + + # Resolve some default tags based on accelerators and directory name + meta["tags"] = meta.get("tags", []) + + accelerators = meta.get("accelerator", ("CPU",)) + if ("GPU" in accelerators) or ("TPU" in accelerators): + meta["tags"].append("GPU/TPU") + + dirname = os.path.basename(os.path.dirname(path_ipynb)) + if dirname != ".notebooks": + meta["tags"].append(AssistantCLI._DIR_TO_TAG.get(dirname, dirname)) + + meta["tags"] = [tag.replace(" ", "-") for tag in meta["tags"]] + meta["tags"] = ",".join(meta["tags"]) + + # Build the notebook cell + rst_cell = TEMPLATE_CARD_ITEM % meta + + # Split lines + rst_cell_lines = rst_cell.strip().splitlines(True) + + if path_thumb is not None: + rst_cell_lines[-1] += "\n" + rst_cell_lines.append(f" :image: {path_thumb}") + + return { + "cell_type": "raw", + "metadata": {"raw_mimetype": "text/restructuredtext"}, + "source": rst_cell_lines, + } + + @staticmethod + def _resolve_path_thumb(path_ipynb: str, path_meta: str) -> Optional[str]: + """Find the thumbnail (assumes thumbnail to be any file that isn't metadata or notebook).""" + paths = list(set(glob.glob(path_ipynb.replace(".ipynb", ".*"))) - {path_ipynb, path_meta}) + if len(paths) == 0: + return None + assert len(paths) == 1, f"Found multiple possible thumbnail paths for notebook: {path_ipynb}." + path_thumb = paths[0] + path_thumb = path_thumb.split(os.path.sep) + path_thumb = os.path.sep.join(path_thumb[path_thumb.index(DIR_NOTEBOOKS) + 1 :]) + return path_thumb + + @staticmethod + def copy_notebooks( + path_root: str, + docs_root: str = "_docs/source", + path_docs_ipynb: str = "notebooks", + path_docs_images: str = "_static/images", + patterns: Sequence[str] = (".", "**"), + ) -> None: + """Copy all notebooks from a folder to doc folder. + + Args: + path_root: source path to the project root in these tutorials + docs_root: docs source directory + path_docs_ipynb: destination path to the notebooks' location relative to ``docs_root`` + path_docs_images: destination path to the images' location relative to ``docs_root`` + patterns: patterns to use when glob-ing notebooks + """ + ls_ipynb = [] + for sub in patterns: + ls_ipynb += glob.glob(os.path.join(path_root, DIR_NOTEBOOKS, sub, "*.ipynb")) + + os.makedirs(os.path.join(docs_root, path_docs_ipynb), exist_ok=True) + ipynb_content = [] + for path_ipynb in tqdm.tqdm(ls_ipynb): + ipynb = path_ipynb.split(os.path.sep) + sub_ipynb = os.path.sep.join(ipynb[ipynb.index(DIR_NOTEBOOKS) + 1 :]) + new_ipynb = os.path.join(docs_root, path_docs_ipynb, sub_ipynb) + os.makedirs(os.path.dirname(new_ipynb), exist_ok=True) + + path_meta = path_ipynb.replace(".ipynb", ".yaml") + path_thumb = AssistantCLI._resolve_path_thumb(path_ipynb, path_meta) + + if path_thumb is not None: + new_thumb = os.path.join(docs_root, path_docs_images, path_thumb) + old_path_thumb = os.path.join(path_root, DIR_NOTEBOOKS, path_thumb) + os.makedirs(os.path.dirname(new_thumb), exist_ok=True) + copyfile(old_path_thumb, new_thumb) + path_thumb = os.path.join(path_docs_images, path_thumb) + + print(f"{path_ipynb} -> {new_ipynb}") + + with open(path_ipynb) as f: + ipynb = json.load(f) + + ipynb["cells"].append(AssistantCLI._get_card_item_cell(path_ipynb, path_meta, path_thumb)) + + with open(new_ipynb, "w") as f: + json.dump(ipynb, f) + + ipynb_content.append(os.path.join("notebooks", sub_ipynb)) + + @staticmethod + def update_env_details(folder: str, base_path: str = DIR_NOTEBOOKS) -> str: + """Export the actual packages used in runtime. + + Args: + folder: path to the folder + base_path: + """ + meta = AssistantCLI._load_meta(folder) + # default is COU runtime + with open(PATH_REQ_DEFAULT) as fp: + req = fp.readlines() + req += meta.get("requirements", []) + req = [r.strip() for r in req] + + def _parse_package_name(pkg: str, keys: str = " !<=>[]@", egg_name: str = "#egg=") -> str: + """Parsing just the package name.""" + if egg_name in pkg: + pkg = pkg[pkg.index(egg_name) + len(egg_name) :] + if any(c in pkg for c in keys): + ix = min(pkg.index(c) for c in keys if c in pkg) + pkg = pkg[:ix] + return pkg + + require = {_parse_package_name(r) for r in req if r} + env = {_parse_package_name(p): p for p in freeze.freeze()} + meta["environment"] = [env[r] for r in require] + meta["published"] = datetime.now().isoformat() + + fmeta = os.path.join(base_path, folder) + ".yaml" + yaml.safe_dump(meta, stream=open(fmeta, "w"), sort_keys=False) + return fmeta + + @staticmethod + def list_dirs(folder: str = "", include_file_ext: str = "") -> str: + """List all sub-folders in a given tree including any ipynb.""" + dirs = glob.glob(os.path.join(folder, "*" + include_file_ext)) + dirs += glob.glob(os.path.join(folder, "**", "*" + include_file_ext)) + if include_file_ext: + _ignore_base_dir = lambda p: os.path.sep.join(p.split(os.path.sep)[1:]) # noqa: E731 + # Take the notebook as a folder (notebook are on teh same level as the raw tutorial file mix) + dirs = [os.path.splitext(_ignore_base_dir(p))[0] for p in dirs] + else: + dirs = [p for p in dirs if os.path.isdir(p)] + return os.linesep.join(sorted(dirs)) + + +if __name__ == "__main__": + fire.Fire(AssistantCLI) diff --git a/_notebooks/.actions/git-diff-sync.sh b/_notebooks/.actions/git-diff-sync.sh new file mode 100644 index 0000000..c461e6d --- /dev/null +++ b/_notebooks/.actions/git-diff-sync.sh @@ -0,0 +1,37 @@ +#!/bin/bash + +set -e +printf "Detect changes for: $1 >> $2\n\n" + +b1="${1//'/'/'_'}" +printf "Branch alias: $b1\n" +# list all dirs in source branch +python .actions/assistant.py list_dirs > "dirs-$b1.txt" +cat "dirs-$b1.txt" + +head=$(git rev-parse origin/$2) +git diff --name-only $head --output=target-diff.txt +printf "\nRaw changes:\n" +cat target-diff.txt +# transfer the source CLI version +mkdir -p _TEMP +cp -r .actions/ _TEMP/.actions/ + +git checkout $2 +b2="${2//'/'/'_'}" +printf "Branch alias: $b2\n" +# recover the original CLI +#rm -rf .actions && mv _TEMP/.actions .actions +# list all dirs in target branch +python _TEMP/.actions/assistant.py list_dirs ".notebooks" --include_file_ext=".ipynb" > "dirs-$b2.txt" +cat "dirs-$b2.txt" + +printf "\n\n" +git merge --ff -s resolve origin/$1 + +python _TEMP/.actions/assistant.py group-folders target-diff.txt --fpath_actual_dirs "['dirs-$b1.txt', 'dirs-$b2.txt']" +printf "\n\nChanged folders:\n" +cat changed-folders.txt +printf "\n\nDropped folders:\n" +cat dropped-folders.txt +printf "\n" diff --git a/_notebooks/.actions/requires.txt b/_notebooks/.actions/requires.txt new file mode 100644 index 0000000..ff35f70 --- /dev/null +++ b/_notebooks/.actions/requires.txt @@ -0,0 +1,6 @@ +Fire +tqdm +PyYAML +wcmatch +requests +pip diff --git a/_notebooks/.actions/test_cli.py b/_notebooks/.actions/test_cli.py new file mode 100644 index 0000000..b73d686 --- /dev/null +++ b/_notebooks/.actions/test_cli.py @@ -0,0 +1,30 @@ +import os + +import pytest +from assistant import AssistantCLI + +_PATH_ROOT = os.path.dirname(os.path.dirname(__file__)) +_PATH_TEMPLATES = os.path.join(_PATH_ROOT, "templates") +_PATH_DIR_SIMPLE = os.path.join(_PATH_TEMPLATES, "simple") +_PATH_DIR_TITANIC = os.path.join(_PATH_TEMPLATES, "titanic") + + +def _path_in_dir(fname: str, folder: str = _PATH_ROOT) -> str: + return os.path.join(folder, fname) + + +@pytest.mark.parametrize( + "cmd,args", + [ + ("list_dirs", []), + ("list_dirs", [".", ".ipynb"]), + ("bash_render", [_PATH_DIR_SIMPLE]), + ("bash_test", [_PATH_DIR_SIMPLE]), + ("group_folders", [_path_in_dir("master-diff.txt"), _path_in_dir("dirs-b1.txt"), _path_in_dir("dirs-b2.txt")]), + ("convert_ipynb", [_PATH_DIR_SIMPLE]), + ("copy_notebooks", [_PATH_ROOT]), + ("update_env_details", [_PATH_DIR_SIMPLE]), + ], +) +def test_assistant_commands(cmd: str, args: list): + AssistantCLI().__getattribute__(cmd)(*args) diff --git a/_notebooks/.azure/ipynb-publish.yml b/_notebooks/.azure/ipynb-publish.yml new file mode 100644 index 0000000..4e99d21 --- /dev/null +++ b/_notebooks/.azure/ipynb-publish.yml @@ -0,0 +1,172 @@ +trigger: + # this shall process all these workflows in sequence even several PRs are merged shortly + batch: "true" + # publish notebooks only from default/main branch + branches: + include: [ main ] + +# no run on PR as this is exclusive for publishing notebooks +pr: none + +jobs: + + - job: sync_pub + pool: + vmImage: 'Ubuntu-20.04' + variables: + ACCELERATOR: CPU,GPU + PUB_BRANCH: publication + COMMIT_MSG: $(echo "$(Build.SourceVersionMessage)" | head -n 1) + COMMIT_HASH: "$(Build.SourceVersion)" + steps: + - bash: | + git config --global user.email "pipelines@azure.com" + git config --global user.name "Azure Pipelines" + printf "commit hash:\n $(COMMIT_HASH)\n" + printf "commit message:\n $(COMMIT_MSG)\n" + displayName: 'Set Git user' + - bash: | + set -e + git fetch --all + echo $(PUB_BRANCH) + git ls-remote --heads origin ${PUB_BRANCH} | grep ${PUB_BRANCH} >/dev/null + if [ "$?" == "1" ] ; then echo "Branch doesn't exist"; exit; fi + displayName: 'Git branch check' + + - bash: pip install -r .actions/requires.txt + displayName: 'Install dependencies' + - bash: | + current_branch=$(cut -d '/' -f3- <<< $(Build.SourceBranch)) + printf "$current_branch\n" + bash .actions/git-diff-sync.sh $current_branch $(PUB_BRANCH) + displayName: 'Compare changes & sync' + + - bash: | + notebooks=$(python .actions/assistant.py generate-matrix changed-folders.txt) + printf "Changed notebooks: $notebooks\n" + echo "##vso[task.setVariable variable=dirs;isOutput=true]$notebooks" + name: mtrx + displayName: 'Changed matrix' + + - bash: | + # remove notebooks which have moved + while IFS= read -r line; do + git rm .notebooks/$line.ipynb + git rm .notebooks/$line.yaml + done <<< $(cat dropped-folders.txt) + git status + git commit -m "prune: $(COMMIT_HASH)" + condition: gt(variables['dropped.folders'], 0) + displayName: 'Prune notebook' + + - bash: | + git status + git push https://$(PAT_GHOST)@github.com/Lightning-AI/tutorials.git $(PUB_BRANCH) + displayName: 'Finish push' + + - job: papermill + dependsOn: sync_pub + strategy: + # generated matrix with changed notebooks, include fields: "notebook", "agent-pool" and "docker-image" + matrix: $[ dependencies.sync_pub.outputs['mtrx.dirs'] ] + # Maximum number of jobs running in parallel, use 1 to run in sequence and reduce collisions + maxParallel: "1" + # how much time to give 'run always even if cancelled tasks' before stopping them + cancelTimeoutInMinutes: "2" + # how long to run the job before automatically cancelling + # When 0 is specified, the maximum limit is used: + # - For 360 minutes (6 hours) on Microsoft-hosted agents with a public project and public repository + # - For 60 minutes on Microsoft-hosted agents with a private project or private repository + timeoutInMinutes: "180" + + pool: "$(agent-pool)" + # this need to have installed docker in the base machine/image... + container: + image: "$(docker-image)" + options: "--gpus=all --shm-size=32g -v /usr/bin/docker:/tmp/docker:ro" + + variables: + ACCELERATOR: CPU,GPU + PUB_BRANCH: publication + PATH_DATASETS: "$(Build.Repository.LocalPath)/.datasets" + COMMIT_MSG: $(echo "$(Build.SourceVersionMessage)" | head -n 1) + COMMIT_HASH: "$(Build.SourceVersion)" + DEVICES: $( python -c 'print("$(Agent.Name)".split("_")[-1])' ) + + condition: ne(dependencies.sync_pub.outputs['mtrx.dirs'], '') + + steps: + - bash: | + echo "##vso[task.setvariable variable=CUDA_VISIBLE_DEVICES]$(DEVICES)" + echo "##vso[task.setvariable variable=CONTAINER_ID]$(head -1 /proc/self/cgroup|cut -d/ -f3)" + displayName: 'Set environment variables' + + - bash: | + lspci | egrep 'VGA|3D' + whereis nvidia + nvidia-smi + echo $CUDA_VISIBLE_DEVICES + echo $CONTAINER_ID + python --version + pip list + displayName: 'Image info & NVIDIA' + + - script: | + /tmp/docker exec -t -u 0 $CONTAINER_ID \ + sh -c "apt-get update && DEBIAN_FRONTEND=noninteractive apt-get -o Dpkg::Options::="--force-confold" -y install sudo" + displayName: 'Install Sudo in container (thanks Microsoft!)' + + - bash: | + git config --global user.email "pipelines@azure.com" + git config --global user.name "Azure Pipelines" + printf "commit hash:\n $(COMMIT_HASH)\n" + printf "commit message:\n $(COMMIT_MSG)\n" + displayName: 'Set Git user' + - bash: | + set -e + git fetch --all + echo $(PUB_BRANCH) + git ls-remote --heads origin ${PUB_BRANCH} | grep ${PUB_BRANCH} >/dev/null + if [ "$?" == "1" ] ; then echo "Branch doesn't exist"; exit; fi + git checkout $(PUB_BRANCH) + git show-ref $(PUB_BRANCH) + git pull + displayName: 'Git check & switch branch' + + - bash: | + set -e + sudo apt-get update -q --fix-missing + sudo apt install -y tree ffmpeg + #pip install --upgrade pip + #pip --version + pip install -r requirements.txt -r _requirements/data.txt + pip list + displayName: 'Install dependencies' + + - bash: | + set -e + python -c "import torch ; mgpu = torch.cuda.device_count() ; assert mgpu > 0, f'GPU: {mgpu}'" + python -m papermill --version + displayName: 'Sanity check' + + - bash: python .actions/assistant.py convert-ipynb $(notebook) + displayName: 'Generate notebook' + + - bash: | + set -e + mkdir $(PATH_DATASETS) + python .actions/assistant.py bash-render $(notebook) + cat .actions/_ipynb-render.sh + bash .actions/_ipynb-render.sh + git status + git commit -m "publish [GPU]: $(notebook)" + env: + KAGGLE_USERNAME: $(KAGGLE_USERNAME) + KAGGLE_KEY: $(KAGGLE_KEY) + displayName: 'Render notebook' + + - bash: | + git status + git show-ref $(PUB_BRANCH) + git push https://$(PAT_GHOST)@github.com/Lightning-AI/tutorials.git $(PUB_BRANCH) + displayName: 'Finish push' diff --git a/_notebooks/.azure/ipynb-tests.yml b/_notebooks/.azure/ipynb-tests.yml new file mode 100644 index 0000000..f7c9d24 --- /dev/null +++ b/_notebooks/.azure/ipynb-tests.yml @@ -0,0 +1,106 @@ +trigger: none +pr: + branches: + include: [ main ] + autoCancel: "true" + drafts: "true" + +# Multi-job configuration +# - https://learn.microsoft.com/en-us/azure/devops/pipelines/process/phases?view=azure-devops&tabs=yaml#multi-job-configuration + +jobs: + + - job: check_diff + pool: + vmImage: 'Ubuntu-20.04' + steps: + - bash: | + pip install -r .actions/requires.txt + pip list + displayName: 'Install dependencies' + + - bash: | + head=$(git rev-parse origin/main) + printf "Head: $head\n" + git diff --name-only $head --output=target-diff.txt + python .actions/assistant.py group-folders --fpath_gitdiff=target-diff.txt + printf "Changed folders:\n" + cat changed-folders.txt + displayName: 'Process folders' + + - bash: | + notebooks=$(python .actions/assistant.py generate-matrix changed-folders.txt) + printf "Changed notebooks: $notebooks\n" + echo "##vso[task.setVariable variable=dirs;isOutput=true]$notebooks" + name: mtrx + displayName: 'Changed matrix' + + - job: nbval + dependsOn: check_diff + strategy: + matrix: $[ dependencies.check_diff.outputs['mtrx.dirs'] ] + # how long to run the job before automatically cancelling + timeoutInMinutes: "95" + # how much time to give 'run always even if cancelled tasks' before stopping them + cancelTimeoutInMinutes: "2" + + pool: "$(agent-pool)" + # this need to have installed docker in the base image... + container: + image: "$(docker-image)" + options: "--gpus=all --shm-size=32g -v /usr/bin/docker:/tmp/docker:ro" + + variables: + ACCELERATOR: CPU,GPU + PATH_DATASETS: "$(Build.Repository.LocalPath)/.datasets" + DEVICES: $( python -c 'print("$(Agent.Name)".split("_")[-1])' ) + + condition: ne(dependencies.check_diff.outputs['mtrx.dirs'], '') + + steps: + + - bash: | + echo "##vso[task.setvariable variable=CUDA_VISIBLE_DEVICES]$(DEVICES)" + echo "##vso[task.setvariable variable=CONTAINER_ID]$(head -1 /proc/self/cgroup|cut -d/ -f3)" + displayName: 'Set environment variables' + + - bash: | + lspci | egrep 'VGA|3D' + whereis nvidia + nvidia-smi + echo $CUDA_VISIBLE_DEVICES + echo $CONTAINER_ID + python --version + pip list | grep torch + displayName: 'Image info & NVIDIA' + + - script: | + /tmp/docker exec -t -u 0 $CONTAINER_ID \ + sh -c "apt-get update && DEBIAN_FRONTEND=noninteractive apt-get -o Dpkg::Options::="--force-confold" -y install sudo" + displayName: 'Install Sudo in container (thanks Microsoft!)' + + - bash: | + set -e + sudo apt-get update -q --fix-missing + sudo apt install -y tree ffmpeg + pip install -r requirements.txt -r _requirements/data.txt + pip list + displayName: 'Install dependencies' + + - bash: | + python -c "import torch ; mgpu = torch.cuda.device_count() ; assert mgpu > 0, f'GPU: {mgpu}'" + displayName: 'Sanity check' + + - bash: python .actions/assistant.py convert-ipynb $(notebook) + displayName: 'Generate notebook' + + - bash: | + set -e + mkdir $(PATH_DATASETS) + python .actions/assistant.py bash-test $(notebook) + cat .actions/_ipynb-test.sh + bash .actions/_ipynb-test.sh + env: + KAGGLE_USERNAME: $(KAGGLE_USERNAME) + KAGGLE_KEY: $(KAGGLE_KEY) + displayName: 'PyTest notebook' diff --git a/_notebooks/.codecov.yml b/_notebooks/.codecov.yml new file mode 100644 index 0000000..7196116 --- /dev/null +++ b/_notebooks/.codecov.yml @@ -0,0 +1,52 @@ +# see https://docs.codecov.io/docs/codecov-yaml +# Validation check: +# $ curl --data-binary @.codecov.yml https://codecov.io/validate + + +# https://docs.codecov.io/docs/codecovyml-reference +codecov: + bot: "codecov-io" + strict_yaml_branch: "yaml-config" + require_ci_to_pass: yes + notify: + # after_n_builds: 2 + wait_for_ci: yes + +coverage: + precision: 0 # 2 = xx.xx%, 0 = xx% + round: nearest # how coverage is rounded: down/up/nearest + range: 40...100 # custom range of coverage colors from red -> yellow -> green + status: + # https://codecov.readme.io/v1.0/docs/commit-status + project: + default: + target: 95% # specify the target coverage for each commit status + threshold: 30% # allow this little decrease on project + # https://github.com/codecov/support/wiki/Filtering-Branches + # branches: master + if_ci_failed: error + # https://github.com/codecov/support/wiki/Patch-Status + patch: + default: + threshold: 50% # allow this much decrease on patch + changes: false + +# https://docs.codecov.com/docs/github-checks#disabling-github-checks-patch-annotations +github_checks: + annotations: false + +parsers: + gcov: + branch_detection: + conditional: true + loop: true + macro: false + method: false + javascript: + enable_partials: false + +comment: + layout: header, diff + require_changes: false + behavior: default # update if exists else create new + # branches: * diff --git a/_notebooks/.gitattributes b/_notebooks/.gitattributes new file mode 100644 index 0000000..180a922 --- /dev/null +++ b/_notebooks/.gitattributes @@ -0,0 +1 @@ +*.ipynb filter=lfs diff=lfs merge=lfs -text diff --git a/_notebooks/.github/CODEOWNERS b/_notebooks/.github/CODEOWNERS new file mode 100644 index 0000000..24a71a1 --- /dev/null +++ b/_notebooks/.github/CODEOWNERS @@ -0,0 +1,24 @@ +# This is a comment. +# Each line is a file pattern followed by one or more owners. + +# These owners will be the default owners for everything in +# the repo. Unless a later match takes precedence, +# @global-owner1 and @global-owner2 will be requested for +# review when someone opens a pull request. +* @borda @rohitgr7 @carmocca @kaushikb11 @SeanNaren @ethanwharris + +# CI/CD and configs +/.actions/ @borda @ethanwharris +/.azure-*/ @borda @ethanwharris +/.github/ @borda @ethanwharris +/_requirements/ @borda @ethanwharris +*.yml @borda @ethanwharris +requirements.txt @borda @ethanwharris + +# Docs +/_docs/ @borda @ethanwharris @rohitgr7 +/.github/*.md @borda @ethanwharris @rohitgr7 +/.github/ISSUE_TEMPLATE/ @borda @ethanwharris @rohitgr7 + +/.github/CODEOWNERS @borda +/README.md @borda diff --git a/_notebooks/.github/CONTRIBUTING.md b/_notebooks/.github/CONTRIBUTING.md new file mode 100644 index 0000000..b2510fc --- /dev/null +++ b/_notebooks/.github/CONTRIBUTING.md @@ -0,0 +1,81 @@ +# Contributing + +Welcome to the PyTorch Lightning community! We're building the most advanced research platform on the planet to implement the latest, best practices that the amazing PyTorch team rolls out! + +## Design Principles + +We encourage all sorts of contributions you're interested in adding! When writing Tutorials, please follow these principles. + +#### Simple Internal Code + +It's useful for users to look at the code and understand very quickly what's happening. +Many users won't be engineers. Thus we need to value clear, simple code over condensed ninja moves. +While that's super cool, this isn't the project for that :) + +#### Force User Decisions To Best Practices + +There are 1,000 ways to do something. However, eventually one popular solution becomes standard practice, and everyone follows. +We try to find the best way to solve a particular problem, and then force our users to use it for readability and simplicity. + +When something becomes a best practice, we add it to the framework. This is usually something like bits of code in utils or in the model file that everyone keeps adding over and over again across projects. When this happens, bring that code inside the trainer and add a flag for it. + +#### Gain User Trust + +As a researcher, you can't have any part of your code going wrong. So, make thorough tests to ensure that every implementation of a new trick or subtle change is correct. + +#### Interoperability + +PyTorch Lightning Tutorials is highly interoperable with PyTorch Lightning and PyTorch. + +______________________________________________________________________ + +## Contribution Types + +We are always looking for help to implement new features or fixing bugs. + +A lot of good work has already been done in project mechanics (\_requirements/base.txt, setup.py, pep8, badges, ci, etc...) so we're in a good state there thanks to all sooner contributors! + +### Bug Fixes: + +1. If you find a bug please submit a GitHub issue. Make sure the title explains the issue. +1. Try to fix it or recommend a solution. +1. Submit a PR! + +_**Note**, even if you do not find the solution, sending a PR with a test covering the issue is a valid contribution, and we can help you or finish it with you :\]_ + +### New Models: + +PyTorch Lightning Tutorials shows several research models for ready usage. Following are general guidelines for adding new models. + +1. Workflows which are standard baselines +1. Whose results are reproduced properly either by us or by authors. +1. Do not reinvent the wheel, natively support torchvision, torchtext, torchaudio models. +1. Use open source licensed models. + +Please raise an issue before adding a new tutorial. There are tons of models that keep coming. It is very difficult to support every peace. + +______________________________________________________________________ + +## Guidelines + +For this section, we refer to read the [parent PL guidelines](https://pytorch-lightning.readthedocs.io/en/stable/CONTRIBUTING.html) + +**Reminder** + +All added or edited code shall be the own original work of the particular contributor. +If you use some third-party implementation, all such blocks/functions/modules shall be properly referred and if possible also agreed by code's author. For example - `This code is inspired from http://...`. +In case you adding new dependencies, make sure that they are compatible with the actual PyTorch Lightning license (each particular tutorial can have own licence). + +### Question & Answer + +1. **How can I help/contribute?** + + All help is extremely welcome - reporting bugs, fixing documentation, etc. To solve some issues you can start with label [good first issue](https://github.com/Lightning-AI/lightning-bolts/issues?q=is%3Aissue+is%3Aopen+label%3A%22good+first+issue%22) or chose something close to your domain with label. Before you start to implement anything check that the issue description that it is clear and self-assign the task to you (if it is not possible, just comment that you take it, and we assign it to you...). + +1. **Is there a recommendation for branch names?** + + We do not rely on the name convention so far you are working with your own fork. Anyway it would be nice to follow this convention `/_` where the types are: `bugfix`, `ipynb`, `docs`, ... + +1. **I have a model in other framework than PyTorch, how do I add it here?** + + Since PL Tutorials are aiming at Pytorch Lightning implementations we encourage staying with it. diff --git a/_notebooks/.github/ISSUE_TEMPLATE/bug_report.md b/_notebooks/.github/ISSUE_TEMPLATE/bug_report.md new file mode 100644 index 0000000..fd7a397 --- /dev/null +++ b/_notebooks/.github/ISSUE_TEMPLATE/bug_report.md @@ -0,0 +1,28 @@ +--- +name: Bug report +about: Create a report to help us improve +title: '' +labels: bug / fix, help wanted +assignees: '' +--- + +## 🐛 Bug + + + +### To Reproduce + +Steps to reproduce the behavior: + +1. Run '....' +1. See error + + + +### Expected behavior + + + +### Additional context + + diff --git a/_notebooks/.github/ISSUE_TEMPLATE/config.yml b/_notebooks/.github/ISSUE_TEMPLATE/config.yml new file mode 100644 index 0000000..c52bf19 --- /dev/null +++ b/_notebooks/.github/ISSUE_TEMPLATE/config.yml @@ -0,0 +1,8 @@ +blank_issues_enabled: false +contact_links: + - name: Ask a Question + url: https://github.com/Lightning-AI/tutorials/discussions/new + about: Ask and answer Lightning related questions + - name: 💬 Slack + url: https://app.slack.com/client/TR9DVT48M/CQXV8BRH9/thread/CQXV8BRH9-1591382895.254600 + about: Chat with our community diff --git a/_notebooks/.github/ISSUE_TEMPLATE/feature_request.md b/_notebooks/.github/ISSUE_TEMPLATE/feature_request.md new file mode 100644 index 0000000..11378b2 --- /dev/null +++ b/_notebooks/.github/ISSUE_TEMPLATE/feature_request.md @@ -0,0 +1,25 @@ +--- +name: Feature request +about: Suggest an idea for this project +title: '' +labels: enhancement +assignees: '' +--- + +## 🚀 Feature + +### Motivation + + + +### Pitch + + + +### Alternatives + + + +### Additional context + + diff --git a/_notebooks/.github/PULL_REQUEST_TEMPLATE.md b/_notebooks/.github/PULL_REQUEST_TEMPLATE.md new file mode 100644 index 0000000..429d86a --- /dev/null +++ b/_notebooks/.github/PULL_REQUEST_TEMPLATE.md @@ -0,0 +1,18 @@ +## Before submitting + +- [ ] Was this **discussed/approved** via a Github issue? (no need for typos and docs improvements) +- [ ] Did you make sure to **update the docs**? +- [ ] Did you write any new **necessary tests**? + +## What does this PR do? + +Fixes # (issue) + +## PR review + +Anyone in the community is free to review the PR once the tests have passed. +If we didn't discuss your PR in Github issues there's a high chance it will not be merged. + +## Did you have fun? + +Make sure you had fun coding 🙃 diff --git a/_notebooks/.github/dependabot.yml b/_notebooks/.github/dependabot.yml new file mode 100644 index 0000000..a01cfc7 --- /dev/null +++ b/_notebooks/.github/dependabot.yml @@ -0,0 +1,30 @@ +# https://docs.github.com/en/code-security/dependabot/dependabot-version-updates/configuration-options-for-the-dependabot.yml-file +version: 2 +updates: + # Enable version updates for python + - package-ecosystem: "pip" + # Look for a `requirements` in the `root` directory + directory: "/_requirements" + # Check for updates once a week + schedule: + interval: "monthly" + # Labels on pull requests for version updates only + labels: ["ci/cd"] + pull-request-branch-name: + # Separate sections of the branch name with a hyphen + separator: "-" + # Allow up to 5 open pull requests for pip dependencies + open-pull-requests-limit: 5 + reviewers: + - "Lightning-AI/teams/core-lightning" + + - package-ecosystem: "github-actions" + directory: "/" + schedule: + interval: "monthly" + labels: ["ci/cd"] + pull-request-branch-name: + separator: "-" + open-pull-requests-limit: 5 + reviewers: + - "Lightning-AI/core-lightning" diff --git a/_notebooks/.github/labeler.yml b/_notebooks/.github/labeler.yml new file mode 100644 index 0000000..621b7e0 --- /dev/null +++ b/_notebooks/.github/labeler.yml @@ -0,0 +1,7 @@ +documentation: + - _docs/**/* + +CI/CD: + - .actions/**/* + - .azure-*/**/* + - .github/**/* diff --git a/_notebooks/.github/mergify.yml b/_notebooks/.github/mergify.yml new file mode 100644 index 0000000..06f25ec --- /dev/null +++ b/_notebooks/.github/mergify.yml @@ -0,0 +1,32 @@ +pull_request_rules: + + - name: warn on conflicts + conditions: + - conflict + - -draft # filter-out GH draft PRs + - -label="has conflicts" + actions: + # comment: + # message: This pull request is now in conflict... :( + label: + add: [ "has conflicts" ] + + - name: resolved conflicts + conditions: + - -conflict + - label="has conflicts" + - -draft # filter-out GH draft PRs + - -merged # not merged yet + - -closed + actions: + label: + remove: [ "has conflicts" ] + + - name: add core reviewer + conditions: + # number of review approvals + - "#approved-reviews-by<2" + actions: + request_reviews: + users: + - Borda diff --git a/_notebooks/.github/stale.yml b/_notebooks/.github/stale.yml new file mode 100644 index 0000000..8dd7aca --- /dev/null +++ b/_notebooks/.github/stale.yml @@ -0,0 +1,26 @@ +# https://github.com/marketplace/stale + +# Number of days of inactivity before an issue becomes stale +daysUntilStale: 60 +# Number of days of inactivity before a stale issue is closed +daysUntilClose: 14 +# Issues with these labels will never be considered stale +exemptLabels: + - pinned + - security +# Label to use when marking an issue as stale +staleLabel: won't fix +# Comment to post when marking an issue as stale. Set to `false` to disable +markComment: > + This issue has been automatically marked as stale because it has not had + recent activity. It will be closed if no further activity occurs. Thank you + for your contributions. +# Comment to post when closing a stale issue. Set to `false` to disable +closeComment: false + +# Set to true to ignore issues in a project (defaults to false) +exemptProjects: true +# Set to true to ignore issues in a milestone (defaults to false) +exemptMilestones: true +# Set to true to ignore issues with an assignee (defaults to false) +exemptAssignees: true diff --git a/_notebooks/.github/workflows/ci_block-ipybn.yml b/_notebooks/.github/workflows/ci_block-ipybn.yml new file mode 100644 index 0000000..cde61ec --- /dev/null +++ b/_notebooks/.github/workflows/ci_block-ipybn.yml @@ -0,0 +1,13 @@ +name: Prevent adding/chnaging notebooks + +# see: https://help.github.com/en/actions/reference/events-that-trigger-workflows +on: # Trigger the workflow on PR to master + pull_request: + paths: + - ./**/*.ipynb + +jobs: + block-ipynb: + runs-on: ubuntu-latest + steps: + - run: exit 1 diff --git a/_notebooks/.github/workflows/ci_block-pub.yml b/_notebooks/.github/workflows/ci_block-pub.yml new file mode 100644 index 0000000..e0a2e81 --- /dev/null +++ b/_notebooks/.github/workflows/ci_block-pub.yml @@ -0,0 +1,12 @@ +name: Prevent modify publication + +# see: https://help.github.com/en/actions/reference/events-that-trigger-workflows +on: # Trigger the workflow on PR to master + pull_request: + branches: [publication] + +jobs: + block-ipynb: + runs-on: ubuntu-latest + steps: + - run: exit 1 diff --git a/_notebooks/.github/workflows/ci_checks.yml b/_notebooks/.github/workflows/ci_checks.yml new file mode 100644 index 0000000..99d3c0c --- /dev/null +++ b/_notebooks/.github/workflows/ci_checks.yml @@ -0,0 +1,18 @@ +name: General checks + +on: + push: + branches: + - "*" + - "**" + - "!publication" + pull_request: {} + +concurrency: + group: ${{ github.workflow }}-${{ github.ref }}-${{ github.head_ref }} + cancel-in-progress: ${{ ! (github.ref == 'refs/heads/master' || startsWith(github.ref, 'refs/heads/release/')) }} + +jobs: + + check-schema: + uses: Lightning-AI/utilities/.github/workflows/check-schema.yml@v0.7.1 diff --git a/_notebooks/.github/workflows/ci_docs.yml b/_notebooks/.github/workflows/ci_docs.yml new file mode 100644 index 0000000..7902d98 --- /dev/null +++ b/_notebooks/.github/workflows/ci_docs.yml @@ -0,0 +1,116 @@ +name: validate Docs + +on: # Trigger the workflow on push or pull request +# push: +# branches: [main] + pull_request: {} + schedule: + # At the end of every day + - cron: "0 0 * * *" + +concurrency: + group: ${{ github.workflow }}-${{ github.head_ref }} + cancel-in-progress: true + +jobs: + build-docs: + runs-on: ubuntu-latest + env: + PUB_BRANCH: publication + PATH_DATASETS: ${{ github.workspace }}/.datasets + timeout-minutes: 20 + steps: + - name: Checkout 🛎️ + uses: actions/checkout@v3 + with: + fetch-depth: 0 # fetch all history for all branches and tags + - uses: actions/setup-python@v4 + with: + python-version: 3.8 + + - name: Cache pip + uses: actions/cache@v3 + with: + path: ~/.cache/pip + key: pip-${{ hashFiles('requirements.txt') }}-${{ hashFiles('_requirements/docs.txt') }} + restore-keys: pip- + + - name: Install dependencies + run: | + sudo apt-get update --fix-missing + sudo apt-get install -y tree + # install Texlive, see https://linuxconfig.org/how-to-install-latex-on-ubuntu-20-04-focal-fossa-linux + sudo apt-get install -y cmake pandoc texlive-latex-extra dvipng texlive-pictures + pip --version + pip install -q -r requirements.txt -r _requirements/docs.txt + pip list + shell: bash + + - name: Process folders + run: | + mkdir -p ${PATH_DATASETS} + head=$(git rev-parse origin/"${{ github.base_ref }}") + git diff --name-only $head --output=master-diff.txt + python .actions/assistant.py group-folders master-diff.txt + printf "Changed folders:\n" + cat changed-folders.txt + shell: bash + + - name: ">> output" + id: changed + run: python -c "lines = open('changed-folders.txt').readlines(); print(f'::set-output name=nb_dirs::{len(lines)}')" + + - uses: oleksiyrudenko/gha-git-credentials@v2.1 + with: + token: '${{ secrets.GITHUB_TOKEN }}' + global: true + - name: Sync to pub + run: git merge -s resolve origin/$PUB_BRANCH + + - name: Generate notebooks + if: steps.changed.outputs.nb_dirs != 0 + run: | + while IFS= read -r line; do + python .actions/assistant.py convert-ipynb $line + python .actions/assistant.py bash-render $line + cat .actions/_ipynb-render.sh + bash .actions/_ipynb-render.sh + done <<< $(cat changed-folders.txt) + env: + DRY_RUN: 1 + shell: bash + + - name: Copy notebooks + if: steps.changed.outputs.nb_dirs != 0 + run: | + while IFS= read -r line; do + dir=$(dirname $line) + mkdir -p changed-notebooks/${dir} + cp .notebooks/${line}.ipynb changed-notebooks/${dir}/ + done <<< $(cat changed-folders.txt) + tree changed-notebooks + shell: bash + + - uses: actions/upload-artifact@v3 + if: steps.changed.outputs.nb_dirs != 0 + with: + name: notebooks-${{ github.sha }} + path: changed-notebooks/ + + - name: Make Documentation + working-directory: ./_docs + run: make html --debug SPHINXOPTS="-W --keep-going" + + - name: Check External Links (Optional) + working-directory: ./_docs + run: make --jobs $(nproc) linkcheck + # ToDO: comment on PR if any link failed + continue-on-error: true + + - name: Upload built docs + uses: actions/upload-artifact@v3 + with: + name: docs-html-${{ github.sha }} + path: _docs/build/html/ + # Use always() to always run this step to publish test results when there are test failures + if: success() diff --git a/_notebooks/.github/workflows/ci_test-acts.yml b/_notebooks/.github/workflows/ci_test-acts.yml new file mode 100644 index 0000000..7f1d99a --- /dev/null +++ b/_notebooks/.github/workflows/ci_test-acts.yml @@ -0,0 +1,84 @@ +name: CI internal + +# see: https://help.github.com/en/actions/reference/events-that-trigger-workflows +on: # Trigger the workflow on push or pull request, but only for the main branch + push: {} + pull_request: + branches: [main] + +defaults: + run: + shell: bash + +jobs: + pytest-internal: + + runs-on: ${{ matrix.os }} + strategy: + fail-fast: false + matrix: + os: [ubuntu-20.04 ] + python-version: ["3.8", "3.10"] + # Timeout: https://stackoverflow.com/a/59076067/4521646 + timeout-minutes: 15 + + steps: + - uses: actions/checkout@v3 + with: + fetch-depth: 0 # fetch all history for all branches and tags + - name: Set up Python ${{ matrix.python-version }} + uses: actions/setup-python@v4 + with: + python-version: ${{ matrix.python-version }} + + # Note: This uses an internal pip API and may not always work + # https://github.com/actions/cache/blob/master/examples.md#multiple-oss-in-a-workflow + - name: Get pip cache dir + id: pip-cache + run: echo "::set-output name=dir::$(pip cache dir)" + + - name: pip cache + uses: actions/cache@v3 + with: + path: ${{ steps.pip-cache.outputs.dir }} + key: ${{ runner.os }}-pip-py${{ matrix.python-version }}-${{ hashFiles('.actions/requires.txt') }}-${{ hashFiles('requirements/default.txt') }} + restore-keys: ${{ runner.os }}-pip-py${{ matrix.python-version }}- + + - name: Install requirements + run: | + pip --version + pip install -q -r .actions/requires.txt + pip install -q "pytest==6.*" coverage jupytext + # this is needed to be able to run package version parsing test + pip install -q matplotlib -r _requirements/default.txt --find-links https://download.pytorch.org/whl/cpu/torch_stable.html + + - name: Prepare dummy inputs + run: | + jupytext --set-formats ipynb,py:percent templates/simple/template.py + jupytext --set-formats ipynb,py:percent templates/titanic/tutorial.py + # mv templates/simple/template.ipynb templates/simple.ipynb + git diff --name-only HEAD~3 > master-diff.txt + python .actions/assistant.py list_dirs "" > dirs-b1.txt + python .actions/assistant.py list_dirs --include_file_ext=".ipynb" > dirs-b2.txt + + - name: Testing + run: | + coverage run -m pytest .actions -v + + - name: Statistics + if: success() + run: | + coverage report + coverage xml + + - name: Upload coverage to Codecov + uses: codecov/codecov-action@v3 + if: always() + # see: https://github.com/actions/toolkit/issues/399 + continue-on-error: true + with: + token: ${{ secrets.CODECOV_TOKEN }} + file: coverage.xml + flags: pytest,${{ runner.os }} + name: CLI-coverage + fail_ci_if_error: false diff --git a/_notebooks/.github/workflows/docs-deploy.yml b/_notebooks/.github/workflows/docs-deploy.yml new file mode 100644 index 0000000..d132912 --- /dev/null +++ b/_notebooks/.github/workflows/docs-deploy.yml @@ -0,0 +1,58 @@ +name: Deploy Docs +on: + push: + branches: [publication] + workflow_dispatch: {} + workflow_run: + workflows: ["Publish notebook"] + types: + - completed + +jobs: + # https://github.com/marketplace/actions/deploy-to-github-pages + build-docs-deploy: + runs-on: ubuntu-20.04 + env: + PATH_DATASETS: ${{ github.workspace }}/.datasets + steps: + - name: Checkout 🛎️ + uses: actions/checkout@v3 + with: + ref: publication + - uses: actions/setup-python@v4 + with: + python-version: 3.8 + + - name: Cache pip + uses: actions/cache@v3 + with: + path: ~/.cache/pip + key: ${{ runner.os }}-pip-${{ hashFiles('requirements.txt') }}-${{ hashFiles('_requirements/docs.txt') }} + restore-keys: ${{ runner.os }}-pip- + + - name: Install dependencies + run: | + mkdir -p ${PATH_DATASETS} + # install Texlive, see https://linuxconfig.org/how-to-install-latex-on-ubuntu-20-04-focal-fossa-linux + sudo apt-get update + sudo apt-get install -y cmake pandoc + sudo apt-get install -y texlive-latex-extra dvipng texlive-pictures + pip --version + pip install --quiet --requirement _requirements/docs.txt + pip list + shell: bash + + - name: Make Documentation + working-directory: ./_docs + run: make html --jobs $(nproc) + + - name: Deploy 🚀 + uses: JamesIves/github-pages-deploy-action@v4.4.1 + with: + token: ${{ secrets.GITHUB_TOKEN }} + branch: gh-pages # The branch the action should deploy to. + folder: _docs/build/html # The folder the action should deploy. + clean: true # Automatically remove deleted files from the deploy branch + target-folder: docs # If you'd like to push the contents of the deployment folder into a specific directory + single-commit: true # you'd prefer to have a single commit on the deployment branch instead of full history + if: success() diff --git a/_notebooks/.gitignore b/_notebooks/.gitignore new file mode 100644 index 0000000..df8737c --- /dev/null +++ b/_notebooks/.gitignore @@ -0,0 +1,137 @@ +# Byte-compiled / optimized / DLL files +__pycache__/ +*.py[cod] +*$py.class + +# C extensions +*.so + +# Distribution / packaging +.Python +build/ +develop-eggs/ +dist/ +downloads/ +eggs/ +.eggs/ +lib/ +lib64/ +parts/ +sdist/ +var/ +wheels/ +pip-wheel-metadata/ +share/python-wheels/ +*.egg-info/ +.installed.cfg +*.egg +MANIFEST + +# PyInstaller +# Usually these files are written by a python script from a template +# before PyInstaller builds the exe, so as to inject date/other infos into it. +*.manifest +*.spec + +# Installer logs +pip-log.txt +pip-delete-this-directory.txt + +# Unit test / coverage reports +htmlcov/ +.tox/ +.nox/ +.coverage +.coverage.* +.cache +nosetests.xml +coverage.xml +*.cover +*.py,cover +.hypothesis/ +.pytest_cache/ + +# Translations +*.mo +*.pot + +# Django stuff: +*.log +local_settings.py +db.sqlite3 +db.sqlite3-journal + +# Flask stuff: +instance/ +.webassets-cache + +# Scrapy stuff: +.scrapy + +# Sphinx documentation +_docs/_build/ + +# PyBuilder +target/ + +# Jupyter Notebook +.ipynb_checkpoints + +# IPython +profile_default/ +ipython_config.py + +# pyenv +.python-version + +# pipenv +# According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control. +# However, in case of collaboration, if having platform-specific dependencies or dependencies +# having no cross-platform support, pipenv may install dependencies that don't work, or not +# install all needed dependencies. +#Pipfile.lock + +# PEP 582; used by e.g. github.com/David-OConnor/pyflow +__pypackages__/ + +# Celery stuff +celerybeat-schedule +celerybeat.pid + +# SageMath parsed files +*.sage.py + +# Environments +.env +.venv +env/ +venv/ +ENV/ +env.bak/ +venv.bak/ + +# Spyder project settings +.spyderproject +.spyproject + +# Rope project settings +.ropeproject + +# mkdocs documentation +/site + +# mypy +.mypy_cache/ +.dmypy.json +dmypy.json + +# Pyre type checker +.pyre/ + +.idea/ + +# data artifacts +logs/ +lightning_logs/ +cifar-10-batches-py +*.tar.gz diff --git a/_notebooks/.jupytext.yml b/_notebooks/.jupytext.yml new file mode 100644 index 0000000..fa534dd --- /dev/null +++ b/_notebooks/.jupytext.yml @@ -0,0 +1,4 @@ +# todo: this seems to have no effect atm + +# Always pair ipynb notebooks to py:percent files +formats: ipynb,py:percent diff --git a/_notebooks/.pre-commit-config.yaml b/_notebooks/.pre-commit-config.yaml new file mode 100644 index 0000000..c65cb64 --- /dev/null +++ b/_notebooks/.pre-commit-config.yaml @@ -0,0 +1,66 @@ +default_language_version: + python: python3.8 + +ci: + autofix_prs: true + autoupdate_commit_msg: '[pre-commit.ci] pre-commit suggestions' + autoupdate_schedule: quarterly + # submodules: true + +repos: + - repo: https://github.com/pre-commit/pre-commit-hooks + rev: v4.4.0 + hooks: + - id: end-of-file-fixer + - id: trailing-whitespace + - id: check-case-conflict + - id: check-json + - id: check-yaml + - id: check-toml + - id: check-added-large-files + args: ['--maxkb=250', '--enforce-all'] + - id: check-docstring-first + - id: detect-private-key + + - repo: https://github.com/asottile/pyupgrade + rev: v3.3.1 + hooks: + - id: pyupgrade + args: [--py37-plus] + name: Upgrade code + + - repo: https://github.com/PyCQA/docformatter + rev: v1.5.1 + hooks: + - id: docformatter + args: [--in-place, --wrap-summaries=115, --wrap-descriptions=120] + + - repo: https://github.com/PyCQA/isort + rev: 5.12.0 + hooks: + - id: isort + + - repo: https://github.com/psf/black + rev: 22.12.0 + hooks: + - id: black + name: Format code + + - repo: https://github.com/asottile/yesqa + rev: v1.4.0 + hooks: + - id: yesqa + + - repo: https://github.com/executablebooks/mdformat + rev: 0.7.16 + hooks: + - id: mdformat + additional_dependencies: + - mdformat-gfm + - mdformat-black + - mdformat_frontmatter + + - repo: https://github.com/PyCQA/flake8 + rev: 6.0.0 + hooks: + - id: flake8 diff --git a/_notebooks/LICENSE b/_notebooks/LICENSE new file mode 100644 index 0000000..261eeb9 --- /dev/null +++ b/_notebooks/LICENSE @@ -0,0 +1,201 @@ + Apache License + Version 2.0, January 2004 + http://www.apache.org/licenses/ + + TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION + + 1. Definitions. + + "License" shall mean the terms and conditions for use, reproduction, + and distribution as defined by Sections 1 through 9 of this document. + + "Licensor" shall mean the copyright owner or entity authorized by + the copyright owner that is granting the License. + + "Legal Entity" shall mean the union of the acting entity and all + other entities that control, are controlled by, or are under common + control with that entity. For the purposes of this definition, + "control" means (i) the power, direct or indirect, to cause the + direction or management of such entity, whether by contract or + otherwise, or (ii) ownership of fifty percent (50%) or more of the + outstanding shares, or (iii) beneficial ownership of such entity. + + "You" (or "Your") shall mean an individual or Legal Entity + exercising permissions granted by this License. + + "Source" form shall mean the preferred form for making modifications, + including but not limited to software source code, documentation + source, and configuration files. + + "Object" form shall mean any form resulting from mechanical + transformation or translation of a Source form, including but + not limited to compiled object code, generated documentation, + and conversions to other media types. + + "Work" shall mean the work of authorship, whether in Source or + Object form, made available under the License, as indicated by a + copyright notice that is included in or attached to the work + (an example is provided in the Appendix below). + + "Derivative Works" shall mean any work, whether in Source or Object + form, that is based on (or derived from) the Work and for which the + editorial revisions, annotations, elaborations, or other modifications + represent, as a whole, an original work of authorship. For the purposes + of this License, Derivative Works shall not include works that remain + separable from, or merely link (or bind by name) to the interfaces of, + the Work and Derivative Works thereof. + + "Contribution" shall mean any work of authorship, including + the original version of the Work and any modifications or additions + to that Work or Derivative Works thereof, that is intentionally + submitted to Licensor for inclusion in the Work by the copyright owner + or by an individual or Legal Entity authorized to submit on behalf of + the copyright owner. For the purposes of this definition, "submitted" + means any form of electronic, verbal, or written communication sent + to the Licensor or its representatives, including but not limited to + communication on electronic mailing lists, source code control systems, + and issue tracking systems that are managed by, or on behalf of, the + Licensor for the purpose of discussing and improving the Work, but + excluding communication that is conspicuously marked or otherwise + designated in writing by the copyright owner as "Not a Contribution." + + "Contributor" shall mean Licensor and any individual or Legal Entity + on behalf of whom a Contribution has been received by Licensor and + subsequently incorporated within the Work. + + 2. Grant of Copyright License. Subject to the terms and conditions of + this License, each Contributor hereby grants to You a perpetual, + worldwide, non-exclusive, no-charge, royalty-free, irrevocable + copyright license to reproduce, prepare Derivative Works of, + publicly display, publicly perform, sublicense, and distribute the + Work and such Derivative Works in Source or Object form. + + 3. Grant of Patent License. Subject to the terms and conditions of + this License, each Contributor hereby grants to You a perpetual, + worldwide, non-exclusive, no-charge, royalty-free, irrevocable + (except as stated in this section) patent license to make, have made, + use, offer to sell, sell, import, and otherwise transfer the Work, + where such license applies only to those patent claims licensable + by such Contributor that are necessarily infringed by their + Contribution(s) alone or by combination of their Contribution(s) + with the Work to which such Contribution(s) was submitted. If You + institute patent litigation against any entity (including a + cross-claim or counterclaim in a lawsuit) alleging that the Work + or a Contribution incorporated within the Work constitutes direct + or contributory patent infringement, then any patent licenses + granted to You under this License for that Work shall terminate + as of the date such litigation is filed. + + 4. Redistribution. You may reproduce and distribute copies of the + Work or Derivative Works thereof in any medium, with or without + modifications, and in Source or Object form, provided that You + meet the following conditions: + + (a) You must give any other recipients of the Work or + Derivative Works a copy of this License; and + + (b) You must cause any modified files to carry prominent notices + stating that You changed the files; and + + (c) You must retain, in the Source form of any Derivative Works + that You distribute, all copyright, patent, trademark, and + attribution notices from the Source form of the Work, + excluding those notices that do not pertain to any part of + the Derivative Works; and + + (d) If the Work includes a "NOTICE" text file as part of its + distribution, then any Derivative Works that You distribute must + include a readable copy of the attribution notices contained + within such NOTICE file, excluding those notices that do not + pertain to any part of the Derivative Works, in at least one + of the following places: within a NOTICE text file distributed + as part of the Derivative Works; within the Source form or + documentation, if provided along with the Derivative Works; or, + within a display generated by the Derivative Works, if and + wherever such third-party notices normally appear. The contents + of the NOTICE file are for informational purposes only and + do not modify the License. You may add Your own attribution + notices within Derivative Works that You distribute, alongside + or as an addendum to the NOTICE text from the Work, provided + that such additional attribution notices cannot be construed + as modifying the License. + + You may add Your own copyright statement to Your modifications and + may provide additional or different license terms and conditions + for use, reproduction, or distribution of Your modifications, or + for any such Derivative Works as a whole, provided Your use, + reproduction, and distribution of the Work otherwise complies with + the conditions stated in this License. + + 5. Submission of Contributions. Unless You explicitly state otherwise, + any Contribution intentionally submitted for inclusion in the Work + by You to the Licensor shall be under the terms and conditions of + this License, without any additional terms or conditions. + Notwithstanding the above, nothing herein shall supersede or modify + the terms of any separate license agreement you may have executed + with Licensor regarding such Contributions. + + 6. Trademarks. This License does not grant permission to use the trade + names, trademarks, service marks, or product names of the Licensor, + except as required for reasonable and customary use in describing the + origin of the Work and reproducing the content of the NOTICE file. + + 7. Disclaimer of Warranty. Unless required by applicable law or + agreed to in writing, Licensor provides the Work (and each + Contributor provides its Contributions) on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or + implied, including, without limitation, any warranties or conditions + of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A + PARTICULAR PURPOSE. You are solely responsible for determining the + appropriateness of using or redistributing the Work and assume any + risks associated with Your exercise of permissions under this License. + + 8. Limitation of Liability. In no event and under no legal theory, + whether in tort (including negligence), contract, or otherwise, + unless required by applicable law (such as deliberate and grossly + negligent acts) or agreed to in writing, shall any Contributor be + liable to You for damages, including any direct, indirect, special, + incidental, or consequential damages of any character arising as a + result of this License or out of the use or inability to use the + Work (including but not limited to damages for loss of goodwill, + work stoppage, computer failure or malfunction, or any and all + other commercial damages or losses), even if such Contributor + has been advised of the possibility of such damages. + + 9. Accepting Warranty or Additional Liability. While redistributing + the Work or Derivative Works thereof, You may choose to offer, + and charge a fee for, acceptance of support, warranty, indemnity, + or other liability obligations and/or rights consistent with this + License. However, in accepting such obligations, You may act only + on Your own behalf and on Your sole responsibility, not on behalf + of any other Contributor, and only if You agree to indemnify, + defend, and hold each Contributor harmless for any liability + incurred by, or claims asserted against, such Contributor by reason + of your accepting any such warranty or additional liability. + + END OF TERMS AND CONDITIONS + + APPENDIX: How to apply the Apache License to your work. + + To apply the Apache License to your work, attach the following + boilerplate notice, with the fields enclosed by brackets "[]" + replaced with your own identifying information. (Don't include + the brackets!) The text should be enclosed in the appropriate + comment syntax for the file format. We also recommend that a + file or class name and description of purpose be included on the + same "printed page" as the copyright notice for easier + identification within third-party archives. + + Copyright [yyyy] [name of copyright owner] + + Licensed under the Apache License, Version 2.0 (the "License"); + you may not use this file except in compliance with the License. + You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. diff --git a/_notebooks/Makefile b/_notebooks/Makefile new file mode 100644 index 0000000..764c44a --- /dev/null +++ b/_notebooks/Makefile @@ -0,0 +1,39 @@ +.PHONY: ipynb clean docs + +# META := $(wildcard **/.meta.yml) +META := $(shell find -regex ".*/.meta.y[a]?ml") +IPYNB := $(META:%/.meta.yml=%.ipynb) +IPYNB := $(IPYNB:%/.meta.yaml=%.ipynb) +export PATH_DATASETS=$(PWD)/.datasets + +init: + @echo $(PATH_DATASETS) + mkdir -p $(PATH_DATASETS) + +ipynb: init ${IPYNB} +# @echo $< + +%.ipynb: %/.meta.y*ml + @echo $< + python .actions/assistant.py convert-ipynb $(shell dirname $<) + python .actions/assistant.py bash-render $(shell dirname $<) + bash .actions/_ipynb-render.sh + +docs: clean + pip install --quiet -r _requirements/docs.txt + python -m sphinx -b html -W --keep-going _docs/source _docs/build + +clean: + rm -rf ./.datasets + # clean all temp runs + rm -rf ./_docs/build + rm -rf ./_docs/source/notebooks + rm -rf ./_docs/source/api + rm -f ./dirs-*.txt + rm -f ./*-folders.txt + rm -f ./*/**/*.ipynb + rm -rf ./*/**/.ipynb_checkpoints + rm -rf ./*/**/venv + rm -rf ./*/**/logs + rm -rf ./*/**/lightning_logs + rm -f ./*/**/requirements.txt diff --git a/_notebooks/README.md b/_notebooks/README.md new file mode 100644 index 0000000..5d8baa4 --- /dev/null +++ b/_notebooks/README.md @@ -0,0 +1,99 @@ +# PytorchLightning Tutorials + +[![CI internal](https://github.com/Lightning-AI/tutorials/actions/workflows/ci_test-acts.yml/badge.svg?event=push)](https://github.com/Lightning-AI/tutorials/actions/workflows/ci_test-acts.yml) +[![Build Status](https://dev.azure.com/Lightning-AI/Tutorials/_apis/build/status/Lightning-AI.tutorials%20%5Bpublish%5D?branchName=main)](https://dev.azure.com/Lightning-AI/Tutorials/_build/latest?definitionId=29&branchName=main) +[![codecov](https://codecov.io/gh/Lightning-AI/tutorials/branch/main/graph/badge.svg?token=C6T3XOOR56)](https://codecov.io/gh/Lightning-AI/tutorials) +[![Deploy Docs](https://github.com/Lightning-AI/tutorials/actions/workflows/docs-deploy.yml/badge.svg)](https://github.com/Lightning-AI/tutorials/actions/workflows/docs-deploy.yml) +[![pre-commit.ci status](https://results.pre-commit.ci/badge/github/Lightning-AI/tutorials/main.svg)](https://results.pre-commit.ci/latest/github/Lightning-AI/tutorials/main) + +This is the Lightning Library - collection of Lightning related notebooks which are pulled back to the main repo as submodule and rendered inside the main documentations. +The key features/highlights: + +- we keep the repo **light-weighted** - notebooks are stored in rich script format +- all scripts/notebooks are tested to be **fully executable** +- fully **reproducible** by saving runtime env. details + +For more details read our blogpost - [Best Practices for Publishing PyTorch Lightning Tutorial Notebooks](https://devblog.pytorchlightning.ai/publishing-lightning-tutorials-cbea3eaa4b2c) + +## Adding/Editing notebooks + +This repo in main branch contain only python scripts with markdown extensions, and notebooks are generated in special publication branch, so no raw notebooks are accepted as PR. +On the other hand we highly recommend creating a notebooks and convert it script with [jupytext](https://jupytext.readthedocs.io/en/latest/) as + +```bash +jupytext --set-formats ipynb,py:percent my-notebook.ipynb +``` + +### Contribution structure + +The addition has to formed as new folder + +- the folder name is used for the future notebooks +- single python scripts with converted notebooks (name does not matter) +- metadata named `.meta.yaml` including following info: + ```yaml + title: Sample notebooks + author: [User](contact) + created: YYYY-MM-DD + updated: YYYY-MM-DD + license: CC BY-SA + # multi-line + description: | + This notebook will walk you through ... + requirements: + - package # with version if needed + # define supported - CPU|GPU|TPU + accelerator: + - CPU + ``` + +### Using datasets + +It is quite common to use some public or competition's dataset for your example. +We facilitate this via defining the data sources in the metafile. +There are two basic options, download a file from web or pul Kaggle dataset: + +```yaml +datasets: + web: + - https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz + kaggle: + - titanic +``` + +In both cases, the downloaded archive (Kaggle dataset is originally downloaded as zip file) is extracted to the default dataset folder under sub-folder with the same name as the downloaded file. +To get path to this dataset folder, please use environment variable `PATH_DATASETS`, so in your script use: + +```py +import os + +data_path = os.environ.get("PATH_DATASETS", "_datasets") +path_titanic = os.path.join(data_path, "titatnic") +``` + +**Warning:** some Kaggle datasets can be quite large and the process is - downloading and extracting, which means that particular runner needs to have double free space. For this reason, the CPU runner is limited to 3GB datasets. + +### Suggestions + +- For inserting images into text cells use MarkDown formatting, so we can insert inline images to the notebooks directly and drop eventual dependency on internet connection -> generated notebooks could be better shared offline +- If your images need special sizes, use `![Cation](my-image.png){height="60px" width="240px"}` +- If your notebook is computational or any other resource (CPU/RAM) demanding use only GPU accelerator option in meta config + +### Known limitations + +- Nothing major at this moment + +## Meantime notes + +On the back side of publishing workflow you can find in principle these three steps + +```bash +# 1) convert script to notebooks +jupytext --set-formats ipynb,py:percent notebook.py + +# 2) testing the created notebook +pytest -v notebook.ipynb --nbval + +# 3) generating notebooks outputs +papermill in-notebook.ipynb out-notebook.ipynb +``` diff --git a/_notebooks/_docs/.build_docs.sh b/_notebooks/_docs/.build_docs.sh new file mode 100644 index 0000000..0419bd6 --- /dev/null +++ b/_notebooks/_docs/.build_docs.sh @@ -0,0 +1,2 @@ +make clean +make html --debug --jobs $(nproc) diff --git a/_notebooks/_docs/Makefile b/_notebooks/_docs/Makefile new file mode 100644 index 0000000..197a2c7 --- /dev/null +++ b/_notebooks/_docs/Makefile @@ -0,0 +1,19 @@ +# Minimal makefile for Sphinx documentation +# + +# You can set these variables from the command line. +SPHINXOPTS = -W +SPHINXBUILD = python $(shell which sphinx-build) +SOURCEDIR = source +BUILDDIR = build + +# Put it first so that "make" without argument is like "make help". +help: + @$(SPHINXBUILD) -M help "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O) + +.PHONY: help Makefile + +# Catch-all target: route all unknown targets to Sphinx using the new +# "make mode" option. $(O) is meant as a shortcut for $(SPHINXOPTS). +%: Makefile + @$(SPHINXBUILD) -M $@ "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O) diff --git a/make.bat b/_notebooks/_docs/make.bat similarity index 100% rename from make.bat rename to _notebooks/_docs/make.bat diff --git a/_notebooks/_docs/source/_static/images/icon.svg b/_notebooks/_docs/source/_static/images/icon.svg new file mode 100644 index 0000000..5ab3512 --- /dev/null +++ b/_notebooks/_docs/source/_static/images/icon.svg @@ -0,0 +1,62 @@ + + + + + + image/svg+xml + + + + + + + + + + diff --git a/_notebooks/_docs/source/_static/images/logo.png b/_notebooks/_docs/source/_static/images/logo.png new file mode 100644 index 0000000..a28606b Binary files /dev/null and b/_notebooks/_docs/source/_static/images/logo.png differ diff --git a/docs/_static/images/logo-lightning.svg b/_notebooks/_docs/source/_static/images/logo.svg old mode 100644 new mode 100755 similarity index 100% rename from docs/_static/images/logo-lightning.svg rename to _notebooks/_docs/source/_static/images/logo.svg diff --git a/_notebooks/_docs/source/_templates/theme_variables.jinja b/_notebooks/_docs/source/_templates/theme_variables.jinja new file mode 100644 index 0000000..95adb3e --- /dev/null +++ b/_notebooks/_docs/source/_templates/theme_variables.jinja @@ -0,0 +1,18 @@ +{%- set external_urls = { + 'github': 'https://github.com/Lightning-AI/lightning-sandbox', + 'github_issues': 'https://github.com/Lightning-AI/lightning-sandbox/issues', + 'contributing': 'https://github.com/Lightning-AI/lightning/blob/master/CONTRIBUTING.md', + 'governance': 'https://github.com/Lightning-AI/lightning/blob/master/governance.md', + 'docs': 'https://lightning-sandbox.rtfd.io/en/latest', + 'twitter': 'https://twitter.com/PyTorchLightnin', + 'discuss': 'https://pytorch-lightning.slack.com', + 'tutorials': 'https://pt-lightning-sandbox.readthedocs.io/en/latest/#tutorials', + 'previous_pytorch_versions': 'https://pt-lightning-sandbox.rtfd.io/en/latest/', + 'home': 'https://pt-lightning-sandbox.rtfd.io/en/latest/', + 'get_started': 'https://pt-lightning-sandbox.readthedocs.io/en/latest/introduction_guide.html', + 'features': 'https://pt-lightning-sandbox.rtfd.io/en/latest/', + 'blog': 'https://www.pytorchlightning.ai/blog', + 'resources': 'https://pt-lightning-sandbox.readthedocs.io/en/latest/#community-examples', + 'support': 'https://pt-lightning-sandbox.rtfd.io/en/latest/', +} +-%} diff --git a/_notebooks/_docs/source/conf.py b/_notebooks/_docs/source/conf.py new file mode 100644 index 0000000..862e46e --- /dev/null +++ b/_notebooks/_docs/source/conf.py @@ -0,0 +1,231 @@ +# +# Configuration file for the Sphinx documentation builder. +# +# This file does only contain a selection of the most common options. For a +# full list see the documentation: +# http://www.sphinx-doc.org/en/master/config + +# -- Path setup -------------------------------------------------------------- + +# If extensions (or modules to document with autodoc) are in another directory, +# add these directories to sys.path here. If the directory is relative to the +# documentation root, use os.path.abspath to make it absolute, like shown here. +import os +import sys + +import pt_lightning_sphinx_theme + +_PATH_HERE = os.path.abspath(os.path.dirname(__file__)) +_PATH_ROOT = os.path.realpath(os.path.join(_PATH_HERE, "..", "..")) +sys.path.insert(0, os.path.abspath(_PATH_ROOT)) +sys.path.append(os.path.join(_PATH_ROOT, ".actions")) + +from assistant import AssistantCLI # noqa: E402 + +# -- Project information ----------------------------------------------------- + +# this name shall match the project name in Github as it is used for linking to code +project = "lightning-tutorials" +author = "PytorchLightning team" +copyright = f"Copyright (c) 2020-2021, {author}." +homepage = "https://www.pytorchlightning.ai" + +# # The short X.Y version +# version = about.__version__ +# # The full version, including alpha/beta/rc tags +# release = about.__version__ + +# Options for the linkcode extension +# ---------------------------------- +github_user = "PyTorchLightning" +github_repo = project + +# -- Project documents ------------------------------------------------------- + +AssistantCLI.copy_notebooks(_PATH_ROOT, _PATH_HERE) + +# with open(os.path.join(_PATH_HERE, 'ipynb_content.rst'), 'w') as fp: +# fp.write(os.linesep.join(ipynb_content)) + +# -- General configuration --------------------------------------------------- + +# If your documentation needs a minimal Sphinx version, state it here. + +needs_sphinx = "4.0" + +# Add any Sphinx extension module names here, as strings. They can be +# extensions coming with Sphinx (named 'sphinx.ext.*') or your custom +# ones. +extensions = [ + "sphinx.ext.intersphinx", + "sphinx.ext.todo", + "sphinx.ext.napoleon", + "sphinx.ext.imgmath", + "sphinx.ext.githubpages", + "nbsphinx", + "myst_parser", + "sphinx_paramlinks", + "pt_lightning_sphinx_theme.extensions.lightning", +] + +# Add any paths that contain templates here, relative to this directory. +templates_path = ["_templates"] + +# https://berkeley-stat159-f17.github.io/stat159-f17/lectures/14-sphinx..html#conf.py-(cont.) +# https://stackoverflow.com/questions/38526888/embed-ipython-notebook-in-sphinx-document +# I execute the notebooks manually in advance. If notebooks test the code, +# they should be run at build time. +nbsphinx_execute = "never" +nbsphinx_allow_errors = True +nbsphinx_requirejs_path = "" + +myst_update_mathjax = False + +# The suffix(es) of source filenames. +# You can specify multiple suffix as a list of string: +# +source_parsers = { + ".rst": "restructuredtext", + ".txt": "markdown", + ".md": "markdown", + ".ipynb": "nbsphinx", +} + +# The master toctree document. +master_doc = "index" + +# The language for content autogenerated by Sphinx. Refer to documentation +# for a list of supported languages. +# +# This is also used if you do content translation via gettext catalogs. +# Usually you set "language" from the command line for these cases. +language = "ko" + +# List of patterns, relative to source directory, that match files and +# directories to ignore when looking for source files. +# This pattern also affects html_static_path and html_extra_path. +exclude_patterns = [ + "PULL_REQUEST_TEMPLATE.md", + "_build", + "**.ipynb_checkpoints", +] + +# The name of the Pygments (syntax highlighting) style to use. +pygments_style = None + +# -- Options for HTML output ------------------------------------------------- + +# The theme to use for HTML and HTML Help pages. See the documentation for +# a list of builtin themes. +# +html_theme = "pt_lightning_sphinx_theme" +html_theme_path = [pt_lightning_sphinx_theme.get_html_theme_path()] + +# Theme options are theme-specific and customize the look and feel of a theme +# further. For a list of options available for each theme, see the +# documentation. + +html_theme_options = { + "pytorch_project": homepage, + "canonical_url": homepage, + "collapse_navigation": False, + "display_version": True, + "logo_only": False, +} + +html_favicon = "_static/images/icon.svg" + +# Add any paths that contain custom static files (such as style sheets) here, +# relative to this directory. They are copied after the builtin static files, +# so a file named "default.css" will overwrite the builtin "default.css". +html_static_path = ["_templates", "_static"] + +# Custom sidebar templates, must be a dictionary that maps document names +# to template names. +# +# The default sidebars (for documents that don't match any pattern) are +# defined by theme itself. Builtin themes are using these templates by +# default: ``['localtoc.html', 'relations.html', 'sourcelink.html', +# 'searchbox.html']``. +# +# html_sidebars = {} + +# -- Options for HTMLHelp output --------------------------------------------- + +# Output file base name for HTML help builder. +htmlhelp_basename = project + "-doc" + +# -- Options for LaTeX output ------------------------------------------------ + +latex_elements = { + # The paper size ('letterpaper' or 'a4paper'). + # 'papersize': 'letterpaper', + # The font size ('10pt', '11pt' or '12pt'). + # 'pointsize': '10pt', + # Additional stuff for the LaTeX preamble. + # 'preamble': '', + # Latex figure (float) alignment + "figure_align": "htbp", +} + +# Grouping the document tree into LaTeX files. List of tuples +# (source start file, target name, title, +# author, documentclass [howto, manual, or own class]). +latex_documents = [ + (master_doc, project + ".tex", project + " Documentation", author, "manual"), +] + +# -- Options for manual page output ------------------------------------------ + +# One entry per manual page. List of tuples +# (source start file, name, description, authors, manual section). +man_pages = [(master_doc, project, project + " Documentation", [author], 1)] + +# -- Options for linkcheck builder ---------------------------------------------- +# regex pattern 0: allow linking to a specific selection state in +# tensorboard.dev links while continuing to validate the base experiment link +linkcheck_anchors_ignore = ["scalars.*&runSelectionState.*"] + +# -- Options for Texinfo output ---------------------------------------------- + +# Grouping the document tree into Texinfo files. List of tuples +# (source start file, target name, title, author, +# dir menu entry, description, category) +texinfo_documents = [ + ( + master_doc, + project, + project + " Documentation", + author, + project, + "" "Miscellaneous", # about.__docs__, + ), +] + +# -- Options for Epub output ------------------------------------------------- + +# Bibliographic Dublin Core info. +epub_title = project + +# The unique identifier of the text. This can be a ISBN number +# or the project homepage. +# +# epub_identifier = '' + +# A unique identification for the text. +# +# epub_uid = '' + +# A list of files that should not be packed into the epub file. +epub_exclude_files = ["search.html"] + +# -- Extension configuration ------------------------------------------------- + +# -- Options for intersphinx extension --------------------------------------- + +# Example configuration for intersphinx: refer to the Python standard library. +# intersphinx_mapping = { +# "python": ("https://docs.python.org/3", None), +# "torch": ("https://pytorch.org/docs/stable/", None), +# "numpy": ("https://docs.scipy.org/doc/numpy/", None), +# } diff --git a/_notebooks/_docs/source/index.rst b/_notebooks/_docs/source/index.rst new file mode 100644 index 0000000..1564f99 --- /dev/null +++ b/_notebooks/_docs/source/index.rst @@ -0,0 +1,32 @@ +.. PyTorchLightning-Sandbox documentation master file, created by + sphinx-quickstart on Wed Mar 25 21:34:07 2020. + You can adapt this file completely to your liking, but it should at least + contain the root `toctree` directive. + +Lightning-Sandbox documentation +=============================== + +.. tutoriallist:: + +.. raw:: html + +
+ +.. toctree:: + :maxdepth: 1 + :name: start + :caption: Start here + :glob: + + notebooks/**/* + +.. raw:: html + +
+ +Indices and tables +================== + +* :ref:`genindex` +* :ref:`modindex` +* :ref:`search` diff --git a/_notebooks/_requirements/data.txt b/_notebooks/_requirements/data.txt new file mode 100644 index 0000000..08fe313 --- /dev/null +++ b/_notebooks/_requirements/data.txt @@ -0,0 +1,2 @@ +# fixed version to be able to call it as `python -m kaggle` +https://github.com/Borda/kaggle-api/archive/refs/heads/setup/python-m.zip diff --git a/_notebooks/_requirements/default.txt b/_notebooks/_requirements/default.txt new file mode 100644 index 0000000..42e7333 --- /dev/null +++ b/_notebooks/_requirements/default.txt @@ -0,0 +1,5 @@ +setuptools==67.4.0 +ipython[notebook]>=8.0.0, <8.12.0 +torch>=1.8.1, <1.14.0 +pytorch-lightning>=1.4, <2.0.0 +torchmetrics>=0.7, <0.12 diff --git a/_notebooks/_requirements/devel.txt b/_notebooks/_requirements/devel.txt new file mode 100644 index 0000000..e0ad0dc --- /dev/null +++ b/_notebooks/_requirements/devel.txt @@ -0,0 +1,6 @@ +virtualenv>=20.10 +jupytext>=1.10, <1.15 # converting +pytest>=6.0, <7.0 +# testing with own fork with extended cell timeout +https://github.com/Borda/nbval/archive/refs/heads/timeout-limit.zip +papermill>=2.3.4, <2.5.0 # render diff --git a/_notebooks/_requirements/docs.txt b/_notebooks/_requirements/docs.txt new file mode 100644 index 0000000..28b8790 --- /dev/null +++ b/_notebooks/_requirements/docs.txt @@ -0,0 +1,12 @@ +sphinx>=4.0, <5.0 +myst-parser>=0.15 +nbsphinx>=0.8 +pandoc>=1.0 +docutils>=0.16 +sphinx-paramlinks>=0.4.0 +ipython[notebook]>=8.0.0, <8.2.0 + +# https://github.com/Lightning-AI/lightning_sphinx_theme/archive/master.zip#egg=pt-lightning-sphinx-theme +https://github.com/PyTorchKorea/lightning_sphinx_theme/archive/master.zip#egg=pt-lightning-sphinx-theme + +-r ../.actions/requires.txt diff --git a/_notebooks/course_UvA-DL/01-introduction-to-pytorch/.meta.yml b/_notebooks/course_UvA-DL/01-introduction-to-pytorch/.meta.yml new file mode 100644 index 0000000..1e5b5b9 --- /dev/null +++ b/_notebooks/course_UvA-DL/01-introduction-to-pytorch/.meta.yml @@ -0,0 +1,15 @@ +title: "Tutorial 1: Introduction to PyTorch" +author: Phillip Lippe +created: 2021-08-27 +updated: 2023-03-14 +license: CC BY-SA +description: | + This tutorial will give a short introduction to PyTorch basics, and get you setup for writing your own neural networks. + This notebook is part of a lecture series on Deep Learning at the University of Amsterdam. + The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io. +requirements: + - matplotlib + - lightning>=2.0.0rc0 +accelerator: + - CPU + - GPU diff --git a/docs/_static/images/course_UvA-DL/01-introduction-to-pytorch.jpg b/_notebooks/course_UvA-DL/01-introduction-to-pytorch/.thumb.jpg similarity index 100% rename from docs/_static/images/course_UvA-DL/01-introduction-to-pytorch.jpg rename to _notebooks/course_UvA-DL/01-introduction-to-pytorch/.thumb.jpg diff --git a/_notebooks/course_UvA-DL/01-introduction-to-pytorch/Introduction_to_PyTorch.py b/_notebooks/course_UvA-DL/01-introduction-to-pytorch/Introduction_to_PyTorch.py new file mode 100644 index 0000000..c692d14 --- /dev/null +++ b/_notebooks/course_UvA-DL/01-introduction-to-pytorch/Introduction_to_PyTorch.py @@ -0,0 +1,990 @@ +# %% [markdown] +#
+# Welcome to our PyTorch tutorial for the Deep Learning course 2020 at the University of Amsterdam! +# The following notebook is meant to give a short introduction to PyTorch basics, and get you setup for writing your own neural networks. +# PyTorch is an open source machine learning framework that allows you to write your own neural networks and optimize them efficiently. +# However, PyTorch is not the only framework of its kind. +# Alternatives to PyTorch include [TensorFlow](https://www.tensorflow.org/), [JAX](https://github.com/google/jax) and [Caffe](http://caffe.berkeleyvision.org/). +# We choose to teach PyTorch at the University of Amsterdam because it is well established, has a huge developer community (originally developed by Facebook), is very flexible and especially used in research. +# Many current papers publish their code in PyTorch, and thus it is good to be familiar with PyTorch as well. +# Meanwhile, TensorFlow (developed by Google) is usually known for being a production-grade deep learning library. +# Still, if you know one machine learning framework in depth, it is very easy to learn another one because many of them use the same concepts and ideas. +# For instance, TensorFlow's version 2 was heavily inspired by the most popular features of PyTorch, making the frameworks even more similar. +# If you are already familiar with PyTorch and have created your own neural network projects, feel free to just skim this notebook. +# +# We are of course not the first ones to create a PyTorch tutorial. +# There are many great tutorials online, including the ["60-min blitz"](https://pytorch.org/tutorials/beginner/deep_learning_60min_blitz.html) on the official [PyTorch website](https://pytorch.org/tutorials/). +# Yet, we choose to create our own tutorial which is designed to give you the basics particularly necessary for the practicals, but still understand how PyTorch works under the hood. +# Over the next few weeks, we will also keep exploring new PyTorch features in the series of Jupyter notebook tutorials about deep learning. +# +# We will use a set of standard libraries that are often used in machine learning projects. +# If you are running this notebook on Google Colab, all libraries should be pre-installed. +# If you are running this notebook locally, make sure you have installed our `dl2020` environment ([link](https://github.com/uvadlc/uvadlc_practicals_2020/blob/master/environment.yml)) and have activated it. + +# %% +import time + +import matplotlib.pyplot as plt + +# %matplotlib inline +import matplotlib_inline.backend_inline +import numpy as np +import torch +import torch.nn as nn +import torch.utils.data as data +from matplotlib.colors import to_rgba +from torch import Tensor +from tqdm.notebook import tqdm # Progress bar + +matplotlib_inline.backend_inline.set_matplotlib_formats("svg", "pdf") # For export + +# %% [markdown] +# ## The Basics of PyTorch +# +# We will start with reviewing the very basic concepts of PyTorch. +# As a prerequisite, we recommend to be familiar with the `numpy` package as most machine learning frameworks are based on very similar concepts. +# If you are not familiar with numpy yet, don't worry: here is a [tutorial](https://numpy.org/devdocs/user/quickstart.html) to go through. +# +# So, let's start with importing PyTorch. +# The package is called `torch`, based on its original framework [Torch](http://torch.ch/). +# As a first step, we can check its version: + +# %% +print("Using torch", torch.__version__) + +# %% [markdown] +# At the time of writing this tutorial (mid of August 2021), the current stable version is 1.9. +# You should therefore see the output `Using torch 1.9.0`, eventually with some extension for the CUDA version on Colab. +# In case you use the `dl2020` environment, you should see `Using torch 1.6.0` since the environment was provided in October 2020. +# It is recommended to update the PyTorch version to the newest one. +# If you see a lower version number than 1.6, make sure you have installed the correct the environment, or ask one of your TAs. +# In case PyTorch 1.10 or newer will be published during the time of the course, don't worry. +# The interface between PyTorch versions doesn't change too much, and hence all code should also be runnable with newer versions. +# +# As in every machine learning framework, PyTorch provides functions that are stochastic like generating random numbers. +# However, a very good practice is to setup your code to be reproducible with the exact same random numbers. +# This is why we set a seed below. + +# %% +torch.manual_seed(42) # Setting the seed + +# %% [markdown] +# ### Tensors +# +# Tensors are the PyTorch equivalent to Numpy arrays, with the addition to also have support for GPU acceleration (more on that later). +# The name "tensor" is a generalization of concepts you already know. +# For instance, a vector is a 1-D tensor, and a matrix a 2-D tensor. +# When working with neural networks, we will use tensors of various shapes and number of dimensions. +# +# Most common functions you know from numpy can be used on tensors as well. +# Actually, since numpy arrays are so similar to tensors, we can convert most tensors to numpy arrays (and back) but we don't need it too often. +# +# #### Initialization +# +# Let's first start by looking at different ways of creating a tensor. +# There are many possible options, the most simple one is to call +# `Tensor` passing the desired shape as input argument: + +# %% +x = Tensor(2, 3, 4) +print(x) + +# %% [markdown] +# The function `torch.Tensor` allocates memory for the desired tensor, but reuses any values that have already been in the memory. +# To directly assign values to the tensor during initialization, there are many alternatives including: +# +# * `torch.zeros`: Creates a tensor filled with zeros +# * `torch.ones`: Creates a tensor filled with ones +# * `torch.rand`: Creates a tensor with random values uniformly sampled between 0 and 1 +# * `torch.randn`: Creates a tensor with random values sampled from a normal distribution with mean 0 and variance 1 +# * `torch.arange`: Creates a tensor containing the values $N,N+1,N+2,...,M$ +# * `torch.Tensor` (input list): Creates a tensor from the list elements you provide + +# %% +# Create a tensor from a (nested) list +x = Tensor([[1, 2], [3, 4]]) +print(x) + +# %% +# Create a tensor with random values between 0 and 1 with the shape [2, 3, 4] +x = torch.rand(2, 3, 4) +print(x) + +# %% [markdown] +# You can obtain the shape of a tensor in the same way as in numpy (`x.shape`), or using the `.size` method: + +# %% +shape = x.shape +print("Shape:", x.shape) + +size = x.size() +print("Size:", size) + +dim1, dim2, dim3 = x.size() +print("Size:", dim1, dim2, dim3) + +# %% [markdown] +# #### Tensor to Numpy, and Numpy to Tensor +# +# Tensors can be converted to numpy arrays, and numpy arrays back to tensors. +# To transform a numpy array into a tensor, we can use the function `torch.from_numpy`: + +# %% +np_arr = np.array([[1, 2], [3, 4]]) +tensor = torch.from_numpy(np_arr) + +print("Numpy array:", np_arr) +print("PyTorch tensor:", tensor) + +# %% [markdown] +# To transform a PyTorch tensor back to a numpy array, we can use the function `.numpy()` on tensors: + +# %% +tensor = torch.arange(4) +np_arr = tensor.numpy() + +print("PyTorch tensor:", tensor) +print("Numpy array:", np_arr) + +# %% [markdown] +# The conversion of tensors to numpy require the tensor to be on the CPU, and not the GPU (more on GPU support in a later section). +# In case you have a tensor on GPU, you need to call `.cpu()` on the tensor beforehand. +# Hence, you get a line like `np_arr = tensor.cpu().numpy()`. + +# %% [markdown] +# #### Operations +# +# Most operations that exist in numpy, also exist in PyTorch. +# A full list of operations can be found in the [PyTorch documentation](https://pytorch.org/docs/stable/tensors.html#), but we will review the most important ones here. +# +# The simplest operation is to add two tensors: + +# %% +x1 = torch.rand(2, 3) +x2 = torch.rand(2, 3) +y = x1 + x2 + +print("X1", x1) +print("X2", x2) +print("Y", y) + +# %% [markdown] +# Calling `x1 + x2` creates a new tensor containing the sum of the two inputs. +# However, we can also use in-place operations that are applied directly on the memory of a tensor. +# We therefore change the values of `x2` without the chance to re-accessing the values of `x2` before the operation. +# An example is shown below: + +# %% +x1 = torch.rand(2, 3) +x2 = torch.rand(2, 3) +print("X1 (before)", x1) +print("X2 (before)", x2) + +x2.add_(x1) +print("X1 (after)", x1) +print("X2 (after)", x2) + +# %% [markdown] +# In-place operations are usually marked with a underscore postfix (for example `torch.add_` instead of `torch.add`). +# +# Another common operation aims at changing the shape of a tensor. +# A tensor of size (2,3) can be re-organized to any other shape with the same number of elements (e.g. a tensor of size (6), or (3,2), ...). +# In PyTorch, this operation is called `view`: + +# %% +x = torch.arange(6) +print("X", x) + +# %% +x = x.view(2, 3) +print("X", x) + +# %% +x = x.permute(1, 0) # Swapping dimension 0 and 1 +print("X", x) + +# %% [markdown] +# Other commonly used operations include matrix multiplications, which are essential for neural networks. +# Quite often, we have an input vector $\mathbf{x}$, which is transformed using a learned weight matrix $\mathbf{W}$. +# There are multiple ways and functions to perform matrix multiplication, some of which we list below: +# +# * `torch.matmul`: Performs the matrix product over two tensors, where the specific behavior depends on the dimensions. +# If both inputs are matrices (2-dimensional tensors), it performs the standard matrix product. +# For higher dimensional inputs, the function supports broadcasting (for details see the [documentation](https://pytorch.org/docs/stable/generated/torch.matmul.html?highlight=matmul#torch.matmul)). +# Can also be written as `a @ b`, similar to numpy. +# * `torch.mm`: Performs the matrix product over two matrices, but doesn't support broadcasting (see [documentation](https://pytorch.org/docs/stable/generated/torch.mm.html?highlight=torch%20mm#torch.mm)) +# * `torch.bmm`: Performs the matrix product with a support batch dimension. +# If the first tensor $T$ is of shape ($b\times n\times m$), and the second tensor $R$ ($b\times m\times p$), the output $O$ is of shape ($b\times n\times p$), and has been calculated by performing $b$ matrix multiplications of the submatrices of $T$ and $R$: $O_i = T_i @ R_i$ +# * `torch.einsum`: Performs matrix multiplications and more (i.e. sums of products) using the Einstein summation convention. +# Explanation of the Einstein sum can be found in assignment 1. +# +# Usually, we use `torch.matmul` or `torch.bmm`. We can try a matrix multiplication with `torch.matmul` below. + +# %% +x = torch.arange(6) +x = x.view(2, 3) +print("X", x) + +# %% +W = torch.arange(9).view(3, 3) # We can also stack multiple operations in a single line +print("W", W) + +# %% +h = torch.matmul(x, W) # Verify the result by calculating it by hand too! +print("h", h) + +# %% [markdown] +# #### Indexing +# +# We often have the situation where we need to select a part of a tensor. +# Indexing works just like in numpy, so let's try it: + +# %% +x = torch.arange(12).view(3, 4) +print("X", x) + +# %% +print(x[:, 1]) # Second column + +# %% +print(x[0]) # First row + +# %% +print(x[:2, -1]) # First two rows, last column + +# %% +print(x[1:3, :]) # Middle two rows + +# %% [markdown] +# ### Dynamic Computation Graph and Backpropagation +# +# One of the main reasons for using PyTorch in Deep Learning projects is that we can automatically get **gradients/derivatives** of functions that we define. +# We will mainly use PyTorch for implementing neural networks, and they are just fancy functions. +# If we use weight matrices in our function that we want to learn, then those are called the **parameters** or simply the **weights**. +# +# If our neural network would output a single scalar value, we would talk about taking the **derivative**, but you will see that quite often we will have **multiple** output variables ("values"); in that case we talk about **gradients**. +# It's a more general term. +# +# Given an input $\mathbf{x}$, we define our function by **manipulating** that input, usually by matrix-multiplications with weight matrices and additions with so-called bias vectors. +# As we manipulate our input, we are automatically creating a **computational graph**. +# This graph shows how to arrive at our output from our input. +# PyTorch is a **define-by-run** framework; this means that we can just do our manipulations, and PyTorch will keep track of that graph for us. +# Thus, we create a dynamic computation graph along the way. +# +# So, to recap: the only thing we have to do is to compute the **output**, and then we can ask PyTorch to automatically get the **gradients**. +# +# > **Note: Why do we want gradients? +# ** Consider that we have defined a function, a neural net, that is supposed to compute a certain output $y$ for an input vector $\mathbf{x}$. +# We then define an **error measure** that tells us how wrong our network is; how bad it is in predicting output $y$ from input $\mathbf{x}$. +# Based on this error measure, we can use the gradients to **update** the weights $\mathbf{W}$ that were responsible for the output, so that the next time we present input $\mathbf{x}$ to our network, the output will be closer to what we want. +# +# The first thing we have to do is to specify which tensors require gradients. +# By default, when we create a tensor, it does not require gradients. + +# %% +x = torch.ones((3,)) +print(x.requires_grad) + +# %% [markdown] +# We can change this for an existing tensor using the function `requires_grad_()` (underscore indicating that this is a in-place operation). +# Alternatively, when creating a tensor, you can pass the argument +# `requires_grad=True` to most initializers we have seen above. + +# %% +x.requires_grad_(True) +print(x.requires_grad) + +# %% [markdown] +# In order to get familiar with the concept of a computation graph, we will create one for the following function: +# +# $$y = \frac{1}{|x|}\sum_i \left[(x_i + 2)^2 + 3\right]$$ +# +# You could imagine that $x$ are our parameters, and we want to optimize (either maximize or minimize) the output $y$. +# For this, we want to obtain the gradients $\partial y / \partial \mathbf{x}$. +# For our example, we'll use $\mathbf{x}=[0,1,2]$ as our input. + +# %% +x = torch.arange(3, dtype=torch.float32, requires_grad=True) # Only float tensors can have gradients +print("X", x) + +# %% [markdown] +# Now let's build the computation graph step by step. +# You can combine multiple operations in a single line, but we will +# separate them here to get a better understanding of how each operation +# is added to the computation graph. + +# %% +a = x + 2 +b = a**2 +c = b + 3 +y = c.mean() +print("Y", y) + +# %% [markdown] +# Using the statements above, we have created a computation graph that looks similar to the figure below: +# +#
+# +# We calculate $a$ based on the inputs $x$ and the constant $2$, $b$ is $a$ squared, and so on. +# The visualization is an abstraction of the dependencies between inputs and outputs of the operations we have applied. +# Each node of the computation graph has automatically defined a function for calculating the gradients with respect to its inputs, `grad_fn`. +# You can see this when we printed the output tensor $y$. +# This is why the computation graph is usually visualized in the reverse direction (arrows point from the result to the inputs). +# We can perform backpropagation on the computation graph by calling the +# function `backward()` on the last output, which effectively calculates +# the gradients for each tensor that has the property +# `requires_grad=True`: + +# %% +y.backward() + +# %% [markdown] +# `x.grad` will now contain the gradient $\partial y/ \partial \mathcal{x}$, and this gradient indicates how a change in $\mathbf{x}$ will affect output $y$ given the current input $\mathbf{x}=[0,1,2]$: + +# %% +print(x.grad) + +# %% [markdown] +# We can also verify these gradients by hand. +# We will calculate the gradients using the chain rule, in the same way as PyTorch did it: +# +# $$\frac{\partial y}{\partial x_i} = \frac{\partial y}{\partial c_i}\frac{\partial c_i}{\partial b_i}\frac{\partial b_i}{\partial a_i}\frac{\partial a_i}{\partial x_i}$$ +# +# Note that we have simplified this equation to index notation, and by using the fact that all operation besides the mean do not combine the elements in the tensor. +# The partial derivatives are: +# +# $$ +# \frac{\partial a_i}{\partial x_i} = 1,\hspace{1cm} +# \frac{\partial b_i}{\partial a_i} = 2\cdot a_i\hspace{1cm} +# \frac{\partial c_i}{\partial b_i} = 1\hspace{1cm} +# \frac{\partial y}{\partial c_i} = \frac{1}{3} +# $$ +# +# Hence, with the input being $\mathbf{x}=[0,1,2]$, our gradients are $\partial y/\partial \mathbf{x}=[4/3,2,8/3]$. +# The previous code cell should have printed the same result. + +# %% [markdown] +# ### GPU support +# +# A crucial feature of PyTorch is the support of GPUs, short for Graphics Processing Unit. +# A GPU can perform many thousands of small operations in parallel, making it very well suitable for performing large matrix operations in neural networks. +# When comparing GPUs to CPUs, we can list the following main differences (credit: [Kevin Krewell, 2009](https://blogs.nvidia.com/blog/2009/12/16/whats-the-difference-between-a-cpu-and-a-gpu/)) +# +#
+# +# CPUs and GPUs have both different advantages and disadvantages, which is why many computers contain both components and use them for different tasks. +# In case you are not familiar with GPUs, you can read up more details in this [NVIDIA blog post](https://blogs.nvidia.com/blog/2009/12/16/whats-the-difference-between-a-cpu-and-a-gpu/) or [here](https://www.intel.com/content/www/us/en/products/docs/processors/what-is-a-gpu.html). +# +# GPUs can accelerate the training of your network up to a factor of $100$ which is essential for large neural networks. +# PyTorch implements a lot of functionality for supporting GPUs (mostly those of NVIDIA due to the libraries [CUDA](https://developer.nvidia.com/cuda-zone) and [cuDNN](https://developer.nvidia.com/cudnn)). +# First, let's check whether you have a GPU available: + +# %% +gpu_avail = torch.cuda.is_available() +print(f"Is the GPU available? {gpu_avail}") + +# %% [markdown] +# If you have a GPU on your computer but the command above returns False, make sure you have the correct CUDA-version installed. +# The `dl2020` environment comes with the CUDA-toolkit 10.1, which is selected for the Lisa supercomputer. +# Please change it if necessary (CUDA 10.2 is currently common). +# On Google Colab, make sure that you have selected a GPU in your runtime setup (in the menu, check under `Runtime -> Change runtime type`). +# +# By default, all tensors you create are stored on the CPU. +# We can push a tensor to the GPU by using the function `.to(...)`, or `.cuda()`. +# However, it is often a good practice to define a `device` object in your code which points to the GPU if you have one, and otherwise to the CPU. +# Then, you can write your code with respect to this device object, and it allows you to run the same code on both a CPU-only system, and one with a GPU. +# Let's try it below. +# We can specify the device as follows: + +# %% +device = torch.device("cuda") if torch.cuda.is_available() else torch.device("cpu") +print("Device", device) + +# %% [markdown] +# Now let's create a tensor and push it to the device: + +# %% +x = torch.zeros(2, 3) +x = x.to(device) +print("X", x) + +# %% [markdown] +# In case you have a GPU, you should now see the attribute `device='cuda:0'` being printed next to your tensor. +# The zero next to cuda indicates that this is the zero-th GPU device on your computer. +# PyTorch also supports multi-GPU systems, but this you will only need once you have very big networks to train (if interested, see the [PyTorch documentation](https://pytorch.org/docs/stable/distributed.html#distributed-basics)). +# We can also compare the runtime of a large matrix multiplication on the CPU with a operation on the GPU: + +# %% +x = torch.randn(5000, 5000) + +# CPU version +start_time = time.time() +_ = torch.matmul(x, x) +end_time = time.time() +print(f"CPU time: {(end_time - start_time):6.5f}s") + +# GPU version +if torch.cuda.is_available(): + x = x.to(device) + # CUDA is asynchronous, so we need to use different timing functions + start = torch.cuda.Event(enable_timing=True) + end = torch.cuda.Event(enable_timing=True) + start.record() + _ = torch.matmul(x, x) + end.record() + torch.cuda.synchronize() # Waits for everything to finish running on the GPU + print(f"GPU time: {0.001 * start.elapsed_time(end):6.5f}s") # Milliseconds to seconds + +# %% [markdown] +# Depending on the size of the operation and the CPU/GPU in your system, the speedup of this operation can be >50x. +# As `matmul` operations are very common in neural networks, we can already see the great benefit of training a NN on a GPU. +# The time estimate can be relatively noisy here because we haven't run it for multiple times. +# Feel free to extend this, but it also takes longer to run. +# +# When generating random numbers, the seed between CPU and GPU is not synchronized. +# Hence, we need to set the seed on the GPU separately to ensure a reproducible code. +# Note that due to different GPU architectures, running the same code on different GPUs does not guarantee the same random numbers. +# Still, we don't want that our code gives us a different output every time we run it on the exact same hardware. +# Hence, we also set the seed on the GPU: + +# %% +# GPU operations have a separate seed we also want to set +if torch.cuda.is_available(): + torch.cuda.manual_seed(42) + torch.cuda.manual_seed_all(42) + +# Additionally, some operations on a GPU are implemented stochastic for efficiency +# We want to ensure that all operations are deterministic on GPU (if used) for reproducibility +torch.backends.cudnn.deterministic = True +torch.backends.cudnn.benchmark = False + +# %% [markdown] +# ## Learning by example: Continuous XOR +#
+# +# If we want to build a neural network in PyTorch, we could specify all our parameters (weight matrices, bias vectors) using `Tensors` (with `requires_grad=True`), ask PyTorch to calculate the gradients and then adjust the parameters. +# But things can quickly get cumbersome if we have a lot of parameters. +# In PyTorch, there is a package called `torch.nn` that makes building neural networks more convenient. +# +# We will introduce the libraries and all additional parts you might need to train a neural network in PyTorch, using a simple example classifier on a simple yet well known example: XOR. +# Given two binary inputs $x_1$ and $x_2$, the label to predict is $1$ if either $x_1$ or $x_2$ is $1$ while the other is $0$, or the label is $0$ in all other cases. +# The example became famous by the fact that a single neuron, i.e. a linear classifier, cannot learn this simple function. +# Hence, we will learn how to build a small neural network that can learn this function. +# To make it a little bit more interesting, we move the XOR into continuous space and introduce some gaussian noise on the binary inputs. +# Our desired separation of an XOR dataset could look as follows: +# +#
+ +# %% [markdown] +# ### The model +# +# The package `torch.nn` defines a series of useful classes like linear networks layers, activation functions, loss functions etc. +# A full list can be found [here](https://pytorch.org/docs/stable/nn.html). +# In case you need a certain network layer, check the documentation of the package first before writing the layer yourself as the package likely contains the code for it already. +# We import it below: + +# %% +# %% + +# %% [markdown] +# Additionally to `torch.nn`, there is also `torch.nn.functional`. +# It contains functions that are used in network layers. +# This is in contrast to `torch.nn` which defines them as `nn.Modules` (more on it below), and `torch.nn` actually uses a lot of functionalities from `torch.nn.functional`. +# Hence, the functional package is useful in many situations, and so we import it as well here. + +# %% [markdown] +# #### nn.Module +# +# In PyTorch, a neural network is built up out of modules. +# Modules can contain other modules, and a neural network is considered to be a module itself as well. +# The basic template of a module is as follows: + + +# %% +class MyModule(nn.Module): + def __init__(self): + super().__init__() + # Some init for my module + + def forward(self, x): + # Function for performing the calculation of the module. + pass + + +# %% [markdown] +# The forward function is where the computation of the module is taken place, and is executed when you call the module (`nn = MyModule(); nn(x)`). +# In the init function, we usually create the parameters of the module, using `nn.Parameter`, or defining other modules that are used in the forward function. +# The backward calculation is done automatically, but could be overwritten as well if wanted. +# +# #### Simple classifier +# We can now make use of the pre-defined modules in the `torch.nn` package, and define our own small neural network. +# We will use a minimal network with a input layer, one hidden layer with tanh as activation function, and a output layer. +# In other words, our networks should look something like this: +# +#
+# +# The input neurons are shown in blue, which represent the coordinates $x_1$ and $x_2$ of a data point. +# The hidden neurons including a tanh activation are shown in white, and the output neuron in red. +# In PyTorch, we can define this as follows: + + +# %% +class SimpleClassifier(nn.Module): + def __init__(self, num_inputs, num_hidden, num_outputs): + super().__init__() + # Initialize the modules we need to build the network + self.linear1 = nn.Linear(num_inputs, num_hidden) + self.act_fn = nn.Tanh() + self.linear2 = nn.Linear(num_hidden, num_outputs) + + def forward(self, x): + # Perform the calculation of the model to determine the prediction + x = self.linear1(x) + x = self.act_fn(x) + x = self.linear2(x) + return x + + +# %% [markdown] +# For the examples in this notebook, we will use a tiny neural network with two input neurons and four hidden neurons. +# As we perform binary classification, we will use a single output neuron. +# Note that we do not apply a sigmoid on the output yet. +# This is because other functions, especially the loss, are more efficient and precise to calculate on the original outputs instead of the sigmoid output. +# We will discuss the detailed reason later. + +# %% +model = SimpleClassifier(num_inputs=2, num_hidden=4, num_outputs=1) +# Printing a module shows all its submodules +print(model) + +# %% [markdown] +# Printing the model lists all submodules it contains. +# The parameters of a module can be obtained by using its `parameters()` functions, or `named_parameters()` to get a name to each parameter object. +# For our small neural network, we have the following parameters: + +# %% +for name, param in model.named_parameters(): + print(f"Parameter {name}, shape {param.shape}") + +# %% [markdown] +# Each linear layer has a weight matrix of the shape `[output, input]`, and a bias of the shape `[output]`. +# The tanh activation function does not have any parameters. +# Note that parameters are only registered for `nn.Module` objects that are direct object attributes, i.e. `self.a = ...`. +# If you define a list of modules, the parameters of those are not registered for the outer module and can cause some issues when you try to optimize your module. +# There are alternatives, like `nn.ModuleList`, `nn.ModuleDict` and `nn.Sequential`, that allow you to have different data structures of modules. +# We will use them in a few later tutorials and explain them there. + +# %% [markdown] +# ### The data +# +# PyTorch also provides a few functionalities to load the training and +# test data efficiently, summarized in the package `torch.utils.data`. + +# %% + +# %% [markdown] +# The data package defines two classes which are the standard interface for handling data in PyTorch: `data.Dataset`, and `data.DataLoader`. +# The dataset class provides an uniform interface to access the +# training/test data, while the data loader makes sure to efficiently load +# and stack the data points from the dataset into batches during training. + +# %% [markdown] +# #### The dataset class +# +# The dataset class summarizes the basic functionality of a dataset in a natural way. +# To define a dataset in PyTorch, we simply specify two functions: `__getitem__`, and `__len__`. +# The get-item function has to return the $i$-th data point in the dataset, while the len function returns the size of the dataset. +# For the XOR dataset, we can define the dataset class as follows: + +# %% + + +class XORDataset(data.Dataset): + def __init__(self, size, std=0.1): + """ + Inputs: + size - Number of data points we want to generate + std - Standard deviation of the noise (see generate_continuous_xor function) + """ + super().__init__() + self.size = size + self.std = std + self.generate_continuous_xor() + + def generate_continuous_xor(self): + # Each data point in the XOR dataset has two variables, x and y, that can be either 0 or 1 + # The label is their XOR combination, i.e. 1 if only x or only y is 1 while the other is 0. + # If x=y, the label is 0. + data = torch.randint(low=0, high=2, size=(self.size, 2), dtype=torch.float32) + label = (data.sum(dim=1) == 1).to(torch.long) + # To make it slightly more challenging, we add a bit of gaussian noise to the data points. + data += self.std * torch.randn(data.shape) + + self.data = data + self.label = label + + def __len__(self): + # Number of data point we have. Alternatively self.data.shape[0], or self.label.shape[0] + return self.size + + def __getitem__(self, idx): + # Return the idx-th data point of the dataset + # If we have multiple things to return (data point and label), we can return them as tuple + data_point = self.data[idx] + data_label = self.label[idx] + return data_point, data_label + + +# %% [markdown] +# Let's try to create such a dataset and inspect it: + +# %% +dataset = XORDataset(size=200) +print("Size of dataset:", len(dataset)) +print("Data point 0:", dataset[0]) + +# %% [markdown] +# To better relate to the dataset, we visualize the samples below. + + +# %% +def visualize_samples(data, label): + if isinstance(data, Tensor): + data = data.cpu().numpy() + if isinstance(label, Tensor): + label = label.cpu().numpy() + data_0 = data[label == 0] + data_1 = data[label == 1] + + plt.figure(figsize=(4, 4)) + plt.scatter(data_0[:, 0], data_0[:, 1], edgecolor="#333", label="Class 0") + plt.scatter(data_1[:, 0], data_1[:, 1], edgecolor="#333", label="Class 1") + plt.title("Dataset samples") + plt.ylabel(r"$x_2$") + plt.xlabel(r"$x_1$") + plt.legend() + + +# %% +visualize_samples(dataset.data, dataset.label) +plt.show() + +# %% [markdown] +# #### The data loader class +# +# The class `torch.utils.data.DataLoader` represents a Python iterable over a dataset with support for automatic batching, multi-process data loading and many more features. +# The data loader communicates with the dataset using the function `__getitem__`, and stacks its outputs as tensors over the first dimension to form a batch. +# In contrast to the dataset class, we usually don't have to define our own data loader class, but can just create an object of it with the dataset as input. +# Additionally, we can configure our data loader with the following input arguments (only a selection, see full list [here](https://pytorch.org/docs/stable/data.html#torch.utils.data.DataLoader)): +# +# * `batch_size`: Number of samples to stack per batch +# * `shuffle`: If True, the data is returned in a random order. +# This is important during training for introducing stochasticity. +# * `num_workers`: Number of subprocesses to use for data loading. +# The default, 0, means that the data will be loaded in the main process which can slow down training for datasets where loading a data point takes a considerable amount of time (e.g. large images). +# More workers are recommended for those, but can cause issues on Windows computers. +# For tiny datasets as ours, 0 workers are usually faster. +# * `pin_memory`: If True, the data loader will copy Tensors into CUDA pinned memory before returning them. +# This can save some time for large data points on GPUs. +# Usually a good practice to use for a training set, but not necessarily for validation and test to save memory on the GPU. +# * `drop_last`: If True, the last batch is dropped in case it is smaller than the specified batch size. +# This occurs when the dataset size is not a multiple of the batch size. +# Only potentially helpful during training to keep a consistent batch size. +# +# Let's create a simple data loader below: + +# %% +data_loader = data.DataLoader(dataset, batch_size=8, shuffle=True) + +# %% +# next(iter(...)) catches the first batch of the data loader +# If shuffle is True, this will return a different batch every time we run this cell +# For iterating over the whole dataset, we can simple use "for batch in data_loader: ..." +data_inputs, data_labels = next(iter(data_loader)) + +# The shape of the outputs are [batch_size, d_1,...,d_N] where d_1,...,d_N are the +# dimensions of the data point returned from the dataset class +print("Data inputs", data_inputs.shape, "\n", data_inputs) +print("Data labels", data_labels.shape, "\n", data_labels) + +# %% [markdown] +# ### Optimization +# +# After defining the model and the dataset, it is time to prepare the optimization of the model. +# During training, we will perform the following steps: +# +# 1. Get a batch from the data loader +# 2. Obtain the predictions from the model for the batch +# 3. Calculate the loss based on the difference between predictions and labels +# 4. Backpropagation: calculate the gradients for every parameter with respect to the loss +# 5. Update the parameters of the model in the direction of the gradients +# +# We have seen how we can do step 1, 2 and 4 in PyTorch. Now, we will look at step 3 and 5. + +# %% [markdown] +# #### Loss modules +# +# We can calculate the loss for a batch by simply performing a few tensor operations as those are automatically added to the computation graph. +# For instance, for binary classification, we can use Binary Cross Entropy (BCE) which is defined as follows: +# +# $$\mathcal{L}_{BCE} = -\sum_i \left[ y_i \log x_i + (1 - y_i) \log (1 - x_i) \right]$$ +# +# where $y$ are our labels, and $x$ our predictions, both in the range of $[0,1]$. +# However, PyTorch already provides a list of predefined loss functions which we can use (see [here](https://pytorch.org/docs/stable/nn.html#loss-functions) for a full list). +# For instance, for BCE, PyTorch has two modules: `nn.BCELoss()`, `nn.BCEWithLogitsLoss()`. +# While `nn.BCELoss` expects the inputs $x$ to be in the range $[0,1]$, i.e. the output of a sigmoid, `nn.BCEWithLogitsLoss` combines a sigmoid layer and the BCE loss in a single class. +# This version is numerically more stable than using a plain Sigmoid followed by a BCE loss because of the logarithms applied in the loss function. +# Hence, it is adviced to use loss functions applied on "logits" where possible (remember to not apply a sigmoid on the output of the model in this case!). +# For our model defined above, we therefore use the module `nn.BCEWithLogitsLoss`. + +# %% +loss_module = nn.BCEWithLogitsLoss() + +# %% [markdown] +# #### Stochastic Gradient Descent +# +# For updating the parameters, PyTorch provides the package `torch.optim` that has most popular optimizers implemented. +# We will discuss the specific optimizers and their differences later in the course, but will for now use the simplest of them: `torch.optim.SGD`. +# Stochastic Gradient Descent updates parameters by multiplying the gradients with a small constant, called learning rate, and subtracting those from the parameters (hence minimizing the loss). +# Therefore, we slowly move towards the direction of minimizing the loss. +# A good default value of the learning rate for a small network as ours is 0.1. + +# %% +# Input to the optimizer are the parameters of the model: model.parameters() +optimizer = torch.optim.SGD(model.parameters(), lr=0.1) + +# %% [markdown] +# The optimizer provides two useful functions: `optimizer.step()`, and `optimizer.zero_grad()`. +# The step function updates the parameters based on the gradients as explained above. +# The function `optimizer.zero_grad()` sets the gradients of all parameters to zero. +# While this function seems less relevant at first, it is a crucial pre-step before performing backpropagation. +# If we would call the `backward` function on the loss while the parameter gradients are non-zero from the previous batch, the new gradients would actually be added to the previous ones instead of overwriting them. +# This is done because a parameter might occur multiple times in a computation graph, and we need to sum the gradients in this case instead of replacing them. +# Hence, remember to call `optimizer.zero_grad()` before calculating the gradients of a batch. + +# %% [markdown] +# ### Training +# +# Finally, we are ready to train our model. +# As a first step, we create a slightly larger dataset and specify a data loader with a larger batch size. + +# %% +train_dataset = XORDataset(size=1000) +train_data_loader = data.DataLoader(train_dataset, batch_size=128, shuffle=True) + +# %% [markdown] +# Now, we can write a small training function. +# Remember our five steps: load a batch, obtain the predictions, calculate the loss, backpropagate, and update. +# Additionally, we have to push all data and model parameters to the device of our choice (GPU if available). +# For the tiny neural network we have, communicating the data to the GPU actually takes much more time than we could save from running the operation on GPU. +# For large networks, the communication time is significantly smaller than the actual runtime making a GPU crucial in these cases. +# Still, to practice, we will push the data to GPU here. + +# %% +# Push model to device. Has to be only done once +model.to(device) + +# %% [markdown] +# In addition, we set our model to training mode. +# This is done by calling `model.train()`. +# There exist certain modules that need to perform a different forward +# step during training than during testing (e.g. BatchNorm and Dropout), +# and we can switch between them using `model.train()` and `model.eval()`. + + +# %% +def train_model(model, optimizer, data_loader, loss_module, num_epochs=100): + # Set model to train mode + model.train() + + # Training loop + for epoch in tqdm(range(num_epochs)): + for data_inputs, data_labels in data_loader: + + # Step 1: Move input data to device (only strictly necessary if we use GPU) + data_inputs = data_inputs.to(device) + data_labels = data_labels.to(device) + + # Step 2: Run the model on the input data + preds = model(data_inputs) + preds = preds.squeeze(dim=1) # Output is [Batch size, 1], but we want [Batch size] + + # Step 3: Calculate the loss + loss = loss_module(preds, data_labels.float()) + + # Step 4: Perform backpropagation + # Before calculating the gradients, we need to ensure that they are all zero. + # The gradients would not be overwritten, but actually added to the existing ones. + optimizer.zero_grad() + # Perform backpropagation + loss.backward() + + # Step 5: Update the parameters + optimizer.step() + + +# %% +train_model(model, optimizer, train_data_loader, loss_module) + +# %% [markdown] +# #### Saving a model +# +# After finish training a model, we save the model to disk so that we can load the same weights at a later time. +# For this, we extract the so-called `state_dict` from the model which contains all learnable parameters. +# For our simple model, the state dict contains the following entries: + +# %% +state_dict = model.state_dict() +print(state_dict) + +# %% [markdown] +# To save the state dictionary, we can use `torch.save`: + +# %% +# torch.save(object, filename). For the filename, any extension can be used +torch.save(state_dict, "our_model.tar") + +# %% [markdown] +# To load a model from a state dict, we use the function `torch.load` to +# load the state dict from the disk, and the module function +# `load_state_dict` to overwrite our parameters with the new values: + +# %% +# Load state dict from the disk (make sure it is the same name as above) +state_dict = torch.load("our_model.tar") + +# Create a new model and load the state +new_model = SimpleClassifier(num_inputs=2, num_hidden=4, num_outputs=1) +new_model.load_state_dict(state_dict) + +# Verify that the parameters are the same +print("Original model\n", model.state_dict()) +print("\nLoaded model\n", new_model.state_dict()) + +# %% [markdown] +# A detailed tutorial on saving and loading models in PyTorch can be found +# [here](https://pytorch.org/tutorials/beginner/saving_loading_models.html). + +# %% [markdown] +# ### Evaluation +# +# Once we have trained a model, it is time to evaluate it on a held-out test set. +# As our dataset consist of randomly generated data points, we need to +# first create a test set with a corresponding data loader. + +# %% +test_dataset = XORDataset(size=500) +# drop_last -> Don't drop the last batch although it is smaller than 128 +test_data_loader = data.DataLoader(test_dataset, batch_size=128, shuffle=False, drop_last=False) + +# %% [markdown] +# As metric, we will use accuracy which is calculated as follows: +# +# $$acc = \frac{\#\text{correct predictions}}{\#\text{all predictions}} = \frac{TP+TN}{TP+TN+FP+FN}$$ +# +# where TP are the true positives, TN true negatives, FP false positives, and FN the fale negatives. +# +# When evaluating the model, we don't need to keep track of the computation graph as we don't intend to calculate the gradients. +# This reduces the required memory and speed up the model. +# In PyTorch, we can deactivate the computation graph using `with torch.no_grad(): ...`. +# Remember to additionally set the model to eval mode. + + +# %% +def eval_model(model, data_loader): + model.eval() # Set model to eval mode + true_preds, num_preds = 0.0, 0.0 + + with torch.no_grad(): # Deactivate gradients for the following code + for data_inputs, data_labels in data_loader: + + # Determine prediction of model on dev set + data_inputs, data_labels = data_inputs.to(device), data_labels.to(device) + preds = model(data_inputs) + preds = preds.squeeze(dim=1) + preds = torch.sigmoid(preds) # Sigmoid to map predictions between 0 and 1 + pred_labels = (preds >= 0.5).long() # Binarize predictions to 0 and 1 + + # Keep records of predictions for the accuracy metric (true_preds=TP+TN, num_preds=TP+TN+FP+FN) + true_preds += (pred_labels == data_labels).sum() + num_preds += data_labels.shape[0] + + acc = true_preds / num_preds + print(f"Accuracy of the model: {100.0*acc:4.2f}%") + + +# %% +eval_model(model, test_data_loader) + +# %% [markdown] +# If we trained our model correctly, we should see a score close to 100% accuracy. +# However, this is only possible because of our simple task, and +# unfortunately, we usually don't get such high scores on test sets of +# more complex tasks. + +# %% [markdown] +# #### Visualizing classification boundaries +# +# To visualize what our model has learned, we can perform a prediction for every data point in a range of $[-0.5, 1.5]$, and visualize the predicted class as in the sample figure at the beginning of this section. +# This shows where the model has created decision boundaries, and which points would be classified as $0$, and which as $1$. +# We therefore get a background image out of blue (class 0) and orange (class 1). +# The spots where the model is uncertain we will see a blurry overlap. +# The specific code is less relevant compared to the output figure which +# should hopefully show us a clear separation of classes: + + +# %% +@torch.no_grad() # Decorator, same effect as "with torch.no_grad(): ..." over the whole function. +def visualize_classification(model, data, label): + if isinstance(data, Tensor): + data = data.cpu().numpy() + if isinstance(label, Tensor): + label = label.cpu().numpy() + data_0 = data[label == 0] + data_1 = data[label == 1] + + plt.figure(figsize=(4, 4)) + plt.scatter(data_0[:, 0], data_0[:, 1], edgecolor="#333", label="Class 0") + plt.scatter(data_1[:, 0], data_1[:, 1], edgecolor="#333", label="Class 1") + plt.title("Dataset samples") + plt.ylabel(r"$x_2$") + plt.xlabel(r"$x_1$") + plt.legend() + + # Let's make use of a lot of operations we have learned above + model.to(device) + c0 = Tensor(to_rgba("C0")).to(device) + c1 = Tensor(to_rgba("C1")).to(device) + x1 = torch.arange(-0.5, 1.5, step=0.01, device=device) + x2 = torch.arange(-0.5, 1.5, step=0.01, device=device) + xx1, xx2 = torch.meshgrid(x1, x2) # Meshgrid function as in numpy + model_inputs = torch.stack([xx1, xx2], dim=-1) + preds = model(model_inputs) + preds = torch.sigmoid(preds) + # Specifying "None" in a dimension creates a new one + output_image = (1 - preds) * c0[None, None] + preds * c1[None, None] + output_image = ( + output_image.cpu().numpy() + ) # Convert to numpy array. This only works for tensors on CPU, hence first push to CPU + plt.imshow(output_image, origin="lower", extent=(-0.5, 1.5, -0.5, 1.5)) + plt.grid(False) + + +visualize_classification(model, dataset.data, dataset.label) +plt.show() + +# %% [markdown] +# The decision boundaries might not look exactly as in the figure in the preamble of this section which can be caused by running it on CPU or a different GPU architecture. +# Nevertheless, the result on the accuracy metric should be the approximately the same. + +# %% [markdown] +# ## Additional features we didn't get to discuss yet +# +# Finally, you are all set to start with your own PyTorch project! +# In summary, we have looked at how we can build neural networks in PyTorch, and train and test them on data. +# However, there is still much more to PyTorch we haven't discussed yet. +# In the comming series of Jupyter notebooks, we will discover more and more functionalities of PyTorch, so that you also get familiar to PyTorch concepts beyond the basics. +# If you are already interested in learning more of PyTorch, we recommend the official [tutorial website](https://pytorch.org/tutorials/) that contains many tutorials on various topics. +# Especially logging with Tensorboard ([tutorial +# here](https://pytorch.org/tutorials/intermediate/tensorboard_tutorial.html)) +# is a good practice that we will explore from Tutorial 5 on. diff --git a/_notebooks/course_UvA-DL/01-introduction-to-pytorch/comparison_CPU_GPU.png b/_notebooks/course_UvA-DL/01-introduction-to-pytorch/comparison_CPU_GPU.png new file mode 100644 index 0000000..b7d94f9 Binary files /dev/null and b/_notebooks/course_UvA-DL/01-introduction-to-pytorch/comparison_CPU_GPU.png differ diff --git a/_notebooks/course_UvA-DL/01-introduction-to-pytorch/continuous_xor.svg b/_notebooks/course_UvA-DL/01-introduction-to-pytorch/continuous_xor.svg new file mode 100644 index 0000000..12bfd7f --- /dev/null +++ b/_notebooks/course_UvA-DL/01-introduction-to-pytorch/continuous_xor.svg @@ -0,0 +1 @@ + diff --git a/_notebooks/course_UvA-DL/01-introduction-to-pytorch/pytorch_computation_graph.svg b/_notebooks/course_UvA-DL/01-introduction-to-pytorch/pytorch_computation_graph.svg new file mode 100644 index 0000000..912788a --- /dev/null +++ b/_notebooks/course_UvA-DL/01-introduction-to-pytorch/pytorch_computation_graph.svg @@ -0,0 +1 @@ +x2abc3y diff --git a/_notebooks/course_UvA-DL/01-introduction-to-pytorch/small_neural_network.svg b/_notebooks/course_UvA-DL/01-introduction-to-pytorch/small_neural_network.svg new file mode 100644 index 0000000..4a55eac --- /dev/null +++ b/_notebooks/course_UvA-DL/01-introduction-to-pytorch/small_neural_network.svg @@ -0,0 +1 @@ +x1x2 diff --git a/_notebooks/course_UvA-DL/02-activation-functions/.meta.yml b/_notebooks/course_UvA-DL/02-activation-functions/.meta.yml new file mode 100644 index 0000000..8d6392a --- /dev/null +++ b/_notebooks/course_UvA-DL/02-activation-functions/.meta.yml @@ -0,0 +1,20 @@ +title: "Tutorial 2: Activation Functions" +author: Phillip Lippe +created: 2021-08-27 +updated: 2023-03-14 +license: CC BY-SA +description: | + In this tutorial, we will take a closer look at (popular) activation functions and investigate their effect on optimization properties in neural networks. + Activation functions are a crucial part of deep learning models as they add the non-linearity to neural networks. + There is a great variety of activation functions in the literature, and some are more beneficial than others. + The goal of this tutorial is to show the importance of choosing a good activation function (and how to do so), and what problems might occur if we don't. + This notebook is part of a lecture series on Deep Learning at the University of Amsterdam. + The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io. +requirements: + - torchvision + - matplotlib + - seaborn + - lightning>=2.0.0rc0 +accelerator: + - CPU + - GPU diff --git a/docs/_static/images/course_UvA-DL/02-activation-functions.jpg b/_notebooks/course_UvA-DL/02-activation-functions/.thumb.jpg similarity index 100% rename from docs/_static/images/course_UvA-DL/02-activation-functions.jpg rename to _notebooks/course_UvA-DL/02-activation-functions/.thumb.jpg diff --git a/_notebooks/course_UvA-DL/02-activation-functions/Activation_Functions.py b/_notebooks/course_UvA-DL/02-activation-functions/Activation_Functions.py new file mode 100644 index 0000000..1abd126 --- /dev/null +++ b/_notebooks/course_UvA-DL/02-activation-functions/Activation_Functions.py @@ -0,0 +1,800 @@ +# %% [markdown] +#
+# Before we start, we import our standard libraries and set up basic functions: + +# %% +import json +import math +import os +import urllib.request +import warnings +from urllib.error import HTTPError + +import matplotlib.pyplot as plt + +# %matplotlib inline +import matplotlib_inline.backend_inline +import numpy as np +import seaborn as sns +import torch +import torch.nn as nn +import torch.nn.functional as F +import torch.optim as optim +import torch.utils.data as data +import torchvision +from torchvision import transforms +from torchvision.datasets import FashionMNIST +from tqdm.notebook import tqdm + +matplotlib_inline.backend_inline.set_matplotlib_formats("svg", "pdf") # For export +sns.set() + +# %% [markdown] +# We will define a function to set a seed on all libraries we might interact with in this tutorial (here numpy and torch). +# This allows us to make our training reproducible. +# However, note that in contrast to the CPU, the same seed on different GPU architectures can give different results. +# All models here have been trained on an NVIDIA GTX1080Ti. +# +# Additionally, the following cell defines two paths: `DATASET_PATH` and `CHECKPOINT_PATH`. +# The dataset path is the directory where we will download datasets used in the notebooks. +# It is recommended to store all datasets from PyTorch in one joined directory to prevent duplicate downloads. +# The checkpoint path is the directory where we will store trained model weights and additional files. +# The needed files will be automatically downloaded. +# In case you are on Google Colab, it is recommended to change the +# directories to start from the current directory (i.e. remove `../` for +# both dataset and checkpoint path). + +# %% +# Path to the folder where the datasets are/should be downloaded (e.g. MNIST) +DATASET_PATH = os.environ.get("PATH_DATASETS", "data/") +# Path to the folder where the pretrained models are saved +CHECKPOINT_PATH = os.environ.get("PATH_CHECKPOINT", "saved_models/Activation_Functions/") + + +# Function for setting the seed +def set_seed(seed): + np.random.seed(seed) + torch.manual_seed(seed) + if torch.cuda.is_available(): # GPU operation have separate seed + torch.cuda.manual_seed(seed) + torch.cuda.manual_seed_all(seed) + + +set_seed(42) + +# Additionally, some operations on a GPU are implemented stochastic for efficiency +# We want to ensure that all operations are deterministic on GPU (if used) for reproducibility +torch.backends.cudnn.deterministic = True +torch.backends.cudnn.benchmark = False + +# Fetching the device that will be used throughout this notebook +device = torch.device("cpu") if not torch.cuda.is_available() else torch.device("cuda:0") +print("Using device", device) + +# %% [markdown] +# The following cell downloads all pretrained models we will use in this notebook. +# The files are stored on a separate [repository](https://github.com/phlippe/saved_models) to reduce the size of the notebook repository, especially for building the documentation on ReadTheDocs. +# In case the download below fails, you can download the models from a [Google Drive folder](https://drive.google.com/drive/folders/1sFpZUpDJVjiYEvIqISqfkFizfsTnPf4s?usp=sharing). +# Please let me (Phillip) know if an error occurs so it can be fixed for all students. + +# %% +# Github URL where saved models are stored for this tutorial +base_url = "https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial3/" +# Files to download +pretrained_files = [ + "FashionMNIST_elu.config", + "FashionMNIST_elu.tar", + "FashionMNIST_leakyrelu.config", + "FashionMNIST_leakyrelu.tar", + "FashionMNIST_relu.config", + "FashionMNIST_relu.tar", + "FashionMNIST_sigmoid.config", + "FashionMNIST_sigmoid.tar", + "FashionMNIST_swish.config", + "FashionMNIST_swish.tar", + "FashionMNIST_tanh.config", + "FashionMNIST_tanh.tar", +] +# Create checkpoint path if it doesn't exist yet +os.makedirs(CHECKPOINT_PATH, exist_ok=True) + +# For each file, check whether it already exists. If not, try downloading it. +for file_name in pretrained_files: + file_path = os.path.join(CHECKPOINT_PATH, file_name) + if not os.path.isfile(file_path): + file_url = base_url + file_name + print(f"Downloading {file_url}...") + try: + urllib.request.urlretrieve(file_url, file_path) + except HTTPError as e: + print( + "Something went wrong. Please try to download the file from the GDrive folder, or contact the author with the full output including the following error:\n", + e, + ) + +# %% [markdown] +# ## Common activation functions + +# %% [markdown] +# As a first step, we will implement some common activation functions by ourselves. +# Of course, most of them can also be found in the `torch.nn` package (see the [documentation](https://pytorch.org/docs/stable/nn.html#non-linear-activations-weighted-sum-nonlinearity) for an overview). +# However, we'll write our own functions here for a better understanding and insights. +# +# For an easier time of comparing various activation functions, we start +# with defining a base class from which all our future modules will +# inherit: + + +# %% +class ActivationFunction(nn.Module): + def __init__(self): + super().__init__() + self.name = self.__class__.__name__ + self.config = {"name": self.name} + + +# %% [markdown] +# Every activation function will be an `nn.Module` so that we can integrate them nicely in a network. +# We will use the `config` dictionary to store adjustable parameters for some activation functions. +# +# Next, we implement two of the "oldest" activation functions that are still commonly used for various tasks: sigmoid and tanh. +# Both the sigmoid and tanh activation can be also found as PyTorch functions (`torch.sigmoid`, `torch.tanh`) or as modules (`nn.Sigmoid`, `nn.Tanh`). +# Here, we implement them by hand: + +# %% +class Sigmoid(ActivationFunction): + def forward(self, x): + return 1 / (1 + torch.exp(-x)) + + +class Tanh(ActivationFunction): + def forward(self, x): + x_exp, neg_x_exp = torch.exp(x), torch.exp(-x) + return (x_exp - neg_x_exp) / (x_exp + neg_x_exp) + + +# %% [markdown] +# Another popular activation function that has allowed the training of deeper networks, is the Rectified Linear Unit (ReLU). +# Despite its simplicity of being a piecewise linear function, ReLU has one major benefit compared to sigmoid and tanh: a strong, stable gradient for a large range of values. +# Based on this idea, a lot of variations of ReLU have been proposed, of which we will implement the following three: LeakyReLU, ELU, and Swish. +# LeakyReLU replaces the zero settings in the negative part with a smaller slope to allow gradients to flow also in this part of the input. +# Similarly, ELU replaces the negative part with an exponential decay. +# The third, most recently proposed activation function is Swish, which is actually the result of a large experiment with the purpose of finding the "optimal" activation function. +# Compared to the other activation functions, Swish is both smooth and non-monotonic (i.e. contains a change of sign in the gradient). +# This has been shown to prevent dead neurons as in standard ReLU activation, especially for deep networks. +# If interested, a more detailed discussion of the benefits of Swish can be found in [this paper](https://arxiv.org/abs/1710.05941) [1]. +# +# Let's implement the four activation functions below: + +# %% +class ReLU(ActivationFunction): + def forward(self, x): + return x * (x > 0).float() + + +class LeakyReLU(ActivationFunction): + def __init__(self, alpha=0.1): + super().__init__() + self.config["alpha"] = alpha + + def forward(self, x): + return torch.where(x > 0, x, self.config["alpha"] * x) + + +class ELU(ActivationFunction): + def forward(self, x): + return torch.where(x > 0, x, torch.exp(x) - 1) + + +class Swish(ActivationFunction): + def forward(self, x): + return x * torch.sigmoid(x) + + +# %% [markdown] +# For later usage, we summarize all our activation functions in a dictionary mapping the name to the class object. +# In case you implement a new activation function by yourself, add it here to include it in future comparisons as well: + +# %% +act_fn_by_name = {"sigmoid": Sigmoid, "tanh": Tanh, "relu": ReLU, "leakyrelu": LeakyReLU, "elu": ELU, "swish": Swish} + +# %% [markdown] +# ### Visualizing activation functions +# +# To get an idea of what each activation function actually does, we will visualize them in the following. +# Next to the actual activation value, the gradient of the function is an important aspect as it is crucial for optimizing the neural network. +# PyTorch allows us to compute the gradients simply by calling the `backward` function: + + +# %% +def get_grads(act_fn, x): + """Computes the gradients of an activation function at specified positions. + + Args: + act_fn: An object of the class "ActivationFunction" with an implemented forward pass. + x: 1D input tensor. + Returns: + A tensor with the same size of x containing the gradients of act_fn at x. + """ + x = x.clone().requires_grad_() # Mark the input as tensor for which we want to store gradients + out = act_fn(x) + out.sum().backward() # Summing results in an equal gradient flow to each element in x + return x.grad # Accessing the gradients of x by "x.grad" + + +# %% [markdown] +# Now we can visualize all our activation functions including their gradients: + + +# %% +def vis_act_fn(act_fn, ax, x): + # Run activation function + y = act_fn(x) + y_grads = get_grads(act_fn, x) + # Push x, y and gradients back to cpu for plotting + x, y, y_grads = x.cpu().numpy(), y.cpu().numpy(), y_grads.cpu().numpy() + # Plotting + ax.plot(x, y, linewidth=2, label="ActFn") + ax.plot(x, y_grads, linewidth=2, label="Gradient") + ax.set_title(act_fn.name) + ax.legend() + ax.set_ylim(-1.5, x.max()) + + +# Add activation functions if wanted +act_fns = [act_fn() for act_fn in act_fn_by_name.values()] +x = torch.linspace(-5, 5, 1000) # Range on which we want to visualize the activation functions +# Plotting +cols = 2 +rows = math.ceil(len(act_fns) / float(cols)) +fig, ax = plt.subplots(rows, cols, figsize=(cols * 4, rows * 4)) +for i, act_fn in enumerate(act_fns): + vis_act_fn(act_fn, ax[divmod(i, cols)], x) +fig.subplots_adjust(hspace=0.3) +plt.show() + +# %% [markdown] +# ## Analysing the effect of activation functions +#
+ + +# %% [markdown] +# After implementing and visualizing the activation functions, we are aiming to gain insights into their effect. +# We do this by using a simple neural network trained on +# [FashionMNIST](https://github.com/zalandoresearch/fashion-mnist) and +# examine various aspects of the model, including the performance and +# gradient flow. + +# %% [markdown] +# ### Setup + +# %% [markdown] +# Firstly, let's set up a neural network. +# The chosen network views the images as 1D tensors and pushes them through a sequence of linear layers and a specified activation function. +# Feel free to experiment with other network architectures. + + +# %% +class BaseNetwork(nn.Module): + def __init__(self, act_fn, input_size=784, num_classes=10, hidden_sizes=[512, 256, 256, 128]): + """ + Args: + act_fn: Object of the activation function that should be used as non-linearity in the network. + input_size: Size of the input images in pixels + num_classes: Number of classes we want to predict + hidden_sizes: A list of integers specifying the hidden layer sizes in the NN + """ + super().__init__() + + # Create the network based on the specified hidden sizes + layers = [] + layer_sizes = [input_size] + hidden_sizes + layer_size_last = layer_sizes[0] + for layer_size in layer_sizes[1:]: + layers += [nn.Linear(layer_size_last, layer_size), act_fn] + layer_size_last = layer_size + layers += [nn.Linear(layer_sizes[-1], num_classes)] + # nn.Sequential summarizes a list of modules into a single module, applying them in sequence + self.layers = nn.Sequential(*layers) + + # We store all hyperparameters in a dictionary for saving and loading of the model + self.config = { + "act_fn": act_fn.config, + "input_size": input_size, + "num_classes": num_classes, + "hidden_sizes": hidden_sizes, + } + + def forward(self, x): + x = x.view(x.size(0), -1) # Reshape images to a flat vector + out = self.layers(x) + return out + + +# %% [markdown] +# We also add functions for loading and saving the model. +# The hyperparameters are stored in a configuration file (simple json file): + + +# %% +def _get_config_file(model_path, model_name): + # Name of the file for storing hyperparameter details + return os.path.join(model_path, model_name + ".config") + + +def _get_model_file(model_path, model_name): + # Name of the file for storing network parameters + return os.path.join(model_path, model_name + ".tar") + + +def load_model(model_path, model_name, net=None): + """Loads a saved model from disk. + + Args: + model_path: Path of the checkpoint directory + model_name: Name of the model (str) + net: (Optional) If given, the state dict is loaded into this model. Otherwise, a new model is created. + """ + config_file, model_file = _get_config_file(model_path, model_name), _get_model_file(model_path, model_name) + assert os.path.isfile( + config_file + ), f'Could not find the config file "{config_file}". Are you sure this is the correct path and you have your model config stored here?' + assert os.path.isfile( + model_file + ), f'Could not find the model file "{model_file}". Are you sure this is the correct path and you have your model stored here?' + with open(config_file) as f: + config_dict = json.load(f) + if net is None: + act_fn_name = config_dict["act_fn"].pop("name").lower() + act_fn = act_fn_by_name[act_fn_name](**config_dict.pop("act_fn")) + net = BaseNetwork(act_fn=act_fn, **config_dict) + net.load_state_dict(torch.load(model_file, map_location=device)) + return net + + +def save_model(model, model_path, model_name): + """Given a model, we save the state_dict and hyperparameters. + + Args: + model: Network object to save parameters from + model_path: Path of the checkpoint directory + model_name: Name of the model (str) + """ + config_dict = model.config + os.makedirs(model_path, exist_ok=True) + config_file, model_file = _get_config_file(model_path, model_name), _get_model_file(model_path, model_name) + with open(config_file, "w") as f: + json.dump(config_dict, f) + torch.save(model.state_dict(), model_file) + + +# %% [markdown] +# We also set up the dataset we want to train it on, namely [FashionMNIST](https://github.com/zalandoresearch/fashion-mnist). +# FashionMNIST is a more complex version of MNIST and contains black-and-white images of clothes instead of digits. +# The 10 classes include trousers, coats, shoes, bags and more. +# To load this dataset, we will make use of yet another PyTorch package, namely `torchvision` ([documentation](https://pytorch.org/vision/stable/index.html)). +# The `torchvision` package consists of popular datasets, model architectures, and common image transformations for computer vision. +# We will use the package for many of the notebooks in this course to simplify our dataset handling. +# +# Let's load the dataset below, and visualize a few images to get an impression of the data. + +# %% + +# Transformations applied on each image => first make them a tensor, then normalize them in the range -1 to 1 +transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.5,), (0.5,))]) + +# Loading the training dataset. We need to split it into a training and validation part +train_dataset = FashionMNIST(root=DATASET_PATH, train=True, transform=transform, download=True) +train_set, val_set = torch.utils.data.random_split(train_dataset, [50000, 10000]) + +# Loading the test set +test_set = FashionMNIST(root=DATASET_PATH, train=False, transform=transform, download=True) + +# %% [markdown] +# We define a set of data loaders that we can use for various purposes later. +# Note that for actually training a model, we will use different data loaders +# with a lower batch size. + +# %% +train_loader = data.DataLoader(train_set, batch_size=1024, shuffle=True, drop_last=False) +val_loader = data.DataLoader(val_set, batch_size=1024, shuffle=False, drop_last=False) +test_loader = data.DataLoader(test_set, batch_size=1024, shuffle=False, drop_last=False) + +# %% +exmp_imgs = [train_set[i][0] for i in range(16)] +# Organize the images into a grid for nicer visualization +img_grid = torchvision.utils.make_grid(torch.stack(exmp_imgs, dim=0), nrow=4, normalize=True, pad_value=0.5) +img_grid = img_grid.permute(1, 2, 0) + +plt.figure(figsize=(8, 8)) +plt.title("FashionMNIST examples") +plt.imshow(img_grid) +plt.axis("off") +plt.show() +plt.close() + +# %% [markdown] +# ### Visualizing the gradient flow after initialization +# +# As mentioned previously, one important aspect of activation functions is how they propagate gradients through the network. +# Imagine we have a very deep neural network with more than 50 layers. +# The gradients for the input layer, i.e. the very first layer, have passed >50 times the activation function, but we still want them to be of a reasonable size. +# If the gradient through the activation function is (in expectation) considerably smaller than 1, our gradients will vanish until they reach the input layer. +# If the gradient through the activation function is larger than 1, the gradients exponentially increase and might explode. +# +# To get a feeling of how every activation function influences the +# gradients, we can look at a freshly initialized network and measure the +# gradients for each parameter for a batch of 256 images: + + +# %% +def visualize_gradients(net, color="C0"): + """ + Args: + net: Object of class BaseNetwork + color: Color in which we want to visualize the histogram (for easier separation of activation functions) + """ + net.eval() + small_loader = data.DataLoader(train_set, batch_size=256, shuffle=False) + imgs, labels = next(iter(small_loader)) + imgs, labels = imgs.to(device), labels.to(device) + + # Pass one batch through the network, and calculate the gradients for the weights + net.zero_grad() + preds = net(imgs) + loss = F.cross_entropy(preds, labels) + loss.backward() + # We limit our visualization to the weight parameters and exclude the bias to reduce the number of plots + grads = { + name: params.grad.data.view(-1).cpu().clone().numpy() + for name, params in net.named_parameters() + if "weight" in name + } + net.zero_grad() + + # Plotting + columns = len(grads) + fig, ax = plt.subplots(1, columns, figsize=(columns * 3.5, 2.5)) + fig_index = 0 + for key in grads: + key_ax = ax[fig_index % columns] + sns.histplot(data=grads[key], bins=30, ax=key_ax, color=color, kde=True) + key_ax.set_title(str(key)) + key_ax.set_xlabel("Grad magnitude") + fig_index += 1 + fig.suptitle( + f"Gradient magnitude distribution for activation function {net.config['act_fn']['name']}", fontsize=14, y=1.05 + ) + fig.subplots_adjust(wspace=0.45) + plt.show() + plt.close() + + +# %% +# Seaborn prints warnings if histogram has small values. We can ignore them for now +warnings.filterwarnings("ignore") +# Create a plot for every activation function +for i, act_fn_name in enumerate(act_fn_by_name): + # Setting the seed ensures that we have the same weight initialization for each activation function + set_seed(42) + act_fn = act_fn_by_name[act_fn_name]() + net_actfn = BaseNetwork(act_fn=act_fn).to(device) + visualize_gradients(net_actfn, color=f"C{i}") + +# %% [markdown] +# The sigmoid activation function shows a clearly undesirable behavior. +# While the gradients for the output layer are very large with up to 0.1, the input layer has the lowest gradient norm across all activation functions with only 1e-5. +# This is due to its small maximum gradient of 1/4, and finding a suitable learning rate across all layers is not possible in this setup. +# All the other activation functions show to have similar gradient norms across all layers. +# Interestingly, the ReLU activation has a spike around 0 which is caused by its zero-part on the left, and dead neurons (we will take a closer look at this later on). +# +# Note that additionally to the activation, the initialization of the weight parameters can be crucial. +# By default, PyTorch uses the [Kaiming](https://pytorch.org/docs/stable/nn.init.html#torch.nn.init.kaiming_uniform_) initialization for linear layers optimized for Tanh activations. +# In Tutorial 4, we will take a closer look at initialization, but assume +# for now that the Kaiming initialization works for all activation +# functions reasonably well. + +# %% [markdown] +# ### Training a model +# +# Next, we want to train our model with different activation functions on FashionMNIST and compare the gained performance. +# All in all, our final goal is to achieve the best possible performance on a dataset of our choice. +# Therefore, we write a training loop in the next cell including a +# validation after every epoch and a final test on the best model: + + +# %% +def train_model(net, model_name, max_epochs=50, patience=7, batch_size=256, overwrite=False): + """Train a model on the training set of FashionMNIST. + + Args: + net: Object of BaseNetwork + model_name: (str) Name of the model, used for creating the checkpoint names + max_epochs: Number of epochs we want to (maximally) train for + patience: If the performance on the validation set has not improved for #patience epochs, we stop training early + batch_size: Size of batches used in training + overwrite: Determines how to handle the case when there already exists a checkpoint. If True, it will be overwritten. Otherwise, we skip training. + """ + file_exists = os.path.isfile(_get_model_file(CHECKPOINT_PATH, model_name)) + if file_exists and not overwrite: + print("Model file already exists. Skipping training...") + else: + if file_exists: + print("Model file exists, but will be overwritten...") + + # Defining optimizer, loss and data loader + optimizer = optim.SGD(net.parameters(), lr=1e-2, momentum=0.9) # Default parameters, feel free to change + loss_module = nn.CrossEntropyLoss() + train_loader_local = data.DataLoader( + train_set, batch_size=batch_size, shuffle=True, drop_last=True, pin_memory=True + ) + + val_scores = [] + best_val_epoch = -1 + for epoch in range(max_epochs): + ############ + # Training # + ############ + net.train() + true_preds, count = 0.0, 0 + for imgs, labels in tqdm(train_loader_local, desc=f"Epoch {epoch+1}", leave=False): + imgs, labels = imgs.to(device), labels.to(device) # To GPU + optimizer.zero_grad() # Zero-grad can be placed anywhere before "loss.backward()" + preds = net(imgs) + loss = loss_module(preds, labels) + loss.backward() + optimizer.step() + # Record statistics during training + true_preds += (preds.argmax(dim=-1) == labels).sum() + count += labels.shape[0] + train_acc = true_preds / count + + ############## + # Validation # + ############## + val_acc = test_model(net, val_loader) + val_scores.append(val_acc) + print( + f"[Epoch {epoch+1:2i}] Training accuracy: {train_acc*100.0:05.2f}%, Validation accuracy: {val_acc*100.0:05.2f}%" + ) + + if len(val_scores) == 1 or val_acc > val_scores[best_val_epoch]: + print("\t (New best performance, saving model...)") + save_model(net, CHECKPOINT_PATH, model_name) + best_val_epoch = epoch + elif best_val_epoch <= epoch - patience: + print(f"Early stopping due to no improvement over the last {patience} epochs") + break + + # Plot a curve of the validation accuracy + plt.plot([i for i in range(1, len(val_scores) + 1)], val_scores) + plt.xlabel("Epochs") + plt.ylabel("Validation accuracy") + plt.title(f"Validation performance of {model_name}") + plt.show() + plt.close() + + load_model(CHECKPOINT_PATH, model_name, net=net) + test_acc = test_model(net, test_loader) + print((f" Test accuracy: {test_acc*100.0:4.2f}% ").center(50, "=") + "\n") + return test_acc + + +def test_model(net, data_loader): + """Test a model on a specified dataset. + + Args: + net: Trained model of type BaseNetwork + data_loader: DataLoader object of the dataset to test on (validation or test) + """ + net.eval() + true_preds, count = 0.0, 0 + for imgs, labels in data_loader: + imgs, labels = imgs.to(device), labels.to(device) + with torch.no_grad(): + preds = net(imgs).argmax(dim=-1) + true_preds += (preds == labels).sum().item() + count += labels.shape[0] + test_acc = true_preds / count + return test_acc + + +# %% [markdown] +# We train one model for each activation function. +# We recommend using the pretrained models to save time if you are running this notebook on CPU. + +# %% +for act_fn_name in act_fn_by_name: + print(f"Training BaseNetwork with {act_fn_name} activation...") + set_seed(42) + act_fn = act_fn_by_name[act_fn_name]() + net_actfn = BaseNetwork(act_fn=act_fn).to(device) + train_model(net_actfn, f"FashionMNIST_{act_fn_name}", overwrite=False) + +# %% [markdown] +# Not surprisingly, the model using the sigmoid activation function shows to fail and does not improve upon random performance (10 classes => 1/10 for random chance). +# +# All the other activation functions gain similar performance. +# To have a more accurate conclusion, we would have to train the models for multiple seeds and look at the averages. +# However, the "optimal" activation function also depends on many other factors (hidden sizes, number of layers, type of layers, task, dataset, optimizer, learning rate, etc.) +# so that a thorough grid search would not be useful in our case. +# In the literature, activation functions that have shown to work well +# with deep networks are all types of ReLU functions we experiment with +# here, with small gains for specific activation functions in specific +# networks. + +# %% [markdown] +# ### Visualizing the activation distribution + +# %% [markdown] +# After we have trained the models, we can look at the actual activation values that find inside the model. +# For instance, how many neurons are set to zero in ReLU? +# Where do we find most values in Tanh? +# To answer these questions, we can write a simple function which takes a +# trained model, applies it to a batch of images, and plots the histogram +# of the activations inside the network: + + +# %% +def visualize_activations(net, color="C0"): + activations = {} + + net.eval() + small_loader = data.DataLoader(train_set, batch_size=1024) + imgs, labels = next(iter(small_loader)) + with torch.no_grad(): + layer_index = 0 + imgs = imgs.to(device) + imgs = imgs.view(imgs.size(0), -1) + # We need to manually loop through the layers to save all activations + for layer_index, layer in enumerate(net.layers[:-1]): + imgs = layer(imgs) + activations[layer_index] = imgs.view(-1).cpu().numpy() + + # Plotting + columns = 4 + rows = math.ceil(len(activations) / columns) + fig, ax = plt.subplots(rows, columns, figsize=(columns * 2.7, rows * 2.5)) + fig_index = 0 + for key in activations: + key_ax = ax[fig_index // columns][fig_index % columns] + sns.histplot(data=activations[key], bins=50, ax=key_ax, color=color, kde=True, stat="density") + key_ax.set_title(f"Layer {key} - {net.layers[key].__class__.__name__}") + fig_index += 1 + fig.suptitle(f"Activation distribution for activation function {net.config['act_fn']['name']}", fontsize=14) + fig.subplots_adjust(hspace=0.4, wspace=0.4) + plt.show() + plt.close() + + +# %% +for i, act_fn_name in enumerate(act_fn_by_name): + net_actfn = load_model(model_path=CHECKPOINT_PATH, model_name=f"FashionMNIST_{act_fn_name}").to(device) + visualize_activations(net_actfn, color=f"C{i}") + +# %% [markdown] +# As the model with sigmoid activation was not able to train properly, the activations are also less informative and all gathered around 0.5 (the activation at input 0). +# +# The tanh shows a more diverse behavior. +# While for the input layer we experience a larger amount of neurons to be close to -1 and 1, where the gradients are close to zero, the activations in the two consecutive layers are closer to zero. +# This is probably because the input layers look for specific features in the input image, and the consecutive layers combine those together. +# The activations for the last layer are again more biased to the extreme points because the classification layer can be seen as a weighted average of those values (the gradients push the activations to those extremes). +# +# The ReLU has a strong peak at 0, as we initially expected. +# The effect of having no gradients for negative values is that the network does not have a Gaussian-like distribution after the linear layers, but a longer tail towards the positive values. +# The LeakyReLU shows a very similar behavior while ELU follows again a more Gaussian-like distribution. +# The Swish activation seems to lie in between, although it is worth noting that Swish uses significantly higher values than other activation functions (up to 20). +# +# As all activation functions show slightly different behavior although +# obtaining similar performance for our simple network, it becomes +# apparent that the selection of the "optimal" activation function really +# depends on many factors, and is not the same for all possible networks. + +# %% [markdown] +# ### Finding dead neurons in ReLU networks + +# %% [markdown] +# One known drawback of the ReLU activation is the occurrence of "dead neurons", i.e. neurons with no gradient for any training input. +# The issue of dead neurons is that as no gradient is provided for the layer, we cannot train the parameters of this neuron in the previous layer to obtain output values besides zero. +# For dead neurons to happen, the output value of a specific neuron of the linear layer before the ReLU has to be negative for all input images. +# Considering the large number of neurons we have in a neural network, it is not unlikely for this to happen. +# +# To get a better understanding of how much of a problem this is, and when we need to be careful, we will measure how many dead neurons different networks have. +# For this, we implement a function which runs the network on the whole +# training set and records whether a neuron is exactly 0 for all data +# points or not: + + +# %% +@torch.no_grad() +def measure_number_dead_neurons(net): + """Function to measure the number of dead neurons in a trained neural network. + + For each neuron, we create a boolean variable initially set to 1. If it has an activation unequals 0 at any time, we + set this variable to 0. After running through the whole training set, only dead neurons will have a 1. + """ + neurons_dead = [ + torch.ones(layer.weight.shape[0], device=device, dtype=torch.bool) + for layer in net.layers[:-1] + if isinstance(layer, nn.Linear) + ] # Same shapes as hidden size in BaseNetwork + + net.eval() + for imgs, labels in tqdm(train_loader, leave=False): # Run through whole training set + layer_index = 0 + imgs = imgs.to(device) + imgs = imgs.view(imgs.size(0), -1) + for layer in net.layers[:-1]: + imgs = layer(imgs) + if isinstance(layer, ActivationFunction): + # Are all activations == 0 in the batch, and we did not record the opposite in the last batches? + neurons_dead[layer_index] = torch.logical_and(neurons_dead[layer_index], (imgs == 0).all(dim=0)) + layer_index += 1 + number_neurons_dead = [t.sum().item() for t in neurons_dead] + print("Number of dead neurons:", number_neurons_dead) + print( + "In percentage:", + ", ".join( + [f"{(100.0 * num_dead / tens.shape[0]):4.2f}%" for tens, num_dead in zip(neurons_dead, number_neurons_dead)] + ), + ) + + +# %% [markdown] +# First, we can measure the number of dead neurons for an untrained network: + +# %% +set_seed(42) +net_relu = BaseNetwork(act_fn=ReLU()).to(device) +measure_number_dead_neurons(net_relu) + +# %% [markdown] +# We see that only a minor amount of neurons are dead, but that they increase with the depth of the layer. +# However, this is not a problem for the small number of dead neurons we have as the input to later layers is changed due to updates to the weights of previous layers. +# Therefore, dead neurons in later layers can potentially become "alive"/active again. +# +# How does this look like for a trained network (with the same initialization)? + +# %% +net_relu = load_model(model_path=CHECKPOINT_PATH, model_name="FashionMNIST_relu").to(device) +measure_number_dead_neurons(net_relu) + +# %% [markdown] +# The number of dead neurons indeed decreased in the later layers. +# However, it should be noted that dead neurons are especially problematic in the input layer. +# As the input does not change over epochs (the training set is kept as it is), training the network cannot turn those neurons back active. +# Still, the input data has usually a sufficiently high standard deviation to reduce the risk of dead neurons. +# +# Finally, we check how the number of dead neurons behaves with increasing layer depth. +# For instance, let's take the following 10-layer neural network: + +# %% +set_seed(42) +net_relu = BaseNetwork( + act_fn=ReLU(), + hidden_sizes=[256, 256, 256, 256, 256, 128, 128, 128, 128, 128], +).to(device) +measure_number_dead_neurons(net_relu) + +# %% [markdown] +# The number of dead neurons is significantly higher than before which harms the gradient flow especially in the first iterations. +# For instance, more than 56% of the neurons in the pre-last layer are dead which creates a considerable bottleneck. +# Hence, it is advisible to use other nonlinearities like Swish for very deep networks. + +# %% [markdown] +# ## Conclusion +# +# In this notebook, we have reviewed a set of six activation functions (sigmoid, tanh, ReLU, LeakyReLU, ELU, and Swish) in neural networks, and discussed how they influence the gradient distribution across layers. +# Sigmoid tends to fail deep neural networks as the highest gradient it provides is 0.25 leading to vanishing gradients in early layers. +# All ReLU-based activation functions have shown to perform well, and besides the original ReLU, do not have the issue of dead neurons. +# When implementing your own neural network, it is recommended to start +# with a ReLU-based network and select the specific activation function +# based on the properties of the network. + +# %% [markdown] +# ## References +# +# [1] Ramachandran, Prajit, Barret Zoph, and Quoc V. Le. +# "Searching for activation functions." +# arXiv preprint arXiv:1710.05941 (2017). +# [Paper link](https://arxiv.org/abs/1710.05941) diff --git a/_notebooks/course_UvA-DL/03-initialization-and-optimization/.meta.yml b/_notebooks/course_UvA-DL/03-initialization-and-optimization/.meta.yml new file mode 100644 index 0000000..dee86a0 --- /dev/null +++ b/_notebooks/course_UvA-DL/03-initialization-and-optimization/.meta.yml @@ -0,0 +1,24 @@ +title: "Tutorial 3: Initialization and Optimization" +author: Phillip Lippe +created: 2021-08-27 +updated: 2023-03-14 +license: CC BY-SA +tags: + - Image + - Initialization + - Optimizers +description: | + In this tutorial, we will review techniques for optimization and initialization of neural networks. + When increasing the depth of neural networks, there are various challenges we face. + Most importantly, we need to have a stable gradient flow through the network, as otherwise, we might encounter vanishing or exploding gradients. + This is why we will take a closer look at the following concepts: initialization and optimization. + This notebook is part of a lecture series on Deep Learning at the University of Amsterdam. + The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io. +requirements: + - torchvision + - matplotlib + - seaborn + - lightning>=2.0.0rc0 +accelerator: + - CPU + - GPU diff --git a/docs/_static/images/course_UvA-DL/03-initialization-and-optimization.jpg b/_notebooks/course_UvA-DL/03-initialization-and-optimization/.thumb.jpg similarity index 100% rename from docs/_static/images/course_UvA-DL/03-initialization-and-optimization.jpg rename to _notebooks/course_UvA-DL/03-initialization-and-optimization/.thumb.jpg diff --git a/_notebooks/course_UvA-DL/03-initialization-and-optimization/Initialization_and_Optimization.py b/_notebooks/course_UvA-DL/03-initialization-and-optimization/Initialization_and_Optimization.py new file mode 100644 index 0000000..4fd6e47 --- /dev/null +++ b/_notebooks/course_UvA-DL/03-initialization-and-optimization/Initialization_and_Optimization.py @@ -0,0 +1,1157 @@ +# %% [markdown] +#
+# In the first half of the notebook, we will review different initialization techniques, and go step by step from the simplest initialization to methods that are nowadays used in very deep networks. +# In the second half, we focus on optimization comparing the optimizers SGD, SGD with Momentum, and Adam. +# +# Let's start with importing our standard libraries: + +# %% +import copy +import json +import math +import os +import urllib.request +from urllib.error import HTTPError + +import lightning as L +import matplotlib.pyplot as plt + +# %matplotlib inline +import matplotlib_inline.backend_inline +import numpy as np +import seaborn as sns +import torch +import torch.nn as nn +import torch.nn.functional as F +import torch.utils.data as data +from matplotlib import cm +from torchvision import transforms +from torchvision.datasets import FashionMNIST +from tqdm.notebook import tqdm + +matplotlib_inline.backend_inline.set_matplotlib_formats("svg", "pdf") # For export +sns.set() + +# %% [markdown] +# Instead of the `set_seed` function as in Tutorial 3, we can use Lightning's build-in function `L.seed_everything`. +# We will reuse the path variables `DATASET_PATH` and `CHECKPOINT_PATH` as in Tutorial 3. +# Adjust the paths if necessary. + +# %% +# Path to the folder where the datasets are/should be downloaded (e.g. MNIST) +DATASET_PATH = os.environ.get("PATH_DATASETS", "data/") +# Path to the folder where the pretrained models are saved +CHECKPOINT_PATH = os.environ.get("PATH_CHECKPOINT", "saved_models/InitOptim/") + +# Seed everything +L.seed_everything(42) + +# Ensure that all operations are deterministic on GPU (if used) for reproducibility +torch.backends.cudnn.deterministic = True +torch.backends.cudnn.benchmark = False + +# Fetching the device that will be used throughout this notebook +device = torch.device("cpu") if not torch.cuda.is_available() else torch.device("cuda:0") +print("Using device", device) + +# %% [markdown] +# In the last part of the notebook, we will train models using three different optimizers. +# The pretrained models for those are downloaded below. + +# %% +# Github URL where saved models are stored for this tutorial +base_url = "https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial4/" +# Files to download +pretrained_files = [ + "FashionMNIST_SGD.config", + "FashionMNIST_SGD_results.json", + "FashionMNIST_SGD.tar", + "FashionMNIST_SGDMom.config", + "FashionMNIST_SGDMom_results.json", + "FashionMNIST_SGDMom.tar", + "FashionMNIST_Adam.config", + "FashionMNIST_Adam_results.json", + "FashionMNIST_Adam.tar", +] +# Create checkpoint path if it doesn't exist yet +os.makedirs(CHECKPOINT_PATH, exist_ok=True) + +# For each file, check whether it already exists. If not, try downloading it. +for file_name in pretrained_files: + file_path = os.path.join(CHECKPOINT_PATH, file_name) + if not os.path.isfile(file_path): + file_url = base_url + file_name + print(f"Downloading {file_url}...") + try: + urllib.request.urlretrieve(file_url, file_path) + except HTTPError as e: + print( + "Something went wrong. Please try to download the file from the GDrive folder, or contact the author with the full output including the following error:\n", + e, + ) + +# %% [markdown] +# ## Preparation + +# %% [markdown] +# Throughout this notebook, we will use a deep fully connected network, similar to our previous tutorial. +# We will also again apply the network to FashionMNIST, so you can relate to the results of Tutorial 3. +# We start by loading the FashionMNIST dataset: + +# %% + +# Transformations applied on each image => first make them a tensor, then normalize them with mean 0 and std 1 +transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.2861,), (0.3530,))]) + +# Loading the training dataset. We need to split it into a training and validation part +train_dataset = FashionMNIST(root=DATASET_PATH, train=True, transform=transform, download=True) +train_set, val_set = torch.utils.data.random_split(train_dataset, [50000, 10000]) + +# Loading the test set +test_set = FashionMNIST(root=DATASET_PATH, train=False, transform=transform, download=True) + +# %% [markdown] +# We define a set of data loaders that we can use for various purposes later. +# Note that for actually training a model, we will use different data loaders +# with a lower batch size. + +# %% +train_loader = data.DataLoader(train_set, batch_size=1024, shuffle=True, drop_last=False) +val_loader = data.DataLoader(val_set, batch_size=1024, shuffle=False, drop_last=False) +test_loader = data.DataLoader(test_set, batch_size=1024, shuffle=False, drop_last=False) + +# %% [markdown] +# In comparison to the previous tutorial, we have changed the parameters of the normalization transformation `transforms.Normalize`. +# The normalization is now designed to give us an expected mean of 0 and a standard deviation of 1 across pixels. +# This will be particularly relevant for the discussion about initialization we will look at below, and hence we change it here. +# It should be noted that in most classification tasks, both normalization techniques (between -1 and 1 or mean 0 and stddev 1) have shown to work well. +# We can calculate the normalization parameters by determining the mean and standard deviation on the original images: + +# %% +print("Mean", (train_dataset.data.float() / 255.0).mean().item()) +print("Std", (train_dataset.data.float() / 255.0).std().item()) + +# %% [markdown] +# We can verify the transformation by looking at the statistics of a single batch: + +# %% +imgs, _ = next(iter(train_loader)) +print(f"Mean: {imgs.mean().item():5.3f}") +print(f"Standard deviation: {imgs.std().item():5.3f}") +print(f"Maximum: {imgs.max().item():5.3f}") +print(f"Minimum: {imgs.min().item():5.3f}") + +# %% [markdown] +# Note that the maximum and minimum are not 1 and -1 anymore, but shifted towards the positive values. +# This is because FashionMNIST contains a lot of black pixels, similar to MNIST. +# +# Next, we create a linear neural network. We use the same setup as in the previous tutorial. + + +# %% +class BaseNetwork(nn.Module): + def __init__(self, act_fn, input_size=784, num_classes=10, hidden_sizes=[512, 256, 256, 128]): + """ + Args: + act_fn: Object of the activation function that should be used as non-linearity in the network. + input_size: Size of the input images in pixels + num_classes: Number of classes we want to predict + hidden_sizes: A list of integers specifying the hidden layer sizes in the NN + """ + super().__init__() + + # Create the network based on the specified hidden sizes + layers = [] + layer_sizes = [input_size] + hidden_sizes + for layer_index in range(1, len(layer_sizes)): + layers += [nn.Linear(layer_sizes[layer_index - 1], layer_sizes[layer_index]), act_fn] + layers += [nn.Linear(layer_sizes[-1], num_classes)] + # A module list registers a list of modules as submodules (e.g. for parameters) + self.layers = nn.ModuleList(layers) + + self.config = { + "act_fn": act_fn.__class__.__name__, + "input_size": input_size, + "num_classes": num_classes, + "hidden_sizes": hidden_sizes, + } + + def forward(self, x): + x = x.view(x.size(0), -1) + for layer in self.layers: + x = layer(x) + return x + + +# %% [markdown] +# For the activation functions, we make use of PyTorch's `torch.nn` library instead of implementing ourselves. +# However, we also define an `Identity` activation function. +# Although this activation function would significantly limit the +# network's modeling capabilities, we will use it in the first steps of +# our discussion about initialization (for simplicity). + + +# %% +class Identity(nn.Module): + def forward(self, x): + return x + + +act_fn_by_name = {"tanh": nn.Tanh, "relu": nn.ReLU, "identity": Identity} + +# %% [markdown] +# Finally, we define a few plotting functions that we will use for our discussions. +# These functions help us to (1) visualize the weight/parameter distribution inside a network, (2) visualize the gradients that the parameters at different layers receive, and (3) the activations, i.e. the output of the linear layers. +# The detailed code is not important, but feel free to take a closer look if interested. + +# %% +############################################################## + + +def plot_dists(val_dict, color="C0", xlabel=None, stat="count", use_kde=True): + columns = len(val_dict) + fig, ax = plt.subplots(1, columns, figsize=(columns * 3, 2.5)) + fig_index = 0 + for key in sorted(val_dict.keys()): + key_ax = ax[fig_index % columns] + sns.histplot( + val_dict[key], + ax=key_ax, + color=color, + bins=50, + stat=stat, + kde=use_kde and ((val_dict[key].max() - val_dict[key].min()) > 1e-8), + ) # Only plot kde if there is variance + hidden_dim_str = ( + r"(%i $\to$ %i)" % (val_dict[key].shape[1], val_dict[key].shape[0]) if len(val_dict[key].shape) > 1 else "" + ) + key_ax.set_title(f"{key} {hidden_dim_str}") + if xlabel is not None: + key_ax.set_xlabel(xlabel) + fig_index += 1 + fig.subplots_adjust(wspace=0.4) + return fig + + +############################################################## + + +def visualize_weight_distribution(model, color="C0"): + weights = {} + for name, param in model.named_parameters(): + if name.endswith(".bias"): + continue + key_name = f"Layer {name.split('.')[1]}" + weights[key_name] = param.detach().view(-1).cpu().numpy() + + # Plotting + fig = plot_dists(weights, color=color, xlabel="Weight vals") + fig.suptitle("Weight distribution", fontsize=14, y=1.05) + plt.show() + plt.close() + + +############################################################## + + +def visualize_gradients(model, color="C0", print_variance=False): + """ + Args: + net: Object of class BaseNetwork + color: Color in which we want to visualize the histogram (for easier separation of activation functions) + """ + model.eval() + small_loader = data.DataLoader(train_set, batch_size=1024, shuffle=False) + imgs, labels = next(iter(small_loader)) + imgs, labels = imgs.to(device), labels.to(device) + + # Pass one batch through the network, and calculate the gradients for the weights + model.zero_grad() + preds = model(imgs) + loss = F.cross_entropy(preds, labels) # Same as nn.CrossEntropyLoss, but as a function instead of module + loss.backward() + # We limit our visualization to the weight parameters and exclude the bias to reduce the number of plots + grads = { + name: params.grad.view(-1).cpu().clone().numpy() + for name, params in model.named_parameters() + if "weight" in name + } + model.zero_grad() + + # Plotting + fig = plot_dists(grads, color=color, xlabel="Grad magnitude") + fig.suptitle("Gradient distribution", fontsize=14, y=1.05) + plt.show() + plt.close() + + if print_variance: + for key in sorted(grads.keys()): + print(f"{key} - Variance: {np.var(grads[key])}") + + +############################################################## + + +def visualize_activations(model, color="C0", print_variance=False): + model.eval() + small_loader = data.DataLoader(train_set, batch_size=1024, shuffle=False) + imgs, labels = next(iter(small_loader)) + imgs, labels = imgs.to(device), labels.to(device) + + # Pass one batch through the network, and calculate the gradients for the weights + feats = imgs.view(imgs.shape[0], -1) + activations = {} + with torch.no_grad(): + for layer_index, layer in enumerate(model.layers): + feats = layer(feats) + if isinstance(layer, nn.Linear): + activations[f"Layer {layer_index}"] = feats.view(-1).detach().cpu().numpy() + + # Plotting + fig = plot_dists(activations, color=color, stat="density", xlabel="Activation vals") + fig.suptitle("Activation distribution", fontsize=14, y=1.05) + plt.show() + plt.close() + + if print_variance: + for key in sorted(activations.keys()): + print(f"{key} - Variance: {np.var(activations[key])}") + + +############################################################## + +# %% [markdown] +# ## Initialization +# +# Before starting our discussion about initialization, it should be noted that there exist many very good blog posts about the topic of neural network initialization (for example [deeplearning.ai](https://www.deeplearning.ai/ai-notes/initialization/), or a more [math-focused blog post](https://pouannes.github.io/blog/initialization)). +# In case something remains unclear after this tutorial, we recommend skimming through these blog posts as well. +# +# When initializing a neural network, there are a few properties we would like to have. +# First, the variance of the input should be propagated through the model to the last layer, so that we have a similar standard deviation for the output neurons. +# If the variance would vanish the deeper we go in our model, it becomes much harder to optimize the model as the input to the next layer is basically a single constant value. +# Similarly, if the variance increases, it is likely to explode (i.e. head to infinity) the deeper we design our model. +# The second property we look out for in initialization techniques is a gradient distribution with equal variance across layers. +# If the first layer receives much smaller gradients than the last layer, we will have difficulties in choosing an appropriate learning rate. +# +# As a starting point for finding a good method, we will analyze different initialization based on our linear neural network with no activation function (i.e. an identity). +# We do this because initializations depend on the specific activation +# function used in the network, and we can adjust the initialization +# schemes later on for our specific choice. + +# %% +model = BaseNetwork(act_fn=Identity()).to(device) + +# %% [markdown] +# ### Constant initialization +# +# The first initialization we can consider is to initialize all weights with the same constant value. +# Intuitively, setting all weights to zero is not a good idea as the propagated gradient will be zero. +# However, what happens if we set all weights to a value slightly larger or smaller than 0? +# To find out, we can implement a function for setting all parameters below and visualize the gradients. + + +# %% +def const_init(model, fill=0.0): + for name, param in model.named_parameters(): + param.data.fill_(fill) + + +const_init(model, fill=0.005) +visualize_gradients(model) +visualize_activations(model, print_variance=True) + +# %% [markdown] +# As we can see, only the first and the last layer have diverse gradient distributions while the other three layers have the same gradient for all weights (note that this value is unequal 0, but often very close to it). +# Having the same gradient for parameters that have been initialized with the same values means that we will always have the same value for those parameters. +# This would make our layer useless and reduce our effective number of parameters to 1. +# Thus, we cannot use a constant initialization to train our networks. + +# %% [markdown] +# ### Constant variance +# +# From the experiment above, we have seen that a constant value is not working. +# So instead, how about we initialize the parameters by randomly sampling from a distribution like a Gaussian? +# The most intuitive way would be to choose one variance that is used for all layers in the network. +# Let's implement it below, and visualize the activation distribution across layers. + + +# %% +def var_init(model, std=0.01): + for name, param in model.named_parameters(): + param.data.normal_(mean=0.0, std=std) + + +var_init(model, std=0.01) +visualize_activations(model, print_variance=True) + +# %% [markdown] +# The variance of the activation becomes smaller and smaller across layers, and almost vanishes in the last layer. +# Alternatively, we could use a higher standard deviation: + +# %% +var_init(model, std=0.1) +visualize_activations(model, print_variance=True) + +# %% [markdown] +# With a higher standard deviation, the activations are likely to explode. +# You can play around with the specific standard deviation values, but it will be hard to find one that gives us a good activation distribution across layers and is very specific to our model. +# If we would change the hidden sizes or number of layers, you would have +# to search all over again, which is neither efficient nor recommended. + +# %% [markdown] +# ### How to find appropriate initialization values +# +# From our experiments above, we have seen that we need to sample the weights from a distribution, but are not sure which one exactly. +# As a next step, we will try to find the optimal initialization from the perspective of the activation distribution. +# For this, we state two requirements: +# +# 1. The mean of the activations should be zero +# 2. The variance of the activations should stay the same across every layer +# +# Suppose we want to design an initialization for the following layer: $y=Wx+b$ with $y\in\mathbb{R}^{d_y}$, $x\in\mathbb{R}^{d_x}$. +# Our goal is that the variance of each element of $y$ is the same as the input, i.e. $\text{Var}(y_i)=\text{Var}(x_i)=\sigma_x^{2}$, and that the mean is zero. +# We assume $x$ to also have a mean of zero, because, in deep neural networks, $y$ would be the input of another layer. +# This requires the bias and weight to have an expectation of 0. +# Actually, as $b$ is a single element per output neuron and is constant across different inputs, we set it to 0 overall. +# +# Next, we need to calculate the variance with which we need to initialize the weight parameters. +# Along the calculation, we will need to following variance rule: given two independent variables, the variance of their product is $\text{Var}(X\cdot Y) = \mathbb{E}(Y)^2\text{Var}(X) + \mathbb{E}(X)^2\text{Var}(Y) + \text{Var}(X)\text{Var}(Y) = \mathbb{E}(Y^2)\mathbb{E}(X^2)-\mathbb{E}(Y)^2\mathbb{E}(X)^2$ ($X$ and $Y$ are not refering to $x$ and $y$, but any random variable). +# +# The needed variance of the weights, $\text{Var}(w_{ij})$, is calculated as follows: +# +# $$ +# \begin{split} +# y_i & = \sum_{j} w_{ij}x_{j}\hspace{10mm}\text{Calculation of a single output neuron without bias}\\ +# \text{Var}(y_i) = \sigma_x^{2} & = \text{Var}\left(\sum_{j} w_{ij}x_{j}\right)\\ +# & = \sum_{j} \text{Var}(w_{ij}x_{j}) \hspace{10mm}\text{Inputs and weights are independent of each other}\\ +# & = \sum_{j} \text{Var}(w_{ij})\cdot\text{Var}(x_{j}) \hspace{10mm}\text{Variance rule (see above) with expectations being zero}\\ +# & = d_x \cdot \text{Var}(w_{ij})\cdot\text{Var}(x_{j}) \hspace{10mm}\text{Variance equal for all $d_x$ elements}\\ +# & = \sigma_x^{2} \cdot d_x \cdot \text{Var}(w_{ij})\\ +# \Rightarrow \text{Var}(w_{ij}) = \sigma_{W}^2 & = \frac{1}{d_x}\\ +# \end{split} +# $$ +# +# Thus, we should initialize the weight distribution with a variance of the inverse of the input dimension $d_x$. +# Let's implement it below and check whether this holds: + + +# %% +def equal_var_init(model): + for name, param in model.named_parameters(): + if name.endswith(".bias"): + param.data.fill_(0) + else: + param.data.normal_(std=1.0 / math.sqrt(param.shape[1])) + + +equal_var_init(model) +visualize_weight_distribution(model) +visualize_activations(model, print_variance=True) + +# %% [markdown] +# As we expected, the variance stays indeed constant across layers. +# Note that our initialization does not restrict us to a normal distribution, but allows any other distribution with a mean of 0 and variance of $1/d_x$. +# You often see that a uniform distribution is used for initialization. +# A small benefit of using a uniform instead of a normal distribution is that we can exclude the chance of initializing very large or small weights. +# +# Besides the variance of the activations, another variance we would like to stabilize is the one of the gradients. +# This ensures a stable optimization for deep networks. +# It turns out that we can do the same calculation as above starting from $\Delta x=W\Delta y$, and come to the conclusion that we should initialize our layers with $1/d_y$ where $d_y$ is the number of output neurons. +# You can do the calculation as a practice, or check a thorough explanation in [this blog post](https://pouannes.github.io/blog/initialization). +# As a compromise between both constraints, [Glorot and Bengio (2010)](http://proceedings.mlr.press/v9/glorot10a/glorot10a.pdf?hc_location=ufi) proposed to use the harmonic mean of both values. +# This leads us to the well-known Xavier initialization: +# +# $$W\sim \mathcal{N}\left(0,\frac{2}{d_x+d_y}\right)$$ +# +# If we use a uniform distribution, we would initialize the weights with: +# +# $$W\sim U\left[-\frac{\sqrt{6}}{\sqrt{d_x+d_y}}, \frac{\sqrt{6}}{\sqrt{d_x+d_y}}\right]$$ +# +# Let's shortly implement it and validate its effectiveness: + + +# %% +def xavier_init(model): + for name, param in model.named_parameters(): + if name.endswith(".bias"): + param.data.fill_(0) + else: + bound = math.sqrt(6) / math.sqrt(param.shape[0] + param.shape[1]) + param.data.uniform_(-bound, bound) + + +xavier_init(model) +visualize_gradients(model, print_variance=True) +visualize_activations(model, print_variance=True) + +# %% [markdown] +# We see that the Xavier initialization balances the variance of gradients and activations. +# Note that the significantly higher variance for the output layer is due to the large difference of input and output dimension ($128$ vs $10$). +# However, we currently assumed the activation function to be linear. +# So what happens if we add a non-linearity? +# In a tanh-based network, a common assumption is that for small values during the initial steps in training, the $\tanh$ works as a linear function such that we don't have to adjust our calculation. +# We can check if that is the case for us as well: + +# %% +model = BaseNetwork(act_fn=nn.Tanh()).to(device) +xavier_init(model) +visualize_gradients(model, print_variance=True) +visualize_activations(model, print_variance=True) + +# %% [markdown] +# Although the variance decreases over depth, it is apparent that the activation distribution becomes more focused on the low values. +# Therefore, our variance will stabilize around 0.25 if we would go even deeper. +# Hence, we can conclude that the Xavier initialization works well for Tanh networks. +# But what about ReLU networks? +# Here, we cannot take the previous assumption of the non-linearity becoming linear for small values. +# The ReLU activation function sets (in expectation) half of the inputs to 0 so that also the expectation of the input is not zero. +# However, as long as the expectation of $W$ is zero and $b=0$, the expectation of the output is zero. +# The part where the calculation of the ReLU initialization differs from the identity is when determining $\text{Var}(w_{ij}x_{j})$: +# +# $$\text{Var}(w_{ij}x_{j})=\underbrace{\mathbb{E}[w_{ij}^2]}_{=\text{Var}(w_{ij})}\mathbb{E}[x_{j}^2]-\underbrace{\mathbb{E}[w_{ij}]^2}_{=0}\mathbb{E}[x_{j}]^2=\text{Var}(w_{ij})\mathbb{E}[x_{j}^2]$$ +# +# If we assume now that $x$ is the output of a ReLU activation (from a previous layer, $x=max(0,\tilde{y})$), we can calculate the expectation as follows: +# +# +# $$ +# \begin{split} +# \mathbb{E}[x^2] & =\mathbb{E}[\max(0,\tilde{y})^2]\\ +# & =\frac{1}{2}\mathbb{E}[{\tilde{y}}^2]\hspace{2cm}\tilde{y}\text{ is zero-centered and symmetric}\\ +# & =\frac{1}{2}\text{Var}(\tilde{y}) +# \end{split}$$ +# +# Thus, we see that we have an additional factor of 1/2 in the equation, so that our desired weight variance becomes $2/d_x$. +# This gives us the Kaiming initialization (see [He, K. et al. +# (2015)](https://arxiv.org/pdf/1502.01852.pdf)). +# Note that the Kaiming initialization does not use the harmonic mean between input and output size. +# In their paper (Section 2.2, Backward Propagation, last paragraph), they argue that using $d_x$ or $d_y$ both lead to stable gradients throughout the network, and only depend on the overall input and output size of the network. +# Hence, we can use here only the input $d_x$: + + +# %% +def kaiming_init(model): + for name, param in model.named_parameters(): + if name.endswith(".bias"): + param.data.fill_(0) + elif name.startswith("layers.0"): # The first layer does not have ReLU applied on its input + param.data.normal_(0, 1 / math.sqrt(param.shape[1])) + else: + param.data.normal_(0, math.sqrt(2) / math.sqrt(param.shape[1])) + + +model = BaseNetwork(act_fn=nn.ReLU()).to(device) +kaiming_init(model) +visualize_gradients(model, print_variance=True) +visualize_activations(model, print_variance=True) + +# %% [markdown] +# The variance stays stable across layers. +# We can conclude that the Kaiming initialization indeed works well for ReLU-based networks. +# Note that for Leaky-ReLU etc., we have to slightly adjust the factor of $2$ in the variance as half of the values are not set to zero anymore. +# PyTorch provides a function to calculate this factor for many activation +# function, see `torch.nn.init.calculate_gain` +# ([link](https://pytorch.org/docs/stable/nn.init.html#torch.nn.init.calculate_gain)). + +# %% [markdown] +# ## Optimization +# +#
+# +# Besides initialization, selecting a suitable optimization algorithm can be an important choice for deep neural networks. +# Before taking a closer look at them, we should define code for training the models. +# Most of the following code is copied from the previous tutorial, and only slightly altered to fit our needs. + + +# %% +def _get_config_file(model_path, model_name): + return os.path.join(model_path, model_name + ".config") + + +def _get_model_file(model_path, model_name): + return os.path.join(model_path, model_name + ".tar") + + +def _get_result_file(model_path, model_name): + return os.path.join(model_path, model_name + "_results.json") + + +def load_model(model_path, model_name, net=None): + config_file = _get_config_file(model_path, model_name) + model_file = _get_model_file(model_path, model_name) + assert os.path.isfile( + config_file + ), f'Could not find the config file "{config_file}". Are you sure this is the correct path and you have your model config stored here?' + assert os.path.isfile( + model_file + ), f'Could not find the model file "{model_file}". Are you sure this is the correct path and you have your model stored here?' + with open(config_file) as f: + config_dict = json.load(f) + if net is None: + act_fn_name = config_dict["act_fn"].pop("name").lower() + assert ( + act_fn_name in act_fn_by_name + ), f'Unknown activation function "{act_fn_name}". Please add it to the "act_fn_by_name" dict.' + act_fn = act_fn_by_name[act_fn_name]() + net = BaseNetwork(act_fn=act_fn, **config_dict) + net.load_state_dict(torch.load(model_file)) + return net + + +def save_model(model, model_path, model_name): + config_dict = model.config + os.makedirs(model_path, exist_ok=True) + config_file = _get_config_file(model_path, model_name) + model_file = _get_model_file(model_path, model_name) + with open(config_file, "w") as f: + json.dump(config_dict, f) + torch.save(model.state_dict(), model_file) + + +def train_model(net, model_name, optim_func, max_epochs=50, batch_size=256, overwrite=False): + """Train a model on the training set of FashionMNIST. + + Args: + net: Object of BaseNetwork + model_name: (str) Name of the model, used for creating the checkpoint names + max_epochs: Number of epochs we want to (maximally) train for + patience: If the performance on the validation set has not improved for #patience epochs, we stop training early + batch_size: Size of batches used in training + overwrite: Determines how to handle the case when there already exists a checkpoint. If True, it will be overwritten. Otherwise, we skip training. + """ + file_exists = os.path.isfile(_get_model_file(CHECKPOINT_PATH, model_name)) + if file_exists and not overwrite: + print(f'Model file of "{model_name}" already exists. Skipping training...') + with open(_get_result_file(CHECKPOINT_PATH, model_name)) as f: + results = json.load(f) + else: + if file_exists: + print("Model file exists, but will be overwritten...") + + # Defining optimizer, loss and data loader + optimizer = optim_func(net.parameters()) + loss_module = nn.CrossEntropyLoss() + train_loader_local = data.DataLoader( + train_set, batch_size=batch_size, shuffle=True, drop_last=True, pin_memory=True + ) + + results = None + val_scores = [] + train_losses, train_scores = [], [] + best_val_epoch = -1 + for epoch in range(max_epochs): + train_acc, val_acc, epoch_losses = epoch_iteration( + net, loss_module, optimizer, train_loader_local, val_loader, epoch + ) + train_scores.append(train_acc) + val_scores.append(val_acc) + train_losses += epoch_losses + + if len(val_scores) == 1 or val_acc > val_scores[best_val_epoch]: + print("\t (New best performance, saving model...)") + save_model(net, CHECKPOINT_PATH, model_name) + best_val_epoch = epoch + + if results is None: + load_model(CHECKPOINT_PATH, model_name, net=net) + test_acc = test_model(net, test_loader) + results = { + "test_acc": test_acc, + "val_scores": val_scores, + "train_losses": train_losses, + "train_scores": train_scores, + } + with open(_get_result_file(CHECKPOINT_PATH, model_name), "w") as f: + json.dump(results, f) + + # Plot a curve of the validation accuracy + sns.set() + plt.plot([i for i in range(1, len(results["train_scores"]) + 1)], results["train_scores"], label="Train") + plt.plot([i for i in range(1, len(results["val_scores"]) + 1)], results["val_scores"], label="Val") + plt.xlabel("Epochs") + plt.ylabel("Validation accuracy") + plt.ylim(min(results["val_scores"]), max(results["train_scores"]) * 1.01) + plt.title(f"Validation performance of {model_name}") + plt.legend() + plt.show() + plt.close() + + print((f" Test accuracy: {results['test_acc']*100.0:4.2f}% ").center(50, "=") + "\n") + return results + + +def epoch_iteration(net, loss_module, optimizer, train_loader_local, val_loader, epoch): + ############ + # Training # + ############ + net.train() + true_preds, count = 0.0, 0 + epoch_losses = [] + t = tqdm(train_loader_local, leave=False) + for imgs, labels in t: + imgs, labels = imgs.to(device), labels.to(device) + optimizer.zero_grad() + preds = net(imgs) + loss = loss_module(preds, labels) + loss.backward() + optimizer.step() + # Record statistics during training + true_preds += (preds.argmax(dim=-1) == labels).sum().item() + count += labels.shape[0] + t.set_description(f"Epoch {epoch+1}: loss={loss.item():4.2f}") + epoch_losses.append(loss.item()) + train_acc = true_preds / count + + ############## + # Validation # + ############## + val_acc = test_model(net, val_loader) + print( + f"[Epoch {epoch+1:2i}] Training accuracy: {train_acc*100.0:05.2f}%, Validation accuracy: {val_acc*100.0:05.2f}%" + ) + return train_acc, val_acc, epoch_losses + + +def test_model(net, data_loader): + """Test a model on a specified dataset. + + Args: + net: Trained model of type BaseNetwork + data_loader: DataLoader object of the dataset to test on (validation or test) + """ + net.eval() + true_preds, count = 0.0, 0 + for imgs, labels in data_loader: + imgs, labels = imgs.to(device), labels.to(device) + with torch.no_grad(): + preds = net(imgs).argmax(dim=-1) + true_preds += (preds == labels).sum().item() + count += labels.shape[0] + test_acc = true_preds / count + return test_acc + + +# %% [markdown] +# First, we need to understand what an optimizer actually does. +# The optimizer is responsible to update the network's parameters given the gradients. +# Hence, we effectively implement a function $w^{t} = f(w^{t-1}, g^{t}, ...)$ with $w$ being the parameters, and $g^{t} = \nabla_{w^{(t-1)}} \mathcal{L}^{(t)}$ the gradients at time step $t$. +# A common, additional parameter to this function is the learning rate, here denoted by $\eta$. +# Usually, the learning rate can be seen as the "step size" of the update. +# A higher learning rate means that we change the weights more in the direction of the gradients, a smaller means we take shorter steps. +# +# As most optimizers only differ in the implementation of $f$, we can define a template for an optimizer in PyTorch below. +# We take as input the parameters of a model and a learning rate. +# The function `zero_grad` sets the gradients of all parameters to zero, which we have to do before calling `loss.backward()`. +# Finally, the `step()` function tells the optimizer to update all weights based on their gradients. +# The template is setup below: + + +# %% +class OptimizerTemplate: + def __init__(self, params, lr): + self.params = list(params) + self.lr = lr + + def zero_grad(self): + # Set gradients of all parameters to zero + for p in self.params: + if p.grad is not None: + p.grad.detach_() # For second-order optimizers important + p.grad.zero_() + + @torch.no_grad() + def step(self): + # Apply update step to all parameters + for p in self.params: + if p.grad is None: # We skip parameters without any gradients + continue + self.update_param(p) + + def update_param(self, p): + # To be implemented in optimizer-specific classes + raise NotImplementedError + + +# %% [markdown] +# The first optimizer we are going to implement is the standard Stochastic Gradient Descent (SGD). +# SGD updates the parameters using the following equation: +# +# $$ +# \begin{split} +# w^{(t)} & = w^{(t-1)} - \eta \cdot g^{(t)} +# \end{split} +# $$ +# +# As simple as the equation is also our implementation of SGD: + + +# %% +class SGD(OptimizerTemplate): + def __init__(self, params, lr): + super().__init__(params, lr) + + def update_param(self, p): + p_update = -self.lr * p.grad + p.add_(p_update) # In-place update => saves memory and does not create computation graph + + +# %% [markdown] +# In the lecture, we also have discussed the concept of momentum which replaces the gradient in the update by an exponential average of all past gradients including the current one: +# +# $$ +# \begin{split} +# m^{(t)} & = \beta_1 m^{(t-1)} + (1 - \beta_1)\cdot g^{(t)}\\ +# w^{(t)} & = w^{(t-1)} - \eta \cdot m^{(t)}\\ +# \end{split} +# $$ +# +# Let's also implement it below: + + +# %% +class SGDMomentum(OptimizerTemplate): + def __init__(self, params, lr, momentum=0.0): + super().__init__(params, lr) + self.momentum = momentum # Corresponds to beta_1 in the equation above + self.param_momentum = {p: torch.zeros_like(p.data) for p in self.params} # Dict to store m_t + + def update_param(self, p): + self.param_momentum[p] = (1 - self.momentum) * p.grad + self.momentum * self.param_momentum[p] + p_update = -self.lr * self.param_momentum[p] + p.add_(p_update) + + +# %% [markdown] +# Finally, we arrive at Adam. +# Adam combines the idea of momentum with an adaptive learning rate, which is based on an exponential average of the squared gradients, i.e. the gradients norm. +# Furthermore, we add a bias correction for the momentum and adaptive learning rate for the first iterations: +# +# $$ +# \begin{split} +# m^{(t)} & = \beta_1 m^{(t-1)} + (1 - \beta_1)\cdot g^{(t)}\\ +# v^{(t)} & = \beta_2 v^{(t-1)} + (1 - \beta_2)\cdot \left(g^{(t)}\right)^2\\ +# \hat{m}^{(t)} & = \frac{m^{(t)}}{1-\beta^{t}_1}, \hat{v}^{(t)} = \frac{v^{(t)}}{1-\beta^{t}_2}\\ +# w^{(t)} & = w^{(t-1)} - \frac{\eta}{\sqrt{v^{(t)}} + \epsilon}\circ \hat{m}^{(t)}\\ +# \end{split} +# $$ +# +# Epsilon is a small constant used to improve numerical stability for very small gradient norms. +# Remember that the adaptive learning rate does not replace the learning +# rate hyperparameter $\eta$, but rather acts as an extra factor and +# ensures that the gradients of various parameters have a similar norm. + + +# %% +class Adam(OptimizerTemplate): + def __init__(self, params, lr, beta1=0.9, beta2=0.999, eps=1e-8): + super().__init__(params, lr) + self.beta1 = beta1 + self.beta2 = beta2 + self.eps = eps + self.param_step = {p: 0 for p in self.params} # Remembers "t" for each parameter for bias correction + self.param_momentum = {p: torch.zeros_like(p.data) for p in self.params} + self.param_2nd_momentum = {p: torch.zeros_like(p.data) for p in self.params} + + def update_param(self, p): + self.param_step[p] += 1 + + self.param_momentum[p] = (1 - self.beta1) * p.grad + self.beta1 * self.param_momentum[p] + self.param_2nd_momentum[p] = (1 - self.beta2) * (p.grad) ** 2 + self.beta2 * self.param_2nd_momentum[p] + + bias_correction_1 = 1 - self.beta1 ** self.param_step[p] + bias_correction_2 = 1 - self.beta2 ** self.param_step[p] + + p_2nd_mom = self.param_2nd_momentum[p] / bias_correction_2 + p_mom = self.param_momentum[p] / bias_correction_1 + p_lr = self.lr / (torch.sqrt(p_2nd_mom) + self.eps) + p_update = -p_lr * p_mom + + p.add_(p_update) + + +# %% [markdown] +# ### Comparing optimizers on model training +# +# After we have implemented three optimizers (SGD, SGD with momentum, and Adam), we can start to analyze and compare them. +# First, we test them on how well they can optimize a neural network on the FashionMNIST dataset. +# We use again our linear network, this time with a ReLU activation and the kaiming initialization, which we have found before to work well for ReLU-based networks. +# Note that the model is over-parameterized for this task, and we can achieve similar performance with a much smaller network (for example `100,100,100`). +# However, our main interest is in how well the optimizer can train *deep* +# neural networks, hence the over-parameterization. + +# %% +base_model = BaseNetwork(act_fn=nn.ReLU(), hidden_sizes=[512, 256, 256, 128]) +kaiming_init(base_model) + +# %% [markdown] +# For a fair comparison, we train the exact same model with the same seed with the three optimizers below. +# Feel free to change the hyperparameters if you want (however, you have to train your own model then). + +# %% +SGD_model = copy.deepcopy(base_model).to(device) +SGD_results = train_model( + SGD_model, "FashionMNIST_SGD", lambda params: SGD(params, lr=1e-1), max_epochs=40, batch_size=256 +) + +# %% +SGDMom_model = copy.deepcopy(base_model).to(device) +SGDMom_results = train_model( + SGDMom_model, + "FashionMNIST_SGDMom", + lambda params: SGDMomentum(params, lr=1e-1, momentum=0.9), + max_epochs=40, + batch_size=256, +) + +# %% +Adam_model = copy.deepcopy(base_model).to(device) +Adam_results = train_model( + Adam_model, "FashionMNIST_Adam", lambda params: Adam(params, lr=1e-3), max_epochs=40, batch_size=256 +) + +# %% [markdown] +# The result is that all optimizers perform similarly well with the given model. +# The differences are too small to find any significant conclusion. +# However, keep in mind that this can also be attributed to the initialization we chose. +# When changing the initialization to worse (e.g. constant initialization), Adam usually shows to be more robust because of its adaptive learning rate. +# To show the specific benefits of the optimizers, we will continue to +# look at some possible loss surfaces in which momentum and adaptive +# learning rate are crucial. + +# %% [markdown] +# ### Pathological curvatures +# +# A pathological curvature is a type of surface that is similar to ravines and is particularly tricky for plain SGD optimization. +# In words, pathological curvatures typically have a steep gradient in one direction with an optimum at the center, while in a second direction we have a slower gradient towards a (global) optimum. +# Let's first create an example surface of this and visualize it: + + +# %% +def pathological_curve_loss(w1, w2): + # Example of a pathological curvature. There are many more possible, feel free to experiment here! + x1_loss = torch.tanh(w1) ** 2 + 0.01 * torch.abs(w1) + x2_loss = torch.sigmoid(w2) + return x1_loss + x2_loss + + +# %% +def plot_curve( + curve_fn, x_range=(-5, 5), y_range=(-5, 5), plot_3d=False, cmap=cm.viridis, title="Pathological curvature" +): + fig = plt.figure() + ax = fig.gca() + if plot_3d: + ax = fig.add_subplot(projection="3d") + + x = torch.arange(x_range[0], x_range[1], (x_range[1] - x_range[0]) / 100.0) + y = torch.arange(y_range[0], y_range[1], (y_range[1] - y_range[0]) / 100.0) + x, y = torch.meshgrid([x, y]) + z = curve_fn(x, y) + x, y, z = x.numpy(), y.numpy(), z.numpy() + + if plot_3d: + ax.plot_surface(x, y, z, cmap=cmap, linewidth=1, color="#000", antialiased=False) + ax.set_zlabel("loss") + else: + ax.imshow(z.T[::-1], cmap=cmap, extent=(x_range[0], x_range[1], y_range[0], y_range[1])) + plt.title(title) + ax.set_xlabel(r"$w_1$") + ax.set_ylabel(r"$w_2$") + plt.tight_layout() + return ax + + +sns.reset_orig() +_ = plot_curve(pathological_curve_loss, plot_3d=True) +plt.show() + +# %% [markdown] +# In terms of optimization, you can image that $w_1$ and $w_2$ are weight parameters, and the curvature represents the loss surface over the space of $w_1$ and $w_2$. +# Note that in typical networks, we have many, many more parameters than two, and such curvatures can occur in multi-dimensional spaces as well. +# +# Ideally, our optimization algorithm would find the center of the ravine and focuses on optimizing the parameters towards the direction of $w_2$. +# However, if we encounter a point along the ridges, the gradient is much greater in $w_1$ than $w_2$, and we might end up jumping from one side to the other. +# Due to the large gradients, we would have to reduce our learning rate slowing down learning significantly. +# +# To test our algorithms, we can implement a simple function to train two parameters on such a surface: + + +# %% +def train_curve(optimizer_func, curve_func=pathological_curve_loss, num_updates=100, init=[5, 5]): + """ + Args: + optimizer_func: Constructor of the optimizer to use. Should only take a parameter list + curve_func: Loss function (e.g. pathological curvature) + num_updates: Number of updates/steps to take when optimizing + init: Initial values of parameters. Must be a list/tuple with two elements representing w_1 and w_2 + Returns: + Numpy array of shape [num_updates, 3] with [t,:2] being the parameter values at step t, and [t,2] the loss at t. + """ + weights = nn.Parameter(torch.FloatTensor(init), requires_grad=True) + optim = optimizer_func([weights]) + + list_points = [] + for _ in range(num_updates): + loss = curve_func(weights[0], weights[1]) + list_points.append(torch.cat([weights.data.detach(), loss.unsqueeze(dim=0).detach()], dim=0)) + optim.zero_grad() + loss.backward() + optim.step() + points = torch.stack(list_points, dim=0).numpy() + return points + + +# %% [markdown] +# Next, let's apply the different optimizers on our curvature. +# Note that we set a much higher learning rate for the optimization algorithms as you would in a standard neural network. +# This is because we only have 2 parameters instead of tens of thousands or even millions. + +# %% +SGD_points = train_curve(lambda params: SGD(params, lr=10)) +SGDMom_points = train_curve(lambda params: SGDMomentum(params, lr=10, momentum=0.9)) +Adam_points = train_curve(lambda params: Adam(params, lr=1)) + +# %% [markdown] +# To understand best how the different algorithms worked, we visualize the update step as a line plot through the loss surface. +# We will stick with a 2D representation for readability. + +# %% +all_points = np.concatenate([SGD_points, SGDMom_points, Adam_points], axis=0) +ax = plot_curve( + pathological_curve_loss, + x_range=(-np.absolute(all_points[:, 0]).max(), np.absolute(all_points[:, 0]).max()), + y_range=(all_points[:, 1].min(), all_points[:, 1].max()), + plot_3d=False, +) +ax.plot(SGD_points[:, 0], SGD_points[:, 1], color="red", marker="o", zorder=1, label="SGD") +ax.plot(SGDMom_points[:, 0], SGDMom_points[:, 1], color="blue", marker="o", zorder=2, label="SGDMom") +ax.plot(Adam_points[:, 0], Adam_points[:, 1], color="grey", marker="o", zorder=3, label="Adam") +plt.legend() +plt.show() + +# %% [markdown] +# We can clearly see that SGD is not able to find the center of the optimization curve and has a problem converging due to the steep gradients in $w_1$. +# In contrast, Adam and SGD with momentum nicely converge as the changing direction of $w_1$ is canceling itself out. +# On such surfaces, it is crucial to use momentum. + +# %% [markdown] +# ### Steep optima +# +# A second type of challenging loss surfaces are steep optima. +# In those, we have a larger part of the surface having very small gradients while around the optimum, we have very large gradients. +# For instance, take the following loss surfaces: + + +# %% +def bivar_gaussian(w1, w2, x_mean=0.0, y_mean=0.0, x_sig=1.0, y_sig=1.0): + norm = 1 / (2 * np.pi * x_sig * y_sig) + x_exp = (-1 * (w1 - x_mean) ** 2) / (2 * x_sig**2) + y_exp = (-1 * (w2 - y_mean) ** 2) / (2 * y_sig**2) + return norm * torch.exp(x_exp + y_exp) + + +def comb_func(w1, w2): + z = -bivar_gaussian(w1, w2, x_mean=1.0, y_mean=-0.5, x_sig=0.2, y_sig=0.2) + z -= bivar_gaussian(w1, w2, x_mean=-1.0, y_mean=0.5, x_sig=0.2, y_sig=0.2) + z -= bivar_gaussian(w1, w2, x_mean=-0.5, y_mean=-0.8, x_sig=0.2, y_sig=0.2) + return z + + +_ = plot_curve(comb_func, x_range=(-2, 2), y_range=(-2, 2), plot_3d=True, title="Steep optima") + +# %% [markdown] +# Most of the loss surface has very little to no gradients. +# However, close to the optima, we have very steep gradients. +# To reach the minimum when starting in a region with lower gradients, we expect an adaptive learning rate to be crucial. +# To verify this hypothesis, we can run our three optimizers on the surface: + +# %% +SGD_points = train_curve(lambda params: SGD(params, lr=0.5), comb_func, init=[0, 0]) +SGDMom_points = train_curve(lambda params: SGDMomentum(params, lr=1, momentum=0.9), comb_func, init=[0, 0]) +Adam_points = train_curve(lambda params: Adam(params, lr=0.2), comb_func, init=[0, 0]) + +all_points = np.concatenate([SGD_points, SGDMom_points, Adam_points], axis=0) +ax = plot_curve(comb_func, x_range=(-2, 2), y_range=(-2, 2), plot_3d=False, title="Steep optima") +ax.plot(SGD_points[:, 0], SGD_points[:, 1], color="red", marker="o", zorder=3, label="SGD", alpha=0.7) +ax.plot(SGDMom_points[:, 0], SGDMom_points[:, 1], color="blue", marker="o", zorder=2, label="SGDMom", alpha=0.7) +ax.plot(Adam_points[:, 0], Adam_points[:, 1], color="grey", marker="o", zorder=1, label="Adam", alpha=0.7) +ax.set_xlim(-2, 2) +ax.set_ylim(-2, 2) +plt.legend() +plt.show() + +# %% [markdown] +# SGD first takes very small steps until it touches the border of the optimum. +# First reaching a point around $(-0.75,-0.5)$, the gradient direction has changed and pushes the parameters to $(0.8,0.5)$ from which SGD cannot recover anymore (only with many, many steps). +# A similar problem has SGD with momentum, only that it continues the direction of the touch of the optimum. +# The gradients from this time step are so much larger than any other point that the momentum $m_t$ is overpowered by it. +# Finally, Adam is able to converge in the optimum showing the importance of adaptive learning rates. + +# %% [markdown] +# ### What optimizer to take +# +# After seeing the results on optimization, what is our conclusion? +# Should we always use Adam and never look at SGD anymore? +# The short answer: no. +# There are many papers saying that in certain situations, SGD (with momentum) generalizes better where Adam often tends to overfit [5,6]. +# This is related to the idea of finding wider optima. +# For instance, see the illustration of different optima below (credit: [Keskar et al., 2017](https://arxiv.org/pdf/1609.04836.pdf)): +# +#
+# +# The black line represents the training loss surface, while the dotted red line is the test loss. +# Finding sharp, narrow minima can be helpful for finding the minimal training loss. +# However, this doesn't mean that it also minimizes the test loss as especially flat minima have shown to generalize better. +# You can imagine that the test dataset has a slightly shifted loss surface due to the different examples than in the training set. +# A small change can have a significant influence for sharp minima, while flat minima are generally more robust to this change. +# +# In the next tutorial, we will see that some network types can still be better optimized with SGD and learning rate scheduling than Adam. +# Nevertheless, Adam is the most commonly used optimizer in Deep Learning +# as it usually performs better than other optimizers, especially for deep +# networks. + +# %% [markdown] +# ## Conclusion +# +# In this tutorial, we have looked at initialization and optimization techniques for neural networks. +# We have seen that a good initialization has to balance the preservation of the gradient variance as well as the activation variance. +# This can be achieved with the Xavier initialization for tanh-based networks, and the Kaiming initialization for ReLU-based networks. +# In optimization, concepts like momentum and adaptive learning rate can help with challenging loss surfaces but don't guarantee an increase in performance for neural networks. +# +# +# ## References +# +# [1] Glorot, Xavier, and Yoshua Bengio. +# "Understanding the difficulty of training deep feedforward neural networks." +# Proceedings of the thirteenth international conference on artificial intelligence and statistics. +# 2010. +# [link](http://proceedings.mlr.press/v9/glorot10a/glorot10a.pdf) +# +# [2] He, Kaiming, et al. +# "Delving deep into rectifiers: Surpassing human-level performance on imagenet classification." +# Proceedings of the IEEE international conference on computer vision. +# 2015. +# [link](https://www.cv-foundation.org/openaccess/content_iccv_2015/html/He_Delving_Deep_into_ICCV_2015_paper.html) +# +# [3] Kingma, Diederik P. & Ba, Jimmy. +# "Adam: A Method for Stochastic Optimization." +# Proceedings of the third international conference for learning representations (ICLR). +# 2015. +# [link](https://arxiv.org/abs/1412.6980) +# +# [4] Keskar, Nitish Shirish, et al. +# "On large-batch training for deep learning: Generalization gap and sharp minima." +# Proceedings of the fifth international conference for learning representations (ICLR). +# 2017. +# [link](https://arxiv.org/abs/1609.04836) +# +# [5] Wilson, Ashia C., et al. +# "The Marginal Value of Adaptive Gradient Methods in Machine Learning." +# Advances in neural information processing systems. +# 2017. +# [link](https://papers.nips.cc/paper/7003-the-marginal-value-of-adaptive-gradient-methods-in-machine-learning.pdf) +# +# [6] Ruder, Sebastian. +# "An overview of gradient descent optimization algorithms." +# arXiv preprint. +# 2017. +# [link](https://arxiv.org/abs/1609.04747) diff --git a/_notebooks/course_UvA-DL/03-initialization-and-optimization/flat_vs_sharp_minima.svg b/_notebooks/course_UvA-DL/03-initialization-and-optimization/flat_vs_sharp_minima.svg new file mode 100644 index 0000000..c7b6225 --- /dev/null +++ b/_notebooks/course_UvA-DL/03-initialization-and-optimization/flat_vs_sharp_minima.svg @@ -0,0 +1,1456 @@ + + + + + + image/svg+xmldiff --git a/_notebooks/course_UvA-DL/04-inception-resnet-densenet/.meta.yaml b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/.meta.yaml new file mode 100644 index 0000000..dc7b7b0 --- /dev/null +++ b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/.meta.yaml @@ -0,0 +1,23 @@ +title: "Tutorial 4: Inception, ResNet and DenseNet" +author: Phillip Lippe +created: 2021-08-27 +updated: 2023-03-14 +license: CC BY-SA +tags: + - Image +description: | + In this tutorial, we will implement and discuss variants of modern CNN architectures. + There have been many different architectures been proposed over the past few years. + Some of the most impactful ones, and still relevant today, are the following: [GoogleNet](https://arxiv.org/abs/1409.4842)/Inception architecture (winner of ILSVRC 2014), [ResNet](https://arxiv.org/abs/1512.03385) (winner of ILSVRC 2015), and [DenseNet](https://arxiv.org/abs/1608.06993) (best paper award CVPR 2017). + All of them were state-of-the-art models when being proposed, and the core ideas of these networks are the foundations for most current state-of-the-art architectures. + Thus, it is important to understand these architectures in detail and learn how to implement them. + This notebook is part of a lecture series on Deep Learning at the University of Amsterdam. + The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io. +requirements: + - torchvision + - matplotlib + - seaborn + - tabulate + - lightning>=2.0.0rc0 +accelerator: + - GPU diff --git a/docs/_static/images/course_UvA-DL/04-inception-resnet-densenet.jpg b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/.thumb.jpg similarity index 100% rename from docs/_static/images/course_UvA-DL/04-inception-resnet-densenet.jpg rename to _notebooks/course_UvA-DL/04-inception-resnet-densenet/.thumb.jpg diff --git a/_notebooks/course_UvA-DL/04-inception-resnet-densenet/Inception_ResNet_DenseNet.py b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/Inception_ResNet_DenseNet.py new file mode 100644 index 0000000..ffee8ff --- /dev/null +++ b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/Inception_ResNet_DenseNet.py @@ -0,0 +1,1207 @@ +# %% [markdown] +#
+# Let's start with importing our standard libraries here. + +# %% +import os +import urllib.request +from types import SimpleNamespace +from urllib.error import HTTPError + +import lightning as L +import matplotlib +import matplotlib.pyplot as plt +import matplotlib_inline.backend_inline +import numpy as np +import seaborn as sns +import tabulate +import torch +import torch.nn as nn +import torch.optim as optim +import torch.utils.data as data +import torchvision + +# %matplotlib inline +from IPython.display import HTML, display +from lightning.pytorch.callbacks import LearningRateMonitor, ModelCheckpoint +from PIL import Image +from torchvision import transforms +from torchvision.datasets import CIFAR10 + +matplotlib_inline.backend_inline.set_matplotlib_formats("svg", "pdf") # For export +matplotlib.rcParams["lines.linewidth"] = 2.0 +sns.reset_orig() + +# PyTorch +# Torchvision + +# %% [markdown] +# We will use the same `set_seed` function as in the previous tutorials, as well as the path variables `DATASET_PATH` and `CHECKPOINT_PATH`. +# Adjust the paths if necessary. + +# %% +# Path to the folder where the datasets are/should be downloaded (e.g. CIFAR10) +DATASET_PATH = os.environ.get("PATH_DATASETS", "data/") +# Path to the folder where the pretrained models are saved +CHECKPOINT_PATH = os.environ.get("PATH_CHECKPOINT", "saved_models/ConvNets") + + +# Function for setting the seed +L.seed_everything(42) + +# Ensure that all operations are deterministic on GPU (if used) for reproducibility +torch.backends.cudnn.deterministic = True +torch.backends.cudnn.benchmark = False + +device = torch.device("cuda:0") if torch.cuda.is_available() else torch.device("cpu") + +# %% [markdown] +# We also have pretrained models and Tensorboards (more on this later) for this tutorial, and download them below. + +# %% +# Github URL where saved models are stored for this tutorial +base_url = "https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial5/" +# Files to download +pretrained_files = [ + "GoogleNet.ckpt", + "ResNet.ckpt", + "ResNetPreAct.ckpt", + "DenseNet.ckpt", + "tensorboards/GoogleNet/events.out.tfevents.googlenet", + "tensorboards/ResNet/events.out.tfevents.resnet", + "tensorboards/ResNetPreAct/events.out.tfevents.resnetpreact", + "tensorboards/DenseNet/events.out.tfevents.densenet", +] +# Create checkpoint path if it doesn't exist yet +os.makedirs(CHECKPOINT_PATH, exist_ok=True) + +# For each file, check whether it already exists. If not, try downloading it. +for file_name in pretrained_files: + file_path = os.path.join(CHECKPOINT_PATH, file_name) + if "/" in file_name: + os.makedirs(file_path.rsplit("/", 1)[0], exist_ok=True) + if not os.path.isfile(file_path): + file_url = base_url + file_name + print(f"Downloading {file_url}...") + try: + urllib.request.urlretrieve(file_url, file_path) + except HTTPError as e: + print( + "Something went wrong. Please try to download the file from the GDrive folder, or contact the author with the full output including the following error:\n", + e, + ) + +# %% [markdown] +# Throughout this tutorial, we will train and evaluate the models on the CIFAR10 dataset. +# This allows you to compare the results obtained here with the model you have implemented in the first assignment. +# As we have learned from the previous tutorial about initialization, it is important to have the data preprocessed with a zero mean. +# Therefore, as a first step, we will calculate the mean and standard deviation of the CIFAR dataset: + +# %% +train_dataset = CIFAR10(root=DATASET_PATH, train=True, download=True) +DATA_MEANS = (train_dataset.data / 255.0).mean(axis=(0, 1, 2)) +DATA_STD = (train_dataset.data / 255.0).std(axis=(0, 1, 2)) +print("Data mean", DATA_MEANS) +print("Data std", DATA_STD) + +# %% [markdown] +# We will use this information to define a `transforms.Normalize` module which will normalize our data accordingly. +# Additionally, we will use data augmentation during training. +# This reduces the risk of overfitting and helps CNNs to generalize better. +# Specifically, we will apply two random augmentations. +# +# First, we will flip each image horizontally by a chance of 50% (`transforms.RandomHorizontalFlip`). +# The object class usually does not change when flipping an image, and we don't expect any image information to be dependent on the horizontal orientation. +# This would be however different if we would try to detect digits or letters in an image, as those have a certain orientation. +# +# The second augmentation we use is called `transforms.RandomResizedCrop`. +# This transformation scales the image in a small range, while eventually changing the aspect ratio, and crops it afterward in the previous size. +# Therefore, the actual pixel values change while the content or overall semantics of the image stays the same. +# +# We will randomly split the training dataset into a training and a validation set. +# The validation set will be used for determining early stopping. +# After finishing the training, we test the models on the CIFAR test set. + +# %% +test_transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize(DATA_MEANS, DATA_STD)]) +# For training, we add some augmentation. Networks are too powerful and would overfit. +train_transform = transforms.Compose( + [ + transforms.RandomHorizontalFlip(), + transforms.RandomResizedCrop((32, 32), scale=(0.8, 1.0), ratio=(0.9, 1.1)), + transforms.ToTensor(), + transforms.Normalize(DATA_MEANS, DATA_STD), + ] +) +# Loading the training dataset. We need to split it into a training and validation part +# We need to do a little trick because the validation set should not use the augmentation. +train_dataset = CIFAR10(root=DATASET_PATH, train=True, transform=train_transform, download=True) +val_dataset = CIFAR10(root=DATASET_PATH, train=True, transform=test_transform, download=True) +L.seed_everything(42) +train_set, _ = torch.utils.data.random_split(train_dataset, [45000, 5000]) +L.seed_everything(42) +_, val_set = torch.utils.data.random_split(val_dataset, [45000, 5000]) + +# Loading the test set +test_set = CIFAR10(root=DATASET_PATH, train=False, transform=test_transform, download=True) + +# We define a set of data loaders that we can use for various purposes later. +train_loader = data.DataLoader(train_set, batch_size=128, shuffle=True, drop_last=True, pin_memory=True, num_workers=4) +val_loader = data.DataLoader(val_set, batch_size=128, shuffle=False, drop_last=False, num_workers=4) +test_loader = data.DataLoader(test_set, batch_size=128, shuffle=False, drop_last=False, num_workers=4) + +# %% [markdown] +# To verify that our normalization works, we can print out the mean and standard deviation of the single batch. +# The mean should be close to 0 and the standard deviation close to 1 for each channel: + +# %% +imgs, _ = next(iter(train_loader)) +print("Batch mean", imgs.mean(dim=[0, 2, 3])) +print("Batch std", imgs.std(dim=[0, 2, 3])) + +# %% [markdown] +# Finally, let's visualize a few images from the training set, and how they look like after random data augmentation: + +# %% +NUM_IMAGES = 4 +images = [train_dataset[idx][0] for idx in range(NUM_IMAGES)] +orig_images = [Image.fromarray(train_dataset.data[idx]) for idx in range(NUM_IMAGES)] +orig_images = [test_transform(img) for img in orig_images] + +img_grid = torchvision.utils.make_grid(torch.stack(images + orig_images, dim=0), nrow=4, normalize=True, pad_value=0.5) +img_grid = img_grid.permute(1, 2, 0) + +plt.figure(figsize=(8, 8)) +plt.title("Augmentation examples on CIFAR10") +plt.imshow(img_grid) +plt.axis("off") +plt.show() +plt.close() + +# %% [markdown] +# ## PyTorch Lightning +# +# In this notebook and in many following ones, we will make use of the library [PyTorch Lightning](https://www.lightning.ai/docs/pytorch/stable). +# PyTorch Lightning is a framework that simplifies your code needed to train, evaluate, and test a model in PyTorch. +# It also handles logging into [TensorBoard](https://pytorch.org/tutorials/intermediate/tensorboard_tutorial.html), a visualization toolkit for ML experiments, and saving model checkpoints automatically with minimal code overhead from our side. +# This is extremely helpful for us as we want to focus on implementing different model architectures and spend little time on other code overhead. +# Note that at the time of writing/teaching, the framework has been released in version 1.3. +# Future versions might have a slightly changed interface and thus might not work perfectly with the code (we will try to keep it up-to-date as much as possible). +# +# Now, we will take the first step in PyTorch Lightning, and continue to explore the framework in our other tutorials. +# PyTorch Lightning comes with a lot of useful functions, such as one for setting the seed as we have seen before: + +# %% +# Setting the seed +L.seed_everything(42) + +# %% [markdown] +# Thus, in the future, we don't have to define our own `set_seed` function anymore. +# +# In PyTorch Lightning, we define `L.LightningModule`'s (inheriting from `Module`) that organize our code into 5 main sections: +# +# 1. Initialization (`__init__`), where we create all necessary parameters/models +# 2. Optimizers (`configure_optimizers`) where we create the optimizers, learning rate scheduler, etc. +# 3. +# Training loop (`training_step`) where we only have to define the loss calculation for a single batch (the loop of optimizer.zero_grad(), loss.backward() and optimizer.step(), as well as any logging/saving operation, is done in the background) +# 4. +# Validation loop (`validation_step`) where similarly to the training, we only have to define what should happen per step +# 5. Test loop (`test_step`) which is the same as validation, only on a test set. +# +# Therefore, we don't abstract the PyTorch code, but rather organize it and define some default operations that are commonly used. +# If you need to change something else in your training/validation/test loop, there are many possible functions you can overwrite (see the [docs](https://lightning.ai/docs/pytorch/stable/common/lightning_module.html) for details). +# +# Now we can look at an example of how a Lightning Module for training a CNN looks like: + + +# %% +class CIFARModule(L.LightningModule): + def __init__(self, model_name, model_hparams, optimizer_name, optimizer_hparams): + """ + Inputs: + model_name - Name of the model/CNN to run. Used for creating the model (see function below) + model_hparams - Hyperparameters for the model, as dictionary. + optimizer_name - Name of the optimizer to use. Currently supported: Adam, SGD + optimizer_hparams - Hyperparameters for the optimizer, as dictionary. This includes learning rate, weight decay, etc. + """ + super().__init__() + # Exports the hyperparameters to a YAML file, and create "self.hparams" namespace + self.save_hyperparameters() + # Create model + self.model = create_model(model_name, model_hparams) + # Create loss module + self.loss_module = nn.CrossEntropyLoss() + # Example input for visualizing the graph in Tensorboard + self.example_input_array = torch.zeros((1, 3, 32, 32), dtype=torch.float32) + + def forward(self, imgs): + # Forward function that is run when visualizing the graph + return self.model(imgs) + + def configure_optimizers(self): + # We will support Adam or SGD as optimizers. + if self.hparams.optimizer_name == "Adam": + # AdamW is Adam with a correct implementation of weight decay (see here + # for details: https://arxiv.org/pdf/1711.05101.pdf) + optimizer = optim.AdamW(self.parameters(), **self.hparams.optimizer_hparams) + elif self.hparams.optimizer_name == "SGD": + optimizer = optim.SGD(self.parameters(), **self.hparams.optimizer_hparams) + else: + assert False, f'Unknown optimizer: "{self.hparams.optimizer_name}"' + + # We will reduce the learning rate by 0.1 after 100 and 150 epochs + scheduler = optim.lr_scheduler.MultiStepLR(optimizer, milestones=[100, 150], gamma=0.1) + return [optimizer], [scheduler] + + def training_step(self, batch, batch_idx): + # "batch" is the output of the training data loader. + imgs, labels = batch + preds = self.model(imgs) + loss = self.loss_module(preds, labels) + acc = (preds.argmax(dim=-1) == labels).float().mean() + + # Logs the accuracy per epoch to tensorboard (weighted average over batches) + self.log("train_acc", acc, on_step=False, on_epoch=True) + self.log("train_loss", loss) + return loss # Return tensor to call ".backward" on + + def validation_step(self, batch, batch_idx): + imgs, labels = batch + preds = self.model(imgs).argmax(dim=-1) + acc = (labels == preds).float().mean() + # By default logs it per epoch (weighted average over batches) + self.log("val_acc", acc) + + def test_step(self, batch, batch_idx): + imgs, labels = batch + preds = self.model(imgs).argmax(dim=-1) + acc = (labels == preds).float().mean() + # By default logs it per epoch (weighted average over batches), and returns it afterwards + self.log("test_acc", acc) + + +# %% [markdown] +# We see that the code is organized and clear, which helps if someone else tries to understand your code. +# +# Another important part of PyTorch Lightning is the concept of callbacks. +# Callbacks are self-contained functions that contain the non-essential logic of your Lightning Module. +# They are usually called after finishing a training epoch, but can also influence other parts of your training loop. +# For instance, we will use the following two pre-defined callbacks: `LearningRateMonitor` and `ModelCheckpoint`. +# The learning rate monitor adds the current learning rate to our TensorBoard, which helps to verify that our learning rate scheduler works correctly. +# The model checkpoint callback allows you to customize the saving routine of your checkpoints. +# For instance, how many checkpoints to keep, when to save, which metric to look out for, etc. +# We import them below: + +# %% +# Callbacks + +# %% [markdown] +# To allow running multiple different models with the same Lightning module, we define a function below that maps a model name to the model class. +# At this stage, the dictionary `model_dict` is empty, but we will fill it throughout the notebook with our new models. + +# %% +model_dict = {} + + +def create_model(model_name, model_hparams): + if model_name in model_dict: + return model_dict[model_name](**model_hparams) + else: + assert False, f'Unknown model name "{model_name}". Available models are: {str(model_dict.keys())}' + + +# %% [markdown] +# Similarly, to use the activation function as another hyperparameter in +# our model, we define a "name to function" dict below: + +# %% +act_fn_by_name = {"tanh": nn.Tanh, "relu": nn.ReLU, "leakyrelu": nn.LeakyReLU, "gelu": nn.GELU} + +# %% [markdown] +# If we pass the classes or objects directly as an argument to the Lightning module, we couldn't take advantage of PyTorch Lightning's automatically hyperparameter saving and loading. +# +# Besides the Lightning module, the second most important module in PyTorch Lightning is the `Trainer`. +# The trainer is responsible to execute the training steps defined in the Lightning module and completes the framework. +# Similar to the Lightning module, you can override any key part that you don't want to be automated, but the default settings are often the best practice to do. +# For a full overview, see the [documentation](https://lightning.ai/docs/pytorch/stable/common/trainer.html). +# The most important functions we use below are: +# +# * `trainer.fit`: Takes as input a lightning module, a training dataset, and an (optional) validation dataset. +# This function trains the given module on the training dataset with occasional validation (default once per epoch, can be changed) +# * `trainer.test`: Takes as input a model and a dataset on which we want to test. +# It returns the test metric on the dataset. +# +# For training and testing, we don't have to worry about things like setting the model to eval mode (`model.eval()`) as this is all done automatically. +# See below how we define a training function for our models: + + +# %% +def train_model(model_name, save_name=None, **kwargs): + """ + Inputs: + model_name - Name of the model you want to run. Is used to look up the class in "model_dict" + save_name (optional) - If specified, this name will be used for creating the checkpoint and logging directory. + """ + if save_name is None: + save_name = model_name + + # Create a PyTorch Lightning trainer with the generation callback + trainer = L.Trainer( + default_root_dir=os.path.join(CHECKPOINT_PATH, save_name), # Where to save models + # We run on a single GPU (if possible) + accelerator="auto", + devices=1, + # How many epochs to train for if no patience is set + max_epochs=180, + callbacks=[ + ModelCheckpoint( + save_weights_only=True, mode="max", monitor="val_acc" + ), # Save the best checkpoint based on the maximum val_acc recorded. Saves only weights and not optimizer + LearningRateMonitor("epoch"), + ], # Log learning rate every epoch + ) # In case your notebook crashes due to the progress bar, consider increasing the refresh rate + trainer.logger._log_graph = True # If True, we plot the computation graph in tensorboard + trainer.logger._default_hp_metric = None # Optional logging argument that we don't need + + # Check whether pretrained model exists. If yes, load it and skip training + pretrained_filename = os.path.join(CHECKPOINT_PATH, save_name + ".ckpt") + if os.path.isfile(pretrained_filename): + print(f"Found pretrained model at {pretrained_filename}, loading...") + # Automatically loads the model with the saved hyperparameters + model = CIFARModule.load_from_checkpoint(pretrained_filename) + else: + L.seed_everything(42) # To be reproducable + model = CIFARModule(model_name=model_name, **kwargs) + trainer.fit(model, train_loader, val_loader) + model = CIFARModule.load_from_checkpoint( + trainer.checkpoint_callback.best_model_path + ) # Load best checkpoint after training + + # Test best model on validation and test set + val_result = trainer.test(model, dataloaders=val_loader, verbose=False) + test_result = trainer.test(model, dataloaders=test_loader, verbose=False) + result = {"test": test_result[0]["test_acc"], "val": val_result[0]["test_acc"]} + + return model, result + + +# %% [markdown] +# Finally, we can focus on the Convolutional Neural Networks we want to +# implement today: GoogleNet, ResNet, and DenseNet. + +# %% [markdown] +# ## Inception +# +#
+# +# The [GoogleNet](https://arxiv.org/abs/1409.4842), proposed in 2014, won the ImageNet Challenge because of its usage of the Inception modules. +# In general, we will mainly focus on the concept of Inception in this tutorial instead of the specifics of the GoogleNet, as based on Inception, there have been many follow-up works ([Inception-v2](https://arxiv.org/abs/1512.00567), [Inception-v3](https://arxiv.org/abs/1512.00567), [Inception-v4](https://arxiv.org/abs/1602.07261), [Inception-ResNet](https://arxiv.org/abs/1602.07261),...). +# The follow-up works mainly focus on increasing efficiency and enabling very deep Inception networks. +# However, for a fundamental understanding, it is sufficient to look at the original Inception block. +# +# An Inception block applies four convolution blocks separately on the same feature map: a 1x1, 3x3, and 5x5 convolution, and a max pool operation. +# This allows the network to look at the same data with different receptive fields. +# Of course, learning only 5x5 convolution would be theoretically more powerful. +# However, this is not only more computation and memory heavy but also tends to overfit much easier. +# The overall inception block looks like below (figure credit - [Szegedy et al. ](https://arxiv.org/abs/1409.4842)): +# +#
+# +# The additional 1x1 convolutions before the 3x3 and 5x5 convolutions are used for dimensionality reduction. +# This is especially crucial as the feature maps of all branches are merged afterward, and we don't want any explosion of feature size. +# As 5x5 convolutions are 25 times more expensive than 1x1 convolutions, we can save a lot of computation and parameters by reducing the dimensionality before the large convolutions. +# +# We can now try to implement the Inception Block ourselves: + + +# %% +class InceptionBlock(nn.Module): + def __init__(self, c_in, c_red: dict, c_out: dict, act_fn): + """ + Inputs: + c_in - Number of input feature maps from the previous layers + c_red - Dictionary with keys "3x3" and "5x5" specifying the output of the dimensionality reducing 1x1 convolutions + c_out - Dictionary with keys "1x1", "3x3", "5x5", and "max" + act_fn - Activation class constructor (e.g. nn.ReLU) + """ + super().__init__() + + # 1x1 convolution branch + self.conv_1x1 = nn.Sequential( + nn.Conv2d(c_in, c_out["1x1"], kernel_size=1), nn.BatchNorm2d(c_out["1x1"]), act_fn() + ) + + # 3x3 convolution branch + self.conv_3x3 = nn.Sequential( + nn.Conv2d(c_in, c_red["3x3"], kernel_size=1), + nn.BatchNorm2d(c_red["3x3"]), + act_fn(), + nn.Conv2d(c_red["3x3"], c_out["3x3"], kernel_size=3, padding=1), + nn.BatchNorm2d(c_out["3x3"]), + act_fn(), + ) + + # 5x5 convolution branch + self.conv_5x5 = nn.Sequential( + nn.Conv2d(c_in, c_red["5x5"], kernel_size=1), + nn.BatchNorm2d(c_red["5x5"]), + act_fn(), + nn.Conv2d(c_red["5x5"], c_out["5x5"], kernel_size=5, padding=2), + nn.BatchNorm2d(c_out["5x5"]), + act_fn(), + ) + + # Max-pool branch + self.max_pool = nn.Sequential( + nn.MaxPool2d(kernel_size=3, padding=1, stride=1), + nn.Conv2d(c_in, c_out["max"], kernel_size=1), + nn.BatchNorm2d(c_out["max"]), + act_fn(), + ) + + def forward(self, x): + x_1x1 = self.conv_1x1(x) + x_3x3 = self.conv_3x3(x) + x_5x5 = self.conv_5x5(x) + x_max = self.max_pool(x) + x_out = torch.cat([x_1x1, x_3x3, x_5x5, x_max], dim=1) + return x_out + + +# %% [markdown] +# The GoogleNet architecture consists of stacking multiple Inception blocks with occasional max pooling to reduce the height and width of the feature maps. +# The original GoogleNet was designed for image sizes of ImageNet (224x224 pixels) and had almost 7 million parameters. +# As we train on CIFAR10 with image sizes of 32x32, we don't require such a heavy architecture, and instead, apply a reduced version. +# The number of channels for dimensionality reduction and output per filter (1x1, 3x3, 5x5, and max pooling) need to be manually specified and can be changed if interested. +# The general intuition is to have the most filters for the 3x3 +# convolutions, as they are powerful enough to take the context into +# account while requiring almost a third of the parameters of the 5x5 +# convolution. + + +# %% +class GoogleNet(nn.Module): + def __init__(self, num_classes=10, act_fn_name="relu", **kwargs): + super().__init__() + self.hparams = SimpleNamespace( + num_classes=num_classes, act_fn_name=act_fn_name, act_fn=act_fn_by_name[act_fn_name] + ) + self._create_network() + self._init_params() + + def _create_network(self): + # A first convolution on the original image to scale up the channel size + self.input_net = nn.Sequential( + nn.Conv2d(3, 64, kernel_size=3, padding=1), nn.BatchNorm2d(64), self.hparams.act_fn() + ) + # Stacking inception blocks + self.inception_blocks = nn.Sequential( + InceptionBlock( + 64, + c_red={"3x3": 32, "5x5": 16}, + c_out={"1x1": 16, "3x3": 32, "5x5": 8, "max": 8}, + act_fn=self.hparams.act_fn, + ), + InceptionBlock( + 64, + c_red={"3x3": 32, "5x5": 16}, + c_out={"1x1": 24, "3x3": 48, "5x5": 12, "max": 12}, + act_fn=self.hparams.act_fn, + ), + nn.MaxPool2d(3, stride=2, padding=1), # 32x32 => 16x16 + InceptionBlock( + 96, + c_red={"3x3": 32, "5x5": 16}, + c_out={"1x1": 24, "3x3": 48, "5x5": 12, "max": 12}, + act_fn=self.hparams.act_fn, + ), + InceptionBlock( + 96, + c_red={"3x3": 32, "5x5": 16}, + c_out={"1x1": 16, "3x3": 48, "5x5": 16, "max": 16}, + act_fn=self.hparams.act_fn, + ), + InceptionBlock( + 96, + c_red={"3x3": 32, "5x5": 16}, + c_out={"1x1": 16, "3x3": 48, "5x5": 16, "max": 16}, + act_fn=self.hparams.act_fn, + ), + InceptionBlock( + 96, + c_red={"3x3": 32, "5x5": 16}, + c_out={"1x1": 32, "3x3": 48, "5x5": 24, "max": 24}, + act_fn=self.hparams.act_fn, + ), + nn.MaxPool2d(3, stride=2, padding=1), # 16x16 => 8x8 + InceptionBlock( + 128, + c_red={"3x3": 48, "5x5": 16}, + c_out={"1x1": 32, "3x3": 64, "5x5": 16, "max": 16}, + act_fn=self.hparams.act_fn, + ), + InceptionBlock( + 128, + c_red={"3x3": 48, "5x5": 16}, + c_out={"1x1": 32, "3x3": 64, "5x5": 16, "max": 16}, + act_fn=self.hparams.act_fn, + ), + ) + # Mapping to classification output + self.output_net = nn.Sequential( + nn.AdaptiveAvgPool2d((1, 1)), nn.Flatten(), nn.Linear(128, self.hparams.num_classes) + ) + + def _init_params(self): + # Based on our discussion in Tutorial 4, we should initialize the + # convolutions according to the activation function + for m in self.modules(): + if isinstance(m, nn.Conv2d): + nn.init.kaiming_normal_(m.weight, nonlinearity=self.hparams.act_fn_name) + elif isinstance(m, nn.BatchNorm2d): + nn.init.constant_(m.weight, 1) + nn.init.constant_(m.bias, 0) + + def forward(self, x): + x = self.input_net(x) + x = self.inception_blocks(x) + x = self.output_net(x) + return x + + +# %% [markdown] +# Now, we can integrate our model to the model dictionary we defined above: + +# %% +model_dict["GoogleNet"] = GoogleNet + +# %% [markdown] +# The training of the model is handled by PyTorch Lightning, and we just have to define the command to start. +# Note that we train for almost 200 epochs, which takes about an hour on Lisa's default GPUs (GTX1080Ti). +# We would recommend using the saved models and train your own model if you are interested. + +# %% +googlenet_model, googlenet_results = train_model( + model_name="GoogleNet", + model_hparams={"num_classes": 10, "act_fn_name": "relu"}, + optimizer_name="Adam", + optimizer_hparams={"lr": 1e-3, "weight_decay": 1e-4}, +) + +# %% [markdown] +# We will compare the results later in the notebooks, but we can already print them here for a first glance: + +# %% +print("GoogleNet Results", googlenet_results) + +# %% [markdown] +# ### Tensorboard log +# +# A nice extra of PyTorch Lightning is the automatic logging into TensorBoard. +# To give you a better intuition of what TensorBoard can be used, we can look at the board that PyTorch Lightning has been generated when training the GoogleNet. +# TensorBoard provides an inline functionality for Jupyter notebooks, and we use it here: + +# %% +# Import tensorboard +# %load_ext tensorboard + +# %% +# Opens tensorboard in notebook. Adjust the path to your CHECKPOINT_PATH! +# %tensorboard --logdir ../saved_models/tutorial5/tensorboards/GoogleNet/ + +# %% [markdown] +#
+# +# TensorBoard is organized in multiple tabs. +# The main tab is the scalar tab where we can log the development of single numbers. +# For example, we have plotted the training loss, accuracy, learning rate, etc. +# If we look at the training or validation accuracy, we can really see the impact of using a learning rate scheduler. +# Reducing the learning rate gives our model a nice increase in training performance. +# Similarly, when looking at the training loss, we see a sudden decrease at this point. +# However, the high numbers on the training set compared to validation indicate that our model was overfitting which is inevitable for such large networks. +# +# Another interesting tab in TensorBoard is the graph tab. +# It shows us the network architecture organized by building blocks from the input to the output. +# It basically shows the operations taken in the forward step of `CIFARModule`. +# Double-click on a module to open it. +# Feel free to explore the architecture from a different perspective. +# The graph visualization can often help you to validate that your model +# is actually doing what it is supposed to do, and you don't miss any +# layers in the computation graph. + +# %% [markdown] +# ## ResNet +# +# The [ResNet](https://arxiv.org/abs/1512.03385) paper is one of the [most cited AI papers](https://www.natureindex.com/news-blog/google-scholar-reveals-most-influential-papers-research-citations-twenty-twenty), and has been the foundation for neural networks with more than 1,000 layers. +# Despite its simplicity, the idea of residual connections is highly effective as it supports stable gradient propagation through the network. +# Instead of modeling $x_{l+1}=F(x_{l})$, we model $x_{l+1}=x_{l}+F(x_{l})$ where $F$ is a non-linear mapping (usually a sequence of NN modules likes convolutions, activation functions, and normalizations). +# If we do backpropagation on such residual connections, we obtain: +# +# $$\frac{\partial x_{l+1}}{\partial x_{l}} = \mathbf{I} + \frac{\partial F(x_{l})}{\partial x_{l}}$$ +# +# The bias towards the identity matrix guarantees a stable gradient propagation being less effected by $F$ itself. +# There have been many variants of ResNet proposed, which mostly concern the function $F$, or operations applied on the sum. +# In this tutorial, we look at two of them: the original ResNet block, and the [Pre-Activation ResNet block](https://arxiv.org/abs/1603.05027). +# We visually compare the blocks below (figure credit - [He et al. ](https://arxiv.org/abs/1603.05027)): +# +#
+# +# The original ResNet block applies a non-linear activation function, usually ReLU, after the skip connection. +# In contrast, the pre-activation ResNet block applies the non-linearity at the beginning of $F$. +# Both have their advantages and disadvantages. +# For very deep network, however, the pre-activation ResNet has shown to perform better as the gradient flow is guaranteed to have the identity matrix as calculated above, and is not harmed by any non-linear activation applied to it. +# For comparison, in this notebook, we implement both ResNet types as shallow networks. +# +# Let's start with the original ResNet block. +# The visualization above already shows what layers are included in $F$. +# One special case we have to handle is when we want to reduce the image dimensions in terms of width and height. +# The basic ResNet block requires $F(x_{l})$ to be of the same shape as $x_{l}$. +# Thus, we need to change the dimensionality of $x_{l}$ as well before adding to $F(x_{l})$. +# The original implementation used an identity mapping with stride 2 and padded additional feature dimensions with 0. +# However, the more common implementation is to use a 1x1 convolution with stride 2 as it allows us to change the feature dimensionality while being efficient in parameter and computation cost. +# The code for the ResNet block is relatively simple, and shown below: + +# %% + + +class ResNetBlock(nn.Module): + def __init__(self, c_in, act_fn, subsample=False, c_out=-1): + """ + Inputs: + c_in - Number of input features + act_fn - Activation class constructor (e.g. nn.ReLU) + subsample - If True, we want to apply a stride inside the block and reduce the output shape by 2 in height and width + c_out - Number of output features. Note that this is only relevant if subsample is True, as otherwise, c_out = c_in + """ + super().__init__() + if not subsample: + c_out = c_in + + # Network representing F + self.net = nn.Sequential( + nn.Conv2d( + c_in, c_out, kernel_size=3, padding=1, stride=1 if not subsample else 2, bias=False + ), # No bias needed as the Batch Norm handles it + nn.BatchNorm2d(c_out), + act_fn(), + nn.Conv2d(c_out, c_out, kernel_size=3, padding=1, bias=False), + nn.BatchNorm2d(c_out), + ) + + # 1x1 convolution with stride 2 means we take the upper left value, and transform it to new output size + self.downsample = nn.Conv2d(c_in, c_out, kernel_size=1, stride=2) if subsample else None + self.act_fn = act_fn() + + def forward(self, x): + z = self.net(x) + if self.downsample is not None: + x = self.downsample(x) + out = z + x + out = self.act_fn(out) + return out + + +# %% [markdown] +# The second block we implement is the pre-activation ResNet block. +# For this, we have to change the order of layer in `self.net`, and do not apply an activation function on the output. +# Additionally, the downsampling operation has to apply a non-linearity as well as the input, $x_l$, has not been processed by a non-linearity yet. +# Hence, the block looks as follows: + + +# %% +class PreActResNetBlock(nn.Module): + def __init__(self, c_in, act_fn, subsample=False, c_out=-1): + """ + Inputs: + c_in - Number of input features + act_fn - Activation class constructor (e.g. nn.ReLU) + subsample - If True, we want to apply a stride inside the block and reduce the output shape by 2 in height and width + c_out - Number of output features. Note that this is only relevant if subsample is True, as otherwise, c_out = c_in + """ + super().__init__() + if not subsample: + c_out = c_in + + # Network representing F + self.net = nn.Sequential( + nn.BatchNorm2d(c_in), + act_fn(), + nn.Conv2d(c_in, c_out, kernel_size=3, padding=1, stride=1 if not subsample else 2, bias=False), + nn.BatchNorm2d(c_out), + act_fn(), + nn.Conv2d(c_out, c_out, kernel_size=3, padding=1, bias=False), + ) + + # 1x1 convolution needs to apply non-linearity as well as not done on skip connection + self.downsample = ( + nn.Sequential(nn.BatchNorm2d(c_in), act_fn(), nn.Conv2d(c_in, c_out, kernel_size=1, stride=2, bias=False)) + if subsample + else None + ) + + def forward(self, x): + z = self.net(x) + if self.downsample is not None: + x = self.downsample(x) + out = z + x + return out + + +# %% [markdown] +# Similarly to the model selection, we define a dictionary to create a mapping from string to block class. +# We will use the string name as hyperparameter value in our model to choose between the ResNet blocks. +# Feel free to implement any other ResNet block type and add it here as well. + +# %% +resnet_blocks_by_name = {"ResNetBlock": ResNetBlock, "PreActResNetBlock": PreActResNetBlock} + +# %% [markdown] +# The overall ResNet architecture consists of stacking multiple ResNet blocks, of which some are downsampling the input. +# When talking about ResNet blocks in the whole network, we usually group them by the same output shape. +# Hence, if we say the ResNet has `[3,3,3]` blocks, it means that we have 3 times a group of 3 ResNet blocks, where a subsampling is taking place in the fourth and seventh block. +# The ResNet with `[3,3,3]` blocks on CIFAR10 is visualized below. +# +#
+# +# The three groups operate on the resolutions $32\times32$, $16\times16$ and $8\times8$ respectively. +# The blocks in orange denote ResNet blocks with downsampling. +# The same notation is used by many other implementations such as in the [torchvision library](https://pytorch.org/vision/0.11/models.html#torchvision.models.resnet18) from PyTorch. +# Thus, our code looks as follows: + + +# %% +class ResNet(nn.Module): + def __init__( + self, + num_classes=10, + num_blocks=[3, 3, 3], + c_hidden=[16, 32, 64], + act_fn_name="relu", + block_name="ResNetBlock", + **kwargs, + ): + """ + Inputs: + num_classes - Number of classification outputs (10 for CIFAR10) + num_blocks - List with the number of ResNet blocks to use. The first block of each group uses downsampling, except the first. + c_hidden - List with the hidden dimensionalities in the different blocks. Usually multiplied by 2 the deeper we go. + act_fn_name - Name of the activation function to use, looked up in "act_fn_by_name" + block_name - Name of the ResNet block, looked up in "resnet_blocks_by_name" + """ + super().__init__() + assert block_name in resnet_blocks_by_name + self.hparams = SimpleNamespace( + num_classes=num_classes, + c_hidden=c_hidden, + num_blocks=num_blocks, + act_fn_name=act_fn_name, + act_fn=act_fn_by_name[act_fn_name], + block_class=resnet_blocks_by_name[block_name], + ) + self._create_network() + self._init_params() + + def _create_network(self): + c_hidden = self.hparams.c_hidden + + # A first convolution on the original image to scale up the channel size + if self.hparams.block_class == PreActResNetBlock: # => Don't apply non-linearity on output + self.input_net = nn.Sequential(nn.Conv2d(3, c_hidden[0], kernel_size=3, padding=1, bias=False)) + else: + self.input_net = nn.Sequential( + nn.Conv2d(3, c_hidden[0], kernel_size=3, padding=1, bias=False), + nn.BatchNorm2d(c_hidden[0]), + self.hparams.act_fn(), + ) + + # Creating the ResNet blocks + blocks = [] + for block_idx, block_count in enumerate(self.hparams.num_blocks): + for bc in range(block_count): + # Subsample the first block of each group, except the very first one. + subsample = bc == 0 and block_idx > 0 + blocks.append( + self.hparams.block_class( + c_in=c_hidden[block_idx if not subsample else (block_idx - 1)], + act_fn=self.hparams.act_fn, + subsample=subsample, + c_out=c_hidden[block_idx], + ) + ) + self.blocks = nn.Sequential(*blocks) + + # Mapping to classification output + self.output_net = nn.Sequential( + nn.AdaptiveAvgPool2d((1, 1)), nn.Flatten(), nn.Linear(c_hidden[-1], self.hparams.num_classes) + ) + + def _init_params(self): + # Based on our discussion in Tutorial 4, we should initialize the convolutions according to the activation function + # Fan-out focuses on the gradient distribution, and is commonly used in ResNets + for m in self.modules(): + if isinstance(m, nn.Conv2d): + nn.init.kaiming_normal_(m.weight, mode="fan_out", nonlinearity=self.hparams.act_fn_name) + elif isinstance(m, nn.BatchNorm2d): + nn.init.constant_(m.weight, 1) + nn.init.constant_(m.bias, 0) + + def forward(self, x): + x = self.input_net(x) + x = self.blocks(x) + x = self.output_net(x) + return x + + +# %% [markdown] +# We also need to add the new ResNet class to our model dictionary: + +# %% +model_dict["ResNet"] = ResNet + +# %% [markdown] +# Finally, we can train our ResNet models. +# One difference to the GoogleNet training is that we explicitly use SGD with Momentum as optimizer instead of Adam. +# Adam often leads to a slightly worse accuracy on plain, shallow ResNets. +# It is not 100% clear why Adam performs worse in this context, but one possible explanation is related to ResNet's loss surface. +# ResNet has been shown to produce smoother loss surfaces than networks without skip connection (see [Li et al., 2018](https://arxiv.org/pdf/1712.09913.pdf) for details). +# A possible visualization of the loss surface with/out skip connections is below (figure credit - [Li et al. ](https://arxiv.org/pdf/1712.09913.pdf)): +# +#
+# +# The $x$ and $y$ axis shows a projection of the parameter space, and the $z$ axis shows the loss values achieved by different parameter values. +# On smooth surfaces like the one on the right, we might not require an adaptive learning rate as Adam provides. +# Instead, Adam can get stuck in local optima while SGD finds the wider minima that tend to generalize better. +# However, to answer this question in detail, we would need an extra tutorial because it is not easy to answer. +# For now, we conclude: for ResNet architectures, consider the optimizer to be an important hyperparameter, and try training with both Adam and SGD. +# Let's train the model below with SGD: + +# %% +resnet_model, resnet_results = train_model( + model_name="ResNet", + model_hparams={"num_classes": 10, "c_hidden": [16, 32, 64], "num_blocks": [3, 3, 3], "act_fn_name": "relu"}, + optimizer_name="SGD", + optimizer_hparams={"lr": 0.1, "momentum": 0.9, "weight_decay": 1e-4}, +) + +# %% [markdown] +# Let's also train the pre-activation ResNet as comparison: + +# %% +resnetpreact_model, resnetpreact_results = train_model( + model_name="ResNet", + model_hparams={ + "num_classes": 10, + "c_hidden": [16, 32, 64], + "num_blocks": [3, 3, 3], + "act_fn_name": "relu", + "block_name": "PreActResNetBlock", + }, + optimizer_name="SGD", + optimizer_hparams={"lr": 0.1, "momentum": 0.9, "weight_decay": 1e-4}, + save_name="ResNetPreAct", +) + +# %% [markdown] +# ### Tensorboard log +# +# Similarly to our GoogleNet model, we also have a TensorBoard log for the ResNet model. We can open it below. + +# %% +# Opens tensorboard in notebook. Adjust the path to your CHECKPOINT_PATH! Feel free to change "ResNet" to "ResNetPreAct" +# %tensorboard --logdir ../saved_models/tutorial5/tensorboards/ResNet/ + +# %% [markdown] +#
+# +# Feel free to explore the TensorBoard yourself, including the computation graph. +# In general, we can see that with SGD, the ResNet has a higher training loss than the GoogleNet in the first stage of the training. +# After reducing the learning rate however, the model achieves even higher validation accuracies. +# We compare the precise scores at the end of the notebook. + +# %% [markdown] +# ## DenseNet +# +#
+# +# [DenseNet](https://arxiv.org/abs/1608.06993) is another architecture for enabling very deep neural networks and takes a slightly different perspective on residual connections. +# Instead of modeling the difference between layers, DenseNet considers residual connections as a possible way to reuse features across layers, removing any necessity to learn redundant feature maps. +# If we go deeper into the network, the model learns abstract features to recognize patterns. +# However, some complex patterns consist of a combination of abstract features (e.g. hand, face, etc. +# ), and low-level features (e.g. edges, basic color, etc.). +# To find these low-level features in the deep layers, standard CNNs have to learn copy such feature maps, which wastes a lot of parameter complexity. +# DenseNet provides an efficient way of reusing features by having each convolution depends on all previous input features, but add only a small amount of filters to it. +# See the figure below for an illustration (figure credit - [Hu et al. ](https://arxiv.org/abs/1608.06993)): +# +#
+# +# The last layer, called the transition layer, is responsible for reducing the dimensionality of the feature maps in height, width, and channel size. +# Although those technically break the identity backpropagation, there are only a few in a network so that it doesn't affect the gradient flow much. +# +# We split the implementation of the layers in DenseNet into three parts: a `DenseLayer`, and a `DenseBlock`, and a `TransitionLayer`. +# The module `DenseLayer` implements a single layer inside a dense block. +# It applies a 1x1 convolution for dimensionality reduction with a subsequential 3x3 convolution. +# The output channels are concatenated to the originals and returned. +# Note that we apply the Batch Normalization as the first layer of each block. +# This allows slightly different activations for the same features to different layers, depending on what is needed. +# Overall, we can implement it as follows: + + +# %% +class DenseLayer(nn.Module): + def __init__(self, c_in, bn_size, growth_rate, act_fn): + """ + Inputs: + c_in - Number of input channels + bn_size - Bottleneck size (factor of growth rate) for the output of the 1x1 convolution. Typically between 2 and 4. + growth_rate - Number of output channels of the 3x3 convolution + act_fn - Activation class constructor (e.g. nn.ReLU) + """ + super().__init__() + self.net = nn.Sequential( + nn.BatchNorm2d(c_in), + act_fn(), + nn.Conv2d(c_in, bn_size * growth_rate, kernel_size=1, bias=False), + nn.BatchNorm2d(bn_size * growth_rate), + act_fn(), + nn.Conv2d(bn_size * growth_rate, growth_rate, kernel_size=3, padding=1, bias=False), + ) + + def forward(self, x): + out = self.net(x) + out = torch.cat([out, x], dim=1) + return out + + +# %% [markdown] +# The module `DenseBlock` summarizes multiple dense layers applied in sequence. +# Each dense layer takes as input the original input concatenated with all previous layers' feature maps: + + +# %% +class DenseBlock(nn.Module): + def __init__(self, c_in, num_layers, bn_size, growth_rate, act_fn): + """ + Inputs: + c_in - Number of input channels + num_layers - Number of dense layers to apply in the block + bn_size - Bottleneck size to use in the dense layers + growth_rate - Growth rate to use in the dense layers + act_fn - Activation function to use in the dense layers + """ + super().__init__() + layers = [] + for layer_idx in range(num_layers): + # Input channels are original plus the feature maps from previous layers + layer_c_in = c_in + layer_idx * growth_rate + layers.append(DenseLayer(c_in=layer_c_in, bn_size=bn_size, growth_rate=growth_rate, act_fn=act_fn)) + self.block = nn.Sequential(*layers) + + def forward(self, x): + out = self.block(x) + return out + + +# %% [markdown] +# Finally, the `TransitionLayer` takes as input the final output of a dense block and reduces its channel dimensionality using a 1x1 convolution. +# To reduce the height and width dimension, we take a slightly different approach than in ResNet and apply an average pooling with kernel size 2 and stride 2. +# This is because we don't have an additional connection to the output that would consider the full 2x2 patch instead of a single value. +# Besides, it is more parameter efficient than using a 3x3 convolution with stride 2. +# Thus, the layer is implemented as follows: + + +# %% +class TransitionLayer(nn.Module): + def __init__(self, c_in, c_out, act_fn): + super().__init__() + self.transition = nn.Sequential( + nn.BatchNorm2d(c_in), + act_fn(), + nn.Conv2d(c_in, c_out, kernel_size=1, bias=False), + nn.AvgPool2d(kernel_size=2, stride=2), # Average the output for each 2x2 pixel group + ) + + def forward(self, x): + return self.transition(x) + + +# %% [markdown] +# Now we can put everything together and create our DenseNet. +# To specify the number of layers, we use a similar notation as in ResNets and pass on a list of ints representing the number of layers per block. +# After each dense block except the last one, we apply a transition layer to reduce the dimensionality by 2. + + +# %% +class DenseNet(nn.Module): + def __init__( + self, num_classes=10, num_layers=[6, 6, 6, 6], bn_size=2, growth_rate=16, act_fn_name="relu", **kwargs + ): + super().__init__() + self.hparams = SimpleNamespace( + num_classes=num_classes, + num_layers=num_layers, + bn_size=bn_size, + growth_rate=growth_rate, + act_fn_name=act_fn_name, + act_fn=act_fn_by_name[act_fn_name], + ) + self._create_network() + self._init_params() + + def _create_network(self): + c_hidden = self.hparams.growth_rate * self.hparams.bn_size # The start number of hidden channels + + # A first convolution on the original image to scale up the channel size + self.input_net = nn.Sequential( + # No batch norm or activation function as done inside the Dense layers + nn.Conv2d(3, c_hidden, kernel_size=3, padding=1) + ) + + # Creating the dense blocks, eventually including transition layers + blocks = [] + for block_idx, num_layers in enumerate(self.hparams.num_layers): + blocks.append( + DenseBlock( + c_in=c_hidden, + num_layers=num_layers, + bn_size=self.hparams.bn_size, + growth_rate=self.hparams.growth_rate, + act_fn=self.hparams.act_fn, + ) + ) + c_hidden = c_hidden + num_layers * self.hparams.growth_rate # Overall output of the dense block + if block_idx < len(self.hparams.num_layers) - 1: # Don't apply transition layer on last block + blocks.append(TransitionLayer(c_in=c_hidden, c_out=c_hidden // 2, act_fn=self.hparams.act_fn)) + c_hidden = c_hidden // 2 + + self.blocks = nn.Sequential(*blocks) + + # Mapping to classification output + self.output_net = nn.Sequential( + nn.BatchNorm2d(c_hidden), # The features have not passed a non-linearity until here. + self.hparams.act_fn(), + nn.AdaptiveAvgPool2d((1, 1)), + nn.Flatten(), + nn.Linear(c_hidden, self.hparams.num_classes), + ) + + def _init_params(self): + # Based on our discussion in Tutorial 4, we should initialize the + # convolutions according to the activation function + for m in self.modules(): + if isinstance(m, nn.Conv2d): + nn.init.kaiming_normal_(m.weight, nonlinearity=self.hparams.act_fn_name) + elif isinstance(m, nn.BatchNorm2d): + nn.init.constant_(m.weight, 1) + nn.init.constant_(m.bias, 0) + + def forward(self, x): + x = self.input_net(x) + x = self.blocks(x) + x = self.output_net(x) + return x + + +# %% [markdown] +# Let's also add the DenseNet to our model dictionary: + +# %% +model_dict["DenseNet"] = DenseNet + +# %% [markdown] +# Lastly, we train our network. +# In contrast to ResNet, DenseNet does not show any issues with Adam, and hence we train it with this optimizer. +# The other hyperparameters are chosen to result in a network with a similar parameter size as the ResNet and GoogleNet. +# Commonly, when designing very deep networks, DenseNet is more parameter +# efficient than ResNet while achieving a similar or even better +# performance. + +# %% +densenet_model, densenet_results = train_model( + model_name="DenseNet", + model_hparams={ + "num_classes": 10, + "num_layers": [6, 6, 6, 6], + "bn_size": 2, + "growth_rate": 16, + "act_fn_name": "relu", + }, + optimizer_name="Adam", + optimizer_hparams={"lr": 1e-3, "weight_decay": 1e-4}, +) + +# %% [markdown] +# ### Tensorboard log +# +# Finally, we also have another TensorBoard for the DenseNet training. We take a look at it below: + +# %% +# Opens tensorboard in notebook. Adjust the path to your CHECKPOINT_PATH! Feel free to change "ResNet" to "ResNetPreAct" +# %tensorboard --logdir ../saved_models/tutorial5/tensorboards/DenseNet/ + +# %% [markdown] +#
+# +# The overall course of the validation accuracy and training loss resemble the training of GoogleNet, which is also related to training the network with Adam. +# Feel free to explore the training metrics yourself. + +# %% [markdown] +# ## Conclusion and Comparison +# +# After discussing each model separately, and training all of them, we can finally compare them. +# First, let's organize the results of all models in a table: + +# %% language="html" +# +# + +# %% +all_models = [ + ("GoogleNet", googlenet_results, googlenet_model), + ("ResNet", resnet_results, resnet_model), + ("ResNetPreAct", resnetpreact_results, resnetpreact_model), + ("DenseNet", densenet_results, densenet_model), +] +table = [ + [ + model_name, + f"{100.0*model_results['val']:4.2f}%", + f"{100.0*model_results['test']:4.2f}%", + f"{sum(np.prod(p.shape) for p in model.parameters()):,}", + ] + for model_name, model_results, model in all_models +] +display( + HTML( + tabulate.tabulate(table, tablefmt="html", headers=["Model", "Val Accuracy", "Test Accuracy", "Num Parameters"]) + ) +) + +# %% [markdown] +# First of all, we see that all models are performing reasonably well. +# Simple models as you have implemented them in the practical achieve considerably lower performance, which is beside the lower number of parameters also attributed to the architecture design choice. +# GoogleNet is the model to obtain the lowest performance on the validation and test set, although it is very close to DenseNet. +# A proper hyperparameter search over all the channel sizes in GoogleNet would likely improve the accuracy of the model to a similar level, but this is also expensive given a large number of hyperparameters. +# ResNet outperforms both DenseNet and GoogleNet by more than 1% on the validation set, while there is a minor difference between both versions, original and pre-activation. +# We can conclude that for shallow networks, the place of the activation function does not seem to be crucial, although papers have reported the contrary for very deep networks (e.g. [He et al. ](https://arxiv.org/abs/1603.05027)). +# +# In general, we can conclude that ResNet is a simple, but powerful architecture. +# If we would apply the models on more complex tasks with larger images and more layers inside the networks, we would likely see a bigger gap between GoogleNet and skip-connection architectures like ResNet and DenseNet. +# A comparison with deeper models on CIFAR10 can be for example found [here](https://github.com/kuangliu/pytorch-cifar). +# Interestingly, DenseNet outperforms the original ResNet on their setup but comes closely behind the Pre-Activation ResNet. +# The best model, a Dual Path Network ([Chen et. +# al](https://arxiv.org/abs/1707.01629)), is actually a combination of +# ResNet and DenseNet showing that both offer different advantages. + +# %% [markdown] +# ### Which model should I choose for my task? +# +# We have reviewed four different models. +# So, which one should we choose if have given a new task? +# Usually, starting with a ResNet is a good idea given the superior performance of the CIFAR dataset and its simple implementation. +# Besides, for the parameter number we have chosen here, ResNet is the fastest as DenseNet and GoogleNet have many more layers that are applied in sequence in our primitive implementation. +# However, if you have a really difficult task, such as semantic +# segmentation on HD images, more complex variants of ResNet and DenseNet +# are recommended. diff --git a/_notebooks/course_UvA-DL/04-inception-resnet-densenet/densenet_block.svg b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/densenet_block.svg new file mode 100644 index 0000000..7b7c5a5 --- /dev/null +++ b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/densenet_block.svg @@ -0,0 +1 @@ + diff --git a/_notebooks/course_UvA-DL/04-inception-resnet-densenet/inception_block.svg b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/inception_block.svg new file mode 100644 index 0000000..be62455 --- /dev/null +++ b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/inception_block.svg @@ -0,0 +1,1290 @@ + + + + + + image/svg+xmldiff --git a/_notebooks/course_UvA-DL/04-inception-resnet-densenet/resnet_block.svg b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/resnet_block.svg new file mode 100644 index 0000000..f5977dc --- /dev/null +++ b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/resnet_block.svg @@ -0,0 +1,1194 @@ + + + + + + image/svg+xmldiff --git a/_notebooks/course_UvA-DL/04-inception-resnet-densenet/resnet_loss_surface.png b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/resnet_loss_surface.png new file mode 100644 index 0000000..01a97d8 Binary files /dev/null and b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/resnet_loss_surface.png differ diff --git a/_notebooks/course_UvA-DL/04-inception-resnet-densenet/resnet_notation.svg b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/resnet_notation.svg new file mode 100644 index 0000000..959a4f0 --- /dev/null +++ b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/resnet_notation.svg @@ -0,0 +1,3 @@ + + +
ResNet Block 1
ResNet Block 1
ResNet Block 2
ResNet Block 2
ResNet Block 3
ResNet Block 3
ResNet Block 4
ResNet Block 4
ResNet Block 5
ResNet Block 5
ResNet Block 6
ResNet Block 6
ResNet Block 7
ResNet Block 7
ResNet Block 8
ResNet Block 8
ResNet Block 9
ResNet Block 9
Group 1 (32x32)
Group 1 (32x32)
Group 2 (16x16)
Group 2 (16x16)
Group 3 (8x8)
Group 3 (8x8)
diff --git a/_notebooks/course_UvA-DL/04-inception-resnet-densenet/tensorboard_screenshot_DenseNet.png b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/tensorboard_screenshot_DenseNet.png new file mode 100644 index 0000000..7302773 Binary files /dev/null and b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/tensorboard_screenshot_DenseNet.png differ diff --git a/_notebooks/course_UvA-DL/04-inception-resnet-densenet/tensorboard_screenshot_GoogleNet.png b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/tensorboard_screenshot_GoogleNet.png new file mode 100644 index 0000000..36341ce Binary files /dev/null and b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/tensorboard_screenshot_GoogleNet.png differ diff --git a/_notebooks/course_UvA-DL/04-inception-resnet-densenet/tensorboard_screenshot_ResNet.png b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/tensorboard_screenshot_ResNet.png new file mode 100644 index 0000000..e40f156 Binary files /dev/null and b/_notebooks/course_UvA-DL/04-inception-resnet-densenet/tensorboard_screenshot_ResNet.png differ diff --git a/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/.meta.yml b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/.meta.yml new file mode 100644 index 0000000..0c8a0ee --- /dev/null +++ b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/.meta.yml @@ -0,0 +1,24 @@ +title: "Tutorial 5: Transformers and Multi-Head Attention" +author: Phillip Lippe +created: 2021-06-30 +updated: 2023-03-14 +license: CC BY-SA +build: 0 +tags: + - Text +description: | + In this tutorial, we will discuss one of the most impactful architectures of the last 2 years: the Transformer model. + Since the paper Attention Is All You Need by Vaswani et al. had been published in 2017, + the Transformer architecture has continued to beat benchmarks in many domains, most importantly in Natural Language Processing. + Transformers with an incredible amount of parameters can generate long, convincing essays, and opened up new application fields of AI. + As the hype of the Transformer architecture seems not to come to an end in the next years, + it is important to understand how it works, and have implemented it yourself, which we will do in this notebook. + This notebook is part of a lecture series on Deep Learning at the University of Amsterdam. + The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io. +requirements: + - torchvision + - matplotlib + - seaborn + - lightning>=2.0.0rc0 +accelerator: + - GPU diff --git a/docs/_static/images/course_UvA-DL/05-transformers-and-MH-attention.jpg b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/.thumb.jpg similarity index 100% rename from docs/_static/images/course_UvA-DL/05-transformers-and-MH-attention.jpg rename to _notebooks/course_UvA-DL/05-transformers-and-MH-attention/.thumb.jpg diff --git a/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/Transformers_MHAttention.py b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/Transformers_MHAttention.py new file mode 100644 index 0000000..f74ed35 --- /dev/null +++ b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/Transformers_MHAttention.py @@ -0,0 +1,1606 @@ +# %% [markdown] +#
+# Despite the huge success of Transformers in NLP, we will _not_ include the NLP domain in our notebook here. +# There are many courses at the University of Amsterdam that focus on Natural Language Processing +# and take a closer look at the application of the Transformer architecture in NLP +# ([NLP2](https://studiegids.uva.nl/xmlpages/page/2020-2021/zoek-vak/vak/79628), +# [Advanced Topics in Computational Semantics](https://studiegids.uva.nl/xmlpages/page/2020-2021/zoek-vak/vak/80162)). +# Furthermore, and most importantly, there is so much more to the Transformer architecture. +# NLP is the domain the Transformer architecture has been originally proposed for and had the greatest impact on, +# but it also accelerated research in other domains, recently even [Computer Vision](https://arxiv.org/abs/2010.11929). +# Thus, we focus here on what makes the Transformer and self-attention so powerful in general. +# In a second notebook, we will look at Vision Transformers, i.e. Transformers for image classification +# ([link to notebook](https://uvadlc-notebooks.readthedocs.io/en/latest/tutorial_notebooks/tutorial15/Vision_Transformer.html)). +# +# Below, we import our standard libraries. + +# %% +# Standard libraries +import math +import os +import urllib.request +from functools import partial +from urllib.error import HTTPError + +# PyTorch Lightning +import lightning as L + +# Plotting +import matplotlib +import matplotlib.pyplot as plt +import matplotlib_inline.backend_inline +import numpy as np +import seaborn as sns + +# PyTorch +import torch +import torch.nn as nn +import torch.nn.functional as F +import torch.optim as optim +import torch.utils.data as data + +# Torchvision +import torchvision +from lightning.pytorch.callbacks import ModelCheckpoint +from torchvision import transforms +from torchvision.datasets import CIFAR100 +from tqdm.notebook import tqdm + +plt.set_cmap("cividis") +# %matplotlib inline +matplotlib_inline.backend_inline.set_matplotlib_formats("svg", "pdf") # For export +matplotlib.rcParams["lines.linewidth"] = 2.0 +sns.reset_orig() + +# Path to the folder where the datasets are/should be downloaded (e.g. CIFAR10) +DATASET_PATH = os.environ.get("PATH_DATASETS", "data/") +# Path to the folder where the pretrained models are saved +CHECKPOINT_PATH = os.environ.get("PATH_CHECKPOINT", "saved_models/Transformers/") + +# Setting the seed +L.seed_everything(42) + +# Ensure that all operations are deterministic on GPU (if used) for reproducibility +torch.backends.cudnn.deterministic = True +torch.backends.cudnn.benchmark = False + +device = torch.device("cuda:0") if torch.cuda.is_available() else torch.device("cpu") +print("Device:", device) + +# %% [markdown] +# Two pre-trained models are downloaded below. +# Make sure to have adjusted your `CHECKPOINT_PATH` before running this code if not already done. + +# %% +# Github URL where saved models are stored for this tutorial +base_url = "https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial6/" +# Files to download +pretrained_files = ["ReverseTask.ckpt", "SetAnomalyTask.ckpt"] + +# Create checkpoint path if it doesn't exist yet +os.makedirs(CHECKPOINT_PATH, exist_ok=True) + +# For each file, check whether it already exists. If not, try downloading it. +for file_name in pretrained_files: + file_path = os.path.join(CHECKPOINT_PATH, file_name) + if "/" in file_name: + os.makedirs(file_path.rsplit("/", 1)[0], exist_ok=True) + if not os.path.isfile(file_path): + file_url = base_url + file_name + print("Downloading %s..." % file_url) + try: + urllib.request.urlretrieve(file_url, file_path) + except HTTPError as e: + print( + "Something went wrong. Please try to download the file manually," + " or contact the author with the full output including the following error:\n", + e, + ) + +# %% [markdown] +# ## The Transformer architecture +# +# In the first part of this notebook, we will implement the Transformer architecture by hand. +# As the architecture is so popular, there already exists a Pytorch module `nn.Transformer` +# ([documentation](https://pytorch.org/docs/stable/generated/torch.nn.Transformer.html)) +# and a [tutorial](https://pytorch.org/tutorials/beginner/transformer_tutorial.html) +# on how to use it for next token prediction. +# However, we will implement it here ourselves, to get through to the smallest details. +# +# There are of course many more tutorials out there about attention and Transformers. +# Below, we list a few that are worth exploring if you are interested in the topic +# and might want yet another perspective on the topic after this one: +# +# * [Transformer: A Novel Neural Network Architecture for Language Understanding +# (Jakob Uszkoreit, 2017)](https://ai.googleblog.com/2017/08/transformer-novel-neural-network.html) - The original Google blog post about the Transformer paper, focusing on the application in machine translation. +# * [The Illustrated Transformer (Jay Alammar, 2018)](http://jalammar.github.io/illustrated-transformer/) - A very popular and great blog post intuitively explaining the Transformer architecture with many nice visualizations. +# The focus is on NLP. +# * [Attention? +# Attention! +# (Lilian Weng, 2018)](https://lilianweng.github.io/lil-log/2018/06/24/attention-attention.html) - A nice blog post summarizing attention mechanisms in many domains including vision. +# * [Illustrated: Self-Attention (Raimi Karim, 2019)](https://towardsdatascience.com/illustrated-self-attention-2d627e33b20a) - A nice visualization of the steps of self-attention. +# Recommended going through if the explanation below is too abstract for you. +# * [The Transformer family (Lilian Weng, 2020)](https://lilianweng.github.io/lil-log/2020/04/07/the-transformer-family.html) - A very detailed blog post reviewing more variants of Transformers besides the original one. + +# %% [markdown] +# ### What is Attention? +# +# The attention mechanism describes a recent new group of layers in neural networks that has attracted +# a lot of interest in the past few years, especially in sequence tasks. +# There are a lot of different possible definitions of "attention" in the literature, +# but the one we will use here is the following: _the attention mechanism describes a weighted average +# of (sequence) elements with the weights dynamically computed based on an input query and elements' keys_. +# So what does this exactly mean? +# The goal is to take an average over the features of multiple elements. +# However, instead of weighting each element equally, we want to weight them depending on their actual values. +# In other words, we want to dynamically decide on which inputs we want to "attend" more than others. +# In particular, an attention mechanism has usually four parts we need to specify: +# +# * **Query**: The query is a feature vector that describes what we are looking for in the sequence, i.e. what would we maybe want to pay attention to. +# * **Keys**: For each input element, we have a key which is again a feature vector. +# This feature vector roughly describes what the element is "offering", or when it might be important. +# The keys should be designed such that we can identify the elements we want to pay attention to based on the query. +# * **Values**: For each input element, we also have a value vector. +# This feature vector is the one we want to average over. +# * **Score function**: To rate which elements we want to pay attention to, we need to specify a score function $f_{attn}$. +# The score function takes the query and a key as input, and output the score/attention weight of the query-key pair. +# It is usually implemented by simple similarity metrics like a dot product, or a small MLP. +# +# +# The weights of the average are calculated by a softmax over all score function outputs. +# Hence, we assign those value vectors a higher weight whose corresponding key is most similar to the query. +# If we try to describe it with pseudo-math, we can write: +# +# $$ +# \alpha_i = \frac{\exp\left(f_{attn}\left(\text{key}_i, \text{query}\right)\right)}{\sum_j \exp\left(f_{attn}\left(\text{key}_j, \text{query}\right)\right)}, \hspace{5mm} \text{out} = \sum_i \alpha_i \cdot \text{value}_i +# $$ +# +# Visually, we can show the attention over a sequence of words as follows: +# +#
+# +# For every word, we have one key and one value vector. +# The query is compared to all keys with a score function (in this case the dot product) to determine the weights. +# The softmax is not visualized for simplicity. +# Finally, the value vectors of all words are averaged using the attention weights. +# +# Most attention mechanisms differ in terms of what queries they use, how the key and value vectors are defined, +# and what score function is used. +# The attention applied inside the Transformer architecture is called **self-attention**. +# In self-attention, each sequence element provides a key, value, and query. +# For each element, we perform an attention layer where based on its query, +# we check the similarity of the all sequence elements' keys, and returned a different, +# averaged value vector for each element. +# We will now go into a bit more detail by first looking at the specific implementation of the attention mechanism +# which is in the Transformer case the scaled dot product attention. + +# %% [markdown] +# ### Scaled Dot Product Attention +# +# The core concept behind self-attention is the scaled dot product attention. +# Our goal is to have an attention mechanism with which any element in a sequence can attend to any other while +# still being efficient to compute. +# The dot product attention takes as input a set of queries +# $Q\in\mathbb{R}^{T\times d_k}$, keys $K\in\mathbb{R}^{T\times d_k}$ +# and values $V\in\mathbb{R}^{T\times d_v}$ where $T$ is the sequence length, +# and $d_k$ and $d_v$ are the hidden dimensionality for queries/keys and values respectively. +# For simplicity, we neglect the batch dimension for now. +# The attention value from element $i$ to $j$ is based on its similarity of the query $Q_i$ and key $K_j$, +# using the dot product as the similarity metric. +# In math, we calculate the dot product attention as follows: +# +# $$\text{Attention}(Q,K,V)=\text{softmax}\left(\frac{QK^T}{\sqrt{d_k}}\right)V$$ +# +# The matrix multiplication $QK^T$ performs the dot product for every possible pair of queries and keys, +# resulting in a matrix of the shape $T\times T$. +# Each row represents the attention logits for a specific element $i$ to all other elements in the sequence. +# On these, we apply a softmax and multiply with the value vector to obtain a weighted mean +# (the weights being determined by the attention). +# Another perspective on this attention mechanism offers the computation graph which is visualized below +# (figure credit - [Vaswani et al., 2017](https://arxiv.org/abs/1706.03762)). +# +#
+# +# One aspect we haven't discussed yet is the scaling factor of $1/\sqrt{d_k}$. +# This scaling factor is crucial to maintain an appropriate variance of attention values after initialization. +# Remember that we intialize our layers with the intention of having equal variance throughout the model, and hence, +# $Q$ and $K$ might also have a variance close to $1$. +# However, performing a dot product over two vectors with a variance $\sigma$ results +# in a scalar having $d_k$-times higher variance: +# +# $$q_i \sim \mathcal{N}(0,\sigma), k_i \sim \mathcal{N}(0,\sigma) \to \text{Var}\left(\sum_{i=1}^{d_k} q_i\cdot k_i\right) = \sigma\cdot d_k$$ +# +# +# If we do not scale down the variance back to $\sigma$, the softmax over the logits will already saturate +# to $1$ for one random element and $0$ for all others. +# The gradients through the softmax will be close to zero so that we can't learn the parameters appropriately. +# +# The block `Mask (opt. +# )` in the diagram above represents the optional masking of specific entries in the attention matrix. +# This is for instance used if we stack multiple sequences with different lengths into a batch. +# To still benefit from parallelization in PyTorch, we pad the sentences to the same length and mask out the padding +# tokens during the calculation of the attention values. +# This is usually done by setting the respective attention logits to a very low value. +# +# After we have discussed the details of the scaled dot product attention block, we can write a function below +# which computes the output features given the triple of queries, keys, and values: + + +# %% +def scaled_dot_product(q, k, v, mask=None): + d_k = q.size()[-1] + attn_logits = torch.matmul(q, k.transpose(-2, -1)) + attn_logits = attn_logits / math.sqrt(d_k) + if mask is not None: + attn_logits = attn_logits.masked_fill(mask == 0, -9e15) + attention = F.softmax(attn_logits, dim=-1) + values = torch.matmul(attention, v) + return values, attention + + +# %% [markdown] +# Note that our code above supports any additional dimensionality in front of the sequence length +# so that we can also use it for batches. +# However, for a better understanding, let's generate a few random queries, keys, and value vectors, +# and calculate the attention outputs: + +# %% +seq_len, d_k = 3, 2 +L.seed_everything(42) +q = torch.randn(seq_len, d_k) +k = torch.randn(seq_len, d_k) +v = torch.randn(seq_len, d_k) +values, attention = scaled_dot_product(q, k, v) +print("Q\n", q) +print("K\n", k) +print("V\n", v) +print("Values\n", values) +print("Attention\n", attention) + +# %% [markdown] +# Before continuing, make sure you can follow the calculation of the specific values here, and also check it by hand. +# It is important to fully understand how the scaled dot product attention is calculated. + +# %% [markdown] +# ### Multi-Head Attention +# +# The scaled dot product attention allows a network to attend over a sequence. +# However, often there are multiple different aspects a sequence element wants to attend to, +# and a single weighted average is not a good option for it. +# This is why we extend the attention mechanisms to multiple heads, +# i.e. multiple different query-key-value triplets on the same features. +# Specifically, given a query, key, and value matrix, we transform those into $h$ sub-queries, sub-keys, +# and sub-values, which we pass through the scaled dot product attention independently. +# Afterward, we concatenate the heads and combine them with a final weight matrix. +# Mathematically, we can express this operation as: +# +# $$ +# \begin{split} +# \text{Multihead}(Q,K,V) & = \text{Concat}(\text{head}_1,...,\text{head}_h)W^{O}\\ +# \text{where } \text{head}_i & = \text{Attention}(QW_i^Q,KW_i^K, VW_i^V) +# \end{split} +# $$ +# +# We refer to this as Multi-Head Attention layer with the learnable parameters +# $W_{1...h}^{Q}\in\mathbb{R}^{D\times d_k}$, +# $W_{1...h}^{K}\in\mathbb{R}^{D\times d_k}$, +# $W_{1...h}^{V}\in\mathbb{R}^{D\times d_v}$, +# and $W^{O}\in\mathbb{R}^{h\cdot d_k\times d_{out}}$ ($D$ being the input dimensionality). +# Expressed in a computational graph, we can visualize it as below +# (figure credit - [Vaswani et al., 2017](https://arxiv.org/abs/1706.03762)). +# +#
+# +# How are we applying a Multi-Head Attention layer in a neural network, +# where we don't have an arbitrary query, key, and value vector as input? +# Looking at the computation graph above, a simple but effective implementation is to set the current +# feature map in a NN, $X\in\mathbb{R}^{B\times T\times d_{\text{model}}}$, as $Q$, $K$ and $V$ +# ($B$ being the batch size, $T$ the sequence length, $d_{\text{model}}$ the hidden dimensionality of $X$). +# The consecutive weight matrices $W^{Q}$, $W^{K}$, and $W^{V}$ can transform $X$ to the corresponding +# feature vectors that represent the queries, keys, and values of the input. +# Using this approach, we can implement the Multi-Head Attention module below. + + +# %% +class MultiheadAttention(nn.Module): + def __init__(self, input_dim, embed_dim, num_heads): + super().__init__() + assert embed_dim % num_heads == 0, "Embedding dimension must be 0 modulo number of heads." + + self.embed_dim = embed_dim + self.num_heads = num_heads + self.head_dim = embed_dim // num_heads + + # Stack all weight matrices 1...h together for efficiency + # Note that in many implementations you see "bias=False" which is optional + self.qkv_proj = nn.Linear(input_dim, 3 * embed_dim) + self.o_proj = nn.Linear(embed_dim, embed_dim) + + self._reset_parameters() + + def _reset_parameters(self): + # Original Transformer initialization, see PyTorch documentation + nn.init.xavier_uniform_(self.qkv_proj.weight) + self.qkv_proj.bias.data.fill_(0) + nn.init.xavier_uniform_(self.o_proj.weight) + self.o_proj.bias.data.fill_(0) + + def forward(self, x, mask=None, return_attention=False): + batch_size, seq_length, embed_dim = x.size() + qkv = self.qkv_proj(x) + + # Separate Q, K, V from linear output + qkv = qkv.reshape(batch_size, seq_length, self.num_heads, 3 * self.head_dim) + qkv = qkv.permute(0, 2, 1, 3) # [Batch, Head, SeqLen, Dims] + q, k, v = qkv.chunk(3, dim=-1) + + # Determine value outputs + values, attention = scaled_dot_product(q, k, v, mask=mask) + values = values.permute(0, 2, 1, 3) # [Batch, SeqLen, Head, Dims] + values = values.reshape(batch_size, seq_length, embed_dim) + o = self.o_proj(values) + + if return_attention: + return o, attention + else: + return o + + +# %% [markdown] +# One crucial characteristic of the multi-head attention is that it is permutation-equivariant with respect to its inputs. +# This means that if we switch two input elements in the sequence, e.g. $X_1\leftrightarrow X_2$ +# (neglecting the batch dimension for now), the output is exactly the same besides the elements 1 and 2 switched. +# Hence, the multi-head attention is actually looking at the input not as a sequence, but as a set of elements. +# This property makes the multi-head attention block and the Transformer architecture so powerful and widely applicable! +# But what if the order of the input is actually important for solving the task, like language modeling? +# The answer is to encode the position in the input features, which we will take a closer look at later +# (topic _Positional encodings_ below). +# +# Before moving on to creating the Transformer architecture, we can compare the self-attention operation +# with our other common layer competitors for sequence data: convolutions and recurrent neural networks. +# Below you can find a table by [Vaswani et al. +# (2017)](https://arxiv.org/abs/1706.03762) on the complexity per layer, the number of sequential operations, +# and maximum path length. +# The complexity is measured by the upper bound of the number of operations to perform, while the maximum path +# length represents the maximum number of steps a forward or backward signal has to traverse to reach any other position. +# The lower this length, the better gradient signals can backpropagate for long-range dependencies. +# Let's take a look at the table below: +# +# +#
+# +# $n$ is the sequence length, $d$ is the representation dimension and $k$ is the kernel size of convolutions. +# In contrast to recurrent networks, the self-attention layer can parallelize all its operations making it much faster +# to execute for smaller sequence lengths. +# However, when the sequence length exceeds the hidden dimensionality, self-attention becomes more expensive than RNNs. +# One way of reducing the computational cost for long sequences is by restricting the self-attention to a neighborhood +# of inputs to attend over, denoted by $r$. +# Nevertheless, there has been recently a lot of work on more efficient Transformer architectures that still allow long +# dependencies, of which you can find an overview in the paper by [Tay et al. +# (2020)](https://arxiv.org/abs/2009.06732) if interested. + +# %% [markdown] +# ### Transformer Encoder +# +#
+# +# Next, we will look at how to apply the multi-head attention blog inside the Transformer architecture. +# Originally, the Transformer model was designed for machine translation. +# Hence, it got an encoder-decoder structure where the encoder takes as input the sentence in the original language +# and generates an attention-based representation. +# On the other hand, the decoder attends over the encoded information and generates the translated sentence +# in an autoregressive manner, as in a standard RNN. +# While this structure is extremely useful for Sequence-to-Sequence tasks with the necessity of autoregressive decoding, +# we will focus here on the encoder part. +# Many advances in NLP have been made using pure encoder-based Transformer models (if interested, models include the +# [BERT](https://arxiv.org/abs/1810.04805)-family, +# the [Vision Transformer](https://arxiv.org/abs/2010.11929), and more), +# and in our tutorial, we will also mainly focus on the encoder part. +# If you have understood the encoder architecture, the decoder is a very small step to implement as well. +# The full Transformer architecture looks as follows +# (figure credit - [Vaswani et al., 2017](https://arxiv.org/abs/1706.03762)). +# : +# +#
+# +# The encoder consists of $N$ identical blocks that are applied in sequence. +# Taking as input $x$, it is first passed through a Multi-Head Attention block as we have implemented above. +# The output is added to the original input using a residual connection, +# and we apply a consecutive Layer Normalization on the sum. +# Overall, it calculates $\text{LayerNorm}(x+\text{Multihead}(x,x,x))$ +# ($x$ being $Q$, $K$ and $V$ input to the attention layer). +# The residual connection is crucial in the Transformer architecture for two reasons: +# +# 1. +# Similar to ResNets, Transformers are designed to be very deep. +# Some models contain more than 24 blocks in the encoder. +# Hence, the residual connections are crucial for enabling a smooth gradient flow through the model. +# 2. +# Without the residual connection, the information about the original sequence is lost. +# Remember that the Multi-Head Attention layer ignores the position of elements in a sequence, +# and can only learn it based on the input features. +# Removing the residual connections would mean that this information is lost after the first attention layer +# (after initialization), and with a randomly initialized query and key vector, +# the output vectors for position $i$ has no relation to its original input. +# All outputs of the attention are likely to represent similar/same information, +# and there is no chance for the model to distinguish which information came from which input element. +# An alternative option to residual connection would be to fix at least one head to focus on its original input, +# but this is very inefficient and does not have the benefit of the improved gradient flow. +# +# The Layer Normalization also plays an important role in the Transformer architecture as it enables faster +# training and provides small regularization. +# Additionally, it ensures that the features are in a similar magnitude among the elements in the sequence. +# We are not using Batch Normalization because it depends on the batch size which is often small with Transformers +# (they require a lot of GPU memory), and BatchNorm has shown to perform particularly bad in language +# as the features of words tend to have a much higher variance (there are many, very rare words +# which need to be considered for a good distribution estimate). +# +# Additionally to the Multi-Head Attention, a small fully connected feed-forward network is added to the model, +# which is applied to each position separately and identically. +# Specifically, the model uses a Linear$\to$ReLU$\to$Linear MLP. +# The full transformation including the residual connection can be expressed as: +# +# $$ +# \begin{split} +# \text{FFN}(x) & = \max(0, xW_1+b_1)W_2 + b_2\\ +# x & = \text{LayerNorm}(x + \text{FFN}(x)) +# \end{split} +# $$ +# +# This MLP adds extra complexity to the model and allows transformations on each sequence element separately. +# You can imagine as this allows the model to "post-process" the new information added +# by the previous Multi-Head Attention, and prepare it for the next attention block. +# Usually, the inner dimensionality of the MLP is 2-8$\times$ larger than $d_{\text{model}}$, +# i.e. the dimensionality of the original input $x$. +# The general advantage of a wider layer instead of a narrow, multi-layer MLP is the faster, parallelizable execution. +# +# Finally, after looking at all parts of the encoder architecture, we can start implementing it below. +# We first start by implementing a single encoder block. +# Additionally to the layers described above, we will add dropout layers in the MLP and on the output +# of the MLP and Multi-Head Attention for regularization. + + +# %% +class EncoderBlock(nn.Module): + def __init__(self, input_dim, num_heads, dim_feedforward, dropout=0.0): + """ + Args: + input_dim: Dimensionality of the input + num_heads: Number of heads to use in the attention block + dim_feedforward: Dimensionality of the hidden layer in the MLP + dropout: Dropout probability to use in the dropout layers + """ + super().__init__() + + # Attention layer + self.self_attn = MultiheadAttention(input_dim, input_dim, num_heads) + + # Two-layer MLP + self.linear_net = nn.Sequential( + nn.Linear(input_dim, dim_feedforward), + nn.Dropout(dropout), + nn.ReLU(inplace=True), + nn.Linear(dim_feedforward, input_dim), + ) + + # Layers to apply in between the main layers + self.norm1 = nn.LayerNorm(input_dim) + self.norm2 = nn.LayerNorm(input_dim) + self.dropout = nn.Dropout(dropout) + + def forward(self, x, mask=None): + # Attention part + attn_out = self.self_attn(x, mask=mask) + x = x + self.dropout(attn_out) + x = self.norm1(x) + + # MLP part + linear_out = self.linear_net(x) + x = x + self.dropout(linear_out) + x = self.norm2(x) + + return x + + +# %% [markdown] +# Based on this block, we can implement a module for the full Transformer encoder. +# Additionally to a forward function that iterates through the sequence of encoder blocks, +# we also provide a function called `get_attention_maps`. +# The idea of this function is to return the attention probabilities for all Multi-Head Attention blocks in the encoder. +# This helps us in understanding, and in a sense, explaining the model. +# However, the attention probabilities should be interpreted with a grain of salt as it does not necessarily +# reflect the true interpretation of the model (there is a series of papers about this, +# including [Attention is not Explanation](https://arxiv.org/abs/1902.10186) +# and [Attention is not not Explanation](https://arxiv.org/abs/1908.04626)). + + +# %% +class TransformerEncoder(nn.Module): + def __init__(self, num_layers, **block_args): + super().__init__() + self.layers = nn.ModuleList([EncoderBlock(**block_args) for _ in range(num_layers)]) + + def forward(self, x, mask=None): + for layer in self.layers: + x = layer(x, mask=mask) + return x + + def get_attention_maps(self, x, mask=None): + attention_maps = [] + for layer in self.layers: + _, attn_map = layer.self_attn(x, mask=mask, return_attention=True) + attention_maps.append(attn_map) + x = layer(x) + return attention_maps + + +# %% [markdown] +# ### Positional encoding +# +# We have discussed before that the Multi-Head Attention block is permutation-equivariant, +# and cannot distinguish whether an input comes before another one in the sequence or not. +# In tasks like language understanding, however, the position is important for interpreting the input words. +# The position information can therefore be added via the input features. +# We could learn a embedding for every possible position, but this would not generalize to a dynamical +# input sequence length. +# Hence, the better option is to use feature patterns that the network can identify from the features +# and potentially generalize to larger sequences. +# The specific pattern chosen by Vaswani et al. +# are sine and cosine functions of different frequencies, as follows: +# +# $$ +# PE_{(pos,i)} = \begin{cases} +# \sin\left(\frac{pos}{10000^{i/d_{\text{model}}}}\right) & \text{if}\hspace{3mm} i \text{ mod } 2=0\\ +# \cos\left(\frac{pos}{10000^{(i-1)/d_{\text{model}}}}\right) & \text{otherwise}\\ +# \end{cases} +# $$ +# +# $PE_{(pos,i)}$ represents the position encoding at position $pos$ in the sequence, and hidden dimensionality $i$. +# These values, concatenated for all hidden dimensions, are added to the original input features +# (in the Transformer visualization above, see "Positional encoding"), and constitute the position information. +# We distinguish between even ($i \text{ mod } 2=0$) and uneven ($i \text{ mod } 2=1$) +# hidden dimensionalities where we apply a sine/cosine respectively. +# The intuition behind this encoding is that you can represent $PE_{(pos+k,:)}$ as a linear function +# of $PE_{(pos,:)}$, which might allow the model to easily attend to relative positions. +# The wavelengths in different dimensions range from $2\pi$ to $10000\cdot 2\pi$. +# +# The positional encoding is implemented below. +# The code is taken from the [PyTorch tutorial](https://pytorch.org/tutorials/beginner/transformer_tutorial.html#define-the-model) +# about Transformers on NLP and adjusted for our purposes. + + +# %% +class PositionalEncoding(nn.Module): + def __init__(self, d_model, max_len=5000): + """ + Args + d_model: Hidden dimensionality of the input. + max_len: Maximum length of a sequence to expect. + """ + super().__init__() + + # Create matrix of [SeqLen, HiddenDim] representing the positional encoding for max_len inputs + pe = torch.zeros(max_len, d_model) + position = torch.arange(0, max_len, dtype=torch.float).unsqueeze(1) + div_term = torch.exp(torch.arange(0, d_model, 2).float() * (-math.log(10000.0) / d_model)) + pe[:, 0::2] = torch.sin(position * div_term) + pe[:, 1::2] = torch.cos(position * div_term) + pe = pe.unsqueeze(0) + + # register_buffer => Tensor which is not a parameter, but should be part of the modules state. + # Used for tensors that need to be on the same device as the module. + # persistent=False tells PyTorch to not add the buffer to the state dict (e.g. when we save the model) + self.register_buffer("pe", pe, persistent=False) + + def forward(self, x): + x = x + self.pe[:, : x.size(1)] + return x + + +# %% [markdown] +# To understand the positional encoding, we can visualize it below. +# We will generate an image of the positional encoding over hidden dimensionality and position in a sequence. +# Each pixel, therefore, represents the change of the input feature we perform to encode the specific position. +# Let's do it below. + +# %% +encod_block = PositionalEncoding(d_model=48, max_len=96) +pe = encod_block.pe.squeeze().T.cpu().numpy() + +fig, ax = plt.subplots(nrows=1, ncols=1, figsize=(8, 3)) +pos = ax.imshow(pe, cmap="RdGy", extent=(1, pe.shape[1] + 1, pe.shape[0] + 1, 1)) +fig.colorbar(pos, ax=ax) +ax.set_xlabel("Position in sequence") +ax.set_ylabel("Hidden dimension") +ax.set_title("Positional encoding over hidden dimensions") +ax.set_xticks([1] + [i * 10 for i in range(1, 1 + pe.shape[1] // 10)]) +ax.set_yticks([1] + [i * 10 for i in range(1, 1 + pe.shape[0] // 10)]) +plt.show() + +# %% [markdown] +# You can clearly see the sine and cosine waves with different wavelengths that encode the position +# in the hidden dimensions. +# Specifically, we can look at the sine/cosine wave for each hidden dimension separately, +# to get a better intuition of the pattern. +# Below we visualize the positional encoding for the hidden dimensions $1$, $2$, $3$ and $4$. + +# %% +sns.set_theme() +fig, ax = plt.subplots(2, 2, figsize=(12, 4)) +ax = [a for a_list in ax for a in a_list] +for i in range(len(ax)): + ax[i].plot(np.arange(1, 17), pe[i, :16], color="C%i" % i, marker="o", markersize=6, markeredgecolor="black") + ax[i].set_title("Encoding in hidden dimension %i" % (i + 1)) + ax[i].set_xlabel("Position in sequence", fontsize=10) + ax[i].set_ylabel("Positional encoding", fontsize=10) + ax[i].set_xticks(np.arange(1, 17)) + ax[i].tick_params(axis="both", which="major", labelsize=10) + ax[i].tick_params(axis="both", which="minor", labelsize=8) + ax[i].set_ylim(-1.2, 1.2) +fig.subplots_adjust(hspace=0.8) +sns.reset_orig() +plt.show() + +# %% [markdown] +# As we can see, the patterns between the hidden dimension $1$ and $2$ only differ in the starting angle. +# The wavelength is $2\pi$, hence the repetition after position $6$. +# The hidden dimensions $2$ and $3$ have about twice the wavelength. + +# %% [markdown] +# ### Learning rate warm-up +# +# One commonly used technique for training a Transformer is learning rate warm-up. +# This means that we gradually increase the learning rate from 0 on to our originally specified +# learning rate in the first few iterations. +# Thus, we slowly start learning instead of taking very large steps from the beginning. +# In fact, training a deep Transformer without learning rate warm-up can make the model diverge +# and achieve a much worse performance on training and testing. +# Take for instance the following plot by [Liu et al. +# (2019)](https://arxiv.org/pdf/1908.03265.pdf) comparing Adam-vanilla (i.e. Adam without warm-up) +# vs Adam with a warm-up: +# +#
+# +# Clearly, the warm-up is a crucial hyperparameter in the Transformer architecture. +# Why is it so important? +# There are currently two common explanations. +# Firstly, Adam uses the bias correction factors which however can lead to a higher variance in the adaptive +# learning rate during the first iterations. +# Improved optimizers like [RAdam](https://arxiv.org/abs/1908.03265) have been shown to overcome this issue, +# not requiring warm-up for training Transformers. +# Secondly, the iteratively applied Layer Normalization across layers can lead to very high gradients during +# the first iterations, which can be solved by using Pre-Layer Normalization +# (similar to Pre-Activation ResNet), or replacing Layer Normalization by other techniques +# (Adaptive Normalization, +# [Power Normalization](https://arxiv.org/abs/2003.07845)). +# +# Nevertheless, many applications and papers still use the original Transformer architecture with Adam, +# because warm-up is a simple, yet effective way of solving the gradient problem in the first iterations. +# There are many different schedulers we could use. +# For instance, the original Transformer paper used an exponential decay scheduler with a warm-up. +# However, the currently most popular scheduler is the cosine warm-up scheduler, +# which combines warm-up with a cosine-shaped learning rate decay. +# We can implement it below, and visualize the learning rate factor over epochs. + + +# %% +class CosineWarmupScheduler(optim.lr_scheduler._LRScheduler): + def __init__(self, optimizer, warmup, max_iters): + self.warmup = warmup + self.max_num_iters = max_iters + super().__init__(optimizer) + + def get_lr(self): + lr_factor = self.get_lr_factor(epoch=self.last_epoch) + return [base_lr * lr_factor for base_lr in self.base_lrs] + + def get_lr_factor(self, epoch): + lr_factor = 0.5 * (1 + np.cos(np.pi * epoch / self.max_num_iters)) + if epoch <= self.warmup: + lr_factor *= epoch * 1.0 / self.warmup + return lr_factor + + +# %% +# Needed for initializing the lr scheduler +p = nn.Parameter(torch.empty(4, 4)) +optimizer = optim.Adam([p], lr=1e-3) +lr_scheduler = CosineWarmupScheduler(optimizer=optimizer, warmup=100, max_iters=2000) + +# Plotting +epochs = list(range(2000)) +sns.set() +plt.figure(figsize=(8, 3)) +plt.plot(epochs, [lr_scheduler.get_lr_factor(e) for e in epochs]) +plt.ylabel("Learning rate factor") +plt.xlabel("Iterations (in batches)") +plt.title("Cosine Warm-up Learning Rate Scheduler") +plt.show() +sns.reset_orig() + +# %% [markdown] +# In the first 100 iterations, we increase the learning rate factor from 0 to 1, +# whereas for all later iterations, we decay it using the cosine wave. +# Pre-implementations of this scheduler can be found in the popular NLP Transformer library +# [huggingface](https://huggingface.co/transformers/main_classes/optimizer_schedules.html?highlight=cosine#transformers.get_cosine_schedule_with_warmup). + +# %% [markdown] +# ### PyTorch Lightning Module +# +# Finally, we can embed the Transformer architecture into a PyTorch lightning module. +# From Tutorial 5, you know that PyTorch Lightning simplifies our training and test code, +# as well as structures the code nicely in separate functions. +# We will implement a template for a classifier based on the Transformer encoder. +# Thereby, we have a prediction output per sequence element. +# If we would need a classifier over the whole sequence, the common approach is to add an additional +# `[CLS]` token to the sequence, representing the classifier token. +# However, here we focus on tasks where we have an output per element. +# +# Additionally to the Transformer architecture, we add a small input network (maps input dimensions to model dimensions), +# the positional encoding, and an output network (transforms output encodings to predictions). +# We also add the learning rate scheduler, which takes a step each iteration instead of once per epoch. +# This is needed for the warmup and the smooth cosine decay. +# The training, validation, and test step is left empty for now and will be filled for our task-specific models. + + +# %% +class TransformerPredictor(L.LightningModule): + def __init__( + self, + input_dim, + model_dim, + num_classes, + num_heads, + num_layers, + lr, + warmup, + max_iters, + dropout=0.0, + input_dropout=0.0, + ): + """ + Args: + input_dim: Hidden dimensionality of the input + model_dim: Hidden dimensionality to use inside the Transformer + num_classes: Number of classes to predict per sequence element + num_heads: Number of heads to use in the Multi-Head Attention blocks + num_layers: Number of encoder blocks to use. + lr: Learning rate in the optimizer + warmup: Number of warmup steps. Usually between 50 and 500 + max_iters: Number of maximum iterations the model is trained for. This is needed for the CosineWarmup scheduler + dropout: Dropout to apply inside the model + input_dropout: Dropout to apply on the input features + """ + super().__init__() + self.save_hyperparameters() + self._create_model() + + def _create_model(self): + # Input dim -> Model dim + self.input_net = nn.Sequential( + nn.Dropout(self.hparams.input_dropout), nn.Linear(self.hparams.input_dim, self.hparams.model_dim) + ) + # Positional encoding for sequences + self.positional_encoding = PositionalEncoding(d_model=self.hparams.model_dim) + # Transformer + self.transformer = TransformerEncoder( + num_layers=self.hparams.num_layers, + input_dim=self.hparams.model_dim, + dim_feedforward=2 * self.hparams.model_dim, + num_heads=self.hparams.num_heads, + dropout=self.hparams.dropout, + ) + # Output classifier per sequence lement + self.output_net = nn.Sequential( + nn.Linear(self.hparams.model_dim, self.hparams.model_dim), + nn.LayerNorm(self.hparams.model_dim), + nn.ReLU(inplace=True), + nn.Dropout(self.hparams.dropout), + nn.Linear(self.hparams.model_dim, self.hparams.num_classes), + ) + + def forward(self, x, mask=None, add_positional_encoding=True): + """ + Args: + x: Input features of shape [Batch, SeqLen, input_dim] + mask: Mask to apply on the attention outputs (optional) + add_positional_encoding: If True, we add the positional encoding to the input. + Might not be desired for some tasks. + """ + x = self.input_net(x) + if add_positional_encoding: + x = self.positional_encoding(x) + x = self.transformer(x, mask=mask) + x = self.output_net(x) + return x + + @torch.no_grad() + def get_attention_maps(self, x, mask=None, add_positional_encoding=True): + """Function for extracting the attention matrices of the whole Transformer for a single batch. + + Input arguments same as the forward pass. + """ + x = self.input_net(x) + if add_positional_encoding: + x = self.positional_encoding(x) + attention_maps = self.transformer.get_attention_maps(x, mask=mask) + return attention_maps + + def configure_optimizers(self): + optimizer = optim.Adam(self.parameters(), lr=self.hparams.lr) + + # We don't return the lr scheduler because we need to apply it per iteration, not per epoch + self.lr_scheduler = CosineWarmupScheduler( + optimizer, warmup=self.hparams.warmup, max_iters=self.hparams.max_iters + ) + return optimizer + + def optimizer_step(self, *args, **kwargs): + super().optimizer_step(*args, **kwargs) + self.lr_scheduler.step() # Step per iteration + + def training_step(self, batch, batch_idx): + raise NotImplementedError + + def validation_step(self, batch, batch_idx): + raise NotImplementedError + + def test_step(self, batch, batch_idx): + raise NotImplementedError + + +# %% [markdown] +# ## Experiments +# +#
+# +# After having finished the implementation of the Transformer architecture, we can start experimenting +# and apply it to various tasks. +# In this notebook, we will focus on two tasks: parallel Sequence-to-Sequence, and set anomaly detection. +# The two tasks focus on different properties of the Transformer architecture, and we go through them below. +# +# ### Sequence to Sequence +# +# A Sequence-to-Sequence task represents a task where the input _and_ the output is a sequence, +# not necessarily of the same length. +# Popular tasks in this domain include machine translation and summarization. +# For this, we usually have a Transformer encoder for interpreting the input sequence, +# and a decoder for generating the output in an autoregressive manner. +# Here, however, we will go back to a much simpler example task and use only the encoder. +# Given a sequence of $N$ numbers between $0$ and $M$, the task is to reverse the input sequence. +# In Numpy notation, if our input is $x$, the output should be $x$[::-1]. +# Although this task sounds very simple, RNNs can have issues with such because the task requires long-term dependencies. +# Transformers are built to support such, and hence, we expect it to perform very well. +# +# First, let's create a dataset class below. + + +# %% +class ReverseDataset(data.Dataset): + def __init__(self, num_categories, seq_len, size): + super().__init__() + self.num_categories = num_categories + self.seq_len = seq_len + self.size = size + + self.data = torch.randint(self.num_categories, size=(self.size, self.seq_len)) + + def __len__(self): + return self.size + + def __getitem__(self, idx): + inp_data = self.data[idx] + labels = torch.flip(inp_data, dims=(0,)) + return inp_data, labels + + +# %% [markdown] +# We create an arbitrary number of random sequences of numbers between 0 and `num_categories-1`. +# The label is simply the tensor flipped over the sequence dimension. +# We can create the corresponding data loaders below. + +# %% +dataset = partial(ReverseDataset, 10, 16) +train_loader = data.DataLoader(dataset(50000), batch_size=128, shuffle=True, drop_last=True, pin_memory=True) +val_loader = data.DataLoader(dataset(1000), batch_size=128) +test_loader = data.DataLoader(dataset(10000), batch_size=128) + +# %% [markdown] +# Let's look at an arbitrary sample of the dataset: + +# %% +inp_data, labels = train_loader.dataset[0] +print("Input data:", inp_data) +print("Labels: ", labels) + +# %% [markdown] +# During training, we pass the input sequence through the Transformer encoder and predict the output for each input token. +# We use the standard Cross-Entropy loss to perform this. +# Every number is represented as a one-hot vector. +# Remember that representing the categories as single scalars decreases the expressiveness of the model extremely +# as $0$ and $1$ are not closer related than $0$ and $9$ in our example. +# An alternative to a one-hot vector is using a learned embedding vector as it is provided by the PyTorch module `nn.Embedding`. +# However, using a one-hot vector with an additional linear layer as in our case has the same effect +# as an embedding layer (`self.input_net` maps one-hot vector to a dense vector, +# where each row of the weight matrix represents the embedding for a specific category). +# +# To implement the training dynamic, we create a new class inheriting from `TransformerPredictor` +# and overwriting the training, validation and test step functions. + + +# %% +class ReversePredictor(TransformerPredictor): + def _calculate_loss(self, batch, mode="train"): + # Fetch data and transform categories to one-hot vectors + inp_data, labels = batch + inp_data = F.one_hot(inp_data, num_classes=self.hparams.num_classes).float() + + # Perform prediction and calculate loss and accuracy + preds = self.forward(inp_data, add_positional_encoding=True) + loss = F.cross_entropy(preds.view(-1, preds.size(-1)), labels.view(-1)) + acc = (preds.argmax(dim=-1) == labels).float().mean() + + # Logging + self.log("%s_loss" % mode, loss) + self.log("%s_acc" % mode, acc) + return loss, acc + + def training_step(self, batch, batch_idx): + loss, _ = self._calculate_loss(batch, mode="train") + return loss + + def validation_step(self, batch, batch_idx): + _ = self._calculate_loss(batch, mode="val") + + def test_step(self, batch, batch_idx): + _ = self._calculate_loss(batch, mode="test") + + +# %% [markdown] +# Finally, we can create a training function similar to the one we have seen in Tutorial 5 for PyTorch Lightning. +# We create a `L.Trainer` object, running for $N$ epochs, logging in TensorBoard, and saving our best model based on the validation. +# Afterward, we test our models on the test set. +# An additional parameter we pass to the trainer here is `gradient_clip_val`. +# This clips the norm of the gradients for all parameters before taking an optimizer step and prevents the model +# from diverging if we obtain very high gradients at, for instance, sharp loss surfaces (see many good blog posts +# on gradient clipping, like [DeepAI glossary](https://deepai.org/machine-learning-glossary-and-terms/gradient-clipping)). +# For Transformers, gradient clipping can help to further stabilize the training during the first few iterations, and also afterward. +# In plain PyTorch, you can apply gradient clipping via `torch.nn.utils.clip_grad_norm_(...)` +# (see [documentation](https://pytorch.org/docs/stable/generated/torch.nn.utils.clip_grad_norm_.html#torch.nn.utils.clip_grad_norm_)). +# The clip value is usually between 0.5 and 10, depending on how harsh you want to clip large gradients. +# After having explained this, let's implement the training function: + + +# %% +def train_reverse(**kwargs): + # Create a PyTorch Lightning trainer with the generation callback + root_dir = os.path.join(CHECKPOINT_PATH, "ReverseTask") + os.makedirs(root_dir, exist_ok=True) + trainer = L.Trainer( + default_root_dir=root_dir, + callbacks=[ModelCheckpoint(save_weights_only=True, mode="max", monitor="val_acc")], + accelerator="auto", + devices=1, + max_epochs=10, + gradient_clip_val=5, + ) + trainer.logger._default_hp_metric = None # Optional logging argument that we don't need + + # Check whether pretrained model exists. If yes, load it and skip training + pretrained_filename = os.path.join(CHECKPOINT_PATH, "ReverseTask.ckpt") + if os.path.isfile(pretrained_filename): + print("Found pretrained model, loading...") + model = ReversePredictor.load_from_checkpoint(pretrained_filename) + else: + model = ReversePredictor(max_iters=trainer.max_epochs * len(train_loader), **kwargs) + trainer.fit(model, train_loader, val_loader) + + # Test best model on validation and test set + val_result = trainer.test(model, dataloaders=val_loader, verbose=False) + test_result = trainer.test(model, dataloaders=test_loader, verbose=False) + result = {"test_acc": test_result[0]["test_acc"], "val_acc": val_result[0]["test_acc"]} + + model = model.to(device) + return model, result + + +# %% [markdown] +# Finally, we can train the model. +# In this setup, we will use a single encoder block and a single head in the Multi-Head Attention. +# This is chosen because of the simplicity of the task, and in this case, the attention can actually be interpreted +# as an "explanation" of the predictions (compared to the other papers above dealing with deep Transformers). + +# %% +reverse_model, reverse_result = train_reverse( + input_dim=train_loader.dataset.num_categories, + model_dim=32, + num_heads=1, + num_classes=train_loader.dataset.num_categories, + num_layers=1, + dropout=0.0, + lr=5e-4, + warmup=50, +) + +# %% [markdown] +# The warning of PyTorch Lightning regarding the number of workers can be ignored for now. +# As the data set is so simple and the `__getitem__` finishes a neglectable time, we don't need subprocesses +# to provide us the data (in fact, more workers can slow down the training as we have communication overhead among processes/threads). +# First, let's print the results: + +# %% +print("Val accuracy: %4.2f%%" % (100.0 * reverse_result["val_acc"])) +print("Test accuracy: %4.2f%%" % (100.0 * reverse_result["test_acc"])) + +# %% [markdown] +# As we would have expected, the Transformer can correctly solve the task. +# However, how does the attention in the Multi-Head Attention block looks like for an arbitrary input? +# Let's try to visualize it below. + +# %% +data_input, labels = next(iter(val_loader)) +inp_data = F.one_hot(data_input, num_classes=reverse_model.hparams.num_classes).float() +inp_data = inp_data.to(device) +attention_maps = reverse_model.get_attention_maps(inp_data) + +# %% [markdown] +# The object `attention_maps` is a list of length $N$ where $N$ is the number of layers. +# Each element is a tensor of shape [Batch, Heads, SeqLen, SeqLen], which we can verify below. + +# %% +attention_maps[0].shape + +# %% [markdown] +# Next, we will write a plotting function that takes as input the sequences, attention maps, and an index +# indicating for which batch element we want to visualize the attention map. +# We will create a plot where over rows, we have different layers, while over columns, we show the different heads. +# Remember that the softmax has been applied for each row separately. + + +# %% +def plot_attention_maps(input_data, attn_maps, idx=0): + if input_data is not None: + input_data = input_data[idx].detach().cpu().numpy() + else: + input_data = np.arange(attn_maps[0][idx].shape[-1]) + attn_maps = [m[idx].detach().cpu().numpy() for m in attn_maps] + + num_heads = attn_maps[0].shape[0] + num_layers = len(attn_maps) + seq_len = input_data.shape[0] + fig_size = 4 if num_heads == 1 else 3 + fig, ax = plt.subplots(num_layers, num_heads, figsize=(num_heads * fig_size, num_layers * fig_size)) + if num_layers == 1: + ax = [ax] + if num_heads == 1: + ax = [[a] for a in ax] + for row in range(num_layers): + for column in range(num_heads): + ax[row][column].imshow(attn_maps[row][column], origin="lower", vmin=0) + ax[row][column].set_xticks(list(range(seq_len))) + ax[row][column].set_xticklabels(input_data.tolist()) + ax[row][column].set_yticks(list(range(seq_len))) + ax[row][column].set_yticklabels(input_data.tolist()) + ax[row][column].set_title("Layer %i, Head %i" % (row + 1, column + 1)) + fig.subplots_adjust(hspace=0.5) + plt.show() + + +# %% [markdown] +# Finally, we can plot the attention map of our trained Transformer on the reverse task: + +# %% +plot_attention_maps(data_input, attention_maps, idx=0) + +# %% [markdown] +# The model has learned to attend to the token that is on the flipped index of itself. +# Hence, it actually does what we intended it to do. +# We see that it however also pays some attention to values close to the flipped index. +# This is because the model doesn't need the perfect, hard attention to solve this problem, +# but is fine with this approximate, noisy attention map. +# The close-by indices are caused by the similarity of the positional encoding, +# which we also intended with the positional encoding. + +# %% [markdown] +# ### Set Anomaly Detection +# +# Besides sequences, sets are another data structure that is relevant for many applications. +# In contrast to sequences, elements are unordered in a set. +# RNNs can only be applied on sets by assuming an order in the data, which however biases the model towards +# a non-existing order in the data. +# [Vinyals et al. +# (2015)](https://arxiv.org/abs/1511.06391) and other papers have shown that the assumed order can have a significant +# impact on the model's performance, and hence, we should try to not use RNNs on sets. +# Ideally, our model should be permutation-equivariant/invariant such that the output is the same no matter how we sort the elements in a set. +# +# Transformers offer the perfect architecture for this as the Multi-Head Attention is permutation-equivariant, and thus, +# outputs the same values no matter in what order we enter the inputs (inputs and outputs are permuted equally). +# The task we are looking at for sets is _Set Anomaly Detection_ which means that we try to find the element(s) +# in a set that does not fit the others. +# In the research community, the common application of anomaly detection is performed on a set of images, +# where $N-1$ images belong to the same category/have the same high-level features while one belongs to another category. +# Note that category does not necessarily have to relate to a class in a standard classification problem, +# but could be the combination of multiple features. +# For instance, on a face dataset, this could be people with glasses, male, beard, etc. +# An example of distinguishing different animals can be seen below. +# The first four images show foxes, while the last represents a different animal. +# We want to recognize that the last image shows a different animal, but it is not relevant which class of animal it is. +# +#
+# +# In this tutorial, we will use the CIFAR100 dataset. +# CIFAR100 has 600 images for 100 classes each with a resolution of 32x32, similar to CIFAR10. +# The larger amount of classes requires the model to attend to specific features in the images instead +# of coarse features as in CIFAR10, therefore making the task harder. +# We will show the model a set of 9 images of one class, and 1 image from another class. +# The task is to find the image that is from a different class than the other images. +# Using the raw images directly as input to the Transformer is not a good idea, because it is not translation +# invariant as a CNN, and would need to learn to detect image features from high-dimensional input first of all. +# Instead, we will use a pre-trained ResNet34 model from the torchvision package to obtain high-level, +# low-dimensional features of the images. +# The ResNet model has been pre-trained on the [ImageNet](http://image-net.org/) dataset which contains +# 1 million images of 1k classes and varying resolutions. +# However, during training and testing, the images are usually scaled to a resolution of 224x224, +# and hence we rescale our CIFAR images to this resolution as well. +# Below, we will load the dataset, and prepare the data for being processed by the ResNet model. + +# %% +# ImageNet statistics +DATA_MEANS = np.array([0.485, 0.456, 0.406]) +DATA_STD = np.array([0.229, 0.224, 0.225]) +# As torch tensors for later preprocessing +TORCH_DATA_MEANS = torch.from_numpy(DATA_MEANS).view(1, 3, 1, 1) +TORCH_DATA_STD = torch.from_numpy(DATA_STD).view(1, 3, 1, 1) + +# Resize to 224x224, and normalize to ImageNet statistic +transform = transforms.Compose( + [transforms.Resize((224, 224)), transforms.ToTensor(), transforms.Normalize(DATA_MEANS, DATA_STD)] +) +# Loading the training dataset. +train_set = CIFAR100(root=DATASET_PATH, train=True, transform=transform, download=True) + +# Loading the test set +test_set = CIFAR100(root=DATASET_PATH, train=False, transform=transform, download=True) + +# %% [markdown] +# Next, we want to run the pre-trained ResNet model on the images, and extract the features before the classification layer. +# These are the most high-level features, and should sufficiently describe the images. +# CIFAR100 has some similarity to ImageNet, and thus we are not retraining the ResNet model in any form. +# However, if you would want to get the best performance and have a very large dataset, +# it would be better to add the ResNet to the computation graph during training and finetune its parameters as well. +# As we don't have a large enough dataset and want to train our model efficiently, we will extract the features beforehand. +# Let's load and prepare the model below. + +# %% +os.environ["TORCH_HOME"] = CHECKPOINT_PATH +pretrained_model = torchvision.models.resnet34(pretrained=True) +# Remove classification layer +# In some models, it is called "fc", others have "classifier" +# Setting both to an empty sequential represents an identity map of the final features. +pretrained_model.fc = nn.Sequential() +pretrained_model.classifier = nn.Sequential() +# To GPU +pretrained_model = pretrained_model.to(device) + +# Only eval, no gradient required +pretrained_model.eval() +for p in pretrained_model.parameters(): + p.requires_grad = False + +# %% [markdown] +# We will now write a extraction function for the features below. +# This cell requires access to a GPU, as the model is rather deep and the images relatively large. +# The GPUs on GoogleColab are sufficient, but running this cell can take 2-3 minutes. +# Once it is run, the features are exported on disk so they don't have to be recalculated every time you run the notebook. +# However, this requires >150MB free disk space. +# So it is recommended to run this only on a local computer if you have enough free disk and a GPU (GoogleColab is fine for this). +# If you do not have a GPU, you can download the features from the +# [GoogleDrive folder](https://drive.google.com/drive/folders/1DF7POc6j03pRiWQPWSl5QJX5iY-xK0sV?usp=sharing). + + +# %% +@torch.no_grad() +def extract_features(dataset, save_file): + if not os.path.isfile(save_file): + data_loader = data.DataLoader(dataset, batch_size=128, shuffle=False, drop_last=False, num_workers=4) + extracted_features = [] + for imgs, _ in tqdm(data_loader): + imgs = imgs.to(device) + feats = pretrained_model(imgs) + extracted_features.append(feats) + extracted_features = torch.cat(extracted_features, dim=0) + extracted_features = extracted_features.detach().cpu() + torch.save(extracted_features, save_file) + else: + extracted_features = torch.load(save_file) + return extracted_features + + +train_feat_file = os.path.join(CHECKPOINT_PATH, "train_set_features.tar") +train_set_feats = extract_features(train_set, train_feat_file) + +test_feat_file = os.path.join(CHECKPOINT_PATH, "test_set_features.tar") +test_feats = extract_features(test_set, test_feat_file) + +# %% [markdown] +# Let's verify the feature shapes below. +# The training should have 50k elements, and the test 10k images. +# The feature dimension is 512 for the ResNet34. +# If you experiment with other models, you likely see a different feature dimension. + +# %% +print("Train:", train_set_feats.shape) +print("Test: ", test_feats.shape) + +# %% [markdown] +# As usual, we want to create a validation set to detect when we should stop training. +# In this case, we will split the training set into 90% training, 10% validation. +# However, the difficulty is here that we need to ensure that the validation set has the same number of images for all 100 labels. +# Otherwise, we have a class imbalance which is not good for creating the image sets. +# Hence, we take 10% of the images for each class, and move them into the validation set. +# The code below does exactly this. + +# %% +# Split train into train+val +# Get labels from train set +labels = train_set.targets + +# Get indices of images per class +labels = torch.LongTensor(labels) +num_labels = labels.max() + 1 +sorted_indices = torch.argsort(labels).reshape(num_labels, -1) # [classes, num_imgs per class] + +# Determine number of validation images per class +num_val_exmps = sorted_indices.shape[1] // 10 + +# Get image indices for validation and training +val_indices = sorted_indices[:, :num_val_exmps].reshape(-1) +train_indices = sorted_indices[:, num_val_exmps:].reshape(-1) + +# Group corresponding image features and labels +train_feats, train_labels = train_set_feats[train_indices], labels[train_indices] +val_feats, val_labels = train_set_feats[val_indices], labels[val_indices] + +# %% [markdown] +# Now we can prepare a dataset class for the set anomaly task. +# We define an epoch to be the sequence in which each image has been exactly once as an "anomaly". +# Hence, the length of the dataset is the number of images in it. +# For the training set, each time we access an item with `__getitem__`, we sample a random, +# different class than the image at the corresponding index `idx` has. +# In a second step, we sample $N-1$ images of this sampled class. +# The set of 10 images is finally returned. +# The randomness in the `__getitem__` allows us to see a slightly different set during each iteration. +# However, we can't use the same strategy for the test set as we want the test dataset to be the same every time we iterate over it. +# Hence, we sample the sets in the `__init__` method, and return those in `__getitem__`. +# The code below implements exactly this dynamic. + + +# %% +class SetAnomalyDataset(data.Dataset): + def __init__(self, img_feats, labels, set_size=10, train=True): + """ + Args: + img_feats: Tensor of shape [num_imgs, img_dim]. Represents the high-level features. + labels: Tensor of shape [num_imgs], containing the class labels for the images + set_size: Number of elements in a set. N-1 are sampled from one class, and one from another one. + train: If True, a new set will be sampled every time __getitem__ is called. + """ + super().__init__() + self.img_feats = img_feats + self.labels = labels + self.set_size = set_size - 1 # The set size is here the size of correct images + self.train = train + + # Tensors with indices of the images per class + self.num_labels = labels.max() + 1 + self.img_idx_by_label = torch.argsort(self.labels).reshape(self.num_labels, -1) + + if not train: + self.test_sets = self._create_test_sets() + + def _create_test_sets(self): + # Pre-generates the sets for each image for the test set + test_sets = [] + num_imgs = self.img_feats.shape[0] + np.random.seed(42) + test_sets = [self.sample_img_set(self.labels[idx]) for idx in range(num_imgs)] + test_sets = torch.stack(test_sets, dim=0) + return test_sets + + def sample_img_set(self, anomaly_label): + """Samples a new set of images, given the label of the anomaly. + + The sampled images come from a different class than anomaly_label + """ + # Sample class from 0,...,num_classes-1 while skipping anomaly_label as class + set_label = np.random.randint(self.num_labels - 1) + if set_label >= anomaly_label: + set_label += 1 + + # Sample images from the class determined above + img_indices = np.random.choice(self.img_idx_by_label.shape[1], size=self.set_size, replace=False) + img_indices = self.img_idx_by_label[set_label, img_indices] + return img_indices + + def __len__(self): + return self.img_feats.shape[0] + + def __getitem__(self, idx): + anomaly = self.img_feats[idx] + if self.train: # If train => sample + img_indices = self.sample_img_set(self.labels[idx]) + else: # If test => use pre-generated ones + img_indices = self.test_sets[idx] + + # Concatenate images. The anomaly is always the last image for simplicity + img_set = torch.cat([self.img_feats[img_indices], anomaly[None]], dim=0) + indices = torch.cat([img_indices, torch.LongTensor([idx])], dim=0) + label = img_set.shape[0] - 1 + + # We return the indices of the images for visualization purpose. "Label" is the index of the anomaly + return img_set, indices, label + + +# %% [markdown] +# Next, we can setup our datasets and data loaders below. +# Here, we will use a set size of 10, i.e. 9 images from one category + 1 anomaly. +# Feel free to change it if you want to experiment with the sizes. + +# %% +SET_SIZE = 10 +test_labels = torch.LongTensor(test_set.targets) + +train_anom_dataset = SetAnomalyDataset(train_feats, train_labels, set_size=SET_SIZE, train=True) +val_anom_dataset = SetAnomalyDataset(val_feats, val_labels, set_size=SET_SIZE, train=False) +test_anom_dataset = SetAnomalyDataset(test_feats, test_labels, set_size=SET_SIZE, train=False) + +train_anom_loader = data.DataLoader( + train_anom_dataset, batch_size=64, shuffle=True, drop_last=True, num_workers=4, pin_memory=True +) +val_anom_loader = data.DataLoader(val_anom_dataset, batch_size=64, shuffle=False, drop_last=False, num_workers=4) +test_anom_loader = data.DataLoader(test_anom_dataset, batch_size=64, shuffle=False, drop_last=False, num_workers=4) + +# %% [markdown] +# To understand the dataset a little better, we can plot below a few sets from the test dataset. +# Each row shows a different input set, where the first 9 are from the same class. + + +# %% +def visualize_exmp(indices, orig_dataset): + images = [orig_dataset[idx][0] for idx in indices.reshape(-1)] + images = torch.stack(images, dim=0) + images = images * TORCH_DATA_STD + TORCH_DATA_MEANS + + img_grid = torchvision.utils.make_grid(images, nrow=SET_SIZE, normalize=True, pad_value=0.5, padding=16) + img_grid = img_grid.permute(1, 2, 0) + + plt.figure(figsize=(12, 8)) + plt.title("Anomaly examples on CIFAR100") + plt.imshow(img_grid) + plt.axis("off") + plt.show() + plt.close() + + +_, indices, _ = next(iter(test_anom_loader)) +visualize_exmp(indices[:4], test_set) + +# %% [markdown] +# We can already see that for some sets the task might be easier than for others. +# Difficulties can especially arise if the anomaly is in a different, but yet visually similar class +# (e.g. train vs bus, flour vs worm, etc. +# ). +# +# After having prepared the data, we can look closer at the model. +# Here, we have a classification of the whole set. +# For the prediction to be permutation-equivariant, we will output one logit for each image. +# Over these logits, we apply a softmax and train the anomaly image to have the highest score/probability. +# This is a bit different than a standard classification layer as the softmax is applied over images, +# not over output classes in the classical sense. +# However, if we swap two images in their position, we effectively swap their position in the output softmax. +# Hence, the prediction is equivariant with respect to the input. +# We implement this idea below in the subclass of the Transformer Lightning module. + + +# %% +class AnomalyPredictor(TransformerPredictor): + def _calculate_loss(self, batch, mode="train"): + img_sets, _, labels = batch + # No positional encodings as it is a set, not a sequence! + preds = self.forward(img_sets, add_positional_encoding=False) + preds = preds.squeeze(dim=-1) # Shape: [Batch_size, set_size] + loss = F.cross_entropy(preds, labels) # Softmax/CE over set dimension + acc = (preds.argmax(dim=-1) == labels).float().mean() + self.log("%s_loss" % mode, loss) + self.log("%s_acc" % mode, acc, on_step=False, on_epoch=True) + return loss, acc + + def training_step(self, batch, batch_idx): + loss, _ = self._calculate_loss(batch, mode="train") + return loss + + def validation_step(self, batch, batch_idx): + _ = self._calculate_loss(batch, mode="val") + + def test_step(self, batch, batch_idx): + _ = self._calculate_loss(batch, mode="test") + + +# %% [markdown] +# Finally, we write our train function below. +# It has the exact same structure as the reverse task one, hence not much of an explanation is needed here. + + +# %% +def train_anomaly(**kwargs): + # Create a PyTorch Lightning trainer with the generation callback + root_dir = os.path.join(CHECKPOINT_PATH, "SetAnomalyTask") + os.makedirs(root_dir, exist_ok=True) + trainer = L.Trainer( + default_root_dir=root_dir, + callbacks=[ModelCheckpoint(save_weights_only=True, mode="max", monitor="val_acc")], + accelerator="auto", + devices=1, + max_epochs=100, + gradient_clip_val=2, + ) + trainer.logger._default_hp_metric = None # Optional logging argument that we don't need + + # Check whether pretrained model exists. If yes, load it and skip training + pretrained_filename = os.path.join(CHECKPOINT_PATH, "SetAnomalyTask.ckpt") + if os.path.isfile(pretrained_filename): + print("Found pretrained model, loading...") + model = AnomalyPredictor.load_from_checkpoint(pretrained_filename) + else: + model = AnomalyPredictor(max_iters=trainer.max_epochs * len(train_anom_loader), **kwargs) + trainer.fit(model, train_anom_loader, val_anom_loader) + model = AnomalyPredictor.load_from_checkpoint(trainer.checkpoint_callback.best_model_path) + + # Test best model on validation and test set + train_result = trainer.test(model, dataloaders=train_anom_loader, verbose=False) + val_result = trainer.test(model, dataloaders=val_anom_loader, verbose=False) + test_result = trainer.test(model, dataloaders=test_anom_loader, verbose=False) + result = { + "test_acc": test_result[0]["test_acc"], + "val_acc": val_result[0]["test_acc"], + "train_acc": train_result[0]["test_acc"], + } + + model = model.to(device) + return model, result + + +# %% [markdown] +# Let's finally train our model. +# We will use 4 layers with 4 attention heads each. +# The hidden dimensionality of the model is 256, and we use a dropout of 0.1 throughout the model for good regularization. +# Note that we also apply the dropout on the input features, as this makes the model more robust against +# image noise and generalizes better. +# Again, we use warmup to slowly start our model training. + +# %% +anomaly_model, anomaly_result = train_anomaly( + input_dim=train_anom_dataset.img_feats.shape[-1], + model_dim=256, + num_heads=4, + num_classes=1, + num_layers=4, + dropout=0.1, + input_dropout=0.1, + lr=5e-4, + warmup=100, +) + +# %% [markdown] +# We can print the achieved accuracy below. + +# %% +print("Train accuracy: %4.2f%%" % (100.0 * anomaly_result["train_acc"])) +print("Val accuracy: %4.2f%%" % (100.0 * anomaly_result["val_acc"])) +print("Test accuracy: %4.2f%%" % (100.0 * anomaly_result["test_acc"])) + +# %% [markdown] +# With ~94% validation and test accuracy, the model generalizes quite well. +# It should be noted that you might see slightly different scores depending on what computer/device you are running this notebook. +# This is because despite setting the seed before generating the test dataset, it is not the same across platforms and numpy versions. +# Nevertheless, we can conclude that the model performs quite well and can solve the task for most sets. +# Before trying to interpret the model, let's verify that our model is permutation-equivariant, +# and assigns the same predictions for different permutations of the input set. +# For this, we sample a batch from the test set and run it through the model to obtain the probabilities. + +# %% +inp_data, indices, labels = next(iter(test_anom_loader)) +inp_data = inp_data.to(device) + +anomaly_model.eval() + +with torch.no_grad(): + preds = anomaly_model.forward(inp_data, add_positional_encoding=False) + preds = F.softmax(preds.squeeze(dim=-1), dim=-1) + + # Permut input data + permut = np.random.permutation(inp_data.shape[1]) + perm_inp_data = inp_data[:, permut] + perm_preds = anomaly_model.forward(perm_inp_data, add_positional_encoding=False) + perm_preds = F.softmax(perm_preds.squeeze(dim=-1), dim=-1) + +assert (preds[:, permut] - perm_preds).abs().max() < 1e-5, "Predictions are not permutation equivariant" + +print("Preds\n", preds[0, permut].cpu().numpy()) +print("Permuted preds\n", perm_preds[0].cpu().numpy()) + +# %% [markdown] +# You can see that the predictions are almost exactly the same, and only differ because of slight numerical +# differences inside the network operation. +# +# To interpret the model a little more, we can plot the attention maps inside the model. +# This will give us an idea of what information the model is sharing/communicating between images, +# and what each head might represent. +# First, we need to extract the attention maps for the test batch above, and determine the discrete predictions for simplicity. + +# %% +attention_maps = anomaly_model.get_attention_maps(inp_data, add_positional_encoding=False) +predictions = preds.argmax(dim=-1) + +# %% [markdown] +# Below we write a plot function which plots the images in the input set, the prediction of the model, +# and the attention maps of the different heads on layers of the transformer. +# Feel free to explore the attention maps for different input examples as well. + + +# %% +def visualize_prediction(idx): + visualize_exmp(indices[idx : idx + 1], test_set) + print("Prediction:", predictions[idx].item()) + plot_attention_maps(input_data=None, attn_maps=attention_maps, idx=idx) + + +visualize_prediction(0) + +# %% [markdown] +# Depending on the random seed, you might see a slightly different input set. +# For the version on the website, we compare 9 tree images with a volcano. +# We see that multiple heads, for instance, Layer 2 Head 1, Layer 2 Head 3, and Layer 3 Head 1 focus on the last image. +# Additionally, the heads in Layer 4 all seem to ignore the last image and assign a very low attention probability to it. +# This shows that the model has indeed recognized that the image doesn't fit the setting, and hence predicted it to be the anomaly. +# Layer 3 Head 2-4 seems to take a slightly weighted average of all images. +# That might indicate that the model extracts the "average" information of all images, to compare it to the image features itself. +# +# Let's try to find where the model actually makes a mistake. +# We can do this by identifying the sets where the model predicts something else than 9, as in the dataset, +# we ensured that the anomaly is always at the last position in the set. + +# %% +mistakes = torch.where(predictions != 9)[0].cpu().numpy() +print("Indices with mistake:", mistakes) + +# %% [markdown] +# As our model achieves ~94% accuracy, we only have very little number of mistakes in a batch of 64 sets. +# Still, let's visualize one of them, for example the last one: + +# %% +visualize_prediction(mistakes[-1]) +print("Probabilities:") +for i, p in enumerate(preds[mistakes[-1]].cpu().numpy()): + print("Image %i: %4.2f%%" % (i, 100.0 * p)) + +# %% [markdown] +# In this example, the model confuses a palm tree with a building, giving a probability of ~90% to image 2, and 8% to the actual anomaly. +# However, the difficulty here is that the picture of the building has been taken at a similar angle as the palms. +# Meanwhile, image 2 shows a rather unusual palm with a different color palette, which is why the model fails here. +# Nevertheless, in general, the model performs quite well. + +# %% [markdown] +# ## Conclusion +# +# In this tutorial, we took a closer look at the Multi-Head Attention layer which uses a scaled dot product between +# queries and keys to find correlations and similarities between input elements. +# The Transformer architecture is based on the Multi-Head Attention layer and applies multiple of them in a ResNet-like block. +# The Transformer is a very important, recent architecture that can be applied to many tasks and datasets. +# Although it is best known for its success in NLP, there is so much more to it. +# We have seen its application on sequence-to-sequence tasks and set anomaly detection. +# Its property of being permutation-equivariant if we do not provide any positional encodings, allows it to generalize to many settings. +# Hence, it is important to know the architecture, but also its possible issues such as the gradient problem during +# the first iterations solved by learning rate warm-up. +# If you are interested in continuing with the study of the Transformer architecture, +# please have a look at the blog posts listed at the beginning of the tutorial notebook. diff --git a/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/attention_example.svg b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/attention_example.svg new file mode 100644 index 0000000..bd290ad --- /dev/null +++ b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/attention_example.svg @@ -0,0 +1 @@ + diff --git a/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/cifar100_example_anomaly.png b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/cifar100_example_anomaly.png new file mode 100644 index 0000000..7e06e5a Binary files /dev/null and b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/cifar100_example_anomaly.png differ diff --git a/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/comparison_conv_rnn.svg b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/comparison_conv_rnn.svg new file mode 100644 index 0000000..7af315f --- /dev/null +++ b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/comparison_conv_rnn.svg @@ -0,0 +1,1803 @@ + + + + + + image/svg+xmldiff --git a/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/multihead_attention.svg b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/multihead_attention.svg new file mode 100644 index 0000000..1019553 --- /dev/null +++ b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/multihead_attention.svg @@ -0,0 +1,282 @@ + + + + + + image/svg+xml + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/scaled_dot_product_attn.svg b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/scaled_dot_product_attn.svg new file mode 100644 index 0000000..7ca74ea --- /dev/null +++ b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/scaled_dot_product_attn.svg @@ -0,0 +1,346 @@ + + + + + + image/svg+xml + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/transformer_architecture.svg b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/transformer_architecture.svg new file mode 100644 index 0000000..5b6b0f4 --- /dev/null +++ b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/transformer_architecture.svg @@ -0,0 +1,112 @@ + + + + + + + image/svg+xml + + + + + + + + + + + + + + + Encoder + Decoder + + diff --git a/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/warmup_loss_plot.svg b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/warmup_loss_plot.svg new file mode 100644 index 0000000..e38f81c --- /dev/null +++ b/_notebooks/course_UvA-DL/05-transformers-and-MH-attention/warmup_loss_plot.svg @@ -0,0 +1,1573 @@ + + + + + + image/svg+xmldiff --git a/_notebooks/course_UvA-DL/06-graph-neural-networks/.meta.yml b/_notebooks/course_UvA-DL/06-graph-neural-networks/.meta.yml new file mode 100644 index 0000000..cfd63af --- /dev/null +++ b/_notebooks/course_UvA-DL/06-graph-neural-networks/.meta.yml @@ -0,0 +1,31 @@ +title: "Tutorial 6: Basics of Graph Neural Networks" +author: Phillip Lippe +created: 2021-06-07 +updated: 2023-03-14 +license: CC BY-SA +build: 0 +tags: + - Graph +description: | + In this tutorial, we will discuss the application of neural networks on graphs. + Graph Neural Networks (GNNs) have recently gained increasing popularity in both applications and research, + including domains such as social networks, knowledge graphs, recommender systems, and bioinformatics. + While the theory and math behind GNNs might first seem complicated, + the implementation of those models is quite simple and helps in understanding the methodology. + Therefore, we will discuss the implementation of basic network layers of a GNN, + namely graph convolutions, and attention layers. + Finally, we will apply a GNN on semi-supervised node classification and molecule categorization. + This notebook is part of a lecture series on Deep Learning at the University of Amsterdam. + The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io. +requirements: + - torch-scatter + - torch-sparse + - torch-cluster + - torch-spline-conv + - torch-geometric + - lightning>=2.0.0rc0 +pip__find-link: + # - https://pytorch-geometric.com/whl/torch-1.8.0+cu101.html + - https://pytorch-geometric.com/whl/torch-%(TORCH_MAJOR_DOT_MINOR)s.0+%(DEVICE)s.html +accelerator: + - GPU diff --git a/docs/_static/images/course_UvA-DL/06-graph-neural-networks.jpg b/_notebooks/course_UvA-DL/06-graph-neural-networks/.thumb.jpg similarity index 100% rename from docs/_static/images/course_UvA-DL/06-graph-neural-networks.jpg rename to _notebooks/course_UvA-DL/06-graph-neural-networks/.thumb.jpg diff --git a/_notebooks/course_UvA-DL/06-graph-neural-networks/GNN_overview.py b/_notebooks/course_UvA-DL/06-graph-neural-networks/GNN_overview.py new file mode 100644 index 0000000..443f442 --- /dev/null +++ b/_notebooks/course_UvA-DL/06-graph-neural-networks/GNN_overview.py @@ -0,0 +1,993 @@ +# %% [markdown] +#
+# We start by importing our standard libraries below. + +# %% +# Standard libraries +import os + +# For downloading pre-trained models +import urllib.request +from urllib.error import HTTPError + +# PyTorch Lightning +import lightning as L + +# PyTorch +import torch +import torch.nn as nn +import torch.nn.functional as F +import torch.optim as optim + +# PyTorch geometric +import torch_geometric +import torch_geometric.data as geom_data +import torch_geometric.nn as geom_nn + +# PL callbacks +from lightning.pytorch.callbacks import ModelCheckpoint +from torch import Tensor + +AVAIL_GPUS = min(1, torch.cuda.device_count()) +BATCH_SIZE = 256 if AVAIL_GPUS else 64 +# Path to the folder where the datasets are/should be downloaded +DATASET_PATH = os.environ.get("PATH_DATASETS", "data/") +# Path to the folder where the pretrained models are saved +CHECKPOINT_PATH = os.environ.get("PATH_CHECKPOINT", "saved_models/GNNs/") + +# Setting the seed +L.seed_everything(42) + +# Ensure that all operations are deterministic on GPU (if used) for reproducibility +torch.backends.cudnn.deterministic = True +torch.backends.cudnn.benchmark = False + +# %% [markdown] +# We also have a few pre-trained models we download below. + +# %% +# Github URL where saved models are stored for this tutorial +base_url = "https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial7/" +# Files to download +pretrained_files = ["NodeLevelMLP.ckpt", "NodeLevelGNN.ckpt", "GraphLevelGraphConv.ckpt"] + +# Create checkpoint path if it doesn't exist yet +os.makedirs(CHECKPOINT_PATH, exist_ok=True) + +# For each file, check whether it already exists. If not, try downloading it. +for file_name in pretrained_files: + file_path = os.path.join(CHECKPOINT_PATH, file_name) + if "/" in file_name: + os.makedirs(file_path.rsplit("/", 1)[0], exist_ok=True) + if not os.path.isfile(file_path): + file_url = base_url + file_name + print("Downloading %s..." % file_url) + try: + urllib.request.urlretrieve(file_url, file_path) + except HTTPError as e: + print( + "Something went wrong. Please try to download the file from the GDrive folder," + " or contact the author with the full output including the following error:\n", + e, + ) + +# %% [markdown] +# ## Graph Neural Networks + +# %% [markdown] +# ### Graph representation +# +# Before starting the discussion of specific neural network operations on graphs, we should consider how to represent a graph. +# Mathematically, a graph $\mathcal{G}$ is defined as a tuple of a set of nodes/vertices $V$, and a set of edges/links $E$: $\mathcal{G}=(V,E)$. +# Each edge is a pair of two vertices, and represents a connection between them. +# For instance, let's look at the following graph: +# +#
+# +# The vertices are $V=\{1,2,3,4\}$, and edges $E=\{(1,2), (2,3), (2,4), (3,4)\}$. +# Note that for simplicity, we assume the graph to be undirected and hence don't add mirrored pairs like $(2,1)$. +# In application, vertices and edge can often have specific attributes, and edges can even be directed. +# The question is how we could represent this diversity in an efficient way for matrix operations. +# Usually, for the edges, we decide between two variants: an adjacency matrix, or a list of paired vertex indices. +# +# The **adjacency matrix** $A$ is a square matrix whose elements indicate whether pairs of vertices are adjacent, +# i.e. connected, or not. +# In the simplest case, $A_{ij}$ is 1 if there is a connection from node $i$ to $j$, and otherwise 0. +# If we have edge attributes or different categories of edges in a graph, this information can be added to the matrix as well. +# For an undirected graph, keep in mind that $A$ is a symmetric matrix ($A_{ij}=A_{ji}$). +# For the example graph above, we have the following adjacency matrix: +# +# $$ +# A = \begin{bmatrix} +# 0 & 1 & 0 & 0\\ +# 1 & 0 & 1 & 1\\ +# 0 & 1 & 0 & 1\\ +# 0 & 1 & 1 & 0 +# \end{bmatrix} +# $$ +# +# While expressing a graph as a list of edges is more efficient in terms of memory and (possibly) computation, +# using an adjacency matrix is more intuitive and simpler to implement. +# In our implementations below, we will rely on the adjacency matrix to keep the code simple. +# However, common libraries use edge lists, which we will discuss later more. +# Alternatively, we could also use the list of edges to define a sparse adjacency matrix with which we can work +# as if it was a dense matrix, but allows more memory-efficient operations. +# PyTorch supports this with the sub-package `torch.sparse` +# ([documentation](https://pytorch.org/docs/stable/sparse.html)) which is however still in a beta-stage +# (API might change in future). + +# %% [markdown] +# ### Graph Convolutions +# +# Graph Convolutional Networks have been introduced by [Kipf et al. ](https://openreview.net/pdf?id=SJU4ayYgl) +# in 2016 at the University of Amsterdam. +# He also wrote a great [blog post](https://tkipf.github.io/graph-convolutional-networks/) about this topic, +# which is recommended if you want to read about GCNs from a different perspective. +# GCNs are similar to convolutions in images in the sense that the "filter" parameters are typically shared over all locations in the graph. +# At the same time, GCNs rely on message passing methods, which means that vertices exchange information with the neighbors, +# and send "messages" to each other. +# Before looking at the math, we can try to visually understand how GCNs work. +# The first step is that each node creates a feature vector that represents the message it wants to send to all its neighbors. +# In the second step, the messages are sent to the neighbors, so that a node receives one message per adjacent node. +# Below we have visualized the two steps for our example graph. +# +#
+# +# If we want to formulate that in more mathematical terms, we need to first decide how to combine +# all the messages a node receives. +# As the number of messages vary across nodes, we need an operation that works for any number. +# Hence, the usual way to go is to sum or take the mean. +# Given the previous features of nodes $H^{(l)}$, the GCN layer is defined as follows: +# +# $$H^{(l+1)} = \sigma\left(\hat{D}^{-1/2}\hat{A}\hat{D}^{-1/2}H^{(l)}W^{(l)}\right)$$ +# +# $W^{(l)}$ is the weight parameters with which we transform the input features into messages ($H^{(l)}W^{(l)}$). +# To the adjacency matrix $A$ we add the identity matrix so that each node sends its own message also to itself: +# $\hat{A}=A+I$. +# Finally, to take the average instead of summing, we calculate the matrix $\hat{D}$ which is a diagonal +# matrix with $D_{ii}$ denoting the number of neighbors node $i$ has. +# $\sigma$ represents an arbitrary activation function, and not necessarily the sigmoid (usually a ReLU-based +# activation function is used in GNNs). +# +# When implementing the GCN layer in PyTorch, we can take advantage of the flexible operations on tensors. +# Instead of defining a matrix $\hat{D}$, we can simply divide the summed messages by the number of neighbors afterward. +# Additionally, we replace the weight matrix with a linear layer, which additionally allows us to add a bias. +# Written as a PyTorch module, the GCN layer is defined as follows: + + +# %% +class GCNLayer(nn.Module): + def __init__(self, c_in, c_out): + super().__init__() + self.projection = nn.Linear(c_in, c_out) + + def forward(self, node_feats, adj_matrix): + """ + Args: + node_feats: Tensor with node features of shape [batch_size, num_nodes, c_in] + adj_matrix: Batch of adjacency matrices of the graph. If there is an edge from i to j, + adj_matrix[b,i,j]=1 else 0. Supports directed edges by non-symmetric matrices. + Assumes to already have added the identity connections. + Shape: [batch_size, num_nodes, num_nodes] + """ + # Num neighbours = number of incoming edges + num_neighbours = adj_matrix.sum(dim=-1, keepdims=True) + node_feats = self.projection(node_feats) + node_feats = torch.bmm(adj_matrix, node_feats) + node_feats = node_feats / num_neighbours + return node_feats + + +# %% [markdown] +# To further understand the GCN layer, we can apply it to our example graph above. +# First, let's specify some node features and the adjacency matrix with added self-connections: + +# %% +node_feats = torch.arange(8, dtype=torch.float32).view(1, 4, 2) +adj_matrix = Tensor([[[1, 1, 0, 0], [1, 1, 1, 1], [0, 1, 1, 1], [0, 1, 1, 1]]]) + +print("Node features:\n", node_feats) +print("\nAdjacency matrix:\n", adj_matrix) + +# %% [markdown] +# Next, let's apply a GCN layer to it. +# For simplicity, we initialize the linear weight matrix as an identity matrix so that the input features are equal to the messages. +# This makes it easier for us to verify the message passing operation. + +# %% +layer = GCNLayer(c_in=2, c_out=2) +layer.projection.weight.data = Tensor([[1.0, 0.0], [0.0, 1.0]]) +layer.projection.bias.data = Tensor([0.0, 0.0]) + +with torch.no_grad(): + out_feats = layer(node_feats, adj_matrix) + +print("Adjacency matrix", adj_matrix) +print("Input features", node_feats) +print("Output features", out_feats) + +# %% [markdown] +# As we can see, the first node's output values are the average of itself and the second node. +# Similarly, we can verify all other nodes. +# However, in a GNN, we would also want to allow feature exchange between nodes beyond its neighbors. +# This can be achieved by applying multiple GCN layers, which gives us the final layout of a GNN. +# The GNN can be build up by a sequence of GCN layers and non-linearities such as ReLU. +# For a visualization, see below (figure credit - [Thomas Kipf, 2016](https://tkipf.github.io/graph-convolutional-networks/)). +# +#
+# +# However, one issue we can see from looking at the example above is that the output features for nodes 3 and 4 are +# the same because they have the same adjacent nodes (including itself). +# Therefore, GCN layers can make the network forget node-specific information if we just take a mean over all messages. +# Multiple possible improvements have been proposed. +# While the simplest option might be using residual connections, the more common approach is to either weigh +# the self-connections higher or define a separate weight matrix for the self-connections. +# Alternatively, we can use a well-known concept: attention. + +# %% [markdown] +# ### Graph Attention +# +# Attention describes a weighted average of multiple elements with the weights dynamically computed based on an input +# query and elements' keys (if you don't know what attention is, it is recommended to at least go through +# the very first section called [What is Attention?](https://uvadlc-notebooks.readthedocs.io/en/latest/tutorial_notebooks/tutorial6/Transformers_and_MHAttention.html#What-is-Attention?)). +# This concept can be similarly applied to graphs, one of such is the Graph Attention Network +# (called GAT, proposed by [Velickovic et al., 2017](https://arxiv.org/abs/1710.10903)). +# Similarly to the GCN, the graph attention layer creates a message for each node using a linear layer/weight matrix. +# For the attention part, it uses the message from the node itself as a query, and the messages to average as both +# keys and values (note that this also includes the message to itself). +# The score function $f_{attn}$ is implemented as a one-layer MLP which maps the query and key to a single value. +# The MLP looks as follows (figure credit - [Velickovic et al. ](https://arxiv.org/abs/1710.10903)): +# +#
+# +# $h_i$ and $h_j$ are the original features from node $i$ and $j$ respectively, and represent the messages +# of the layer with $\mathbf{W}$ as weight matrix. +# $\mathbf{a}$ is the weight matrix of the MLP, which has the shape $[1,2\times d_{\text{message}}]$, +# and $\alpha_{ij}$ the final attention weight from node $i$ to $j$. +# The calculation can be described as follows: +# +# $$\alpha_{ij} = \frac{\exp\left(\text{LeakyReLU}\left(\mathbf{a}\left[\mathbf{W}h_i||\mathbf{W}h_j\right]\right)\right)}{\sum_{k\in\mathcal{N}_i} \exp\left(\text{LeakyReLU}\left(\mathbf{a}\left[\mathbf{W}h_i||\mathbf{W}h_k\right]\right)\right)}$$ +# +# The operator $||$ represents the concatenation, and $\mathcal{N}_i$ the indices of the neighbors of node $i$. +# Note that in contrast to usual practice, we apply a non-linearity (here LeakyReLU) before the softmax over elements. +# Although it seems like a minor change at first, it is crucial for the attention to depend on the original input. +# Specifically, let's remove the non-linearity for a second, and try to simplify the expression: +# +# $$ +# \begin{split} +# \alpha_{ij} & = \frac{\exp\left(\mathbf{a}\left[\mathbf{W}h_i||\mathbf{W}h_j\right]\right)}{\sum_{k\in\mathcal{N}_i} \exp\left(\mathbf{a}\left[\mathbf{W}h_i||\mathbf{W}h_k\right]\right)}\\[5pt] +# & = \frac{\exp\left(\mathbf{a}_{:,:d/2}\mathbf{W}h_i+\mathbf{a}_{:,d/2:}\mathbf{W}h_j\right)}{\sum_{k\in\mathcal{N}_i} \exp\left(\mathbf{a}_{:,:d/2}\mathbf{W}h_i+\mathbf{a}_{:,d/2:}\mathbf{W}h_k\right)}\\[5pt] +# & = \frac{\exp\left(\mathbf{a}_{:,:d/2}\mathbf{W}h_i\right)\cdot\exp\left(\mathbf{a}_{:,d/2:}\mathbf{W}h_j\right)}{\sum_{k\in\mathcal{N}_i} \exp\left(\mathbf{a}_{:,:d/2}\mathbf{W}h_i\right)\cdot\exp\left(\mathbf{a}_{:,d/2:}\mathbf{W}h_k\right)}\\[5pt] +# & = \frac{\exp\left(\mathbf{a}_{:,d/2:}\mathbf{W}h_j\right)}{\sum_{k\in\mathcal{N}_i} \exp\left(\mathbf{a}_{:,d/2:}\mathbf{W}h_k\right)}\\ +# \end{split} +# $$ +# +# We can see that without the non-linearity, the attention term with $h_i$ actually cancels itself out, +# resulting in the attention being independent of the node itself. +# Hence, we would have the same issue as the GCN of creating the same output features for nodes with the same neighbors. +# This is why the LeakyReLU is crucial and adds some dependency on $h_i$ to the attention. +# +# Once we obtain all attention factors, we can calculate the output features for each node by performing +# the weighted average: +# +# $$h_i'=\sigma\left(\sum_{j\in\mathcal{N}_i}\alpha_{ij}\mathbf{W}h_j\right)$$ +# +# $\sigma$ is yet another non-linearity, as in the GCN layer. +# Visually, we can represent the full message passing in an attention layer as follows +# (figure credit - [Velickovic et al. ](https://arxiv.org/abs/1710.10903)): +# +#
+# +# To increase the expressiveness of the graph attention network, [Velickovic et al. ](https://arxiv.org/abs/1710.10903) +# proposed to extend it to multiple heads similar to the Multi-Head Attention block in Transformers. +# This results in $N$ attention layers being applied in parallel. +# In the image above, it is visualized as three different colors of arrows (green, blue, and purple) +# that are afterward concatenated. +# The average is only applied for the very final prediction layer in a network. +# +# After having discussed the graph attention layer in detail, we can implement it below: + + +# %% +class GATLayer(nn.Module): + def __init__(self, c_in, c_out, num_heads=1, concat_heads=True, alpha=0.2): + """ + Args: + c_in: Dimensionality of input features + c_out: Dimensionality of output features + num_heads: Number of heads, i.e. attention mechanisms to apply in parallel. The + output features are equally split up over the heads if concat_heads=True. + concat_heads: If True, the output of the different heads is concatenated instead of averaged. + alpha: Negative slope of the LeakyReLU activation. + """ + super().__init__() + self.num_heads = num_heads + self.concat_heads = concat_heads + if self.concat_heads: + assert c_out % num_heads == 0, "Number of output features must be a multiple of the count of heads." + c_out = c_out // num_heads + + # Sub-modules and parameters needed in the layer + self.projection = nn.Linear(c_in, c_out * num_heads) + self.a = nn.Parameter(Tensor(num_heads, 2 * c_out)) # One per head + self.leakyrelu = nn.LeakyReLU(alpha) + + # Initialization from the original implementation + nn.init.xavier_uniform_(self.projection.weight.data, gain=1.414) + nn.init.xavier_uniform_(self.a.data, gain=1.414) + + def forward(self, node_feats, adj_matrix, print_attn_probs=False): + """ + Args: + node_feats: Input features of the node. Shape: [batch_size, c_in] + adj_matrix: Adjacency matrix including self-connections. Shape: [batch_size, num_nodes, num_nodes] + print_attn_probs: If True, the attention weights are printed during the forward pass + (for debugging purposes) + """ + batch_size, num_nodes = node_feats.size(0), node_feats.size(1) + + # Apply linear layer and sort nodes by head + node_feats = self.projection(node_feats) + node_feats = node_feats.view(batch_size, num_nodes, self.num_heads, -1) + + # We need to calculate the attention logits for every edge in the adjacency matrix + # Doing this on all possible combinations of nodes is very expensive + # => Create a tensor of [W*h_i||W*h_j] with i and j being the indices of all edges + # Returns indices where the adjacency matrix is not 0 => edges + edges = adj_matrix.nonzero(as_tuple=False) + node_feats_flat = node_feats.view(batch_size * num_nodes, self.num_heads, -1) + edge_indices_row = edges[:, 0] * num_nodes + edges[:, 1] + edge_indices_col = edges[:, 0] * num_nodes + edges[:, 2] + a_input = torch.cat( + [ + torch.index_select(input=node_feats_flat, index=edge_indices_row, dim=0), + torch.index_select(input=node_feats_flat, index=edge_indices_col, dim=0), + ], + dim=-1, + ) # Index select returns a tensor with node_feats_flat being indexed at the desired positions + + # Calculate attention MLP output (independent for each head) + attn_logits = torch.einsum("bhc,hc->bh", a_input, self.a) + attn_logits = self.leakyrelu(attn_logits) + + # Map list of attention values back into a matrix + attn_matrix = attn_logits.new_zeros(adj_matrix.shape + (self.num_heads,)).fill_(-9e15) + attn_matrix[adj_matrix[..., None].repeat(1, 1, 1, self.num_heads) == 1] = attn_logits.reshape(-1) + + # Weighted average of attention + attn_probs = F.softmax(attn_matrix, dim=2) + if print_attn_probs: + print("Attention probs\n", attn_probs.permute(0, 3, 1, 2)) + node_feats = torch.einsum("bijh,bjhc->bihc", attn_probs, node_feats) + + # If heads should be concatenated, we can do this by reshaping. Otherwise, take mean + if self.concat_heads: + node_feats = node_feats.reshape(batch_size, num_nodes, -1) + else: + node_feats = node_feats.mean(dim=2) + + return node_feats + + +# %% [markdown] +# Again, we can apply the graph attention layer on our example graph above to understand the dynamics better. +# As before, the input layer is initialized as an identity matrix, but we set $\mathbf{a}$ +# to be a vector of arbitrary numbers to obtain different attention values. +# We use two heads to show the parallel, independent attention mechanisms working in the layer. + +# %% +layer = GATLayer(2, 2, num_heads=2) +layer.projection.weight.data = Tensor([[1.0, 0.0], [0.0, 1.0]]) +layer.projection.bias.data = Tensor([0.0, 0.0]) +layer.a.data = Tensor([[-0.2, 0.3], [0.1, -0.1]]) + +with torch.no_grad(): + out_feats = layer(node_feats, adj_matrix, print_attn_probs=True) + +print("Adjacency matrix", adj_matrix) +print("Input features", node_feats) +print("Output features", out_feats) + +# %% [markdown] +# We recommend that you try to calculate the attention matrix at least for one head and one node for yourself. +# The entries are 0 where there does not exist an edge between $i$ and $j$. +# For the others, we see a diverse set of attention probabilities. +# Moreover, the output features of node 3 and 4 are now different although they have the same neighbors. + +# %% [markdown] +# ## PyTorch Geometric +# +# We had mentioned before that implementing graph networks with adjacency matrix is simple and straight-forward +# but can be computationally expensive for large graphs. +# Many real-world graphs can reach over 200k nodes, for which adjacency matrix-based implementations fail. +# There are a lot of optimizations possible when implementing GNNs, and luckily, there exist packages that provide such layers. +# The most popular packages for PyTorch are [PyTorch Geometric](https://pytorch-geometric.readthedocs.io/en/latest/) +# and the [Deep Graph Library](https://www.dgl.ai/) (the latter being actually framework agnostic). +# Which one to use depends on the project you are planning to do and personal taste. +# In this tutorial, we will look at PyTorch Geometric as part of the PyTorch family. +# +# PyTorch Geometric provides us a set of common graph layers, including the GCN and GAT layer we implemented above. +# Additionally, similar to PyTorch's torchvision, it provides the common graph datasets and transformations +# on those to simplify training. +# Compared to our implementation above, PyTorch Geometric uses a list of index pairs to represent the edges. +# The details of this library will be explored further in our experiments. +# +# In our tasks below, we want to allow us to pick from a multitude of graph layers. +# Thus, we define again below a dictionary to access those using a string: + +# %% +gnn_layer_by_name = {"GCN": geom_nn.GCNConv, "GAT": geom_nn.GATConv, "GraphConv": geom_nn.GraphConv} + +# %% [markdown] +# Additionally to GCN and GAT, we added the layer `geom_nn.GraphConv` +# ([documentation](https://pytorch-geometric.readthedocs.io/en/latest/modules/nn.html#torch_geometric.nn.conv.GraphConv)). +# GraphConv is a GCN with a separate weight matrix for the self-connections. +# Mathematically, this would be: +# +# $$ +# \mathbf{x}_i^{(l+1)} = \mathbf{W}^{(l + 1)}_1 \mathbf{x}_i^{(l)} + \mathbf{W}^{(\ell + 1)}_2 \sum_{j \in \mathcal{N}_i} \mathbf{x}_j^{(l)} +# $$ +# +# In this formula, the neighbor's messages are added instead of averaged. +# However, PyTorch Geometric provides the argument `aggr` to switch between summing, averaging, and max pooling. + +# %% [markdown] +# ## Experiments on graph structures +# +#
+# +# Tasks on graph-structured data can be grouped into three groups: node-level, edge-level and graph-level. +# The different levels describe on which level we want to perform classification/regression. +# We will discuss all three types in more detail below. + +# %% [markdown] +# ### Node-level tasks: Semi-supervised node classification +# +# Node-level tasks have the goal to classify nodes in a graph. +# Usually, we have given a single, large graph with >1000 nodes of which a certain amount of nodes are labeled. +# We learn to classify those labeled examples during training and try to generalize to the unlabeled nodes. +# +# A popular example that we will use in this tutorial is the Cora dataset, a citation network among papers. +# The Cora consists of 2708 scientific publications with links between each other representing +# the citation of one paper by another. +# The task is to classify each publication into one of seven classes. +# Each publication is represented by a bag-of-words vector. +# This means that we have a vector of 1433 elements for each publication, where a 1 at feature $i$ indicates +# that the $i$-th word of a pre-defined dictionary is in the article. +# Binary bag-of-words representations are commonly used when we need very simple encodings, +# and already have an intuition of what words to expect in a network. +# There exist much better approaches, but we will leave this to the NLP courses to discuss. +# +# We will load the dataset below: + +# %% +cora_dataset = torch_geometric.datasets.Planetoid(root=DATASET_PATH, name="Cora") + +# %% [markdown] +# Let's look at how PyTorch Geometric represents the graph data. +# Note that although we have a single graph, PyTorch Geometric returns a dataset for compatibility to other datasets. + +# %% +cora_dataset[0] + +# %% [markdown] +# The graph is represented by a `Data` object +# ([documentation](https://pytorch-geometric.readthedocs.io/en/latest/modules/data.html#torch_geometric.data.Data)) +# which we can access as a standard Python namespace. +# The edge index tensor is the list of edges in the graph and contains the mirrored version of each edge for undirected graphs. +# The `train_mask`, `val_mask`, and `test_mask` are boolean masks that indicate which nodes we should use for training, +# validation, and testing. +# The `x` tensor is the feature tensor of our 2708 publications, and `y` the labels for all nodes. +# +# After having seen the data, we can implement a simple graph neural network. +# The GNN applies a sequence of graph layers (GCN, GAT, or GraphConv), ReLU as activation function, +# and dropout for regularization. +# See below for the specific implementation. + + +# %% +class GNNModel(nn.Module): + def __init__( + self, + c_in, + c_hidden, + c_out, + num_layers=2, + layer_name="GCN", + dp_rate=0.1, + **kwargs, + ): + """ + Args: + c_in: Dimension of input features + c_hidden: Dimension of hidden features + c_out: Dimension of the output features. Usually number of classes in classification + num_layers: Number of "hidden" graph layers + layer_name: String of the graph layer to use + dp_rate: Dropout rate to apply throughout the network + kwargs: Additional arguments for the graph layer (e.g. number of heads for GAT) + """ + super().__init__() + gnn_layer = gnn_layer_by_name[layer_name] + + layers = [] + in_channels, out_channels = c_in, c_hidden + for l_idx in range(num_layers - 1): + layers += [ + gnn_layer(in_channels=in_channels, out_channels=out_channels, **kwargs), + nn.ReLU(inplace=True), + nn.Dropout(dp_rate), + ] + in_channels = c_hidden + layers += [gnn_layer(in_channels=in_channels, out_channels=c_out, **kwargs)] + self.layers = nn.ModuleList(layers) + + def forward(self, x, edge_index): + """ + Args: + x: Input features per node + edge_index: List of vertex index pairs representing the edges in the graph (PyTorch geometric notation) + """ + for layer in self.layers: + # For graph layers, we need to add the "edge_index" tensor as additional input + # All PyTorch Geometric graph layer inherit the class "MessagePassing", hence + # we can simply check the class type. + if isinstance(layer, geom_nn.MessagePassing): + x = layer(x, edge_index) + else: + x = layer(x) + return x + + +# %% [markdown] +# Good practice in node-level tasks is to create an MLP baseline that is applied to each node independently. +# This way we can verify whether adding the graph information to the model indeed improves the prediction, or not. +# It might also be that the features per node are already expressive enough to clearly point towards a specific class. +# To check this, we implement a simple MLP below. + + +# %% +class MLPModel(nn.Module): + def __init__(self, c_in, c_hidden, c_out, num_layers=2, dp_rate=0.1): + """ + Args: + c_in: Dimension of input features + c_hidden: Dimension of hidden features + c_out: Dimension of the output features. Usually number of classes in classification + num_layers: Number of hidden layers + dp_rate: Dropout rate to apply throughout the network + """ + super().__init__() + layers = [] + in_channels, out_channels = c_in, c_hidden + for l_idx in range(num_layers - 1): + layers += [nn.Linear(in_channels, out_channels), nn.ReLU(inplace=True), nn.Dropout(dp_rate)] + in_channels = c_hidden + layers += [nn.Linear(in_channels, c_out)] + self.layers = nn.Sequential(*layers) + + def forward(self, x, *args, **kwargs): + """ + Args: + x: Input features per node + """ + return self.layers(x) + + +# %% [markdown] +# Finally, we can merge the models into a PyTorch Lightning module which handles the training, +# validation, and testing for us. + + +# %% +class NodeLevelGNN(L.LightningModule): + def __init__(self, model_name, **model_kwargs): + super().__init__() + # Saving hyperparameters + self.save_hyperparameters() + + if model_name == "MLP": + self.model = MLPModel(**model_kwargs) + else: + self.model = GNNModel(**model_kwargs) + self.loss_module = nn.CrossEntropyLoss() + + def forward(self, data, mode="train"): + x, edge_index = data.x, data.edge_index + x = self.model(x, edge_index) + + # Only calculate the loss on the nodes corresponding to the mask + if mode == "train": + mask = data.train_mask + elif mode == "val": + mask = data.val_mask + elif mode == "test": + mask = data.test_mask + else: + assert False, "Unknown forward mode: %s" % mode + + loss = self.loss_module(x[mask], data.y[mask]) + acc = (x[mask].argmax(dim=-1) == data.y[mask]).sum().float() / mask.sum() + return loss, acc + + def configure_optimizers(self): + # We use SGD here, but Adam works as well + optimizer = optim.SGD(self.parameters(), lr=0.1, momentum=0.9, weight_decay=2e-3) + return optimizer + + def training_step(self, batch, batch_idx): + loss, acc = self.forward(batch, mode="train") + self.log("train_loss", loss) + self.log("train_acc", acc) + return loss + + def validation_step(self, batch, batch_idx): + _, acc = self.forward(batch, mode="val") + self.log("val_acc", acc) + + def test_step(self, batch, batch_idx): + _, acc = self.forward(batch, mode="test") + self.log("test_acc", acc) + + +# %% [markdown] +# Additionally to the Lightning module, we define a training function below. +# As we have a single graph, we use a batch size of 1 for the data loader and share the same data loader for the train, +# validation, and test set (the mask is picked inside the Lightning module). +# Besides, we set the argument `enable_progress_bar` to False as it usually shows the progress per epoch, +# but an epoch only consists of a single step. +# If you have downloaded the pre-trained models in the beginning of the tutorial, we load those instead of training from scratch. +# Finally, we test the model and return the results. + + +# %% +def train_node_classifier(model_name, dataset, **model_kwargs): + L.seed_everything(42) + node_data_loader = geom_data.DataLoader(dataset, batch_size=1) + + # Create a PyTorch Lightning trainer + root_dir = os.path.join(CHECKPOINT_PATH, "NodeLevel" + model_name) + os.makedirs(root_dir, exist_ok=True) + trainer = L.Trainer( + default_root_dir=root_dir, + callbacks=[ModelCheckpoint(save_weights_only=True, mode="max", monitor="val_acc")], + accelerator="auto", + devices=AVAIL_GPUS, + max_epochs=200, + enable_progress_bar=False, + ) # 0 because epoch size is 1 + trainer.logger._default_hp_metric = None # Optional logging argument that we don't need + + # Check whether pretrained model exists. If yes, load it and skip training + pretrained_filename = os.path.join(CHECKPOINT_PATH, "NodeLevel%s.ckpt" % model_name) + if os.path.isfile(pretrained_filename): + print("Found pretrained model, loading...") + model = NodeLevelGNN.load_from_checkpoint(pretrained_filename) + else: + L.seed_everything() + model = NodeLevelGNN( + model_name=model_name, c_in=dataset.num_node_features, c_out=dataset.num_classes, **model_kwargs + ) + trainer.fit(model, node_data_loader, node_data_loader) + model = NodeLevelGNN.load_from_checkpoint(trainer.checkpoint_callback.best_model_path) + + # Test best model on the test set + test_result = trainer.test(model, dataloaders=node_data_loader, verbose=False) + batch = next(iter(node_data_loader)) + batch = batch.to(model.device) + _, train_acc = model.forward(batch, mode="train") + _, val_acc = model.forward(batch, mode="val") + result = {"train": train_acc, "val": val_acc, "test": test_result[0]["test_acc"]} + return model, result + + +# %% [markdown] +# Now, we can train our models. First, let's train the simple MLP: + + +# %% +# Small function for printing the test scores +def print_results(result_dict): + if "train" in result_dict: + print("Train accuracy: %4.2f%%" % (100.0 * result_dict["train"])) + if "val" in result_dict: + print("Val accuracy: %4.2f%%" % (100.0 * result_dict["val"])) + print("Test accuracy: %4.2f%%" % (100.0 * result_dict["test"])) + + +# %% +node_mlp_model, node_mlp_result = train_node_classifier( + model_name="MLP", dataset=cora_dataset, c_hidden=16, num_layers=2, dp_rate=0.1 +) + +print_results(node_mlp_result) + +# %% [markdown] +# Although the MLP can overfit on the training dataset because of the high-dimensional input features, +# it does not perform too well on the test set. +# Let's see if we can beat this score with our graph networks: + +# %% +node_gnn_model, node_gnn_result = train_node_classifier( + model_name="GNN", layer_name="GCN", dataset=cora_dataset, c_hidden=16, num_layers=2, dp_rate=0.1 +) +print_results(node_gnn_result) + +# %% [markdown] +# As we would have hoped for, the GNN model outperforms the MLP by quite a margin. +# This shows that using the graph information indeed improves our predictions and lets us generalizes better. +# +# The hyperparameters in the model have been chosen to create a relatively small network. +# This is because the first layer with an input dimension of 1433 can be relatively expensive to perform for large graphs. +# In general, GNNs can become relatively expensive for very big graphs. +# This is why such GNNs either have a small hidden size or use a special batching strategy +# where we sample a connected subgraph of the big, original graph. + +# %% [markdown] +# ### Edge-level tasks: Link prediction +# +# In some applications, we might have to predict on an edge-level instead of node-level. +# The most common edge-level task in GNN is link prediction. +# Link prediction means that given a graph, we want to predict whether there will be/should be an edge between two nodes or not. +# For example, in a social network, this is used by Facebook and co to propose new friends to you. +# Again, graph level information can be crucial to perform this task. +# The output prediction is usually done by performing a similarity metric on the pair of node features, +# which should be 1 if there should be a link, and otherwise close to 0. +# To keep the tutorial short, we will not implement this task ourselves. +# Nevertheless, there are many good resources out there if you are interested in looking closer at this task. +# Tutorials and papers for this topic include: +# +# * [PyTorch Geometric example](https://github.com/rusty1s/pytorch_geometric/blob/master/examples/link_pred.py) +# * [Graph Neural Networks: A Review of Methods and Applications](https://arxiv.org/pdf/1812.08434.pdf), Zhou et al. +# 2019 +# * [Link Prediction Based on Graph Neural Networks](https://papers.nips.cc/paper/2018/file/53f0d7c537d99b3824f0f99d62ea2428-Paper.pdf), Zhang and Chen, 2018. + +# %% [markdown] +# ### Graph-level tasks: Graph classification +# +# Finally, in this part of the tutorial, we will have a closer look at how to apply GNNs to the task of graph classification. +# The goal is to classify an entire graph instead of single nodes or edges. +# Therefore, we are also given a dataset of multiple graphs that we need to classify based on some structural graph properties. +# The most common task for graph classification is molecular property prediction, in which molecules are represented as graphs. +# Each atom is linked to a node, and edges in the graph are the bonds between atoms. +# For example, look at the figure below. +# +#
+# +# On the left, we have an arbitrary, small molecule with different atoms, whereas the right part of the image shows the graph representation. +# The atom types are abstracted as node features (e.g. a one-hot vector), and the different bond types are used as edge features. +# For simplicity, we will neglect the edge attributes in this tutorial, but you can include by using methods like the +# [Relational Graph Convolution](https://arxiv.org/abs/1703.06103) that uses a different weight matrix for each edge type. +# +# The dataset we will use below is called the MUTAG dataset. +# It is a common small benchmark for graph classification algorithms, and contain 188 graphs with 18 nodes +# and 20 edges on average for each graph. +# The graph nodes have 7 different labels/atom types, and the binary graph labels represent "their mutagenic effect +# on a specific gram negative bacterium" (the specific meaning of the labels are not too important here). +# The dataset is part of a large collection of different graph classification datasets, known as the +# [TUDatasets](https://chrsmrrs.github.io/datasets/), which is directly accessible +# via `torch_geometric.datasets.TUDataset` ([documentation](https://pytorch-geometric.readthedocs.io/en/latest/modules/datasets.html#torch_geometric.datasets.TUDataset)) in PyTorch Geometric. +# We can load the dataset below. + +# %% +tu_dataset = torch_geometric.datasets.TUDataset(root=DATASET_PATH, name="MUTAG") + +# %% [markdown] +# Let's look at some statistics for the dataset: + +# %% +print("Data object:", tu_dataset.data) +print("Length:", len(tu_dataset)) +print("Average label: %4.2f" % (tu_dataset.data.y.float().mean().item())) + +# %% [markdown] +# The first line shows how the dataset stores different graphs. +# The nodes, edges, and labels of each graph are concatenated to one tensor, and the dataset stores the indices +# where to split the tensors correspondingly. +# The length of the dataset is the number of graphs we have, and the "average label" +# denotes the percentage of the graph with label 1. +# As long as the percentage is in the range of 0.5, we have a relatively balanced dataset. +# It happens quite often that graph datasets are very imbalanced, hence checking the class balance +# is always a good thing to do. +# +# Next, we will split our dataset into a training and test part. +# Note that we do not use a validation set this time because of the small size of the dataset. +# Therefore, our model might overfit slightly on the validation set due to the noise of the evaluation, +# but we still get an estimate of the performance on untrained data. + +# %% +torch.manual_seed(42) +tu_dataset.shuffle() +train_dataset = tu_dataset[:150] +test_dataset = tu_dataset[150:] + +# %% [markdown] +# When using a data loader, we encounter a problem with batching $N$ graphs. +# Each graph in the batch can have a different number of nodes and edges, and hence we would require a lot of padding to obtain a single tensor. +# Torch geometric uses a different, more efficient approach: we can view the $N$ graphs in a batch as a single large graph with concatenated node and edge list. +# As there is no edge between the $N$ graphs, running GNN layers on the large graph gives us the same output as running the GNN on each graph separately. +# Visually, this batching strategy is visualized below (figure credit - PyTorch Geometric team, +# [tutorial here](https://colab.research.google.com/drive/1I8a0DfQ3fI7Njc62__mVXUlcAleUclnb)). +# +#
+# +# The adjacency matrix is zero for any nodes that come from two different graphs, and otherwise according to the adjacency matrix of the individual graph. +# Luckily, this strategy is already implemented in torch geometric, and hence we can use the corresponding data loader: + +# %% +graph_train_loader = geom_data.DataLoader(train_dataset, batch_size=BATCH_SIZE, shuffle=True) +graph_val_loader = geom_data.DataLoader(test_dataset, batch_size=BATCH_SIZE) # Additional loader for a larger datasets +graph_test_loader = geom_data.DataLoader(test_dataset, batch_size=BATCH_SIZE) + +# %% [markdown] +# Let's load a batch below to see the batching in action: + +# %% +batch = next(iter(graph_test_loader)) +print("Batch:", batch) +print("Labels:", batch.y[:10]) +print("Batch indices:", batch.batch[:40]) + +# %% [markdown] +# We have 38 graphs stacked together for the test dataset. +# The batch indices, stored in `batch`, show that the first 12 nodes belong to the first graph, +# the next 22 to the second graph, and so on. +# These indices are important for performing the final prediction. +# To perform a prediction over a whole graph, we usually perform a pooling operation over all nodes after running the GNN model. +# In this case, we will use the average pooling. +# Hence, we need to know which nodes should be included in which average pool. +# Using this pooling, we can already create our graph network below. +# Specifically, we re-use our class `GNNModel` from before, +# and simply add an average pool and single linear layer for the graph prediction task. + + +# %% +class GraphGNNModel(nn.Module): + def __init__(self, c_in, c_hidden, c_out, dp_rate_linear=0.5, **kwargs): + """ + Args: + c_in: Dimension of input features + c_hidden: Dimension of hidden features + c_out: Dimension of output features (usually number of classes) + dp_rate_linear: Dropout rate before the linear layer (usually much higher than inside the GNN) + kwargs: Additional arguments for the GNNModel object + """ + super().__init__() + self.GNN = GNNModel(c_in=c_in, c_hidden=c_hidden, c_out=c_hidden, **kwargs) # Not our prediction output yet! + self.head = nn.Sequential(nn.Dropout(dp_rate_linear), nn.Linear(c_hidden, c_out)) + + def forward(self, x, edge_index, batch_idx): + """ + Args: + x: Input features per node + edge_index: List of vertex index pairs representing the edges in the graph (PyTorch geometric notation) + batch_idx: Index of batch element for each node + """ + x = self.GNN(x, edge_index) + x = geom_nn.global_mean_pool(x, batch_idx) # Average pooling + x = self.head(x) + return x + + +# %% [markdown] +# Finally, we can create a PyTorch Lightning module to handle the training. +# It is similar to the modules we have seen before and does nothing surprising in terms of training. +# As we have a binary classification task, we use the Binary Cross Entropy loss. + + +# %% +class GraphLevelGNN(L.LightningModule): + def __init__(self, **model_kwargs): + super().__init__() + # Saving hyperparameters + self.save_hyperparameters() + + self.model = GraphGNNModel(**model_kwargs) + self.loss_module = nn.BCEWithLogitsLoss() if self.hparams.c_out == 1 else nn.CrossEntropyLoss() + + def forward(self, data, mode="train"): + x, edge_index, batch_idx = data.x, data.edge_index, data.batch + x = self.model(x, edge_index, batch_idx) + x = x.squeeze(dim=-1) + + if self.hparams.c_out == 1: + preds = (x > 0).float() + data.y = data.y.float() + else: + preds = x.argmax(dim=-1) + loss = self.loss_module(x, data.y) + acc = (preds == data.y).sum().float() / preds.shape[0] + return loss, acc + + def configure_optimizers(self): + # High lr because of small dataset and small model + optimizer = optim.AdamW(self.parameters(), lr=1e-2, weight_decay=0.0) + return optimizer + + def training_step(self, batch, batch_idx): + loss, acc = self.forward(batch, mode="train") + self.log("train_loss", loss) + self.log("train_acc", acc) + return loss + + def validation_step(self, batch, batch_idx): + _, acc = self.forward(batch, mode="val") + self.log("val_acc", acc) + + def test_step(self, batch, batch_idx): + _, acc = self.forward(batch, mode="test") + self.log("test_acc", acc) + + +# %% [markdown] +# Below we train the model on our dataset. It resembles the typical training functions we have seen so far. + + +# %% +def train_graph_classifier(model_name, **model_kwargs): + L.seed_everything(42) + + # Create a PyTorch Lightning trainer with the generation callback + root_dir = os.path.join(CHECKPOINT_PATH, "GraphLevel" + model_name) + os.makedirs(root_dir, exist_ok=True) + trainer = L.Trainer( + default_root_dir=root_dir, + callbacks=[ModelCheckpoint(save_weights_only=True, mode="max", monitor="val_acc")], + accelerator="cuda", + devices=AVAIL_GPUS, + max_epochs=500, + enable_progress_bar=False, + ) + trainer.logger._default_hp_metric = None + + # Check whether pretrained model exists. If yes, load it and skip training + pretrained_filename = os.path.join(CHECKPOINT_PATH, "GraphLevel%s.ckpt" % model_name) + if os.path.isfile(pretrained_filename): + print("Found pretrained model, loading...") + model = GraphLevelGNN.load_from_checkpoint(pretrained_filename) + else: + L.seed_everything(42) + model = GraphLevelGNN( + c_in=tu_dataset.num_node_features, + c_out=1 if tu_dataset.num_classes == 2 else tu_dataset.num_classes, + **model_kwargs, + ) + trainer.fit(model, graph_train_loader, graph_val_loader) + model = GraphLevelGNN.load_from_checkpoint(trainer.checkpoint_callback.best_model_path) + + # Test best model on validation and test set + train_result = trainer.test(model, dataloaders=graph_train_loader, verbose=False) + test_result = trainer.test(model, dataloaders=graph_test_loader, verbose=False) + result = {"test": test_result[0]["test_acc"], "train": train_result[0]["test_acc"]} + return model, result + + +# %% [markdown] +# Finally, let's perform the training and testing. +# Feel free to experiment with different GNN layers, hyperparameters, etc. + +# %% +model, result = train_graph_classifier( + model_name="GraphConv", c_hidden=256, layer_name="GraphConv", num_layers=3, dp_rate_linear=0.5, dp_rate=0.0 +) + +# %% +print("Train performance: %4.2f%%" % (100.0 * result["train"])) +print("Test performance: %4.2f%%" % (100.0 * result["test"])) + +# %% [markdown] +# The test performance shows that we obtain quite good scores on an unseen part of the dataset. +# It should be noted that as we have been using the test set for validation as well, we might have overfitted slightly to this set. +# Nevertheless, the experiment shows us that GNNs can be indeed powerful to predict the properties of graphs and/or molecules. + +# %% [markdown] +# ## Conclusion +# +# In this tutorial, we have seen the application of neural networks to graph structures. +# We looked at how a graph can be represented (adjacency matrix or edge list), +# and discussed the implementation of common graph layers: GCN and GAT. +# The implementations showed the practical side of the layers, which is often easier than the theory. +# Finally, we experimented with different tasks, on node-, edge- and graph-level. +# Overall, we have seen that including graph information in the predictions can be crucial for achieving high performance. +# There are a lot of applications that benefit from GNNs, +# and the importance of these networks will likely increase over the next years. diff --git a/_notebooks/course_UvA-DL/06-graph-neural-networks/example_graph.svg b/_notebooks/course_UvA-DL/06-graph-neural-networks/example_graph.svg new file mode 100644 index 0000000..1d85c94 --- /dev/null +++ b/_notebooks/course_UvA-DL/06-graph-neural-networks/example_graph.svg @@ -0,0 +1,3 @@ + + +
1
1
4
4
3
3
2
2
diff --git a/_notebooks/course_UvA-DL/06-graph-neural-networks/gcn_network.png b/_notebooks/course_UvA-DL/06-graph-neural-networks/gcn_network.png new file mode 100644 index 0000000..d191107 Binary files /dev/null and b/_notebooks/course_UvA-DL/06-graph-neural-networks/gcn_network.png differ diff --git a/_notebooks/course_UvA-DL/06-graph-neural-networks/graph_attention.jpeg b/_notebooks/course_UvA-DL/06-graph-neural-networks/graph_attention.jpeg new file mode 100644 index 0000000..4f382cb Binary files /dev/null and b/_notebooks/course_UvA-DL/06-graph-neural-networks/graph_attention.jpeg differ diff --git a/_notebooks/course_UvA-DL/06-graph-neural-networks/graph_attention_MLP.svg b/_notebooks/course_UvA-DL/06-graph-neural-networks/graph_attention_MLP.svg new file mode 100644 index 0000000..66d219d --- /dev/null +++ b/_notebooks/course_UvA-DL/06-graph-neural-networks/graph_attention_MLP.svg @@ -0,0 +1,553 @@ + + + + + + image/svg+xml + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/_notebooks/course_UvA-DL/06-graph-neural-networks/graph_message_passing.svg b/_notebooks/course_UvA-DL/06-graph-neural-networks/graph_message_passing.svg new file mode 100644 index 0000000..35f9915 --- /dev/null +++ b/_notebooks/course_UvA-DL/06-graph-neural-networks/graph_message_passing.svg @@ -0,0 +1,3 @@ + + +
1
1
4
4
3
3
2
2
1
1
4
4
3
3
2
2
Message passing
Message passing
diff --git a/_notebooks/course_UvA-DL/06-graph-neural-networks/molecule_graph.svg b/_notebooks/course_UvA-DL/06-graph-neural-networks/molecule_graph.svg new file mode 100644 index 0000000..d5c8e1d --- /dev/null +++ b/_notebooks/course_UvA-DL/06-graph-neural-networks/molecule_graph.svg @@ -0,0 +1,434 @@ + + + + + + image/svg+xml + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/_notebooks/course_UvA-DL/06-graph-neural-networks/torch_geometric_stacking_graphs.png b/_notebooks/course_UvA-DL/06-graph-neural-networks/torch_geometric_stacking_graphs.png new file mode 100644 index 0000000..14bccb9 Binary files /dev/null and b/_notebooks/course_UvA-DL/06-graph-neural-networks/torch_geometric_stacking_graphs.png differ diff --git a/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/.meta.yml b/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/.meta.yml new file mode 100644 index 0000000..a5d7c01 --- /dev/null +++ b/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/.meta.yml @@ -0,0 +1,28 @@ +title: "Tutorial 7: Deep Energy-Based Generative Models" +author: Phillip Lippe +created: 2021-07-12 +updated: 2023-03-14 +license: CC BY-SA +build: 0 +tags: + - Image +description: | + In this tutorial, we will look at energy-based deep learning models, and focus on their application as generative models. + Energy models have been a popular tool before the huge deep learning hype around 2012 hit. + However, in recent years, energy-based models have gained increasing attention because of improved training methods and tricks being proposed. + Although they are still in a research stage, they have shown to outperform strong Generative Adversarial Networks + in certain cases which have been the state of the art of generating images + ([blog post](https://ajolicoeur.wordpress.com/the-new-contender-to-gans-score-matching-with-langevin-sampling/)about strong energy-based models, + [blog post](https://medium.com/syncedreview/nvidia-open-sources-hyper-realistic-face-generator-stylegan-f346e1a73826) about the power of GANs). + Hence, it is important to be aware of energy-based models, and as the theory can be abstract sometimes, + we will show the idea of energy-based models with a lot of examples. + This notebook is part of a lecture series on Deep Learning at the University of Amsterdam. + The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io. +requirements: + - torchvision + - matplotlib + - tensorboard + - lightning>=2.0.0rc0 +accelerator: + - CPU + - GPU diff --git a/docs/_static/images/course_UvA-DL/07-deep-energy-based-generative-models.jpg b/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/.thumb.jpg similarity index 100% rename from docs/_static/images/course_UvA-DL/07-deep-energy-based-generative-models.jpg rename to _notebooks/course_UvA-DL/07-deep-energy-based-generative-models/.thumb.jpg diff --git a/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/Deep_Energy_Models.py b/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/Deep_Energy_Models.py new file mode 100644 index 0000000..6cd07a4 --- /dev/null +++ b/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/Deep_Energy_Models.py @@ -0,0 +1,887 @@ +# %% [markdown] +#
+# First, let's import our standard libraries below. + +# %% +# Standard libraries +import os +import random +import urllib.request +from urllib.error import HTTPError + +# PyTorch Lightning +import lightning as L + +# Plotting +import matplotlib +import matplotlib.pyplot as plt + +# %matplotlib inline +import matplotlib_inline.backend_inline +import numpy as np + +# PyTorch +import torch +import torch.nn as nn +import torch.optim as optim +import torch.utils.data as data + +# Torchvision +import torchvision +from lightning.pytorch.callbacks import Callback, LearningRateMonitor, ModelCheckpoint +from torchvision import transforms +from torchvision.datasets import MNIST + +matplotlib_inline.backend_inline.set_matplotlib_formats("svg", "pdf") # For export +matplotlib.rcParams["lines.linewidth"] = 2.0 + +# Path to the folder where the datasets are/should be downloaded (e.g. CIFAR10) +DATASET_PATH = os.environ.get("PATH_DATASETS", "data") +# Path to the folder where the pretrained models are saved +CHECKPOINT_PATH = os.environ.get("PATH_CHECKPOINT", "saved_models/tutorial8") + +# Setting the seed +L.seed_everything(42) + +# Ensure that all operations are deterministic on GPU (if used) for reproducibility +torch.backends.cudnn.deterministic = True +torch.backends.cudnn.benchmark = False + +device = torch.device("cuda:0") if torch.cuda.is_available() else torch.device("cpu") + +# %% [markdown] +# We also have pre-trained models that we download below. + +# %% +# Github URL where saved models are stored for this tutorial +base_url = "https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial8/" +# Files to download +pretrained_files = ["MNIST.ckpt", "tensorboards/events.out.tfevents.MNIST"] + +# Create checkpoint path if it doesn't exist yet +os.makedirs(CHECKPOINT_PATH, exist_ok=True) + +# For each file, check whether it already exists. If not, try downloading it. +for file_name in pretrained_files: + file_path = os.path.join(CHECKPOINT_PATH, file_name) + if "/" in file_name: + os.makedirs(file_path.rsplit("/", 1)[0], exist_ok=True) + if not os.path.isfile(file_path): + file_url = base_url + file_name + print("Downloading %s..." % file_url) + try: + urllib.request.urlretrieve(file_url, file_path) + except HTTPError as e: + print( + "Something went wrong. Please try to download the files manually," + " or contact the author with the full output including the following error:\n", + e, + ) + +# %% [markdown] +# ## Energy Models +# +# In the first part of this tutorial, we will review the theory of the energy-based models +# (the same theory has been discussed in Lecture 8). +# While most of the previous models had the goal of classification or regression, +# energy-based models are motivated from a different perspective: density estimation. +# Given a dataset with a lot of elements, we want to estimate the probability distribution over the whole data space. +# As an example, if we model images from CIFAR10, our goal would be to have a probability distribution +# over all possible images of size $32\times32\times3$ where those images have a high likelihood +# that look realistic and are one of the 10 CIFAR classes. +# Simple methods like interpolation between images don't work because images are extremely high-dimensional +# (especially for large HD images). +# Hence, we turn to deep learning methods that have performed well on complex data. +# +# However, how do we predict a probability distribution $p(\mathbf{x})$ over so many dimensions using a simple neural network? +# The problem is that we cannot just predict a score between 0 and 1, +# because a probability distribution over data needs to fulfill two properties: +# +# 1. +# The probability distribution needs to assign any possible value of +# $\mathbf{x}$ a non-negative value: $p(\mathbf{x}) \geq 0$. +# 2. +# The probability density must sum/integrate to 1 over **all** possible inputs: +# $\int_{\mathbf{x}} p(\mathbf{x}) d\mathbf{x} = 1$. +# +# Luckily, there are actually many approaches for this, and one of them are energy-based models. +# The fundamental idea of energy-based models is that you can turn any function +# that predicts values larger than zero into a probability distribution by dviding by its volume. +# Imagine we have a neural network, which has as output a single neuron, like in regression. +# We can call this network $E_{\theta}(\mathbf{x})$, where $\theta$ are our parameters of the network, +# and $\mathbf{x}$ the input data (e.g. an image). +# The output of $E_{\theta}$ is a scalar value between $-\infty$ and $\infty$. +# Now, we can use basic probability theory to *normalize* the scores of all possible inputs: +# +# $$ +# q_{\theta}(\mathbf{x}) = \frac{\exp\left(-E_{\theta}(\mathbf{x})\right)}{Z_{\theta}} \hspace{5mm}\text{where}\hspace{5mm} +# Z_{\theta} = \begin{cases} +# \int_{\mathbf{x}}\exp\left(-E_{\theta}(\mathbf{x})\right) d\mathbf{x} & \text{if }x\text{ is continuous}\\ +# \sum_{\mathbf{x}}\exp\left(-E_{\theta}(\mathbf{x})\right) & \text{if }x\text{ is discrete} +# \end{cases} +# $$ +# +# The $\exp$-function ensures that we assign a probability greater than zero to any possible input. +# We use a negative sign in front of $E$ because we call $E_{\theta}$ to be the energy function: +# data points with high likelihood have a low energy, while data points with low likelihood have a high energy. +# $Z_{\theta}$ is our normalization terms that ensures that the density integrates/sums to 1. +# We can show this by integrating over $q_{\theta}(\mathbf{x})$: +# +# $$ +# \int_{\mathbf{x}}q_{\theta}(\mathbf{x})d\mathbf{x} = +# \int_{\mathbf{x}}\frac{\exp\left(-E_{\theta}(\mathbf{x})\right)}{\int_{\mathbf{\tilde{x}}}\exp\left(-E_{\theta}(\mathbf{\tilde{x}})\right) d\mathbf{\tilde{x}}}d\mathbf{x} = +# \frac{\int_{\mathbf{x}}\exp\left(-E_{\theta}(\mathbf{x})\right)d\mathbf{x}}{\int_{\mathbf{\tilde{x}}}\exp\left(-E_{\theta}(\mathbf{\tilde{x}})\right) d\mathbf{\tilde{x}}} = 1 +# $$ +# +# Note that we call the probability distribution $q_{\theta}(\mathbf{x})$ because this is the learned distribution by the model, +# and is trained to be as close as possible to the *true*, unknown distribution $p(\mathbf{x})$. +# +# The main benefit of this formulation of the probability distribution is its great flexibility as we can choose +# $E_{\theta}$ in whatever way we like, without any constraints. +# Nevertheless, when looking at the equation above, we can see a fundamental issue: How do we calculate $Z_{\theta}$? +# There is no chance that we can calculate $Z_{\theta}$ analytically for high-dimensional input +# and/or larger neural networks, but the task requires us to know $Z_{\theta}$. +# Although we can't determine the exact likelihood of a point, there exist methods with which we can train energy-based models. +# Thus, we will look next at "Contrastive Divergence" for training the model. + +# %% [markdown] +# ### Contrastive Divergence +# +# When we train a model on generative modeling, it is usually done by maximum likelihood estimation. +# In other words, we try to maximize the likelihood of the examples in the training set. +# As the exact likelihood of a point cannot be determined due to the unknown normalization constant $Z_{\theta}$, +# we need to train energy-based models slightly different. +# We cannot just maximize the un-normalized probability $\exp(-E_{\theta}(\mathbf{x}_{\text{train}}))$ +# because there is no guarantee that $Z_{\theta}$ stays constant, or that $\mathbf{x}_{\text{train}}$ +# is becoming more likely than the others. +# However, if we base our training on comparing the likelihood of points, we can create a stable objective. +# Namely, we can re-write our maximum likelihood objective where we maximize the probability +# of $\mathbf{x}_{\text{train}}$ compared to a randomly sampled data point of our model: +# +# $$ +# \begin{split} +# \nabla_{\theta}\mathcal{L}_{\text{MLE}}(\mathbf{\theta};p) & = -\mathbb{E}_{p(\mathbf{x})}\left[\nabla_{\theta}\log q_{\theta}(\mathbf{x})\right]\\[5pt] +# & = \mathbb{E}_{p(\mathbf{x})}\left[\nabla_{\theta}E_{\theta}(\mathbf{x})\right] - \mathbb{E}_{q_{\theta}(\mathbf{x})}\left[\nabla_{\theta}E_{\theta}(\mathbf{x})\right] +# \end{split} +# $$ +# +# Note that the loss is still an objective we want to minimize. +# Thus, we try to minimize the energy for data points from the dataset, while maximizing the energy for randomly +# sampled data points from our model (how we sample will be explained below). +# Although this objective sounds intuitive, how is it actually derived from our original distribution $q_{\theta}(\mathbf{x})$? +# The trick is that we approximate $Z_{\theta}$ by a single Monte-Carlo sample. +# This gives us the exact same objective as written above. +# +# Visually, we can look at the objective as follows (figure credit +# - [Stefano Ermon and Aditya Grover](https://deepgenerativemodels.github.io/assets/slides/cs236_lecture11.pdf)): +# +#
+# +# $f_{\theta}$ represents $\exp(-E_{\theta}(\mathbf{x}))$ in our case. +# The point on the right, called "correct answer", represents a data point from the dataset +# (i.e. $x_{\text{train}}$), and the left point, "wrong answer", a sample from our model (i.e. $x_{\text{sample}}$). +# Thus, we try to "pull up" the probability of the data points in the dataset, +# while "pushing down" randomly sampled points. +# The two forces for pulling and pushing are in balance iff $q_{\theta}(\mathbf{x})=p(\mathbf{x})$. + +# %% [markdown] +# ### Sampling from Energy-Based Models +# +# For sampling from an energy-based model, we can apply a Markov Chain Monte Carlo using Langevin Dynamics. +# The idea of the algorithm is to start from a random point, and slowly move towards the direction +# of higher probability using the gradients of $E_{\theta}$. +# Nevertheless, this is not enough to fully capture the probability distribution. +# We need to add noise $\omega$ at each gradient step to the current sample. +# Under certain conditions such as that we perform the gradient steps an infinite amount of times, +# we would be able to create an exact sample from our modeled distribution. +# However, as this is not practically possible, we usually limit the chain to $K$ steps +# ($K$ a hyperparameter that needs to be finetuned). +# Overall, the sampling procedure can be summarized in the following algorithm: +# +#
+ +# %% [markdown] +# ### Applications of Energy-based models beyond generation +# +# Modeling the probability distribution for sampling new data is not the only application of energy-based models. +# Any application which requires us to compare two elements is much simpler to learn +# because we just need to go for the higher energy. +# A couple of examples are shown below (figure credit +# - [Stefano Ermon and Aditya Grover](https://deepgenerativemodels.github.io/assets/slides/cs236_lecture11.pdf)). +# A classification setup like object recognition or sequence labeling can be considered as an energy-based +# task as we just need to find the $Y$ input that minimizes the output $E(X, Y)$ (hence maximizes probability). +# Similarly, a popular application of energy-based models is denoising of images. +# Given an image $X$ with a lot of noise, we try to minimize the energy by finding the true input image $Y$. +# +#
+# +# Nonetheless, we will focus on generative modeling here as in the next couple of lectures, +# we will discuss more generative deep learning approaches. + +# %% [markdown] +# ## Image generation +# +#
+# +# As an example for energy-based models, we will train a model on image generation. +# Specifically, we will look at how we can generate MNIST digits with a very simple CNN model. +# However, it should be noted that energy models are not easy to train and often diverge +# if the hyperparameters are not well tuned. +# We will rely on training tricks proposed in the paper +# [Implicit Generation and Generalization in Energy-Based Models](https://arxiv.org/abs/1903.08689) +# by Yilun Du and Igor Mordatch ([blog](https://openai.com/blog/energy-based-models/)). +# The important part of this notebook is however to see how the theory above can actually be used in a model. +# +# ### Dataset +# +# First, we can load the MNIST dataset below. +# Note that we need to normalize the images between -1 and 1 instead of mean 0 and std 1 because during sampling, +# we have to limit the input space. +# Scaling between -1 and 1 makes it easier to implement it. + +# %% +# Transformations applied on each image => make them a tensor and normalize between -1 and 1 +transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.5,), (0.5,))]) + +# Loading the training dataset. We need to split it into a training and validation part +train_set = MNIST(root=DATASET_PATH, train=True, transform=transform, download=True) + +# Loading the test set +test_set = MNIST(root=DATASET_PATH, train=False, transform=transform, download=True) + +# We define a set of data loaders that we can use for various purposes later. +# Note that for actually training a model, we will use different data loaders +# with a lower batch size. +train_loader = data.DataLoader(train_set, batch_size=128, shuffle=True, drop_last=True, num_workers=4, pin_memory=True) +test_loader = data.DataLoader(test_set, batch_size=256, shuffle=False, drop_last=False, num_workers=4) + +# %% [markdown] +# ### CNN Model +# +# First, we implement our CNN model. +# The MNIST images are of size 28x28, hence we only need a small model. +# As an example, we will apply several convolutions with stride 2 that downscale the images. +# If you are interested, you can also use a deeper model such as a small ResNet, but for simplicity, +# we will stick with the tiny network. +# +# It is a good practice to use a smooth activation function like Swish instead of ReLU in the energy model. +# This is because we will rely on the gradients we get back with respect to the input image, which should not be sparse. + + +# %% +class CNNModel(nn.Module): + def __init__(self, hidden_features=32, out_dim=1, **kwargs): + super().__init__() + # We increase the hidden dimension over layers. Here pre-calculated for simplicity. + c_hid1 = hidden_features // 2 + c_hid2 = hidden_features + c_hid3 = hidden_features * 2 + + # Series of convolutions and Swish activation functions + self.cnn_layers = nn.Sequential( + nn.Conv2d(1, c_hid1, kernel_size=5, stride=2, padding=4), # [16x16] - Larger padding to get 32x32 image + nn.SiLU(), + nn.Conv2d(c_hid1, c_hid2, kernel_size=3, stride=2, padding=1), # [8x8] + nn.SiLU(), + nn.Conv2d(c_hid2, c_hid3, kernel_size=3, stride=2, padding=1), # [4x4] + nn.SiLU(), + nn.Conv2d(c_hid3, c_hid3, kernel_size=3, stride=2, padding=1), # [2x2] + nn.SiLU(), + nn.Flatten(), + nn.Linear(c_hid3 * 4, c_hid3), + nn.SiLU(), + nn.Linear(c_hid3, out_dim), + ) + + def forward(self, x): + x = self.cnn_layers(x).squeeze(dim=-1) + return x + + +# %% [markdown] +# In the rest of the notebook, the output of the model will actually not represent +# $E_{\theta}(\mathbf{x})$, but $-E_{\theta}(\mathbf{x})$. +# This is a standard implementation practice for energy-based models, as some people also write the energy probability +# density as $q_{\theta}(\mathbf{x}) = \frac{\exp\left(f_{\theta}(\mathbf{x})\right)}{Z_{\theta}}$. +# In that case, the model would actually represent $f_{\theta}(\mathbf{x})$. +# In the training loss etc., we need to be careful to not switch up the signs. + +# %% [markdown] +# ### Sampling buffer +# +# In the next part, we look at the training with sampled elements. +# To use the contrastive divergence objective, we need to generate samples during training. +# Previous work has shown that due to the high dimensionality of images, we need a lot of iterations +# inside the MCMC sampling to obtain reasonable samples. +# However, there is a training trick that significantly reduces the sampling cost: using a sampling buffer. +# The idea is that we store the samples of the last couple of batches in a buffer, +# and re-use those as the starting point of the MCMC algorithm for the next batches. +# This reduces the sampling cost because the model requires a significantly +# lower number of steps to converge to reasonable samples. +# However, to not solely rely on previous samples and allow novel samples as well, +# we re-initialize 5% of our samples from scratch (random noise between -1 and 1). +# +# Below, we implement the sampling buffer. +# The function `sample_new_exmps` returns a new batch of "fake" images. +# We refer to those as fake images because they have been generated, but are not actually part of the dataset. +# As mentioned before, we use initialize 5% randomly, and 95% are randomly picked from our buffer. +# On this initial batch, we perform MCMC for 60 iterations to improve the image quality +# and come closer to samples from $q_{\theta}(\mathbf{x})$. +# In the function `generate_samples`, we implemented the MCMC for images. +# Note that the hyperparameters of `step_size`, `steps`, the noise standard deviation +# $\sigma$ are specifically set for MNIST, and need to be finetuned for a different dataset if you want to use such. + + +# %% +class Sampler: + def __init__(self, model, img_shape, sample_size, max_len=8192): + """ + Args: + model: Neural network to use for modeling E_theta + img_shape: Shape of the images to model + sample_size: Batch size of the samples + max_len: Maximum number of data points to keep in the buffer + """ + super().__init__() + self.model = model + self.img_shape = img_shape + self.sample_size = sample_size + self.max_len = max_len + self.examples = [(torch.rand((1,) + img_shape) * 2 - 1) for _ in range(self.sample_size)] + + def sample_new_exmps(self, steps=60, step_size=10): + """Function for getting a new batch of "fake" images. + + Args: + steps: Number of iterations in the MCMC algorithm + step_size: Learning rate nu in the algorithm above + """ + # Choose 95% of the batch from the buffer, 5% generate from scratch + n_new = np.random.binomial(self.sample_size, 0.05) + rand_imgs = torch.rand((n_new,) + self.img_shape) * 2 - 1 + old_imgs = torch.cat(random.choices(self.examples, k=self.sample_size - n_new), dim=0) + inp_imgs = torch.cat([rand_imgs, old_imgs], dim=0).detach().to(device) + + # Perform MCMC sampling + inp_imgs = Sampler.generate_samples(self.model, inp_imgs, steps=steps, step_size=step_size) + + # Add new images to the buffer and remove old ones if needed + self.examples = list(inp_imgs.to(torch.device("cpu")).chunk(self.sample_size, dim=0)) + self.examples + self.examples = self.examples[: self.max_len] + return inp_imgs + + @staticmethod + def generate_samples(model, inp_imgs, steps=60, step_size=10, return_img_per_step=False): + """Function for sampling images for a given model. + + Args: + model: Neural network to use for modeling E_theta + inp_imgs: Images to start from for sampling. If you want to generate new images, enter noise between -1 and 1. + steps: Number of iterations in the MCMC algorithm. + step_size: Learning rate nu in the algorithm above + return_img_per_step: If True, we return the sample at every iteration of the MCMC + """ + # Before MCMC: set model parameters to "required_grad=False" + # because we are only interested in the gradients of the input. + is_training = model.training + model.eval() + for p in model.parameters(): + p.requires_grad = False + inp_imgs.requires_grad = True + + # Enable gradient calculation if not already the case + had_gradients_enabled = torch.is_grad_enabled() + torch.set_grad_enabled(True) + + # We use a buffer tensor in which we generate noise each loop iteration. + # More efficient than creating a new tensor every iteration. + noise = torch.randn(inp_imgs.shape, device=inp_imgs.device) + + # List for storing generations at each step (for later analysis) + imgs_per_step = [] + + # Loop over K (steps) + for _ in range(steps): + # Part 1: Add noise to the input. + noise.normal_(0, 0.005) + inp_imgs.data.add_(noise.data) + inp_imgs.data.clamp_(min=-1.0, max=1.0) + + # Part 2: calculate gradients for the current input. + out_imgs = -model(inp_imgs) + out_imgs.sum().backward() + inp_imgs.grad.data.clamp_(-0.03, 0.03) # For stabilizing and preventing too high gradients + + # Apply gradients to our current samples + inp_imgs.data.add_(-step_size * inp_imgs.grad.data) + inp_imgs.grad.detach_() + inp_imgs.grad.zero_() + inp_imgs.data.clamp_(min=-1.0, max=1.0) + + if return_img_per_step: + imgs_per_step.append(inp_imgs.clone().detach()) + + # Reactivate gradients for parameters for training + for p in model.parameters(): + p.requires_grad = True + model.train(is_training) + + # Reset gradient calculation to setting before this function + torch.set_grad_enabled(had_gradients_enabled) + + if return_img_per_step: + return torch.stack(imgs_per_step, dim=0) + else: + return inp_imgs + + +# %% [markdown] +# The idea of the buffer becomes a bit clearer in the following algorithm. + +# %% [markdown] +# ### Training algorithm +# +# With the sampling buffer being ready, we can complete our training algorithm. +# Below is shown a summary of the full training algorithm of an energy model on image modeling: +# +#
+# +# The first few statements in each training iteration concern the sampling of the real and fake data, +# as we have seen above with the sample buffer. +# Next, we calculate the contrastive divergence objective using our energy model $E_{\theta}$. +# However, one additional training trick we need is to add a regularization loss on the output of $E_{\theta}$. +# As the output of the network is not constrained and adding a large bias or not to the output +# doesn't change the contrastive divergence loss, we need to ensure somehow else that the output values are in a reasonable range. +# Without the regularization loss, the output values will fluctuate in a very large range. +# With this, we ensure that the values for the real data are around 0, and the fake data likely slightly lower +# (for noise or outliers the score can be still significantly lower). +# As the regularization loss is less important than the Contrastive Divergence, we have a weight factor +# $\alpha$ which is usually quite some smaller than 1. +# Finally, we perform an update step with an optimizer on the combined loss and add the new samples to the buffer. +# +# Below, we put this training dynamic into a PyTorch Lightning module: + + +# %% +class DeepEnergyModel(L.LightningModule): + def __init__(self, img_shape, batch_size, alpha=0.1, lr=1e-4, beta1=0.0, **CNN_args): + super().__init__() + self.save_hyperparameters() + + self.cnn = CNNModel(**CNN_args) + self.sampler = Sampler(self.cnn, img_shape=img_shape, sample_size=batch_size) + self.example_input_array = torch.zeros(1, *img_shape) + + def forward(self, x): + z = self.cnn(x) + return z + + def configure_optimizers(self): + # Energy models can have issues with momentum as the loss surfaces changes with its parameters. + # Hence, we set it to 0 by default. + optimizer = optim.Adam(self.parameters(), lr=self.hparams.lr, betas=(self.hparams.beta1, 0.999)) + scheduler = optim.lr_scheduler.StepLR(optimizer, 1, gamma=0.97) # Exponential decay over epochs + return [optimizer], [scheduler] + + def training_step(self, batch, batch_idx): + # We add minimal noise to the original images to prevent the model from focusing on purely "clean" inputs + real_imgs, _ = batch + small_noise = torch.randn_like(real_imgs) * 0.005 + real_imgs.add_(small_noise).clamp_(min=-1.0, max=1.0) + + # Obtain samples + fake_imgs = self.sampler.sample_new_exmps(steps=60, step_size=10) + + # Predict energy score for all images + inp_imgs = torch.cat([real_imgs, fake_imgs], dim=0) + real_out, fake_out = self.cnn(inp_imgs).chunk(2, dim=0) + + # Calculate losses + reg_loss = self.hparams.alpha * (real_out**2 + fake_out**2).mean() + cdiv_loss = fake_out.mean() - real_out.mean() + loss = reg_loss + cdiv_loss + + # Logging + self.log("loss", loss) + self.log("loss_regularization", reg_loss) + self.log("loss_contrastive_divergence", cdiv_loss) + self.log("metrics_avg_real", real_out.mean()) + self.log("metrics_avg_fake", fake_out.mean()) + return loss + + def validation_step(self, batch, batch_idx): + # For validating, we calculate the contrastive divergence between purely random images and unseen examples + # Note that the validation/test step of energy-based models depends on what we are interested in the model + real_imgs, _ = batch + fake_imgs = torch.rand_like(real_imgs) * 2 - 1 + + inp_imgs = torch.cat([real_imgs, fake_imgs], dim=0) + real_out, fake_out = self.cnn(inp_imgs).chunk(2, dim=0) + + cdiv = fake_out.mean() - real_out.mean() + self.log("val_contrastive_divergence", cdiv) + self.log("val_fake_out", fake_out.mean()) + self.log("val_real_out", real_out.mean()) + + +# %% [markdown] +# We do not implement a test step because energy-based, generative models are usually not evaluated on a test set. +# The validation step however is used to get an idea of the difference between ennergy/likelihood +# of random images to unseen examples of the dataset. + +# %% [markdown] +# ### Callbacks +# +# To track the performance of our model during training, we will make extensive use of PyTorch Lightning's callback framework. +# Remember that callbacks can be used for running small functions at any point of the training, +# for instance after finishing an epoch. +# Here, we will use three different callbacks we define ourselves. +# +# The first callback, called `GenerateCallback`, is used for adding image generations to the model during training. +# After every $N$ epochs (usually $N=5$ to reduce output to TensorBoard), we take a small batch +# of random images and perform many MCMC iterations until the model's generation converges. +# Compared to the training that used 60 iterations, we use 256 here because +# (1) we only have to do it once compared to the training that has to do it every iteration, and +# (2) we do not start from a buffer here, but from scratch. +# It is implemented as follows: + + +# %% +class GenerateCallback(Callback): + def __init__(self, batch_size=8, vis_steps=8, num_steps=256, every_n_epochs=5): + super().__init__() + self.batch_size = batch_size # Number of images to generate + self.vis_steps = vis_steps # Number of steps within generation to visualize + self.num_steps = num_steps # Number of steps to take during generation + # Only save those images every N epochs (otherwise tensorboard gets quite large) + self.every_n_epochs = every_n_epochs + + def on_epoch_end(self, trainer, pl_module): + # Skip for all other epochs + if trainer.current_epoch % self.every_n_epochs == 0: + # Generate images + imgs_per_step = self.generate_imgs(pl_module) + # Plot and add to tensorboard + for i in range(imgs_per_step.shape[1]): + step_size = self.num_steps // self.vis_steps + imgs_to_plot = imgs_per_step[step_size - 1 :: step_size, i] + grid = torchvision.utils.make_grid( + imgs_to_plot, nrow=imgs_to_plot.shape[0], normalize=True, range=(-1, 1) + ) + trainer.logger.experiment.add_image("generation_%i" % i, grid, global_step=trainer.current_epoch) + + def generate_imgs(self, pl_module): + pl_module.eval() + start_imgs = torch.rand((self.batch_size,) + pl_module.hparams["img_shape"]).to(pl_module.device) + start_imgs = start_imgs * 2 - 1 + imgs_per_step = Sampler.generate_samples( + pl_module.cnn, start_imgs, steps=self.num_steps, step_size=10, return_img_per_step=True + ) + pl_module.train() + return imgs_per_step + + +# %% [markdown] +# The second callback is called `SamplerCallback`, and simply adds a randomly picked subset of images +# in the sampling buffer to the TensorBoard. +# This helps to understand what images are currently shown to the model as "fake". + + +# %% +class SamplerCallback(Callback): + def __init__(self, num_imgs=32, every_n_epochs=5): + super().__init__() + self.num_imgs = num_imgs # Number of images to plot + # Only save those images every N epochs (otherwise tensorboard gets quite large) + self.every_n_epochs = every_n_epochs + + def on_epoch_end(self, trainer, pl_module): + if trainer.current_epoch % self.every_n_epochs == 0: + exmp_imgs = torch.cat(random.choices(pl_module.sampler.examples, k=self.num_imgs), dim=0) + grid = torchvision.utils.make_grid(exmp_imgs, nrow=4, normalize=True, range=(-1, 1)) + trainer.logger.experiment.add_image("sampler", grid, global_step=trainer.current_epoch) + + +# %% [markdown] +# Finally, our last callback is `OutlierCallback`. +# This callback evaluates the model by recording the (negative) energy assigned to random noise. +# While our training loss is almost constant across iterations, +# this score is likely showing the progress of the model to detect "outliers". + + +# %% +class OutlierCallback(Callback): + def __init__(self, batch_size=1024): + super().__init__() + self.batch_size = batch_size + + def on_epoch_end(self, trainer, pl_module): + with torch.no_grad(): + pl_module.eval() + rand_imgs = torch.rand((self.batch_size,) + pl_module.hparams["img_shape"]).to(pl_module.device) + rand_imgs = rand_imgs * 2 - 1.0 + rand_out = pl_module.cnn(rand_imgs).mean() + pl_module.train() + + trainer.logger.experiment.add_scalar("rand_out", rand_out, global_step=trainer.current_epoch) + + +# %% [markdown] +# ### Running the model +# +# Finally, we can add everything together to create our final training function. +# The function is very similar to any other PyTorch Lightning training function we have seen so far. +# However, there is the small difference of that we do not test the model on a test set +# because we will analyse the model afterward by checking its prediction and ability to perform outlier detection. + + +# %% +def train_model(**kwargs): + # Create a PyTorch Lightning trainer with the generation callback + trainer = L.Trainer( + default_root_dir=os.path.join(CHECKPOINT_PATH, "MNIST"), + accelerator="auto", + devices=1, + max_epochs=60, + gradient_clip_val=0.1, + callbacks=[ + ModelCheckpoint(save_weights_only=True, mode="min", monitor="val_contrastive_divergence"), + GenerateCallback(every_n_epochs=5), + SamplerCallback(every_n_epochs=5), + OutlierCallback(), + LearningRateMonitor("epoch"), + ], + ) + # Check whether pretrained model exists. If yes, load it and skip training + pretrained_filename = os.path.join(CHECKPOINT_PATH, "MNIST.ckpt") + if os.path.isfile(pretrained_filename): + print("Found pretrained model, loading...") + model = DeepEnergyModel.load_from_checkpoint(pretrained_filename) + else: + L.seed_everything(42) + model = DeepEnergyModel(**kwargs) + trainer.fit(model, train_loader, test_loader) + model = DeepEnergyModel.load_from_checkpoint(trainer.checkpoint_callback.best_model_path) + # No testing as we are more interested in other properties + return model + + +# %% +model = train_model(img_shape=(1, 28, 28), batch_size=train_loader.batch_size, lr=1e-4, beta1=0.0) + +# %% [markdown] +# ## Analysis +# +# In the last part of the notebook, we will try to take the trained energy-based generative model, +# and analyse its properties. + +# %% [markdown] +# ### TensorBoard +# +# The first thing we can look at is the TensorBoard generate during training. +# This can help us to understand the training dynamic even better, and shows potential issues. +# Let's load the TensorBoard below: + +# %% +# Uncomment the following two lines to open a tensorboard in the notebook. +# Adjust the path to your CHECKPOINT_PATH if needed. +# %load_ext tensorboard +# %tensorboard --logdir ../saved_models/tutorial8/tensorboards/ + +# %% [markdown] +#
+ +# %% [markdown] +# We see that the contrastive divergence as well as the regularization converge quickly to 0. +# However, the training continues although the loss is always close to zero. +# This is because our "training" data changes with the model by sampling. +# The progress of training can be best measured by looking at the samples across iterations, +# and the score for random images that decreases constantly over time. + +# %% [markdown] +# ### Image Generation +# +# Another way of evaluating generative models is by sampling a few generated images. +# Generative models need to be good at generating realistic images as this truely shows that they have modeled the true data distribution. +# Thus, let's sample a few images of the model below: + +# %% +model.to(device) +L.seed_everything(43) +callback = GenerateCallback(batch_size=4, vis_steps=8, num_steps=256) +imgs_per_step = callback.generate_imgs(model) +imgs_per_step = imgs_per_step.cpu() + +# %% [markdown] +# The characteristic of sampling with energy-based models is that they require the iterative MCMC algorithm. +# To gain an insight in how the images change over iterations, we plot a few intermediate samples in the MCMC as well: + +# %% +for i in range(imgs_per_step.shape[1]): + step_size = callback.num_steps // callback.vis_steps + imgs_to_plot = imgs_per_step[step_size - 1 :: step_size, i] + imgs_to_plot = torch.cat([imgs_per_step[0:1, i], imgs_to_plot], dim=0) + grid = torchvision.utils.make_grid( + imgs_to_plot, nrow=imgs_to_plot.shape[0], normalize=True, range=(-1, 1), pad_value=0.5, padding=2 + ) + grid = grid.permute(1, 2, 0) + plt.figure(figsize=(8, 8)) + plt.imshow(grid) + plt.xlabel("Generation iteration") + plt.xticks( + [(imgs_per_step.shape[-1] + 2) * (0.5 + j) for j in range(callback.vis_steps + 1)], + labels=[1] + list(range(step_size, imgs_per_step.shape[0] + 1, step_size)), + ) + plt.yticks([]) + plt.show() + +# %% [markdown] +# We see that although starting from noise in the very first step, the sampling algorithm obtains reasonable shapes after only 32 steps. +# Over the next 200 steps, the shapes become clearer and changed towards realistic digits. +# The specific samples can differ when you run the code on Colab, hence the following description is specific to the plots shown on the website. +# The first row shows an 8, where we remove unnecessary white parts over iterations. +# The transformation across iterations can be seen at best for the second sample, which creates a digit of 2. +# While the first sample after 32 iterations looks a bit like a digit, but not really, +# the sample is transformed more and more to a typical image of the digit 2. + +# %% [markdown] +# ### Out-of-distribution detection +# +# A very common and strong application of energy-based models is out-of-distribution detection +# (sometimes referred to as "anomaly" detection). +# As more and more deep learning models are applied in production and applications, +# a crucial aspect of these models is to know what the models don't know. +# Deep learning models are usually overconfident, meaning that they classify even random images sometimes with 100% probability. +# Clearly, this is not something that we want to see in applications. +# Energy-based models can help with this problem because they are trained to detect images that do not fit the training dataset distribution. +# Thus, in those applications, you could train an energy-based model along with the classifier, +# and only output predictions if the energy-based models assign a (unnormalized) probability higher than $\delta$ to the image. +# You can actually combine classifiers and energy-based objectives in a single model, +# as proposed in this [paper](https://arxiv.org/abs/1912.03263). +# +# In this part of the analysis, we want to test the out-of-distribution capability of our energy-based model. +# Remember that a lower output of the model denotes a low probability. +# Thus, we hope to see low scores if we enter random noise to the model: + +# %% +with torch.no_grad(): + rand_imgs = torch.rand((128,) + model.hparams.img_shape).to(model.device) + rand_imgs = rand_imgs * 2 - 1.0 + rand_out = model.cnn(rand_imgs).mean() + print("Average score for random images: %4.2f" % (rand_out.item())) + +# %% [markdown] +# As we hoped, the model assigns very low probability to those noisy images. +# As another reference, let's look at predictions for a batch of images from the training set: + +# %% +with torch.no_grad(): + train_imgs, _ = next(iter(train_loader)) + train_imgs = train_imgs.to(model.device) + train_out = model.cnn(train_imgs).mean() + print("Average score for training images: %4.2f" % (train_out.item())) + +# %% [markdown] +# The scores are close to 0 because of the regularization objective that was added to the training. +# So clearly, the model can distinguish between noise and real digits. +# However, what happens if we change the training images a little, and see which ones gets a very low score? + + +# %% +@torch.no_grad() +def compare_images(img1, img2): + imgs = torch.stack([img1, img2], dim=0).to(model.device) + score1, score2 = model.cnn(imgs).cpu().chunk(2, dim=0) + grid = torchvision.utils.make_grid( + [img1.cpu(), img2.cpu()], nrow=2, normalize=True, range=(-1, 1), pad_value=0.5, padding=2 + ) + grid = grid.permute(1, 2, 0) + plt.figure(figsize=(4, 4)) + plt.imshow(grid) + plt.xticks([(img1.shape[2] + 2) * (0.5 + j) for j in range(2)], labels=["Original image", "Transformed image"]) + plt.yticks([]) + plt.show() + print("Score original image: %4.2f" % score1) + print("Score transformed image: %4.2f" % score2) + + +# %% [markdown] +# We use a random test image for this. Feel free to change it to experiment with the model yourself. + +# %% +test_imgs, _ = next(iter(test_loader)) +exmp_img = test_imgs[0].to(model.device) + +# %% [markdown] +# The first transformation is to add some random noise to the image: + +# %% +img_noisy = exmp_img + torch.randn_like(exmp_img) * 0.3 +img_noisy.clamp_(min=-1.0, max=1.0) +compare_images(exmp_img, img_noisy) + +# %% [markdown] +# We can see that the score considerably drops. +# Hence, the model can detect random Gaussian noise on the image. +# This is also to expect as initially, the "fake" samples are pure noise images. +# +# Next, we flip an image and check how this influences the score: + +# %% +img_flipped = exmp_img.flip(dims=(1, 2)) +compare_images(exmp_img, img_flipped) + +# %% [markdown] +# If the digit can only be read in this way, for example, the 7, then we can see that the score drops. +# However, the score only drops slightly. +# This is likely because of the small size of our model. +# Keep in mind that generative modeling is a much harder task than classification, +# as we do not only need to distinguish between classes but learn **all** details/characteristics of the digits. +# With a deeper model, this could eventually be captured better (but at the cost of greater training instability). +# +# Finally, we check what happens if we reduce the digit significantly in size: + +# %% +img_tiny = torch.zeros_like(exmp_img) - 1 +img_tiny[:, exmp_img.shape[1] // 2 :, exmp_img.shape[2] // 2 :] = exmp_img[:, ::2, ::2] +compare_images(exmp_img, img_tiny) + +# %% [markdown] +# The score again drops but not by a large margin, although digits in the MNIST dataset usually are much larger. +# +# Overall, we can conclude that our model is good for detecting Gaussian noise and smaller transformations to existing digits. +# Nonetheless, to obtain a very good out-of-distribution model, we would need to train deeper models and for more iterations. + +# %% [markdown] +# ### Instability +# +# Finally, we should discuss the possible instabilities of energy-based models, +# in particular for the example of image generation that we have implemented in this notebook. +# In the process of hyperparameter search for this notebook, there have been several models that diverged. +# Divergence in energy-based models means that the models assign a high probability to examples of the training set which is a good thing. +# However, at the same time, the sampling algorithm fails and only generates noise images that obtain minimal probability scores. +# This happens because the model has created many local maxima in which the generated noise images fall. +# The energy surface over which we calculate the gradients to reach data points with high probability has "diverged" and is not useful for our MCMC sampling. +# +# Besides finding the optimal hyperparameters, a common trick in energy-based models is to reload stable checkpoints. +# If we detect that the model is diverging, we stop the training, load the model from one epoch ago where it did not diverge yet. +# Afterward, we continue training and hope that with a different seed the model is not diverging again. +# Nevertheless, this should be considered as the "last hope" for stabilizing the models, +# and careful hyperparameter tuning is the better way to do so. +# Sensitive hyperparameters include `step_size`, `steps` and the noise standard deviation in the sampler, +# and the learning rate and feature dimensionality in the CNN model. + +# %% [markdown] +# ## Conclusion +# +# In this tutorial, we have discussed energy-based models for generative modeling. +# The concept relies on the idea that any strictly positive function can be turned into a probability +# distribution by normalizing over the whole dataset. +# As this is not reasonable to calculate for high dimensional data like images, +# we train the model using contrastive divergence and sampling via MCMC. +# While the idea allows us to turn any neural network into an energy-based model, +# we have seen that there are multiple training tricks needed to stabilize the training. +# Furthermore, the training time of these models is relatively long as, during every training iteration, +# we need to sample new "fake" images, even with a sampling buffer. +# In the next lectures and assignment, we will see different generative models (e.g. VAE, GAN, NF) +# that allow us to do generative modeling more stably, but with the cost of more parameters. diff --git a/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/contrastive_divergence.svg b/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/contrastive_divergence.svg new file mode 100644 index 0000000..bc084ae --- /dev/null +++ b/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/contrastive_divergence.svg @@ -0,0 +1,84 @@ + + + + + + image/svg+xml + + + + + + + + + + + + + + + + + + diff --git a/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/energy_models_application.png b/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/energy_models_application.png new file mode 100644 index 0000000..71fee99 Binary files /dev/null and b/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/energy_models_application.png differ diff --git a/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/sampling.svg b/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/sampling.svg new file mode 100644 index 0000000..b6fbd2a --- /dev/null +++ b/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/sampling.svg @@ -0,0 +1,2562 @@ + + + + + + image/svg+xmldiff --git a/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/tensorboard_screenshot.png b/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/tensorboard_screenshot.png new file mode 100644 index 0000000..e514684 Binary files /dev/null and b/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/tensorboard_screenshot.png differ diff --git a/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/training_algorithm.svg b/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/training_algorithm.svg new file mode 100644 index 0000000..b1c76d6 --- /dev/null +++ b/_notebooks/course_UvA-DL/07-deep-energy-based-generative-models/training_algorithm.svg @@ -0,0 +1,5567 @@ + + + + + + image/svg+xmldiff --git a/_notebooks/course_UvA-DL/08-deep-autoencoders/.meta.yml b/_notebooks/course_UvA-DL/08-deep-autoencoders/.meta.yml new file mode 100644 index 0000000..5c4df67 --- /dev/null +++ b/_notebooks/course_UvA-DL/08-deep-autoencoders/.meta.yml @@ -0,0 +1,28 @@ +title: "Tutorial 8: Deep Autoencoders" +author: Phillip Lippe +created: 2021-07-12 +updated: 2023-03-14 +license: CC BY-SA +build: 0 +tags: + - Image +description: | + In this tutorial, we will take a closer look at autoencoders (AE). + Autoencoders are trained on encoding input data such as images into a smaller feature vector, + and afterward, reconstruct it by a second neural network, called a decoder. + The feature vector is called the "bottleneck" of the network as we aim to compress the input data into a smaller amount of features. + This property is useful in many applications, in particular in compressing data or comparing images on a metric beyond pixel-level comparisons. + Besides learning about the autoencoder framework, we will also see the "deconvolution" + (or transposed convolution) operator in action for scaling up feature maps in height and width. + Such deconvolution networks are necessary wherever we start from a small feature vector + and need to output an image of full size (e.g. in VAE, GANs, or super-resolution applications). + This notebook is part of a lecture series on Deep Learning at the University of Amsterdam. + The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io. +requirements: + - torchvision + - matplotlib + - seaborn + - lightning>=2.0.0rc0 +accelerator: + - CPU + - GPU diff --git a/docs/_static/images/course_UvA-DL/08-deep-autoencoders.jpg b/_notebooks/course_UvA-DL/08-deep-autoencoders/.thumb.jpg similarity index 100% rename from docs/_static/images/course_UvA-DL/08-deep-autoencoders.jpg rename to _notebooks/course_UvA-DL/08-deep-autoencoders/.thumb.jpg diff --git a/_notebooks/course_UvA-DL/08-deep-autoencoders/Deep_Autoencoders.py b/_notebooks/course_UvA-DL/08-deep-autoencoders/Deep_Autoencoders.py new file mode 100644 index 0000000..da289b9 --- /dev/null +++ b/_notebooks/course_UvA-DL/08-deep-autoencoders/Deep_Autoencoders.py @@ -0,0 +1,713 @@ +# %% [markdown] +#
+ +# %% +import os +import urllib.request +from urllib.error import HTTPError + +import lightning as L +import matplotlib +import matplotlib.pyplot as plt +import matplotlib_inline.backend_inline +import seaborn as sns +import torch +import torch.nn as nn +import torch.nn.functional as F +import torch.optim as optim +import torch.utils.data as data +import torchvision +from lightning.pytorch.callbacks import Callback, LearningRateMonitor, ModelCheckpoint +from torch.utils.tensorboard import SummaryWriter +from torchvision import transforms +from torchvision.datasets import CIFAR10 +from tqdm.notebook import tqdm + +# %matplotlib inline +matplotlib_inline.backend_inline.set_matplotlib_formats("svg", "pdf") # For export +matplotlib.rcParams["lines.linewidth"] = 2.0 +sns.reset_orig() +sns.set() + +# Tensorboard extension (for visualization purposes later) +# %load_ext tensorboard + +# Path to the folder where the datasets are/should be downloaded (e.g. CIFAR10) +DATASET_PATH = os.environ.get("PATH_DATASETS", "data") +# Path to the folder where the pretrained models are saved +CHECKPOINT_PATH = os.environ.get("PATH_CHECKPOINT", "saved_models/tutorial9") + +# Setting the seed +L.seed_everything(42) + +# Ensure that all operations are deterministic on GPU (if used) for reproducibility +torch.backends.cudnn.deterministic = True +torch.backends.cudnn.benchmark = False + +device = torch.device("cuda:0") if torch.cuda.is_available() else torch.device("cpu") +print("Device:", device) + +# %% [markdown] +# We have 4 pretrained models that we have to download. +# Remember the adjust the variables `DATASET_PATH` and `CHECKPOINT_PATH` if needed. + +# %% +# Github URL where saved models are stored for this tutorial +base_url = "https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial9/" +# Files to download +pretrained_files = ["cifar10_64.ckpt", "cifar10_128.ckpt", "cifar10_256.ckpt", "cifar10_384.ckpt"] +# Create checkpoint path if it doesn't exist yet +os.makedirs(CHECKPOINT_PATH, exist_ok=True) + +# For each file, check whether it already exists. If not, try downloading it. +for file_name in pretrained_files: + file_path = os.path.join(CHECKPOINT_PATH, file_name) + if not os.path.isfile(file_path): + file_url = base_url + file_name + print("Downloading %s..." % file_url) + try: + urllib.request.urlretrieve(file_url, file_path) + except HTTPError as e: + print( + "Something went wrong. Please try to download the files manually," + " or contact the author with the full output including the following error:\n", + e, + ) + +# %% [markdown] +# In this tutorial, we work with the CIFAR10 dataset. +# In CIFAR10, each image has 3 color channels and is 32x32 pixels large. +# As autoencoders do not have the constrain of modeling images probabilistic, we can work on more complex image data +# (i.e. 3 color channels instead of black-and-white) much easier than for VAEs. +# In case you have downloaded CIFAR10 already in a different directory, make sure to set DATASET_PATH +# accordingly to prevent another download. +# +# In contrast to previous tutorials on CIFAR10 like +# [Tutorial 5](https://uvadlc-notebooks.readthedocs.io/en/latest/tutorial_notebooks/tutorial5/Inception_ResNet_DenseNet.html) +# (CNN classification), we do not normalize the data explicitly with a mean of 0 and std of 1, +# but roughly estimate it scaling the data between -1 and 1. +# This is because limiting the range will make our task of predicting/reconstructing images easier. + +# %% +# Transformations applied on each image => only make them a tensor +transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.5,), (0.5,))]) + +# Loading the training dataset. We need to split it into a training and validation part +train_dataset = CIFAR10(root=DATASET_PATH, train=True, transform=transform, download=True) +L.seed_everything(42) +train_set, val_set = torch.utils.data.random_split(train_dataset, [45000, 5000]) + +# Loading the test set +test_set = CIFAR10(root=DATASET_PATH, train=False, transform=transform, download=True) + +# We define a set of data loaders that we can use for various purposes later. +train_loader = data.DataLoader(train_set, batch_size=256, shuffle=True, drop_last=True, pin_memory=True, num_workers=4) +val_loader = data.DataLoader(val_set, batch_size=256, shuffle=False, drop_last=False, num_workers=4) +test_loader = data.DataLoader(test_set, batch_size=256, shuffle=False, drop_last=False, num_workers=4) + + +def get_train_images(num): + return torch.stack([train_dataset[i][0] for i in range(num)], dim=0) + + +# %% [markdown] +# ## Building the autoencoder +# +# In general, an autoencoder consists of an **encoder** that maps the input $x$ to a lower-dimensional feature vector $z$, +# and a **decoder** that reconstructs the input $\hat{x}$ from $z$. +# We train the model by comparing $x$ to $\hat{x}$ and optimizing the parameters to increase the similarity between $x$ and $\hat{x}$. +# See below for a small illustration of the autoencoder framework. + +# %% [markdown] +#
+ +# %% [markdown] +# We first start by implementing the encoder. +# The encoder effectively consists of a deep convolutional network, where we scale down the image layer-by-layer using strided convolutions. +# After downscaling the image three times, we flatten the features and apply linear layers. +# The latent representation $z$ is therefore a vector of size *d* which can be flexibly selected. + + +# %% +class Encoder(nn.Module): + def __init__(self, num_input_channels: int, base_channel_size: int, latent_dim: int, act_fn: object = nn.GELU): + """ + Args: + num_input_channels : Number of input channels of the image. For CIFAR, this parameter is 3 + base_channel_size : Number of channels we use in the first convolutional layers. Deeper layers might use a duplicate of it. + latent_dim : Dimensionality of latent representation z + act_fn : Activation function used throughout the encoder network + """ + super().__init__() + c_hid = base_channel_size + self.net = nn.Sequential( + nn.Conv2d(num_input_channels, c_hid, kernel_size=3, padding=1, stride=2), # 32x32 => 16x16 + act_fn(), + nn.Conv2d(c_hid, c_hid, kernel_size=3, padding=1), + act_fn(), + nn.Conv2d(c_hid, 2 * c_hid, kernel_size=3, padding=1, stride=2), # 16x16 => 8x8 + act_fn(), + nn.Conv2d(2 * c_hid, 2 * c_hid, kernel_size=3, padding=1), + act_fn(), + nn.Conv2d(2 * c_hid, 2 * c_hid, kernel_size=3, padding=1, stride=2), # 8x8 => 4x4 + act_fn(), + nn.Flatten(), # Image grid to single feature vector + nn.Linear(2 * 16 * c_hid, latent_dim), + ) + + def forward(self, x): + return self.net(x) + + +# %% [markdown] +# Note that we do not apply Batch Normalization here. +# This is because we want the encoding of each image to be independent of all the other images. +# Otherwise, we might introduce correlations into the encoding or decoding that we do not want to have. +# In some implementations, you still can see Batch Normalization being used, because it can also serve as a form of regularization. +# Nevertheless, the better practice is to go with other normalization techniques if necessary like Instance Normalization or Layer Normalization. +# Given the small size of the model, we can neglect normalization for now. + +# %% [markdown] +# The decoder is a mirrored, flipped version of the encoder. +# The only difference is that we replace strided convolutions by transposed convolutions +# (i.e. deconvolutions) to upscale the features. +# Transposed convolutions can be imagined as adding the stride to the input instead of the output, +# and can thus upscale the input. +# For an illustration of a `nn.ConvTranspose2d` layer with kernel size 3, stride 2, and padding 1, +# see below (figure credit - [Vincent Dumoulin and Francesco Visin](https://arxiv.org/abs/1603.07285)): +# +#
+# +# You see that for an input of size $3\times3$, we obtain an output of $5\times5$. +# However, to truly have a reverse operation of the convolution, +# we need to ensure that the layer scales the input shape by a factor of 2 (e.g. $4\times4\to8\times8$). +# For this, we can specify the parameter `output_padding` which adds additional values to the output shape. +# Note that we do not perform zero-padding with this, but rather increase the output shape for calculation. +# +# Overall, the decoder can be implemented as follows: + + +# %% +class Decoder(nn.Module): + def __init__(self, num_input_channels: int, base_channel_size: int, latent_dim: int, act_fn: object = nn.GELU): + """ + Args: + num_input_channels : Number of channels of the image to reconstruct. For CIFAR, this parameter is 3 + base_channel_size : Number of channels we use in the last convolutional layers. Early layers might use a duplicate of it. + latent_dim : Dimensionality of latent representation z + act_fn : Activation function used throughout the decoder network + """ + super().__init__() + c_hid = base_channel_size + self.linear = nn.Sequential(nn.Linear(latent_dim, 2 * 16 * c_hid), act_fn()) + self.net = nn.Sequential( + nn.ConvTranspose2d( + 2 * c_hid, 2 * c_hid, kernel_size=3, output_padding=1, padding=1, stride=2 + ), # 4x4 => 8x8 + act_fn(), + nn.Conv2d(2 * c_hid, 2 * c_hid, kernel_size=3, padding=1), + act_fn(), + nn.ConvTranspose2d(2 * c_hid, c_hid, kernel_size=3, output_padding=1, padding=1, stride=2), # 8x8 => 16x16 + act_fn(), + nn.Conv2d(c_hid, c_hid, kernel_size=3, padding=1), + act_fn(), + nn.ConvTranspose2d( + c_hid, num_input_channels, kernel_size=3, output_padding=1, padding=1, stride=2 + ), # 16x16 => 32x32 + nn.Tanh(), # The input images is scaled between -1 and 1, hence the output has to be bounded as well + ) + + def forward(self, x): + x = self.linear(x) + x = x.reshape(x.shape[0], -1, 4, 4) + x = self.net(x) + return x + + +# %% [markdown] +# The encoder and decoder networks we chose here are relatively simple. +# Usually, more complex networks are applied, especially when using a ResNet-based architecture. +# For example, see [VQ-VAE](https://arxiv.org/abs/1711.00937) and +# [NVAE](https://arxiv.org/abs/2007.03898) (although the papers discuss architectures for VAEs, +# they can equally be applied to standard autoencoders). +# +# In a final step, we add the encoder and decoder together into the autoencoder architecture. +# We define the autoencoder as PyTorch Lightning Module to simplify the needed training code: + + +# %% +class Autoencoder(L.LightningModule): + def __init__( + self, + base_channel_size: int, + latent_dim: int, + encoder_class: object = Encoder, + decoder_class: object = Decoder, + num_input_channels: int = 3, + width: int = 32, + height: int = 32, + ): + super().__init__() + # Saving hyperparameters of autoencoder + self.save_hyperparameters() + # Creating encoder and decoder + self.encoder = encoder_class(num_input_channels, base_channel_size, latent_dim) + self.decoder = decoder_class(num_input_channels, base_channel_size, latent_dim) + # Example input array needed for visualizing the graph of the network + self.example_input_array = torch.zeros(2, num_input_channels, width, height) + + def forward(self, x): + """The forward function takes in an image and returns the reconstructed image.""" + z = self.encoder(x) + x_hat = self.decoder(z) + return x_hat + + def _get_reconstruction_loss(self, batch): + """Given a batch of images, this function returns the reconstruction loss (MSE in our case)""" + x, _ = batch # We do not need the labels + x_hat = self.forward(x) + loss = F.mse_loss(x, x_hat, reduction="none") + loss = loss.sum(dim=[1, 2, 3]).mean(dim=[0]) + return loss + + def configure_optimizers(self): + optimizer = optim.Adam(self.parameters(), lr=1e-3) + # Using a scheduler is optional but can be helpful. + # The scheduler reduces the LR if the validation performance hasn't improved for the last N epochs + scheduler = optim.lr_scheduler.ReduceLROnPlateau(optimizer, mode="min", factor=0.2, patience=20, min_lr=5e-5) + return {"optimizer": optimizer, "lr_scheduler": scheduler, "monitor": "val_loss"} + + def training_step(self, batch, batch_idx): + loss = self._get_reconstruction_loss(batch) + self.log("train_loss", loss) + return loss + + def validation_step(self, batch, batch_idx): + loss = self._get_reconstruction_loss(batch) + self.log("val_loss", loss) + + def test_step(self, batch, batch_idx): + loss = self._get_reconstruction_loss(batch) + self.log("test_loss", loss) + + +# %% [markdown] +# For the loss function, we use the mean squared error (MSE). +# The mean squared error pushes the network to pay special attention to those pixel values its estimate is far away. +# Predicting 127 instead of 128 is not important when reconstructing, but confusing 0 with 128 is much worse. +# Note that in contrast to VAEs, we do not predict the probability per pixel value, but instead use a distance measure. +# This saves a lot of parameters and simplifies training. +# To get a better intuition per pixel, we report the summed squared error averaged over the batch dimension +# (any other mean/sum leads to the same result/parameters). +# +# However, MSE has also some considerable disadvantages. +# Usually, MSE leads to blurry images where small noise/high-frequent patterns are removed as those cause a very low error. +# To ensure realistic images to be reconstructed, one could combine Generative Adversarial Networks +# (lecture 10) with autoencoders as done in several works (e.g. see [here](https://arxiv.org/abs/1704.02304), +# [here](https://arxiv.org/abs/1511.05644) or these [slides](http://elarosca.net/slides/iccv_autoencoder_gans.pdf)). +# Additionally, comparing two images using MSE does not necessarily reflect their visual similarity. +# For instance, suppose the autoencoder reconstructs an image shifted by one pixel to the right and bottom. +# Although the images are almost identical, we can get a higher loss than predicting a constant pixel value for half of the image (see code below). +# An example solution for this issue includes using a separate, pre-trained CNN, +# and use a distance of visual features in lower layers as a distance measure instead of the original pixel-level comparison. + + +# %% +def compare_imgs(img1, img2, title_prefix=""): + # Calculate MSE loss between both images + loss = F.mse_loss(img1, img2, reduction="sum") + # Plot images for visual comparison + grid = torchvision.utils.make_grid(torch.stack([img1, img2], dim=0), nrow=2, normalize=True, range=(-1, 1)) + grid = grid.permute(1, 2, 0) + plt.figure(figsize=(4, 2)) + plt.title(f"{title_prefix} Loss: {loss.item():4.2f}") + plt.imshow(grid) + plt.axis("off") + plt.show() + + +for i in range(2): + # Load example image + img, _ = train_dataset[i] + img_mean = img.mean(dim=[1, 2], keepdims=True) + + # Shift image by one pixel + SHIFT = 1 + img_shifted = torch.roll(img, shifts=SHIFT, dims=1) + img_shifted = torch.roll(img_shifted, shifts=SHIFT, dims=2) + img_shifted[:, :1, :] = img_mean + img_shifted[:, :, :1] = img_mean + compare_imgs(img, img_shifted, "Shifted -") + + # Set half of the image to zero + img_masked = img.clone() + img_masked[:, : img_masked.shape[1] // 2, :] = img_mean + compare_imgs(img, img_masked, "Masked -") + +# %% [markdown] +# ### Training the model +# +# During the training, we want to keep track of the learning progress by seeing reconstructions made by our model. +# For this, we implement a callback object in PyTorch Lightning which will add reconstructions every $N$ epochs to our tensorboard: + + +# %% +class GenerateCallback(Callback): + def __init__(self, input_imgs, every_n_epochs=1): + super().__init__() + self.input_imgs = input_imgs # Images to reconstruct during training + # Only save those images every N epochs (otherwise tensorboard gets quite large) + self.every_n_epochs = every_n_epochs + + def on_train_epoch_end(self, trainer, pl_module): + if trainer.current_epoch % self.every_n_epochs == 0: + # Reconstruct images + input_imgs = self.input_imgs.to(pl_module.device) + with torch.no_grad(): + pl_module.eval() + reconst_imgs = pl_module(input_imgs) + pl_module.train() + # Plot and add to tensorboard + imgs = torch.stack([input_imgs, reconst_imgs], dim=1).flatten(0, 1) + grid = torchvision.utils.make_grid(imgs, nrow=2, normalize=True, range=(-1, 1)) + trainer.logger.experiment.add_image("Reconstructions", grid, global_step=trainer.global_step) + + +# %% [markdown] +# We will now write a training function that allows us to train the autoencoder with different latent dimensionality +# and returns both the test and validation score. +# We provide pre-trained models and recommend you using those, especially when you work on a computer without GPU. +# Of course, feel free to train your own models on Lisa. + + +# %% +def train_cifar(latent_dim): + # Create a PyTorch Lightning trainer with the generation callback + trainer = L.Trainer( + default_root_dir=os.path.join(CHECKPOINT_PATH, "cifar10_%i" % latent_dim), + accelerator="auto", + devices=1, + max_epochs=500, + callbacks=[ + ModelCheckpoint(save_weights_only=True), + GenerateCallback(get_train_images(8), every_n_epochs=10), + LearningRateMonitor("epoch"), + ], + ) + trainer.logger._log_graph = True # If True, we plot the computation graph in tensorboard + trainer.logger._default_hp_metric = None # Optional logging argument that we don't need + + # Check whether pretrained model exists. If yes, load it and skip training + pretrained_filename = os.path.join(CHECKPOINT_PATH, "cifar10_%i.ckpt" % latent_dim) + if os.path.isfile(pretrained_filename): + print("Found pretrained model, loading...") + model = Autoencoder.load_from_checkpoint(pretrained_filename) + else: + model = Autoencoder(base_channel_size=32, latent_dim=latent_dim) + trainer.fit(model, train_loader, val_loader) + # Test best model on validation and test set + val_result = trainer.test(model, dataloaders=val_loader, verbose=False) + test_result = trainer.test(model, dataloaders=test_loader, verbose=False) + result = {"test": test_result, "val": val_result} + return model, result + + +# %% [markdown] +# ### Comparing latent dimensionality +# +#
+# +# When training an autoencoder, we need to choose a dimensionality for the latent representation $z$. +# The higher the latent dimensionality, the better we expect the reconstruction to be. +# However, the idea of autoencoders is to *compress* data. +# Hence, we are also interested in keeping the dimensionality low. +# To find the best tradeoff, we can train multiple models with different latent dimensionalities. +# The original input has $32\times 32\times 3 = 3072$ pixels. +# Keeping this in mind, a reasonable choice for the latent dimensionality might be between 64 and 384: + +# %% +model_dict = {} +for latent_dim in [64, 128, 256, 384]: + model_ld, result_ld = train_cifar(latent_dim) + model_dict[latent_dim] = {"model": model_ld, "result": result_ld} + +# %% [markdown] +# After training the models, we can plot the reconstruction loss over the latent dimensionality to get an intuition +# how these two properties are correlated: + +# %% +latent_dims = sorted(k for k in model_dict) +val_scores = [model_dict[k]["result"]["val"][0]["test_loss"] for k in latent_dims] + +fig = plt.figure(figsize=(6, 4)) +plt.plot( + latent_dims, val_scores, "--", color="#000", marker="*", markeredgecolor="#000", markerfacecolor="y", markersize=16 +) +plt.xscale("log") +plt.xticks(latent_dims, labels=latent_dims) +plt.title("Reconstruction error over latent dimensionality", fontsize=14) +plt.xlabel("Latent dimensionality") +plt.ylabel("Reconstruction error") +plt.minorticks_off() +plt.ylim(0, 100) +plt.show() + +# %% [markdown] +# As we initially expected, the reconstruction loss goes down with increasing latent dimensionality. +# For our model and setup, the two properties seem to be exponentially (or double exponentially) correlated. +# To understand what these differences in reconstruction error mean, we can visualize example reconstructions of the four models: + + +# %% +def visualize_reconstructions(model, input_imgs): + # Reconstruct images + model.eval() + with torch.no_grad(): + reconst_imgs = model(input_imgs.to(model.device)) + reconst_imgs = reconst_imgs.cpu() + + # Plotting + imgs = torch.stack([input_imgs, reconst_imgs], dim=1).flatten(0, 1) + grid = torchvision.utils.make_grid(imgs, nrow=4, normalize=True, range=(-1, 1)) + grid = grid.permute(1, 2, 0) + plt.figure(figsize=(7, 4.5)) + plt.title("Reconstructed from %i latents" % (model.hparams.latent_dim)) + plt.imshow(grid) + plt.axis("off") + plt.show() + + +# %% +input_imgs = get_train_images(4) +for latent_dim in model_dict: + visualize_reconstructions(model_dict[latent_dim]["model"], input_imgs) + +# %% [markdown] +# Clearly, the smallest latent dimensionality can only save information about the rough shape and color of the object, +# but the reconstructed image is extremely blurry and it is hard to recognize the original object in the reconstruction. +# With 128 features, we can recognize some shapes again although the picture remains blurry. +# The models with the highest two dimensionalities reconstruct the images quite well. +# The difference between 256 and 384 is marginal at first sight but can be noticed when comparing, for instance, +# the backgrounds of the first image (the 384 features model more of the pattern than 256). + +# %% [markdown] +# ### Out-of-distribution images +# +# Before continuing with the applications of autoencoder, we can actually explore some limitations of our autoencoder. +# For example, what happens if we try to reconstruct an image that is clearly out of the distribution of our dataset? +# We expect the decoder to have learned some common patterns in the dataset, +# and thus might in particular fail to reconstruct images that do not follow these patterns. +# +# The first experiment we can try is to reconstruct noise. +# We, therefore, create two images whose pixels are randomly sampled from a uniform distribution over pixel values, +# and visualize the reconstruction of the model (feel free to test different latent dimensionalities): + +# %% +rand_imgs = torch.rand(2, 3, 32, 32) * 2 - 1 +visualize_reconstructions(model_dict[256]["model"], rand_imgs) + +# %% [markdown] +# The reconstruction of the noise is quite poor, and seems to introduce some rough patterns. +# As the input does not follow the patterns of the CIFAR dataset, the model has issues reconstructing it accurately. +# +# We can also check how well the model can reconstruct other manually-coded patterns: + +# %% +plain_imgs = torch.zeros(4, 3, 32, 32) + +# Single color channel +plain_imgs[1, 0] = 1 +# Checkboard pattern +plain_imgs[2, :, :16, :16] = 1 +plain_imgs[2, :, 16:, 16:] = -1 +# Color progression +xx, yy = torch.meshgrid(torch.linspace(-1, 1, 32), torch.linspace(-1, 1, 32)) +plain_imgs[3, 0, :, :] = xx +plain_imgs[3, 1, :, :] = yy + +visualize_reconstructions(model_dict[256]["model"], plain_imgs) + +# %% [markdown] +# The plain, constant images are reconstructed relatively good although the single color channel contains some noticeable noise. +# The hard borders of the checkboard pattern are not as sharp as intended, as well as the color progression, +# both because such patterns never occur in the real-world pictures of CIFAR. +# +# In general, autoencoders tend to fail reconstructing high-frequent noise (i.e. sudden, big changes across few pixels) +# due to the choice of MSE as loss function (see our previous discussion about loss functions in autoencoders). +# Small misalignments in the decoder can lead to huge losses so that the model settles for the expected value/mean in these regions. +# For low-frequent noise, a misalignment of a few pixels does not result in a big difference to the original image. +# However, the larger the latent dimensionality becomes, the more of this high-frequent noise can be accurately reconstructed. + +# %% [markdown] +# ### Generating new images +# +# Variational autoencoders are a generative version of the autoencoders because we regularize the latent space to follow a Gaussian distribution. +# However, in vanilla autoencoders, we do not have any restrictions on the latent vector. +# So what happens if we would actually input a randomly sampled latent vector into the decoder? +# Let's find it out below: + +# %% +model = model_dict[256]["model"] +latent_vectors = torch.randn(8, model.hparams.latent_dim, device=model.device) +with torch.no_grad(): + imgs = model.decoder(latent_vectors) + imgs = imgs.cpu() + +grid = torchvision.utils.make_grid(imgs, nrow=4, normalize=True, range=(-1, 1), pad_value=0.5) +grid = grid.permute(1, 2, 0) +plt.figure(figsize=(8, 5)) +plt.imshow(grid) +plt.axis("off") +plt.show() + +# %% [markdown] +# As we can see, the generated images more look like art than realistic images. +# As the autoencoder was allowed to structure the latent space in whichever way it suits the reconstruction best, +# there is no incentive to map every possible latent vector to realistic images. +# Furthermore, the distribution in latent space is unknown to us and doesn't necessarily follow a multivariate normal distribution. +# Thus, we can conclude that vanilla autoencoders are indeed not generative. + +# %% [markdown] +# ## Finding visually similar images +# +# One application of autoencoders is to build an image-based search engine to retrieve visually similar images. +# This can be done by representing all images as their latent dimensionality, and find the closest $K$ images in this domain. +# The first step to such a search engine is to encode all images into $z$. +# In the following, we will use the training set as a search corpus, and the test set as queries to the system. +# +# (Warning: the following cells can be computationally heavy for a weak CPU-only system. +# If you do not have a strong computer and are not on Google Colab, +# you might want to skip the execution of the following cells and rely on the results shown in the filled notebook) + +# %% +# We use the following model throughout this section. +# If you want to try a different latent dimensionality, change it here! +model = model_dict[128]["model"] + + +# %% +def embed_imgs(model, data_loader): + # Encode all images in the data_laoder using model, and return both images and encodings + img_list, embed_list = [], [] + model.eval() + for imgs, _ in tqdm(data_loader, desc="Encoding images", leave=False): + with torch.no_grad(): + z = model.encoder(imgs.to(model.device)) + img_list.append(imgs) + embed_list.append(z) + return (torch.cat(img_list, dim=0), torch.cat(embed_list, dim=0)) + + +train_img_embeds = embed_imgs(model, train_loader) +test_img_embeds = embed_imgs(model, test_loader) + +# %% [markdown] +# After encoding all images, we just need to write a function that finds the closest $K$ images and returns (or plots) those: + + +# %% +def find_similar_images(query_img, query_z, key_embeds, K=8): + # Find closest K images. We use the euclidean distance here but other like cosine distance can also be used. + dist = torch.cdist(query_z[None, :], key_embeds[1], p=2) + dist = dist.squeeze(dim=0) + dist, indices = torch.sort(dist) + # Plot K closest images + imgs_to_display = torch.cat([query_img[None], key_embeds[0][indices[:K]]], dim=0) + grid = torchvision.utils.make_grid(imgs_to_display, nrow=K + 1, normalize=True, range=(-1, 1)) + grid = grid.permute(1, 2, 0) + plt.figure(figsize=(12, 3)) + plt.imshow(grid) + plt.axis("off") + plt.show() + + +# %% +# Plot the closest images for the first N test images as example +for i in range(8): + find_similar_images(test_img_embeds[0][i], test_img_embeds[1][i], key_embeds=train_img_embeds) + +# %% [markdown] +# Based on our autoencoder, we see that we are able to retrieve many similar images to the test input. +# In particular, in row 4, we can spot that some test images might not be that different +# from the training set as we thought (same poster, just different scaling/color scaling). +# We also see that although we haven't given the model any labels, +# it can cluster different classes in different parts of the latent space (airplane + ship, animals, etc.). +# This is why autoencoders can also be used as a pre-training strategy for deep networks, +# especially when we have a large set of unlabeled images (often the case). +# However, it should be noted that the background still plays a big role in autoencoders while it doesn't for classification. +# Hence, we don't get "perfect" clusters and need to finetune such models for classification. + +# %% [markdown] +# ### Tensorboard clustering +# +# Another way of exploring the similarity of images in the latent space is by dimensionality-reduction methods like PCA or T-SNE. +# Luckily, Tensorboard provides a nice interface for this and we can make use of it in the following: + +# %% +# We use the following model throughout this section. +# If you want to try a different latent dimensionality, change it here! +model = model_dict[128]["model"] + +# %% +# Create a summary writer +writer = SummaryWriter("tensorboard/") + +# %% [markdown] +# The function `add_embedding` allows us to add high-dimensional feature vectors to TensorBoard on which we can perform clustering. +# What we have to provide in the function are the feature vectors, additional metadata such as the labels, +# and the original images so that we can identify a specific image in the clustering. + +# %% +# In case you obtain the following error in the next cell, execute the import statements and last line in this cell +# AttributeError: module 'tensorflow._api.v2.io.gfile' has no attribute 'get_filesystem' + +# import tensorflow as tf +# import tensorboard as tb +# tf.io.gfile = tb.compat.tensorflow_stub.io.gfile + +# %% +# Note: the embedding projector in tensorboard is computationally heavy. +# Reduce the image amount below if your computer struggles with visualizing all 10k points +NUM_IMGS = len(test_set) + +writer.add_embedding( + test_img_embeds[1][:NUM_IMGS], # Encodings per image + metadata=[test_set[i][1] for i in range(NUM_IMGS)], # Adding the labels per image to the plot + label_img=(test_img_embeds[0][:NUM_IMGS] + 1) / 2.0, +) # Adding the original images to the plot + +# %% [markdown] +# Finally, we can run tensorboard to explore similarities among images: + +# %% +# Uncomment the next line to start the tensorboard +# %tensorboard --logdir tensorboard/ + +# %% [markdown] +# You should be able to see something similar as in the following image. +# In case the projector stays empty, try to start the TensorBoard outside of the Jupyter notebook. +# +#
+# +# Overall, we can see that the model indeed clustered images together that are visually similar. +# Especially the background color seems to be a crucial factor in the encoding. +# This correlates to the chosen loss function, here Mean Squared Error on pixel-level +# because the background is responsible for more than half of the pixels in an average image. +# Hence, the model learns to focus on it. +# Nevertheless, we can see that the encodings also separate a couple of classes in the latent space although it hasn't seen any labels. +# This shows again that autoencoding can also be used as a "pre-training"/transfer learning task before classification. + +# %% +# Closing the summary writer +writer.close() + +# %% [markdown] +# ## Conclusion +# +# In this tutorial, we have implemented our own autoencoder on small RGB images and explored various properties of the model. +# In contrast to variational autoencoders, vanilla AEs are not generative and can work on MSE loss functions. +# This makes them often easier to train. +# Both versions of AE can be used for dimensionality reduction, as we have seen for finding visually similar images beyond pixel distances. +# Despite autoencoders gaining less interest in the research community due to their more "theoretically" +# challenging counterpart of VAEs, autoencoders still find usage in a lot of applications like denoising and compression. +# Hence, AEs are an essential tool that every Deep Learning engineer/researcher should be familiar with. diff --git a/_notebooks/course_UvA-DL/08-deep-autoencoders/autoencoder_visualization.svg b/_notebooks/course_UvA-DL/08-deep-autoencoders/autoencoder_visualization.svg new file mode 100644 index 0000000..f6c0411 --- /dev/null +++ b/_notebooks/course_UvA-DL/08-deep-autoencoders/autoencoder_visualization.svg @@ -0,0 +1,3 @@ + + +
Encoder
Encoder
Decoder
Decoder
Input 𝑥
Input 𝑥
𝑧
𝑧
Reconstruction 𝑥
Reconstruction 𝑥
ˆ
ˆ
diff --git a/_notebooks/course_UvA-DL/08-deep-autoencoders/deconvolution.gif b/_notebooks/course_UvA-DL/08-deep-autoencoders/deconvolution.gif new file mode 100644 index 0000000..894c1d6 Binary files /dev/null and b/_notebooks/course_UvA-DL/08-deep-autoencoders/deconvolution.gif differ diff --git a/_notebooks/course_UvA-DL/08-deep-autoencoders/tensorboard_projector_screenshot.jpeg b/_notebooks/course_UvA-DL/08-deep-autoencoders/tensorboard_projector_screenshot.jpeg new file mode 100644 index 0000000..c638110 Binary files /dev/null and b/_notebooks/course_UvA-DL/08-deep-autoencoders/tensorboard_projector_screenshot.jpeg differ diff --git a/_notebooks/course_UvA-DL/09-normalizing-flows/.meta.yml b/_notebooks/course_UvA-DL/09-normalizing-flows/.meta.yml new file mode 100644 index 0000000..d366a99 --- /dev/null +++ b/_notebooks/course_UvA-DL/09-normalizing-flows/.meta.yml @@ -0,0 +1,31 @@ +title: "Tutorial 9: Normalizing Flows for Image Modeling" +author: Phillip Lippe +created: 2021-06-07 +updated: 2023-03-14 +license: CC BY-SA +build: 0 +tags: + - Image +description: | + In this tutorial, we will take a closer look at complex, deep normalizing flows. + The most popular, current application of deep normalizing flows is to model datasets of images. + As for other generative models, images are a good domain to start working on because + (1) CNNs are widely studied and strong models exist, + (2) images are high-dimensional and complex, + and (3) images are discrete integers. + In this tutorial, we will review current advances in normalizing flows for image modeling, + and get hands-on experience on coding normalizing flows. + Note that normalizing flows are commonly parameter heavy and therefore computationally expensive. + We will use relatively simple and shallow flows to save computational cost and allow you to run the notebook on CPU, + but keep in mind that a simple way to improve the scores of the flows we study here is to make them deeper. + This notebook is part of a lecture series on Deep Learning at the University of Amsterdam. + The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io. +requirements: + - torchvision + - matplotlib + - seaborn + - tabulate + - lightning>=2.0.0rc0 +accelerator: + - CPU + - GPU diff --git a/docs/_static/images/course_UvA-DL/09-normalizing-flows.jpg b/_notebooks/course_UvA-DL/09-normalizing-flows/.thumb.jpg similarity index 100% rename from docs/_static/images/course_UvA-DL/09-normalizing-flows.jpg rename to _notebooks/course_UvA-DL/09-normalizing-flows/.thumb.jpg diff --git a/_notebooks/course_UvA-DL/09-normalizing-flows/NF_image_modeling.py b/_notebooks/course_UvA-DL/09-normalizing-flows/NF_image_modeling.py new file mode 100644 index 0000000..28821f6 --- /dev/null +++ b/_notebooks/course_UvA-DL/09-normalizing-flows/NF_image_modeling.py @@ -0,0 +1,1417 @@ +# %% [markdown] +#
+# Throughout this notebook, we make use of [PyTorch Lightning](https://lightning.ai/docs/pytorch/stable/). +# The first cell imports our usual libraries. + +# %% +import math +import os +import time +import urllib.request +from urllib.error import HTTPError + +import lightning as L +import matplotlib +import matplotlib.pyplot as plt +import matplotlib_inline.backend_inline +import numpy as np +import seaborn as sns +import tabulate +import torch +import torch.nn as nn +import torch.nn.functional as F +import torch.optim as optim +import torch.utils.data as data +import torchvision +from IPython.display import HTML, display +from lightning.pytorch.callbacks import LearningRateMonitor, ModelCheckpoint +from matplotlib.colors import to_rgb +from torch import Tensor +from torchvision import transforms +from torchvision.datasets import MNIST +from tqdm.notebook import tqdm + +# %matplotlib inline +matplotlib_inline.backend_inline.set_matplotlib_formats("svg", "pdf") # For export +matplotlib.rcParams["lines.linewidth"] = 2.0 +sns.reset_orig() + +# Path to the folder where the datasets are/should be downloaded (e.g. MNIST) +DATASET_PATH = os.environ.get("PATH_DATASETS", "data") +# Path to the folder where the pretrained models are saved +CHECKPOINT_PATH = os.environ.get("PATH_CHECKPOINT", "saved_models/tutorial11") + +# Setting the seed +L.seed_everything(42) + +# Ensure that all operations are deterministic on GPU (if used) for reproducibility +torch.backends.cudnn.deterministic = True +torch.backends.cudnn.benchmark = False + +# Fetching the device that will be used throughout this notebook +device = torch.device("cpu") if not torch.cuda.is_available() else torch.device("cuda:0") +print("Using device", device) + +# %% [markdown] +# Again, we have a few pretrained models. We download them below to the specified path above. + +# %% +# Github URL where saved models are stored for this tutorial +base_url = "https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial11/" +# Files to download +pretrained_files = ["MNISTFlow_simple.ckpt", "MNISTFlow_vardeq.ckpt", "MNISTFlow_multiscale.ckpt"] +# Create checkpoint path if it doesn't exist yet +os.makedirs(CHECKPOINT_PATH, exist_ok=True) + +# For each file, check whether it already exists. If not, try downloading it. +for file_name in pretrained_files: + file_path = os.path.join(CHECKPOINT_PATH, file_name) + if not os.path.isfile(file_path): + file_url = base_url + file_name + print("Downloading %s..." % file_url) + try: + urllib.request.urlretrieve(file_url, file_path) + except HTTPError as e: + print( + "Something went wrong. Please try to download the file from the GDrive folder, or contact the author with the full output including the following error:\n", + e, + ) + +# %% [markdown] +# We will use the MNIST dataset in this notebook. +# MNIST constitutes, despite its simplicity, a challenge for small generative models as it requires the global understanding of an image. +# At the same time, we can easily judge whether generated images come from the same distribution as the dataset +# (i.e. represent real digits), or not. +# +# To deal better with the discrete nature of the images, we transform them +# from a range of 0-1 to a range of 0-255 as integers. + + +# %% +# Convert images from 0-1 to 0-255 (integers) +def discretize(sample): + return (sample * 255).to(torch.int32) + + +# Transformations applied on each image => make them a tensor and discretize +transform = transforms.Compose([transforms.ToTensor(), discretize]) + +# Loading the training dataset. We need to split it into a training and validation part +train_dataset = MNIST(root=DATASET_PATH, train=True, transform=transform, download=True) +L.seed_everything(42) +train_set, val_set = torch.utils.data.random_split(train_dataset, [50000, 10000]) + +# Loading the test set +test_set = MNIST(root=DATASET_PATH, train=False, transform=transform, download=True) + +# We define a set of data loaders that we can use for various purposes later. +# Note that for actually training a model, we will use different data loaders +# with a lower batch size. +train_loader = data.DataLoader(train_set, batch_size=256, shuffle=False, drop_last=False) +val_loader = data.DataLoader(val_set, batch_size=64, shuffle=False, drop_last=False, num_workers=4) +test_loader = data.DataLoader(test_set, batch_size=64, shuffle=False, drop_last=False, num_workers=4) + +# %% [markdown] +# In addition, we will define below a function to simplify the visualization of images/samples. +# Some training examples of the MNIST dataset is shown below. + + +# %% +def show_imgs(imgs, title=None, row_size=4): + # Form a grid of pictures (we use max. 8 columns) + num_imgs = imgs.shape[0] if isinstance(imgs, Tensor) else len(imgs) + is_int = imgs.dtype == torch.int32 if isinstance(imgs, Tensor) else imgs[0].dtype == torch.int32 + nrow = min(num_imgs, row_size) + ncol = int(math.ceil(num_imgs / nrow)) + imgs = torchvision.utils.make_grid(imgs, nrow=nrow, pad_value=128 if is_int else 0.5) + np_imgs = imgs.cpu().numpy() + # Plot the grid + plt.figure(figsize=(1.5 * nrow, 1.5 * ncol)) + plt.imshow(np.transpose(np_imgs, (1, 2, 0)), interpolation="nearest") + plt.axis("off") + if title is not None: + plt.title(title) + plt.show() + plt.close() + + +show_imgs([train_set[i][0] for i in range(8)]) + +# %% [markdown] +# ## Normalizing Flows as generative model +# +# In the previous lectures, we have seen Energy-based models, Variational Autoencoders (VAEs) +# and Generative Adversarial Networks (GANs) as example of generative models. +# However, none of them explicitly learn the probability density function $p(x)$ of the real input data. +# While VAEs model a lower bound, energy-based models only implicitly learn the probability density. +# GANs on the other hand provide us a sampling mechanism for generating new data, without offering a likelihood estimate. +# The generative model we will look at here, called Normalizing Flows, actually models the true data distribution +# $p(x)$ and provides us with an exact likelihood estimate. +# Below, we can visually compare VAEs, GANs and Flows +# (figure credit - [Lilian Weng](https://lilianweng.github.io/lil-log/2018/10/13/flow-based-deep-generative-models.html)): +# +#
+# +# The major difference compared to VAEs is that flows use *invertible* functions $f$ +# to map the input data $x$ to a latent representation $z$. +# To realize this, $z$ must be of the same shape as $x$. +# This is in contrast to VAEs where $z$ is usually much lower dimensional than the original input data. +# However, an invertible mapping also means that for every data point $x$, we have a corresponding latent representation +# $z$ which allows us to perform lossless reconstruction ($z$ to $x$). +# In the visualization above, this means that $x=x'$ for flows, no matter what invertible function $f$ and input $x$ we choose. +# +# Nonetheless, how are normalizing flows modeling a probability density with an invertible function? +# The answer to this question is the rule for change of variables. +# Specifically, given a prior density $p_z(z)$ (e.g. Gaussian) and an invertible function $f$, +# we can determine $p_x(x)$ as follows: +# +# $$ +# \begin{split} +# \int p_x(x) dx & = \int p_z(z) dz = 1 \hspace{1cm}\text{(by definition of a probability distribution)}\\ +# \Leftrightarrow p_x(x) & = p_z(z) \left|\frac{dz}{dx}\right| = p_z(f(x)) \left|\frac{df(x)}{dx}\right| +# \end{split} +# $$ +# +# Hence, in order to determine the probability of $x$, we only need to determine its probability in latent space, +# and get the derivate of $f$. +# Note that this is for a univariate distribution, and $f$ is required to be invertible and smooth. +# For a multivariate case, the derivative becomes a Jacobian of which we need to take the determinant. +# As we usually use the log-likelihood as objective, we write the multivariate term with logarithms below: +# +# $$ +# \log p_x(\mathbf{x}) = \log p_z(f(\mathbf{x})) + \log{} \left|\det \frac{df(\mathbf{x})}{d\mathbf{x}}\right| +# $$ +# +# Although we now know how a normalizing flow obtains its likelihood, it might not be clear what a normalizing flow does intuitively. +# For this, we should look from the inverse perspective of the flow starting with the prior probability density $p_z(z)$. +# If we apply an invertible function on it, we effectively "transform" its probability density. +# For instance, if $f^{-1}(z)=z+1$, we shift the density by one while still remaining a valid probability distribution, +# and being invertible. +# We can also apply more complex transformations, like scaling: $f^{-1}(z)=2z+1$, but there you might see a difference. +# When you scale, you also change the volume of the probability density, as for example on uniform distributions +# (figure credit - [Eric Jang](https://blog.evjang.com/2018/01/nf1.html)): +# +#
+# +# You can see that the height of $p(y)$ should be lower than $p(x)$ after scaling. +# This change in volume represents $\left|\frac{df(x)}{dx}\right|$ in our equation above, +# and ensures that even after scaling, we still have a valid probability distribution. +# We can go on with making our function $f$ more complex. +# However, the more complex $f$ becomes, the harder it will be to find the inverse $f^{-1}$ of it, +# and to calculate the log-determinant of the Jacobian $\log{} \left|\det \frac{df(\mathbf{x})}{d\mathbf{x}}\right|$. +# An easier trick to stack multiple invertible functions $f_{1,...,K}$ after each other, as all together, +# they still represent a single, invertible function. +# Using multiple, learnable invertible functions, a normalizing flow attempts to transform +# $p_z(z)$ slowly into a more complex distribution which should finally be $p_x(x)$. +# We visualize the idea below +# (figure credit - [Lilian Weng](https://lilianweng.github.io/lil-log/2018/10/13/flow-based-deep-generative-models.html)): +# +#
+# +# Starting from $z_0$, which follows the prior Gaussian distribution, we sequentially apply the invertible +# functions $f_1,f_2,...,f_K$, until $z_K$ represents $x$. +# Note that in the figure above, the functions $f$ represent the inverted function from $f$ we had above +# (here: $f:Z\to X$, above: $f:X\to Z$). +# This is just a different notation and has no impact on the actual flow design because all $f$ need to be invertible anyways. +# When we estimate the log likelihood of a data point $x$ as in the equations above, +# we run the flows in the opposite direction than visualized above. +# Multiple flow layers have been proposed that use a neural network as learnable parameters, +# such as the planar and radial flow. +# However, we will focus here on flows that are commonly used in image +# modeling, and will discuss them in the rest of the notebook along with +# the details of how to train a normalizing flow. + +# %% [markdown] +# ## Normalizing Flows on images +# +#
+# +# To become familiar with normalizing flows, especially for the application of image modeling, +# it is best to discuss the different elements in a flow along with the implementation. +# As a general concept, we want to build a normalizing flow that maps an input image (here MNIST) to an equally sized latent space: +# +#
+# +# As a first step, we will implement a template of a normalizing flow in PyTorch Lightning. +# During training and validation, a normalizing flow performs density estimation in the forward direction. +# For this, we apply a series of flow transformations on the input $x$ and estimate the probability +# of the input by determining the probability of the transformed point $z$ given a prior, +# and the change of volume caused by the transformations. +# During inference, we can do both density estimation and sampling new points by inverting the flow transformations. +# Therefore, we define a function `_get_likelihood` which performs density estimation, +# and `sample` to generate new examples. +# The functions `training_step`, `validation_step` and `test_step` all make use of `_get_likelihood`. +# +# The standard metric used in generative models, and in particular normalizing flows, is bits per dimensions (bpd). +# Bpd is motivated from an information theory perspective and describes how many bits we would need to encode a particular example in our modeled distribution. +# The less bits we need, the more likely the example in our distribution. +# When we test for the bits per dimension of our test dataset, we can judge whether our model generalizes to new samples of the dataset and didn't memorize the training dataset. +# In order to calculate the bits per dimension score, we can rely on the negative log-likelihood and change the log base (as bits are binary while NLL is usually exponential): +# +# $$\text{bpd} = \text{nll} \cdot \log_2\left(\exp(1)\right) \cdot \left(\prod d_i\right)^{-1}$$ +# +# where $d_1,...,d_K$ are the dimensions of the input. +# For images, this would be the height, width and channel number. +# We divide the log likelihood by these extra dimensions to have a metric which we can compare for different image resolutions. +# In the original image space, MNIST examples have a bits per dimension +# score of 8 (we need 8 bits to encode each pixel as there are 256 +# possible values). + + +# %% +class ImageFlow(L.LightningModule): + def __init__(self, flows, import_samples=8): + """ + Args: + flows: A list of flows (each a nn.Module) that should be applied on the images. + import_samples: Number of importance samples to use during testing (see explanation below). Can be changed at any time + """ + super().__init__() + self.flows = nn.ModuleList(flows) + self.import_samples = import_samples + # Create prior distribution for final latent space + self.prior = torch.distributions.normal.Normal(loc=0.0, scale=1.0) + # Example input for visualizing the graph + self.example_input_array = train_set[0][0].unsqueeze(dim=0) + + def forward(self, imgs): + # The forward function is only used for visualizing the graph + return self._get_likelihood(imgs) + + def encode(self, imgs): + # Given a batch of images, return the latent representation z and ldj of the transformations + z, ldj = imgs, torch.zeros(imgs.shape[0], device=self.device) + for flow in self.flows: + z, ldj = flow(z, ldj, reverse=False) + return z, ldj + + def _get_likelihood(self, imgs, return_ll=False): + """Given a batch of images, return the likelihood of those. + + If return_ll is True, this function returns the log likelihood of the input. Otherwise, the ouptut metric is + bits per dimension (scaled negative log likelihood) + """ + z, ldj = self.encode(imgs) + log_pz = self.prior.log_prob(z).sum(dim=[1, 2, 3]) + log_px = ldj + log_pz + nll = -log_px + # Calculating bits per dimension + bpd = nll * np.log2(np.exp(1)) / np.prod(imgs.shape[1:]) + return bpd.mean() if not return_ll else log_px + + @torch.no_grad() + def sample(self, img_shape, z_init=None): + """Sample a batch of images from the flow.""" + # Sample latent representation from prior + if z_init is None: + z = self.prior.sample(sample_shape=img_shape).to(device) + else: + z = z_init.to(device) + + # Transform z to x by inverting the flows + ldj = torch.zeros(img_shape[0], device=device) + for flow in reversed(self.flows): + z, ldj = flow(z, ldj, reverse=True) + return z + + def configure_optimizers(self): + optimizer = optim.Adam(self.parameters(), lr=1e-3) + # An scheduler is optional, but can help in flows to get the last bpd improvement + scheduler = optim.lr_scheduler.StepLR(optimizer, 1, gamma=0.99) + return [optimizer], [scheduler] + + def training_step(self, batch, batch_idx): + # Normalizing flows are trained by maximum likelihood => return bpd + loss = self._get_likelihood(batch[0]) + self.log("train_bpd", loss) + return loss + + def validation_step(self, batch, batch_idx): + loss = self._get_likelihood(batch[0]) + self.log("val_bpd", loss) + + def test_step(self, batch, batch_idx): + # Perform importance sampling during testing => estimate likelihood M times for each image + samples = [] + for _ in range(self.import_samples): + img_ll = self._get_likelihood(batch[0], return_ll=True) + samples.append(img_ll) + img_ll = torch.stack(samples, dim=-1) + + # To average the probabilities, we need to go from log-space to exp, and back to log. + # Logsumexp provides us a stable implementation for this + img_ll = torch.logsumexp(img_ll, dim=-1) - np.log(self.import_samples) + + # Calculate final bpd + bpd = -img_ll * np.log2(np.exp(1)) / np.prod(batch[0].shape[1:]) + bpd = bpd.mean() + + self.log("test_bpd", bpd) + + +# %% [markdown] +# The `test_step` function differs from the training and validation step in that it makes use of importance sampling. +# We will discuss the motiviation and details behind this after +# understanding how flows model discrete images in continuous space. + +# %% [markdown] +# ### Dequantization +# +# Normalizing flows rely on the rule of change of variables, which is naturally defined in continuous space. +# Applying flows directly on discrete data leads to undesired density models where arbitrarly high likelihood are placed on a few, particular values. +# See the illustration below: +# +#
+# +# The black points represent the discrete points, and the green volume the density modeled by a normalizing flow in continuous space. +# The flow would continue to increase the likelihood for $x=0,1,2,3$ while having no volume on any other point. +# Remember that in continuous space, we have the constraint that the overall volume of the probability density must be 1 ($\int p(x)dx=1$). +# Otherwise, we don't model a probability distribution anymore. +# However, the discrete points $x=0,1,2,3$ represent delta peaks with no width in continuous space. +# This is why the flow can place an infinite high likelihood on these few points while still representing a distribution in continuous space. +# Nonetheless, the learned density does not tell us anything about the distribution among the discrete points, +# as in discrete space, the likelihoods of those four points would have to sum to 1, not to infinity. +# +# To prevent such degenerated solutions, a common solution is to add a small amount of noise to each discrete value, which is also referred to as dequantization. +# Considering $x$ as an integer (as it is the case for images), the dequantized representation $v$ can be formulated as $v=x+u$ where $u\in[0,1)^D$. +# Thus, the discrete value $1$ is modeled by a distribution over the interval $[1.0, 2.0)$, the value $2$ by an volume over $[2.0, 3.0)$, etc. +# Our objective of modeling $p(x)$ becomes: +# +# $$ p(x) = \int p(x+u)du = \int \frac{q(u|x)}{q(u|x)}p(x+u)du = \mathbb{E}_{u\sim q(u|x)}\left[\frac{p(x+u)}{q(u|x)} \right]$$ +# +# with $q(u|x)$ being the noise distribution. +# For now, we assume it to be uniform, which can also be written as $p(x)=\mathbb{E}_{u\sim U(0,1)^D}\left[p(x+u) \right]$. +# +# In the following, we will implement Dequantization as a flow transformation itself. +# After adding noise to the discrete values, we additionally transform the volume into a Gaussian-like shape. +# This is done by scaling $x+u$ between $0$ and $1$, and applying the invert of the sigmoid function $\sigma(z)^{-1} = \log z - \log 1-z$. +# If we would not do this, we would face two problems: +# +# 1. +# The input is scaled between 0 and 256 while the prior distribution is a Gaussian with mean $0$ and standard deviation $1$. +# In the first iterations after initializing the parameters of the flow, we would have extremely low likelihoods for large values like $256$. +# This would cause the training to diverge instantaneously. +# 2. +# As the output distribution is a Gaussian, it is beneficial for the flow to have a similarly shaped input distribution. +# This will reduce the modeling complexity that is required by the flow. +# +# Overall, we can implement dequantization as follows: + + +# %% +class Dequantization(nn.Module): + def __init__(self, alpha=1e-5, quants=256): + """ + Args: + alpha: small constant that is used to scale the original input. + Prevents dealing with values very close to 0 and 1 when inverting the sigmoid + quants: Number of possible discrete values (usually 256 for 8-bit image) + """ + super().__init__() + self.alpha = alpha + self.quants = quants + + def forward(self, z, ldj, reverse=False): + if not reverse: + z, ldj = self.dequant(z, ldj) + z, ldj = self.sigmoid(z, ldj, reverse=True) + else: + z, ldj = self.sigmoid(z, ldj, reverse=False) + z = z * self.quants + ldj += np.log(self.quants) * np.prod(z.shape[1:]) + z = torch.floor(z).clamp(min=0, max=self.quants - 1).to(torch.int32) + return z, ldj + + def sigmoid(self, z, ldj, reverse=False): + # Applies an invertible sigmoid transformation + if not reverse: + ldj += (-z - 2 * F.softplus(-z)).sum(dim=[1, 2, 3]) + z = torch.sigmoid(z) + else: + z = z * (1 - self.alpha) + 0.5 * self.alpha # Scale to prevent boundaries 0 and 1 + ldj += np.log(1 - self.alpha) * np.prod(z.shape[1:]) + ldj += (-torch.log(z) - torch.log(1 - z)).sum(dim=[1, 2, 3]) + z = torch.log(z) - torch.log(1 - z) + return z, ldj + + def dequant(self, z, ldj): + # Transform discrete values to continuous volumes + z = z.to(torch.float32) + z = z + torch.rand_like(z).detach() + z = z / self.quants + ldj -= np.log(self.quants) * np.prod(z.shape[1:]) + return z, ldj + + +# %% [markdown] +# A good check whether a flow is correctly implemented or not, is to verify that it is invertible. +# Hence, we will dequantize a randomly chosen training image, and then quantize it again. +# We would expect that we would get the exact same image out: + +# %% +# Testing invertibility of dequantization layer +L.seed_everything(42) +orig_img = train_set[0][0].unsqueeze(dim=0) +ldj = torch.zeros( + 1, +) +dequant_module = Dequantization() +deq_img, ldj = dequant_module(orig_img, ldj, reverse=False) +reconst_img, ldj = dequant_module(deq_img, ldj, reverse=True) + +d1, d2 = torch.where(orig_img.squeeze() != reconst_img.squeeze()) +if len(d1) != 0: + print("Dequantization was not invertible.") + for i in range(d1.shape[0]): + print("Original value:", orig_img[0, 0, d1[i], d2[i]].item()) + print("Reconstructed value:", reconst_img[0, 0, d1[i], d2[i]].item()) +else: + print("Successfully inverted dequantization") + +# Layer is not strictly invertible due to float precision constraints +# assert (orig_img == reconst_img).all().item() + +# %% [markdown] +# In contrast to our expectation, the test fails. +# However, this is no reason to doubt our implementation here as only one single value is not equal to the original. +# This is caused due to numerical inaccuracies in the sigmoid invert. +# While the input space to the inverted sigmoid is scaled between 0 and 1, the output space is between $-\infty$ and $\infty$. +# And as we use 32 bits to represent the numbers (in addition to applying logs over and over again), +# such inaccuries can occur and should not be worrisome. +# Nevertheless, it is good to be aware of them, and can be improved by using a double tensor (float64). +# +# Finally, we can take our dequantization and actually visualize the +# distribution it transforms the discrete values into: + +# %% + + +def visualize_dequantization(quants, prior=None): + """Function for visualizing the dequantization values of discrete values in continuous space.""" + # Prior over discrete values. If not given, a uniform is assumed + if prior is None: + prior = np.ones(quants, dtype=np.float32) / quants + prior = prior / prior.sum() # Ensure proper categorical distribution + + inp = torch.arange(-4, 4, 0.01).view(-1, 1, 1, 1) # Possible continuous values we want to consider + ldj = torch.zeros(inp.shape[0]) + dequant_module = Dequantization(quants=quants) + # Invert dequantization on continuous values to find corresponding discrete value + out, ldj = dequant_module.forward(inp, ldj, reverse=True) + inp, out, prob = inp.squeeze().numpy(), out.squeeze().numpy(), ldj.exp().numpy() + prob = prob * prior[out] # Probability scaled by categorical prior + + # Plot volumes and continuous distribution + sns.set_style("white") + _ = plt.figure(figsize=(6, 3)) + x_ticks = [] + for v in np.unique(out): + indices = np.where(out == v) + color = to_rgb("C%i" % v) + plt.fill_between(inp[indices], prob[indices], np.zeros(indices[0].shape[0]), color=color + (0.5,), label=str(v)) + plt.plot([inp[indices[0][0]]] * 2, [0, prob[indices[0][0]]], color=color) + plt.plot([inp[indices[0][-1]]] * 2, [0, prob[indices[0][-1]]], color=color) + x_ticks.append(inp[indices[0][0]]) + x_ticks.append(inp.max()) + plt.xticks(x_ticks, ["%.1f" % x for x in x_ticks]) + plt.plot(inp, prob, color=(0.0, 0.0, 0.0)) + # Set final plot properties + plt.ylim(0, prob.max() * 1.1) + plt.xlim(inp.min(), inp.max()) + plt.xlabel("z") + plt.ylabel("Probability") + plt.title("Dequantization distribution for %i discrete values" % quants) + plt.legend() + plt.show() + plt.close() + + +visualize_dequantization(quants=8) + +# %% [markdown] +# The visualized distribution show the sub-volumes that are assigned to the different discrete values. +# The value $0$ has its volume between $[-\infty, -1.9)$, the value $1$ is represented by the interval $[-1.9, -1.1)$, etc. +# The volume for each discrete value has the same probability mass. +# That's why the volumes close to the center (e.g. 3 and 4) have a smaller area on the z-axis as others +# ($z$ is being used to denote the output of the whole dequantization flow). +# +# Effectively, the consecutive normalizing flow models discrete images by the following objective: +# +# $$\log p(x) = \log \mathbb{E}_{u\sim q(u|x)}\left[\frac{p(x+u)}{q(u|x)} \right] \geq \mathbb{E}_{u}\left[\log \frac{p(x+u)}{q(u|x)} \right]$$ +# +# Although normalizing flows are exact in likelihood, we have a lower bound. +# Specifically, this is an example of the Jensen inequality because we need to move the log into the expectation so we can use Monte-carlo estimates. +# In general, this bound is considerably smaller than the ELBO in variational autoencoders. +# Actually, we can reduce the bound ourselves by estimating the expectation not by one, but by $M$ samples. +# In other words, we can apply importance sampling which leads to the following inequality: +# +# $$\log p(x) = \log \mathbb{E}_{u\sim q(u|x)}\left[\frac{p(x+u)}{q(u|x)} \right] \geq \mathbb{E}_{u}\left[\log \frac{1}{M} \sum_{m=1}^{M} \frac{p(x+u_m)}{q(u_m|x)} \right] \geq \mathbb{E}_{u}\left[\log \frac{p(x+u)}{q(u|x)} \right]$$ +# +# The importance sampling $\frac{1}{M} \sum_{m=1}^{M} \frac{p(x+u_m)}{q(u_m|x)}$ becomes +# $\mathbb{E}_{u\sim q(u|x)}\left[\frac{p(x+u)}{q(u|x)} \right]$ if $M\to \infty$, +# so that the more samples we use, the tighter the bound is. +# During testing, we can make use of this property and have it implemented in `test_step` in `ImageFlow`. +# In theory, we could also use this tighter bound during training. +# However, related work has shown that this does not necessarily lead to +# an improvement given the additional computational cost, and it is more +# efficient to stick with a single estimate [5]. + +# %% [markdown] +# ### Variational Dequantization +# +# Dequantization uses a uniform distribution for the noise $u$ which effectively leads to images being represented as hypercubes +# (cube in high dimensions) with sharp borders. +# However, modeling such sharp borders is not easy for a flow as it uses smooth transformations to convert it into a Gaussian distribution. +# +# Another way of looking at it is if we change the prior distribution in the previous visualization. +# Imagine we have independent Gaussian noise on pixels which is commonly the case for any real-world taken picture. +# Therefore, the flow would have to model a distribution as above, but with the individual volumes scaled as follows: + +# %% +visualize_dequantization(quants=8, prior=np.array([0.075, 0.2, 0.4, 0.2, 0.075, 0.025, 0.0125, 0.0125])) + +# %% [markdown] +# Transforming such a probability into a Gaussian is a difficult task, especially with such hard borders. +# Dequantization has therefore been extended to more sophisticated, learnable distributions beyond uniform in a variational framework. +# In particular, if we remember the learning objective +# $\log p(x) = \log \mathbb{E}_{u}\left[\frac{p(x+u)}{q(u|x)} \right]$, +# the uniform distribution can be replaced by a learned distribution $q_{\theta}(u|x)$ with support over $u\in[0,1)^D$. +# This approach is called Variational Dequantization and has been proposed by Ho et al. +# [3]. +# How can we learn such a distribution? +# We can use a second normalizing flow that takes $x$ as external input and learns a flexible distribution over $u$. +# To ensure a support over $[0,1)^D$, we can apply a sigmoid activation function as final flow transformation. +# +# Inheriting the original dequantization class, we can implement variational dequantization as follows: + + +# %% +class VariationalDequantization(Dequantization): + def __init__(self, var_flows, alpha=1e-5): + """ + Args: + var_flows: A list of flow transformations to use for modeling q(u|x) + alpha: Small constant, see Dequantization for details + """ + super().__init__(alpha=alpha) + self.flows = nn.ModuleList(var_flows) + + def dequant(self, z, ldj): + z = z.to(torch.float32) + img = (z / 255.0) * 2 - 1 # We condition the flows on x, i.e. the original image + + # Prior of u is a uniform distribution as before + # As most flow transformations are defined on [-infinity,+infinity], we apply an inverse sigmoid first. + deq_noise = torch.rand_like(z).detach() + deq_noise, ldj = self.sigmoid(deq_noise, ldj, reverse=True) + for flow in self.flows: + deq_noise, ldj = flow(deq_noise, ldj, reverse=False, orig_img=img) + deq_noise, ldj = self.sigmoid(deq_noise, ldj, reverse=False) + + # After the flows, apply u as in standard dequantization + z = (z + deq_noise) / 256.0 + ldj -= np.log(256.0) * np.prod(z.shape[1:]) + return z, ldj + + +# %% [markdown] +# Variational dequantization can be used as a substitute for dequantization. +# We will compare dequantization and variational dequantization in later experiments. + +# %% [markdown] +# ### Coupling layers +# +#
+# +# Next, we look at possible transformations to apply inside the flow. +# A recent popular flow layer, which works well in combination with deep neural networks, +# is the coupling layer introduced by Dinh et al. +# [1]. +# The input $z$ is arbitrarily split into two parts, $z_{1:j}$ and $z_{j+1:d}$, of which the first remains unchanged by the flow. +# Yet, $z_{1:j}$ is used to parameterize the transformation for the second part, $z_{j+1:d}$. +# Various transformations have been proposed in recent time [3,4], but here we will settle for the simplest and most efficient one: affine coupling. +# In this coupling layer, we apply an affine transformation by shifting the input by a bias $\mu$ and scale it by $\sigma$. +# In other words, our transformation looks as follows: +# +# $$z'_{j+1:d} = \mu_{\theta}(z_{1:j}) + \sigma_{\theta}(z_{1:j}) \odot z_{j+1:d}$$ +# +# The functions $\mu$ and $\sigma$ are implemented as a shared neural network, +# and the sum and multiplication are performed element-wise. +# The LDJ is thereby the sum of the logs of the scaling factors: $\sum_i \left[\log \sigma_{\theta}(z_{1:j})\right]_i$. +# Inverting the layer can as simply be done as subtracting the bias and dividing by the scale: +# +# $$z_{j+1:d} = \left(z'_{j+1:d} - \mu_{\theta}(z_{1:j})\right) / \sigma_{\theta}(z_{1:j})$$ +# +# We can also visualize the coupling layer in form of a computation graph, +# where $z_1$ represents $z_{1:j}$, and $z_2$ represents $z_{j+1:d}$: +# +#
+# +# In our implementation, we will realize the splitting of variables as masking. +# The variables to be transformed, $z_{j+1:d}$, are masked when passing $z$ to the shared network to predict the transformation parameters. +# When applying the transformation, we mask the parameters for $z_{1:j}$ +# so that we have an identity operation for those variables: + + +# %% +class CouplingLayer(nn.Module): + def __init__(self, network, mask, c_in): + """Coupling layer inside a normalizing flow. + + Args: + network: A PyTorch nn.Module constituting the deep neural network for mu and sigma. + Output shape should be twice the channel size as the input. + mask: Binary mask (0 or 1) where 0 denotes that the element should be transformed, + while 1 means the latent will be used as input to the NN. + c_in: Number of input channels + """ + super().__init__() + self.network = network + self.scaling_factor = nn.Parameter(torch.zeros(c_in)) + # Register mask as buffer as it is a tensor which is not a parameter, + # but should be part of the modules state. + self.register_buffer("mask", mask) + + def forward(self, z, ldj, reverse=False, orig_img=None): + """ + Args: + z: Latent input to the flow + ldj: The current ldj of the previous flows. + The ldj of this layer will be added to this tensor. + reverse: If True, we apply the inverse of the layer. + orig_img (optional): Only needed in VarDeq. Allows external + input to condition the flow on (e.g. original image) + """ + # Apply network to masked input + z_in = z * self.mask + if orig_img is None: + nn_out = self.network(z_in) + else: + nn_out = self.network(torch.cat([z_in, orig_img], dim=1)) + s, t = nn_out.chunk(2, dim=1) + + # Stabilize scaling output + s_fac = self.scaling_factor.exp().view(1, -1, 1, 1) + s = torch.tanh(s / s_fac) * s_fac + + # Mask outputs (only transform the second part) + s = s * (1 - self.mask) + t = t * (1 - self.mask) + + # Affine transformation + if not reverse: + # Whether we first shift and then scale, or the other way round, + # is a design choice, and usually does not have a big impact + z = (z + t) * torch.exp(s) + ldj += s.sum(dim=[1, 2, 3]) + else: + z = (z * torch.exp(-s)) - t + ldj -= s.sum(dim=[1, 2, 3]) + + return z, ldj + + +# %% [markdown] +# For stabilization purposes, we apply a $\tanh$ activation function on the scaling output. +# This prevents sudden large output values for the scaling that can destabilize training. +# To still allow scaling factors smaller or larger than -1 and 1 respectively, +# we have a learnable parameter per dimension, called `scaling_factor`. +# This scales the tanh to different limits. +# Below, we visualize the effect of the scaling factor on the output activation of the scaling terms: + +# %% +with torch.no_grad(): + x = torch.arange(-5, 5, 0.01) + scaling_factors = [0.5, 1, 2] + sns.set() + fig, ax = plt.subplots(1, 3, figsize=(12, 3)) + for i, scale in enumerate(scaling_factors): + y = torch.tanh(x / scale) * scale + ax[i].plot(x.numpy(), y.numpy()) + ax[i].set_title("Scaling factor: " + str(scale)) + ax[i].set_ylim(-3, 3) + plt.subplots_adjust(wspace=0.4) + sns.reset_orig() + plt.show() + +# %% [markdown] +# Coupling layers generalize to any masking technique we could think of. +# However, the most common approach for images is to split the input $z$ in half, using a checkerboard mask or channel mask. +# A checkerboard mask splits the variables across the height and width dimensions and assigns each other pixel to $z_{j+1:d}$. +# Thereby, the mask is shared across channels. +# In contrast, the channel mask assigns half of the channels to $z_{j+1:d}$, and the other half to $z_{1:j+1}$. +# Note that when we apply multiple coupling layers, we invert the masking for each other layer so that each variable is transformed a similar amount of times. +# +# Let's implement a function that creates a checkerboard mask and a channel mask for us: + + +# %% +def create_checkerboard_mask(h, w, invert=False): + x, y = torch.arange(h, dtype=torch.int32), torch.arange(w, dtype=torch.int32) + xx, yy = torch.meshgrid(x, y) + mask = torch.fmod(xx + yy, 2) + mask = mask.to(torch.float32).view(1, 1, h, w) + if invert: + mask = 1 - mask + return mask + + +def create_channel_mask(c_in, invert=False): + mask = torch.cat([torch.ones(c_in // 2, dtype=torch.float32), torch.zeros(c_in - c_in // 2, dtype=torch.float32)]) + mask = mask.view(1, c_in, 1, 1) + if invert: + mask = 1 - mask + return mask + + +# %% [markdown] +# We can also visualize the corresponding masks for an image of size $8\times 8\times 2$ (2 channels): + +# %% +checkerboard_mask = create_checkerboard_mask(h=8, w=8).expand(-1, 2, -1, -1) +channel_mask = create_channel_mask(c_in=2).expand(-1, -1, 8, 8) + +show_imgs(checkerboard_mask.transpose(0, 1), "Checkerboard mask") +show_imgs(channel_mask.transpose(0, 1), "Channel mask") + +# %% [markdown] +# As a last aspect of coupling layers, we need to decide for the deep neural network we want to apply in the coupling layers. +# The input to the layers is an image, and hence we stick with a CNN. +# Because the input to a transformation depends on all transformations before, +# it is crucial to ensure a good gradient flow through the CNN back to the input, +# which can be optimally achieved by a ResNet-like architecture. +# Specifically, we use a Gated ResNet that adds a $\sigma$-gate to the skip connection, +# similarly to the input gate in LSTMs. +# The details are not necessarily important here, and the network is +# strongly inspired from Flow++ [3] in case you are interested in building +# even stronger models. + + +# %% +class ConcatELU(nn.Module): + """Activation function that applies ELU in both direction (inverted and plain). + + Allows non-linearity while providing strong gradients for any input (important for final convolution) + """ + + def forward(self, x): + return torch.cat([F.elu(x), F.elu(-x)], dim=1) + + +class LayerNormChannels(nn.Module): + def __init__(self, c_in, eps=1e-5): + """ + This module applies layer norm across channels in an image. + Inputs: + c_in - Number of channels of the input + eps - Small constant to stabilize std + """ + super().__init__() + self.gamma = nn.Parameter(torch.ones(1, c_in, 1, 1)) + self.beta = nn.Parameter(torch.zeros(1, c_in, 1, 1)) + self.eps = eps + + def forward(self, x): + mean = x.mean(dim=1, keepdim=True) + var = x.var(dim=1, unbiased=False, keepdim=True) + y = (x - mean) / torch.sqrt(var + self.eps) + y = y * self.gamma + self.beta + return y + + +class GatedConv(nn.Module): + def __init__(self, c_in, c_hidden): + """ + This module applies a two-layer convolutional ResNet block with input gate + Args: + c_in: Number of channels of the input + c_hidden: Number of hidden dimensions we want to model (usually similar to c_in) + """ + super().__init__() + self.net = nn.Sequential( + ConcatELU(), + nn.Conv2d(2 * c_in, c_hidden, kernel_size=3, padding=1), + ConcatELU(), + nn.Conv2d(2 * c_hidden, 2 * c_in, kernel_size=1), + ) + + def forward(self, x): + out = self.net(x) + val, gate = out.chunk(2, dim=1) + return x + val * torch.sigmoid(gate) + + +class GatedConvNet(nn.Module): + def __init__(self, c_in, c_hidden=32, c_out=-1, num_layers=3): + """Module that summarizes the previous blocks to a full convolutional neural network. + + Args: + c_in: Number of input channels + c_hidden: Number of hidden dimensions to use within the network + c_out: Number of output channels. If -1, 2 times the input channels are used (affine coupling) + num_layers: Number of gated ResNet blocks to apply + """ + super().__init__() + c_out = c_out if c_out > 0 else 2 * c_in + layers = [] + layers += [nn.Conv2d(c_in, c_hidden, kernel_size=3, padding=1)] + for layer_index in range(num_layers): + layers += [GatedConv(c_hidden, c_hidden), LayerNormChannels(c_hidden)] + layers += [ConcatELU(), nn.Conv2d(2 * c_hidden, c_out, kernel_size=3, padding=1)] + self.nn = nn.Sequential(*layers) + + self.nn[-1].weight.data.zero_() + self.nn[-1].bias.data.zero_() + + def forward(self, x): + return self.nn(x) + + +# %% [markdown] +# ### Training loop +# +# Finally, we can add Dequantization, Variational Dequantization and Coupling Layers together to build our full normalizing flow on MNIST images. +# We apply 8 coupling layers in the main flow, and 4 for variational dequantization if applied. +# We apply a checkerboard mask throughout the network as with a single channel (black-white images), +# we cannot apply channel mask. +# The overall architecture is visualized below. +# +# +#
+ + +# %% +def create_simple_flow(use_vardeq=True): + flow_layers = [] + if use_vardeq: + vardeq_layers = [ + CouplingLayer( + network=GatedConvNet(c_in=2, c_out=2, c_hidden=16), + mask=create_checkerboard_mask(h=28, w=28, invert=(i % 2 == 1)), + c_in=1, + ) + for i in range(4) + ] + flow_layers += [VariationalDequantization(var_flows=vardeq_layers)] + else: + flow_layers += [Dequantization()] + + for i in range(8): + flow_layers += [ + CouplingLayer( + network=GatedConvNet(c_in=1, c_hidden=32), + mask=create_checkerboard_mask(h=28, w=28, invert=(i % 2 == 1)), + c_in=1, + ) + ] + + flow_model = ImageFlow(flow_layers).to(device) + return flow_model + + +# %% [markdown] +# For implementing the training loop, we use the framework of PyTorch Lightning and reduce the code overhead. +# If interested, you can take a look at the generated tensorboard file, +# in particularly the graph to see an overview of flow transformations that are applied. +# Note that we again provide pre-trained models (see later on in the notebook) +# as normalizing flows are particularly expensive to train. +# We have also run validation and testing as this can take some time as well with the added importance sampling. + + +# %% +def train_flow(flow, model_name="MNISTFlow"): + # Create a PyTorch Lightning trainer + trainer = L.Trainer( + default_root_dir=os.path.join(CHECKPOINT_PATH, model_name), + accelerator="auto", + devices=1, + max_epochs=200, + gradient_clip_val=1.0, + callbacks=[ + ModelCheckpoint(save_weights_only=True, mode="min", monitor="val_bpd"), + LearningRateMonitor("epoch"), + ], + ) + trainer.logger._log_graph = True + trainer.logger._default_hp_metric = None # Optional logging argument that we don't need + + train_data_loader = data.DataLoader( + train_set, batch_size=128, shuffle=True, drop_last=True, pin_memory=True, num_workers=8 + ) + result = None + + # Check whether pretrained model exists. If yes, load it and skip training + pretrained_filename = os.path.join(CHECKPOINT_PATH, model_name + ".ckpt") + if os.path.isfile(pretrained_filename): + print("Found pretrained model, loading...") + ckpt = torch.load(pretrained_filename, map_location=device) + flow.load_state_dict(ckpt["state_dict"]) + result = ckpt.get("result", None) + else: + print("Start training", model_name) + trainer.fit(flow, train_data_loader, val_loader) + + # Test best model on validation and test set if no result has been found + # Testing can be expensive due to the importance sampling. + if result is None: + val_result = trainer.test(flow, dataloaders=val_loader, verbose=False) + start_time = time.time() + test_result = trainer.test(flow, dataloaders=test_loader, verbose=False) + duration = time.time() - start_time + result = {"test": test_result, "val": val_result, "time": duration / len(test_loader) / flow.import_samples} + + return flow, result + + +# %% [markdown] +# ## Multi-scale architecture +# +#
+# +# One disadvantage of normalizing flows is that they operate on the exact same dimensions as the input. +# If the input is high-dimensional, so is the latent space, which requires larger computational cost to learn suitable transformations. +# However, particularly in the image domain, many pixels contain less information in the sense +# that we could remove them without loosing the semantical information of the image. +# +# Based on this intuition, deep normalizing flows on images commonly apply a multi-scale architecture [1]. +# After the first $N$ flow transformations, we split off half of the latent dimensions and directly evaluate them on the prior. +# The other half is run through $N$ more flow transformations, and depending on the size of the input, +# we split it again in half or stop overall at this position. +# The two operations involved in this setup is `Squeeze` and `Split` which +# we will review more closely and implement below. + +# %% [markdown] +# ### Squeeze and Split +# +# When we want to remove half of the pixels in an image, we have the problem of deciding which variables to cut, +# and how to rearrange the image. +# Thus, the squeezing operation is commonly used before split, which divides the image into subsquares +# of shape $2\times 2\times C$, and reshapes them into $1\times 1\times 4C$ blocks. +# Effectively, we reduce the height and width of the image by a factor of 2 while scaling the number of channels by 4. +# Afterwards, we can perform the split operation over channels without the need of rearranging the pixels. +# The smaller scale also makes the overall architecture more efficient. +# Visually, the squeeze operation should transform the input as follows: +# +#
+# +# The input of $4\times 4\times 1$ is scaled to $2\times 2\times 4$ following +# the idea of grouping the pixels in $2\times 2\times 1$ subsquares. +# Next, let's try to implement this layer: + + +# %% +class SqueezeFlow(nn.Module): + def forward(self, z, ldj, reverse=False): + B, C, H, W = z.shape + if not reverse: + # Forward direction: H x W x C => H/2 x W/2 x 4C + z = z.reshape(B, C, H // 2, 2, W // 2, 2) + z = z.permute(0, 1, 3, 5, 2, 4) + z = z.reshape(B, 4 * C, H // 2, W // 2) + else: + # Reverse direction: H/2 x W/2 x 4C => H x W x C + z = z.reshape(B, C // 4, 2, 2, H, W) + z = z.permute(0, 1, 4, 2, 5, 3) + z = z.reshape(B, C // 4, H * 2, W * 2) + return z, ldj + + +# %% [markdown] +# Before moving on, we can verify our implementation by comparing our output with the example figure above: + +# %% +sq_flow = SqueezeFlow() +rand_img = torch.arange(1, 17).view(1, 1, 4, 4) +print("Image (before)\n", rand_img) +forward_img, _ = sq_flow(rand_img, ldj=None, reverse=False) +print("\nImage (forward)\n", forward_img.permute(0, 2, 3, 1)) # Permute for readability +reconst_img, _ = sq_flow(forward_img, ldj=None, reverse=True) +print("\nImage (reverse)\n", reconst_img) + +# %% [markdown] +# The split operation divides the input into two parts, and evaluates one part directly on the prior. +# So that our flow operation fits to the implementation of the previous layers, +# we will return the prior probability of the first part as the log determinant jacobian of the layer. +# It has the same effect as if we would combine all variable splits at the +# end of the flow, and evaluate them together on the prior. + + +# %% +class SplitFlow(nn.Module): + def __init__(self): + super().__init__() + self.prior = torch.distributions.normal.Normal(loc=0.0, scale=1.0) + + def forward(self, z, ldj, reverse=False): + if not reverse: + z, z_split = z.chunk(2, dim=1) + ldj += self.prior.log_prob(z_split).sum(dim=[1, 2, 3]) + else: + z_split = self.prior.sample(sample_shape=z.shape).to(device) + z = torch.cat([z, z_split], dim=1) + ldj -= self.prior.log_prob(z_split).sum(dim=[1, 2, 3]) + return z, ldj + + +# %% [markdown] +# ### Building a multi-scale flow +# +# After defining the squeeze and split operation, we are finally able to build our own multi-scale flow. +# Deep normalizing flows such as Glow and Flow++ [2,3] often apply a split operation directly after squeezing. +# However, with shallow flows, we need to be more thoughtful about where to place the split operation as we need at least a minimum amount of transformations on each variable. +# Our setup is inspired by the original RealNVP architecture [1] which is shallower than other, +# more recent state-of-the-art architectures. +# +# Hence, for the MNIST dataset, we will apply the first squeeze operation after two coupling layers, but don't apply a split operation yet. +# Because we have only used two coupling layers and each the variable has been only transformed once, a split operation would be too early. +# We apply two more coupling layers before finally applying a split flow and squeeze again. +# The last four coupling layers operate on a scale of $7\times 7\times 8$. +# The full flow architecture is shown below. +# +#
+# +# Note that while the feature maps inside the coupling layers reduce with the height and width of the input, +# the increased number of channels is not directly considered. +# To counteract this, we increase the hidden dimensions for the coupling layers on the squeezed input. +# The dimensions are often scaled by 2 as this approximately increases the computation cost by 4 canceling with the squeezing operation. +# However, we will choose the hidden dimensionalities $32, 48, 64$ for the +# three scales respectively to keep the number of parameters reasonable +# and show the efficiency of multi-scale architectures. + + +# %% +def create_multiscale_flow(): + flow_layers = [] + + vardeq_layers = [ + CouplingLayer( + network=GatedConvNet(c_in=2, c_out=2, c_hidden=16), + mask=create_checkerboard_mask(h=28, w=28, invert=(i % 2 == 1)), + c_in=1, + ) + for i in range(4) + ] + flow_layers += [VariationalDequantization(vardeq_layers)] + + flow_layers += [ + CouplingLayer( + network=GatedConvNet(c_in=1, c_hidden=32), + mask=create_checkerboard_mask(h=28, w=28, invert=(i % 2 == 1)), + c_in=1, + ) + for i in range(2) + ] + flow_layers += [SqueezeFlow()] + for i in range(2): + flow_layers += [ + CouplingLayer( + network=GatedConvNet(c_in=4, c_hidden=48), mask=create_channel_mask(c_in=4, invert=(i % 2 == 1)), c_in=4 + ) + ] + flow_layers += [SplitFlow(), SqueezeFlow()] + for i in range(4): + flow_layers += [ + CouplingLayer( + network=GatedConvNet(c_in=8, c_hidden=64), mask=create_channel_mask(c_in=8, invert=(i % 2 == 1)), c_in=8 + ) + ] + + flow_model = ImageFlow(flow_layers).to(device) + return flow_model + + +# %% [markdown] +# We can show the difference in number of parameters below: + + +# %% +def print_num_params(model): + num_params = sum(np.prod(p.shape) for p in model.parameters()) + print(f"Number of parameters: {num_params:,}") + + +print_num_params(create_simple_flow(use_vardeq=False)) +print_num_params(create_simple_flow(use_vardeq=True)) +print_num_params(create_multiscale_flow()) + +# %% [markdown] +# Although the multi-scale flow has almost 3 times the parameters of the single scale flow, +# it is not necessarily more computationally expensive than its counterpart. +# We will compare the runtime in the following experiments as well. + +# %% [markdown] +# ## Analysing the flows +# +# In the last part of the notebook, we will train all the models we have implemented above, +# and try to analyze the effect of the multi-scale architecture and variational dequantization. +# +# ### Training flow variants +# +# Before we can analyse the flow models, we need to train them first. +# We provide pre-trained models that contain the validation and test performance, and run-time information. +# As flow models are computationally expensive, we advice you to rely on +# those pretrained models for a first run through the notebook. + +# %% +flow_dict = {"simple": {}, "vardeq": {}, "multiscale": {}} +flow_dict["simple"]["model"], flow_dict["simple"]["result"] = train_flow( + create_simple_flow(use_vardeq=False), model_name="MNISTFlow_simple" +) +flow_dict["vardeq"]["model"], flow_dict["vardeq"]["result"] = train_flow( + create_simple_flow(use_vardeq=True), model_name="MNISTFlow_vardeq" +) +flow_dict["multiscale"]["model"], flow_dict["multiscale"]["result"] = train_flow( + create_multiscale_flow(), model_name="MNISTFlow_multiscale" +) + +# %% [markdown] +# ### Density modeling and sampling +# +# Firstly, we can compare the models on their quantitative results. +# The following table shows all important statistics. +# The inference time specifies the time needed to determine the +# probability for a batch of 64 images for each model, and the sampling +# time the duration it took to sample a batch of 64 images. + +# %% language="html" +# +# + +# %% + +table = [ + [ + key, + "%4.3f bpd" % flow_dict[key]["result"]["val"][0]["test_bpd"], + "%4.3f bpd" % flow_dict[key]["result"]["test"][0]["test_bpd"], + "%2.0f ms" % (1000 * flow_dict[key]["result"]["time"]), + "%2.0f ms" % (1000 * flow_dict[key]["result"].get("samp_time", 0)), + "{:,}".format(sum(np.prod(p.shape) for p in flow_dict[key]["model"].parameters())), + ] + for key in flow_dict +] +display( + HTML( + tabulate.tabulate( + table, + tablefmt="html", + headers=["Model", "Validation Bpd", "Test Bpd", "Inference time", "Sampling time", "Num Parameters"], + ) + ) +) + +# %% [markdown] +# As we have intially expected, using variational dequantization improves upon standard dequantization in terms of bits per dimension. +# Although the difference with 0.04bpd doesn't seem impressive first, it is a considerably step for generative models +# (most state-of-the-art models improve upon previous models in a range of 0.02-0.1bpd on CIFAR with three times as high bpd). +# While it takes longer to evaluate the probability of an image due to the variational dequantization, +# which also leads to a longer training time, it does not have an effect on the sampling time. +# This is because inverting variational dequantization is the same as dequantization: finding the next lower integer. +# +# When we compare the two models to multi-scale architecture, we can see that the bits per dimension score again dropped by about 0.04bpd. +# Additionally, the inference time and sampling time improved notably despite having more parameters. +# Thus, we see that the multi-scale flow is not only stronger for density modeling, but also more efficient. +# +# Next, we can test the sampling quality of the models. +# We should note that the samples for variational dequantization and standard dequantization are very similar, +# and hence we visualize here only the ones for variational dequantization and the multi-scale model. +# However, feel free to also test out the `"simple"` model. +# The seeds are set to obtain reproducable generations and are not cherry picked. + +# %% +L.seed_everything(44) +samples = flow_dict["vardeq"]["model"].sample(img_shape=[16, 1, 28, 28]) +show_imgs(samples.cpu()) + +# %% +L.seed_everything(44) +samples = flow_dict["multiscale"]["model"].sample(img_shape=[16, 8, 7, 7]) +show_imgs(samples.cpu()) + +# %% [markdown] +# From the few samples, we can see a clear difference between the simple and the multi-scale model. +# The single-scale model has only learned local, small correlations while the multi-scale model was able to learn full, +# global relations that form digits. +# This show-cases another benefit of the multi-scale model. +# In contrast to VAEs, the outputs are sharp as normalizing flows can naturally model complex, +# multi-modal distributions while VAEs have the independent decoder output noise. +# Nevertheless, the samples from this flow are far from perfect as not all samples show true digits. + +# %% [markdown] +# ### Interpolation in latent space +# +# Another popular test for the smoothness of the latent space of generative models is to interpolate between two training examples. +# As normalizing flows are strictly invertible, we can guarantee that any image is represented in the latent space. +# We again compare the variational dequantization model with the multi-scale model below. + + +# %% +@torch.no_grad() +def interpolate(model, img1, img2, num_steps=8): + """ + Args: + model: object of ImageFlow class that represents the (trained) flow model + img1, img2: Image tensors of shape [1, 28, 28]. Images between which should be interpolated. + num_steps: Number of interpolation steps. 8 interpolation steps mean 6 intermediate pictures besides img1 and img2 + """ + imgs = torch.stack([img1, img2], dim=0).to(model.device) + z, _ = model.encode(imgs) + alpha = torch.linspace(0, 1, steps=num_steps, device=z.device).view(-1, 1, 1, 1) + interpolations = z[0:1] * alpha + z[1:2] * (1 - alpha) + interp_imgs = model.sample(interpolations.shape[:1] + imgs.shape[1:], z_init=interpolations) + show_imgs(interp_imgs, row_size=8) + + +exmp_imgs, _ = next(iter(train_loader)) + +# %% +L.seed_everything(42) +for i in range(2): + interpolate(flow_dict["vardeq"]["model"], exmp_imgs[2 * i], exmp_imgs[2 * i + 1]) + +# %% +L.seed_everything(42) +for i in range(2): + interpolate(flow_dict["multiscale"]["model"], exmp_imgs[2 * i], exmp_imgs[2 * i + 1]) + +# %% [markdown] +# The interpolations of the multi-scale model result in more realistic digits +# (first row $7\leftrightarrow 8\leftrightarrow 6$, second row $9\leftrightarrow 4\leftrightarrow 6$), +# while the variational dequantization model focuses on local patterns that globally do not form a digit. +# For the multi-scale model, we actually did not do the "true" interpolation between the two images +# as we did not consider the variables that were split along the flow (they have been sampled randomly for all samples). +# However, as we will see in the next experiment, the early variables do not effect the overall image much. + +# %% [markdown] +# ### Visualization of latents in different levels of multi-scale +# +# In the following we will focus more on the multi-scale flow. +# We want to analyse what information is being stored in the variables split at early layers, +# and what information for the final variables. +# For this, we sample 8 images where each of them share the same final latent variables, +# but differ in the other part of the latent variables. +# Below we visualize three examples of this: + +# %% +L.seed_everything(44) +for _ in range(3): + z_init = flow_dict["multiscale"]["model"].prior.sample(sample_shape=[1, 8, 7, 7]) + z_init = z_init.expand(8, -1, -1, -1) + samples = flow_dict["multiscale"]["model"].sample(img_shape=z_init.shape, z_init=z_init) + show_imgs(samples.cpu()) + +# %% [markdown] +# We see that the early split variables indeed have a smaller effect on the image. +# Still, small differences can be spot when we look carefully at the borders of the digits. +# For instance, the hole at the top of the 8 changes for different samples although all of them represent the same coarse structure. +# This shows that the flow indeed learns to separate the higher-level +# information in the final variables, while the early split ones contain +# local noise patterns. + +# %% [markdown] +# ### Visualizing Dequantization +# +# As a final part of this notebook, we will look at the effect of variational dequantization. +# We have motivated variational dequantization by the issue of sharp edges/boarders being difficult to model, +# and a flow would rather prefer smooth, prior-like distributions. +# To check how what noise distribution $q(u|x)$ the flows in the +# variational dequantization module have learned, we can plot a histogram +# of output values from the dequantization and variational dequantization +# module. + + +# %% +def visualize_dequant_distribution(model: ImageFlow, imgs: Tensor, title: str = None): + """ + Args: + model: The flow of which we want to visualize the dequantization distribution + imgs: Example training images of which we want to visualize the dequantization distribution + """ + imgs = imgs.to(device) + ldj = torch.zeros(imgs.shape[0], dtype=torch.float32).to(device) + with torch.no_grad(): + dequant_vals = [] + for _ in tqdm(range(8), leave=False): + d, _ = model.flows[0](imgs, ldj, reverse=False) + dequant_vals.append(d) + dequant_vals = torch.cat(dequant_vals, dim=0) + dequant_vals = dequant_vals.view(-1).cpu().numpy() + sns.set() + plt.figure(figsize=(10, 3)) + plt.hist(dequant_vals, bins=256, color=to_rgb("C0") + (0.5,), edgecolor="C0", density=True) + if title is not None: + plt.title(title) + plt.show() + plt.close() + + +sample_imgs, _ = next(iter(train_loader)) + +# %% +visualize_dequant_distribution(flow_dict["simple"]["model"], sample_imgs, title="Dequantization") + +# %% +visualize_dequant_distribution(flow_dict["vardeq"]["model"], sample_imgs, title="Variational dequantization") + +# %% [markdown] +# The dequantization distribution in the first plot shows that the MNIST images have a strong bias towards 0 (black), +# and the distribution of them have a sharp border as mentioned before. +# The variational dequantization module has indeed learned a much smoother distribution with a Gaussian-like curve which can be modeled much better. +# For the other values, we would need to visualize the distribution $q(u|x)$ on a deeper level, depending on $x$. +# However, as all $u$'s interact and depend on each other, we would need +# to visualize a distribution in 784 dimensions, which is not that +# intuitive anymore. + +# %% [markdown] +# ## Conclusion +# +# In conclusion, we have seen how to implement our own normalizing flow, and what difficulties arise if we want to apply them on images. +# Dequantization is a crucial step in mapping the discrete images into continuous space to prevent underisable delta-peak solutions. +# While dequantization creates hypercubes with hard border, variational dequantization allows us to fit a flow much better on the data. +# This allows us to obtain a lower bits per dimension score, while not affecting the sampling speed. +# The most common flow element, the coupling layer, is simple to implement, and yet effective. +# Furthermore, multi-scale architectures help to capture the global image context while allowing us to efficiently scale up the flow. +# Normalizing flows are an interesting alternative to VAEs as they allow an exact likelihood estimate in continuous space, +# and we have the guarantee that every possible input $x$ has a corresponding latent vector $z$. +# However, even beyond continuous inputs and images, flows can be applied and allow us to exploit +# the data structure in latent space, as e.g. on graphs for the task of molecule generation [6]. +# Recent advances in [Neural ODEs](https://arxiv.org/pdf/1806.07366.pdf) allow a flow with infinite number of layers, +# called Continuous Normalizing Flows, whose potential is yet to fully explore. +# Overall, normalizing flows are an exciting research area which will continue over the next couple of years. + +# %% [markdown] +# ## References +# +# [1] Dinh, L., Sohl-Dickstein, J., and Bengio, S. (2017). +# “Density estimation using Real NVP,” In: 5th International Conference on Learning Representations, ICLR 2017. +# [Link](https://arxiv.org/abs/1605.08803) +# +# [2] Kingma, D. P., and Dhariwal, P. (2018). +# “Glow: Generative Flow with Invertible 1x1 Convolutions,” In: Advances in Neural Information Processing Systems, vol. +# 31, pp. +# 10215--10224. +# [Link](http://papers.nips.cc/paper/8224-glow-generative-flow-with-invertible-1x1-convolutions.pdf) +# +# [3] Ho, J., Chen, X., Srinivas, A., Duan, Y., and Abbeel, P. (2019). +# “Flow++: Improving Flow-Based Generative Models with Variational Dequantization and Architecture Design,” +# in Proceedings of the 36th International Conference on Machine Learning, vol. +# 97, pp. +# 2722–2730. +# [Link](https://arxiv.org/abs/1902.00275) +# +# [4] Durkan, C., Bekasov, A., Murray, I., and Papamakarios, G. (2019). +# “Neural Spline Flows,” In: Advances in Neural Information Processing Systems, pp. +# 7509–7520. +# [Link](http://papers.neurips.cc/paper/8969-neural-spline-flows.pdf) +# +# [5] Hoogeboom, E., Cohen, T. S., and Tomczak, J. M. (2020). +# “Learning Discrete Distributions by Dequantization,” arXiv preprint arXiv2001.11235v1. +# [Link](https://arxiv.org/abs/2001.11235) +# +# [6] Lippe, P., and Gavves, E. (2021). +# “Categorical Normalizing Flows via Continuous Transformations,” +# In: International Conference on Learning Representations, ICLR 2021. +# [Link](https://openreview.net/pdf?id=-GLNZeVDuik) diff --git a/_notebooks/course_UvA-DL/09-normalizing-flows/Squeeze_operation.svg b/_notebooks/course_UvA-DL/09-normalizing-flows/Squeeze_operation.svg new file mode 100644 index 0000000..cf66772 --- /dev/null +++ b/_notebooks/course_UvA-DL/09-normalizing-flows/Squeeze_operation.svg @@ -0,0 +1,3 @@ + + +
16
16
15
15
12
12
14
14
13
13
10
10
8
8
7
7
4
4
6
6
5
5
1
1
2
2
3
3
4
4
5
5
6
6
7
7
8
8
9
9
10
10
11
11
12
12
13
13
14
14
15
15
16
16
2
2
3
3
9
9
11
11
1
1
H x W x C
H x W x C
H/2 x W/2 x 4C
H/2 x W/2 x 4C
diff --git a/_notebooks/course_UvA-DL/09-normalizing-flows/comparison_GAN_VAE_NF.png b/_notebooks/course_UvA-DL/09-normalizing-flows/comparison_GAN_VAE_NF.png new file mode 100644 index 0000000..fffe9d2 Binary files /dev/null and b/_notebooks/course_UvA-DL/09-normalizing-flows/comparison_GAN_VAE_NF.png differ diff --git a/_notebooks/course_UvA-DL/09-normalizing-flows/coupling_flow.svg b/_notebooks/course_UvA-DL/09-normalizing-flows/coupling_flow.svg new file mode 100644 index 0000000..817758c --- /dev/null +++ b/_notebooks/course_UvA-DL/09-normalizing-flows/coupling_flow.svg @@ -0,0 +1,926 @@ + + + + + + image/svg+xmldiff --git a/_notebooks/course_UvA-DL/09-normalizing-flows/dequantization_issue.svg b/_notebooks/course_UvA-DL/09-normalizing-flows/dequantization_issue.svg new file mode 100644 index 0000000..f254085 --- /dev/null +++ b/_notebooks/course_UvA-DL/09-normalizing-flows/dequantization_issue.svg @@ -0,0 +1,417 @@ + + + + + + + + 2020-09-10T14:01:01.731212 + image/svg+xml + + + Matplotlib v3.3.0, https://matplotlib.org/ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/_notebooks/course_UvA-DL/09-normalizing-flows/image_to_gaussian.svg b/_notebooks/course_UvA-DL/09-normalizing-flows/image_to_gaussian.svg new file mode 100644 index 0000000..f287768 --- /dev/null +++ b/_notebooks/course_UvA-DL/09-normalizing-flows/image_to_gaussian.svg @@ -0,0 +1,3 @@ + + +
p(z)
p(z)
1x28x28
1x28x28
p(x)
p(x)
1x28x28
1x28x28
Normalizing Flow
Normalizing F...
diff --git a/_notebooks/course_UvA-DL/09-normalizing-flows/multiscale_flow.svg b/_notebooks/course_UvA-DL/09-normalizing-flows/multiscale_flow.svg new file mode 100644 index 0000000..db7af24 --- /dev/null +++ b/_notebooks/course_UvA-DL/09-normalizing-flows/multiscale_flow.svg @@ -0,0 +1,3 @@ + + +
(Variational) Dequantization
(Variational) Dequantizati...
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
p(x)
p(x)
p(z)
p(z)
1x28x28
1x28x28
1x28x28
1x28x28
Squeeze flow
Squeeze flow
1x28x28
=>
 4x14x14
1x28x28...
Squeeze flow
Squeeze flow
Split flow
Split flow
2x14x14
2x14x14
2x14x14
=>
8x7x7
2x14x14...
Concatenate and reshape
Concatenate and reshape
diff --git a/_notebooks/course_UvA-DL/09-normalizing-flows/normalizing_flow_layout.png b/_notebooks/course_UvA-DL/09-normalizing-flows/normalizing_flow_layout.png new file mode 100644 index 0000000..9a164b9 Binary files /dev/null and b/_notebooks/course_UvA-DL/09-normalizing-flows/normalizing_flow_layout.png differ diff --git a/_notebooks/course_UvA-DL/09-normalizing-flows/uniform_flow.png b/_notebooks/course_UvA-DL/09-normalizing-flows/uniform_flow.png new file mode 100644 index 0000000..34a08cf Binary files /dev/null and b/_notebooks/course_UvA-DL/09-normalizing-flows/uniform_flow.png differ diff --git a/_notebooks/course_UvA-DL/09-normalizing-flows/vanilla_flow.svg b/_notebooks/course_UvA-DL/09-normalizing-flows/vanilla_flow.svg new file mode 100644 index 0000000..6220752 --- /dev/null +++ b/_notebooks/course_UvA-DL/09-normalizing-flows/vanilla_flow.svg @@ -0,0 +1,3 @@ + + +
(Variational) Dequantization
(Variational) Dequantizati...
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
Coupling layer
p(x)
p(x)
p(z)
p(z)
1x28x28
1x28x28
1x28x28
1x28x28
diff --git a/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/.meta.yml b/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/.meta.yml new file mode 100644 index 0000000..ac181f2 --- /dev/null +++ b/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/.meta.yml @@ -0,0 +1,23 @@ +title: "Tutorial 10: Autoregressive Image Modeling" +author: Phillip Lippe +created: 2021-07-12 +updated: 2023-03-14 +license: CC BY-SA +build: 0 +tags: + - Image +description: | + In this tutorial, we implement an autoregressive likelihood model for the task of image modeling. + Autoregressive models are naturally strong generative models that constitute one of the current + state-of-the-art architectures on likelihood-based image modeling, + and are also the basis for large language generation models such as GPT3. + We will focus on the PixelCNN architecture in this tutorial, and apply it to MNIST modeling. + This notebook is part of a lecture series on Deep Learning at the University of Amsterdam. + The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io. +requirements: + - torchvision + - matplotlib + - seaborn + - lightning>=2.0.0rc0 +accelerator: + - GPU diff --git a/docs/_static/images/course_UvA-DL/10-autoregressive-image-modeling.jpg b/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/.thumb.jpg similarity index 100% rename from docs/_static/images/course_UvA-DL/10-autoregressive-image-modeling.jpg rename to _notebooks/course_UvA-DL/10-autoregressive-image-modeling/.thumb.jpg diff --git a/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/Autoregressive_Image_Modeling.py b/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/Autoregressive_Image_Modeling.py new file mode 100644 index 0000000..5adb928 --- /dev/null +++ b/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/Autoregressive_Image_Modeling.py @@ -0,0 +1,977 @@ +# %% [markdown] +#
+# +# Similar to the language generation you have seen in assignment 2, autoregressive models work on images by modeling the likelihood of a pixel given all previous ones. +# For instance, in the picture below, we model the pixel $x_i$ as a conditional probability distribution +# based on all previous (here blue) pixels (figure credit - [Aaron van den Oord et al. ](https://arxiv.org/abs/1601.06759)): +# +#
+# +# Generally, autoregressive model over high-dimensional data $\mathbf{x}$ factor the joint distribution as the following product of conditionals: +# +# $$p(\mathbf{x})=p(x_1, ..., x_n)=\prod_{i=1}^{n} p(x_i|x_1,...,x_{i-1})$$ +# +# Learning these conditionals is often much simpler than learning the joint distribution $p(\mathbf{x})$ all together. +# However, disadvantages of autoregressive models include slow sampling, especially for large images, +# as we need height-times-width forward passes through the model. +# In addition, for some applications, we require a latent space as modeled in VAEs and Normalizing Flows. +# For instance, in autoregressive models, we cannot interpolate between two images because of the lack of a latent representation. +# We will explore and discuss these benefits and drawbacks alongside with our implementation. +# +# Our implementation will focus on the [PixelCNN](https://arxiv.org/pdf/1606.05328.pdf) [2] model which has been discussed in detail in the lecture. +# Most current SOTA models use PixelCNN as their fundamental architecture, +# and various additions have been proposed to improve the performance +# (e.g. [PixelCNN++](https://arxiv.org/pdf/1701.05517.pdf) and [PixelSNAIL](http://proceedings.mlr.press/v80/chen18h/chen18h.pdf)). +# Hence, implementing PixelCNN is a good starting point for our short tutorial. +# +# First of all, we need to import our standard libraries. Similarly as in +# the last couple of tutorials, we will use [PyTorch +# Lightning](https://lightning.ai/docs/pytorch/stable/) here as +# well. + +# %% + +import math +import os +import urllib.request +from urllib.error import HTTPError + +import lightning as L + +# Imports for plotting +import matplotlib.pyplot as plt +import matplotlib_inline.backend_inline +import numpy as np +import seaborn as sns +import torch +import torch.nn as nn +import torch.nn.functional as F +import torch.optim as optim +import torch.utils.data as data +import torchvision +from lightning.pytorch.callbacks import LearningRateMonitor, ModelCheckpoint +from matplotlib.colors import to_rgb +from torch import Tensor +from torchvision import transforms +from torchvision.datasets import MNIST +from tqdm.notebook import tqdm + +plt.set_cmap("cividis") +# %matplotlib inline +matplotlib_inline.backend_inline.set_matplotlib_formats("svg", "pdf") # For export + +# Path to the folder where the datasets are/should be downloaded (e.g. MNIST) +DATASET_PATH = os.environ.get("PATH_DATASETS", "data") +# Path to the folder where the pretrained models are saved +CHECKPOINT_PATH = os.environ.get("PATH_CHECKPOINT", "saved_models/tutorial12") + +# Setting the seed +L.seed_everything(42) + +# Ensure that all operations are deterministic on GPU (if used) for reproducibility +torch.backends.cudnn.determinstic = True +torch.backends.cudnn.benchmark = False + +# Fetching the device that will be used throughout this notebook +device = torch.device("cpu") if not torch.cuda.is_available() else torch.device("cuda:0") +print("Using device", device) + +# %% [markdown] +# We again provide a pretrained model, which is downloaded below: + +# %% +# Github URL where saved models are stored for this tutorial +base_url = "https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial12/" +# Files to download +pretrained_files = ["PixelCNN.ckpt"] +# Create checkpoint path if it doesn't exist yet +os.makedirs(CHECKPOINT_PATH, exist_ok=True) + +# For each file, check whether it already exists. If not, try downloading it. +for file_name in pretrained_files: + file_path = os.path.join(CHECKPOINT_PATH, file_name) + if not os.path.isfile(file_path): + file_url = base_url + file_name + print("Downloading %s..." % file_url) + try: + urllib.request.urlretrieve(file_url, file_path) + except HTTPError as e: + print( + "Something went wrong. Please try to download the file from the GDrive folder, or contact the author with the full output including the following error:\n", + e, + ) + +# %% [markdown] +# Similar to the Normalizing Flows in Tutorial 11, we will work on the +# MNIST dataset and use 8-bits per pixel (values between 0 and 255). The +# dataset is loaded below: + + +# %% +# Convert images from 0-1 to 0-255 (integers). We use the long datatype as we will use the images as labels as well +def discretize(sample): + return (sample * 255).to(torch.long) + + +# Transformations applied on each image => only make them a tensor +transform = transforms.Compose([transforms.ToTensor(), discretize]) + +# Loading the training dataset. We need to split it into a training and validation part +train_dataset = MNIST(root=DATASET_PATH, train=True, transform=transform, download=True) +L.seed_everything(42) +train_set, val_set = torch.utils.data.random_split(train_dataset, [50000, 10000]) + +# Loading the test set +test_set = MNIST(root=DATASET_PATH, train=False, transform=transform, download=True) + +# We define a set of data loaders that we can use for various purposes later. +train_loader = data.DataLoader(train_set, batch_size=128, shuffle=True, drop_last=True, pin_memory=True, num_workers=4) +val_loader = data.DataLoader(val_set, batch_size=128, shuffle=False, drop_last=False, num_workers=4) +test_loader = data.DataLoader(test_set, batch_size=128, shuffle=False, drop_last=False, num_workers=4) + +# %% [markdown] +# A good practice is to always visualize some data examples to get an intuition of the data: + + +# %% +def show_imgs(imgs): + num_imgs = imgs.shape[0] if isinstance(imgs, Tensor) else len(imgs) + nrow = min(num_imgs, 4) + ncol = int(math.ceil(num_imgs / nrow)) + imgs = torchvision.utils.make_grid(imgs, nrow=nrow, pad_value=128) + imgs = imgs.clamp(min=0, max=255) + np_imgs = imgs.cpu().numpy() + plt.figure(figsize=(1.5 * nrow, 1.5 * ncol)) + plt.imshow(np.transpose(np_imgs, (1, 2, 0)), interpolation="nearest") + plt.axis("off") + plt.show() + plt.close() + + +show_imgs([train_set[i][0] for i in range(8)]) + +# %% [markdown] +# ## Masked autoregressive convolutions +# +# The core module of PixelCNN is its masked convolutions. +# In contrast to language models, we don't apply an LSTM on each pixel one-by-one. +# This would be inefficient because images are grids instead of sequences. +# Thus, it is better to rely on convolutions that have shown great success in deep CNN classification models. +# +# Nevertheless, we cannot just apply standard convolutions without any changes. +# Remember that during training of autoregressive models, we want to use teacher forcing which both helps the model training, and significantly reduces the time needed for training. +# For image modeling, teacher forcing is implemented by using a training image as input to the model, and we want to obtain as output the prediction for each pixel based on *only* its predecessors. +# Thus, we need to ensure that the prediction for a specific pixel can only be influenced by its predecessors and not by its own value or any "future" pixels. +# For this, we apply convolutions with a mask. +# +# Which mask we use depends on the ordering of pixels we decide on, i.e. which is the first pixel we predict, +# which is the second one, etc. +# The most commonly used ordering is to denote the upper left pixel as the start pixel, +# and sort the pixels row by row, as shown in the visualization at the top of the tutorial. +# Thus, the second pixel is on the right of the first one (first row, second column), +# and once we reach the end of the row, we start in the second row, first column. +# If we now want to apply this to our convolutions, we need to ensure that the prediction of pixel 1 +# is not influenced by its own "true" input, and all pixels on its right and in any lower row. +# In convolutions, this means that we want to set those entries of the weight matrix to zero that take pixels on the right and below into account. +# As an example for a 5x5 kernel, see a mask below (figure credit - [Aaron van den Oord](https://arxiv.org/pdf/1606.05328.pdf)): +# +#
+# +# Before looking into the application of masked convolutions in PixelCNN +# in detail, let's first implement a module that allows us to apply an +# arbitrary mask to a convolution: + + +# %% +class MaskedConvolution(nn.Module): + def __init__(self, c_in, c_out, mask, **kwargs): + """Implements a convolution with mask applied on its weights. + + Args: + c_in: Number of input channels + c_out: Number of output channels + mask: Tensor of shape [kernel_size_H, kernel_size_W] with 0s where + the convolution should be masked, and 1s otherwise. + kwargs: Additional arguments for the convolution + """ + super().__init__() + # For simplicity: calculate padding automatically + kernel_size = (mask.shape[0], mask.shape[1]) + dilation = 1 if "dilation" not in kwargs else kwargs["dilation"] + padding = tuple(dilation * (kernel_size[i] - 1) // 2 for i in range(2)) + # Actual convolution + self.conv = nn.Conv2d(c_in, c_out, kernel_size, padding=padding, **kwargs) + + # Mask as buffer => it is no parameter but still a tensor of the module + # (must be moved with the devices) + self.register_buffer("mask", mask[None, None]) + + def forward(self, x): + self.conv.weight.data *= self.mask # Ensures zero's at masked positions + return self.conv(x) + + +# %% [markdown] +# ### Vertical and horizontal convolution stacks +# +# To build our own autoregressive image model, we could simply stack a few masked convolutions on top of each other. +# This was actually the case for the original PixelCNN model, discussed in the paper +# [Pixel Recurrent Neural Networks](https://arxiv.org/pdf/1601.06759.pdf), but this leads to a considerable issue. +# When sequentially applying a couple of masked convolutions, the receptive field of a pixel +# show to have a "blind spot" on the right upper side, as shown in the figure below +# (figure credit - [Aaron van den Oord et al. ](https://arxiv.org/pdf/1606.05328.pdf)): +# +#
+# +# Although a pixel should be able to take into account all other pixels above and left of it, +# a stack of masked convolutions does not allow us to look to the upper pixels on the right. +# This is because the features of the pixels above, which we use for convolution, +# do not contain any information of the pixels on the right of the same row. +# If they would, we would be "cheating" and actually looking into the future. +# To overcome this issue, van den Oord et. +# al [2] proposed to split the convolutions into a vertical and a horizontal stack. +# The vertical stack looks at all pixels above the current one, while the horizontal takes into account all on the left. +# While keeping both of them separate, we can actually look at the pixels on the right with the vertical stack without breaking any of our assumptions. +# The two convolutions are also shown in the figure above. +# +# Let us implement them here as follows: + + +# %% +class VerticalStackConvolution(MaskedConvolution): + def __init__(self, c_in, c_out, kernel_size=3, mask_center=False, **kwargs): + # Mask out all pixels below. For efficiency, we could also reduce the kernel + # size in height, but for simplicity, we stick with masking here. + mask = torch.ones(kernel_size, kernel_size) + mask[kernel_size // 2 + 1 :, :] = 0 + + # For the very first convolution, we will also mask the center row + if mask_center: + mask[kernel_size // 2, :] = 0 + + super().__init__(c_in, c_out, mask, **kwargs) + + +class HorizontalStackConvolution(MaskedConvolution): + def __init__(self, c_in, c_out, kernel_size=3, mask_center=False, **kwargs): + # Mask out all pixels on the left. Note that our kernel has a size of 1 + # in height because we only look at the pixel in the same row. + mask = torch.ones(1, kernel_size) + mask[0, kernel_size // 2 + 1 :] = 0 + + # For the very first convolution, we will also mask the center pixel + if mask_center: + mask[0, kernel_size // 2] = 0 + + super().__init__(c_in, c_out, mask, **kwargs) + + +# %% [markdown] +# Note that we have an input argument called `mask_center`. Remember that +# the input to the model is the actual input image. Hence, the very first +# convolution we apply cannot use the center pixel as input, but must be +# masked. All consecutive convolutions, however, should use the center +# pixel as we otherwise lose the features of the previous layer. Hence, +# the input argument `mask_center` is True for the very first +# convolutions, and False for all others. + +# %% [markdown] +# ### Visualizing the receptive field +# +# To validate our implementation of masked convolutions, we can visualize the receptive field we obtain with such convolutions. +# We should see that with increasing number of convolutional layers, the receptive field grows in both vertical and horizontal direction, without the issue of a blind spot. +# The receptive field can be empirically measured by backpropagating an arbitrary loss for the output features of a speicifc pixel with respect to the input. +# We implement this idea below, and visualize the receptive field below. + +# %% +inp_img = torch.zeros(1, 1, 11, 11) +inp_img.requires_grad_() + + +def show_center_recep_field(img, out): + """Calculates the gradients of the input with respect to the output center pixel, and visualizes the overall + receptive field. + + Args: + img: Input image for which we want to calculate the receptive field on. + out: Output features/loss which is used for backpropagation, and should be + the output of the network/computation graph. + """ + # Determine gradients + loss = out[0, :, img.shape[2] // 2, img.shape[3] // 2].sum() # L1 loss for simplicity + # Retain graph as we want to stack multiple layers and show the receptive field of all of them + loss.backward(retain_graph=True) + img_grads = img.grad.abs() + img.grad.fill_(0) # Reset grads + + # Plot receptive field + img = img_grads.squeeze().cpu().numpy() + fig, ax = plt.subplots(1, 2) + _ = ax[0].imshow(img) + ax[1].imshow(img > 0) + # Mark the center pixel in red if it doesn't have any gradients (should be + # the case for standard autoregressive models) + show_center = img[img.shape[0] // 2, img.shape[1] // 2] == 0 + if show_center: + center_pixel = np.zeros(img.shape + (4,)) + center_pixel[center_pixel.shape[0] // 2, center_pixel.shape[1] // 2, :] = np.array([1.0, 0.0, 0.0, 1.0]) + for i in range(2): + ax[i].axis("off") + if show_center: + ax[i].imshow(center_pixel) + ax[0].set_title("Weighted receptive field") + ax[1].set_title("Binary receptive field") + plt.show() + plt.close() + + +show_center_recep_field(inp_img, inp_img) + +# %% [markdown] +# Let's first visualize the receptive field of a horizontal convolution +# without the center pixel. We use a small, arbitrary input image +# ($11\times 11$ pixels), and calculate the loss for the center pixel. For +# simplicity, we initialize all weights with 1 and the bias with 0, and +# use a single channel. This is sufficient for our visualization purposes. + +# %% +horiz_conv = HorizontalStackConvolution(c_in=1, c_out=1, kernel_size=3, mask_center=True) +horiz_conv.conv.weight.data.fill_(1) +horiz_conv.conv.bias.data.fill_(0) +horiz_img = horiz_conv(inp_img) +show_center_recep_field(inp_img, horiz_img) + +# %% [markdown] +# The receptive field is shown in yellow, the center pixel in red, and all other pixels outside of the receptive field are dark blue. +# As expected, the receptive field of a single horizontal convolution with the center pixel masked and a $3\times3$ kernel is only the pixel on the left. +# If we use a larger kernel size, more pixels would be taken into account on the left. +# +# Next, let's take a look at the vertical convolution: + +# %% +vert_conv = VerticalStackConvolution(c_in=1, c_out=1, kernel_size=3, mask_center=True) +vert_conv.conv.weight.data.fill_(1) +vert_conv.conv.bias.data.fill_(0) +vert_img = vert_conv(inp_img) +show_center_recep_field(inp_img, vert_img) + +# %% [markdown] +# The vertical convolution takes all pixels above into account. Combining +# these two, we get the L-shaped receptive field of the original masked +# convolution: + +# %% +horiz_img = vert_img + horiz_img +show_center_recep_field(inp_img, horiz_img) + +# %% [markdown] +# If we stack multiple horizontal and vertical convolutions, we need to take two aspects into account: +# +# 1. +# The center should not be masked anymore for the following convolutions as the features at the pixel's position are already independent of its actual value. +# If it is hard to imagine why we can do this, just change the value below to `mask_center=True` and see what happens. +# 2. +# The vertical convolution is not allowed to work on features from the horizontal convolution. +# In the feature map of the horizontal convolutions, a pixel contains information about all of the "true" pixels on the left. +# If we apply a vertical convolution which also uses features from the right, we effectively expand our receptive field to the true input which we want to prevent. +# Thus, the feature maps can only be merged for the horizontal convolution. +# +# Using this, we can stack the convolutions in the following way. We have +# two feature streams: one for the vertical stack, and one for the +# horizontal stack. The horizontal convolutions can operate on the joint +# features of the previous horizontals and vertical convolutions, while +# the vertical stack only takes its own previous features as input. For a +# quick implementation, we can therefore sum the horizontal and vertical +# output features at each layer, and use those as final output features to +# calculate the loss on. An implementation of 4 consecutive layers is +# shown below. Note that we reuse the features from the other convolutions +# with `mask_center=True` from above. + +# %% +# Initialize convolutions with equal weight to all input pixels +horiz_conv = HorizontalStackConvolution(c_in=1, c_out=1, kernel_size=3, mask_center=False) +horiz_conv.conv.weight.data.fill_(1) +horiz_conv.conv.bias.data.fill_(0) +vert_conv = VerticalStackConvolution(c_in=1, c_out=1, kernel_size=3, mask_center=False) +vert_conv.conv.weight.data.fill_(1) +vert_conv.conv.bias.data.fill_(0) + +# We reuse our convolutions for the 4 layers here. Note that in a standard network, +# we don't do that, and instead learn 4 separate convolution. As this cell is only for +# visualization purposes, we reuse the convolutions for all layers. +for l_idx in range(4): + vert_img = vert_conv(vert_img) + horiz_img = horiz_conv(horiz_img) + vert_img + print("Layer %i" % (l_idx + 2)) + show_center_recep_field(inp_img, horiz_img) + +# %% [markdown] +# The receptive field above it visualized for the horizontal stack, which includes the features of the vertical convolutions. +# It grows over layers without any blind spot as we had before. +# The difference between "weighted" and "binary" receptive field is that for the latter, we check whether there are any gradients flowing back to this pixel. +# This indicates that the center pixel indeed can use information from this pixel. +# Nevertheless, due to the convolution weights, some pixels have a stronger effect on the prediction than others. +# This is visualized in the weighted receptive field by plotting the gradient magnitude for each pixel instead of a binary yes/no. +# +# +# Another receptive field we can check is the one for the vertical stack +# as the one above is for the horizontal stack. Let's visualize it below: + +# %% +show_center_recep_field(inp_img, vert_img) + +# %% [markdown] +# As we have discussed before, the vertical stack only looks at pixels above the one we want to predict. +# Hence, we can validate that our implementation works as we initially expected it to. +# As a final step, let's clean up the computation graph we still had kept +# in memory for the visualization of the receptive field: + +# %% +del inp_img, horiz_conv, vert_conv + +# %% [markdown] +# ## Gated PixelCNN +# +#
+# +# In the next step, we will use the masked convolutions to build a full autoregressive model, called Gated PixelCNN. +# The difference between the original PixelCNN and Gated PixelCNN is the use of separate horizontal and vertical stacks. +# However, in literature, you often see that people refer to the Gated PixelCNN simply as "PixelCNN". +# Hence, in the following, if we say "PixelCNN", we usually mean the gated version. +# What "Gated" refers to in the model name is explained next. +# +# ### Gated Convolutions +# +# For visualizing the receptive field, we assumed a very simplified stack of vertical and horizontal convolutions. +# Obviously, there are more sophisticated ways of doing it, and PixelCNN uses gated convolutions for this. +# Specifically, the Gated Convolution block in PixelCNN looks as follows +# (figure credit - [Aaron van den Oord et al. ](https://arxiv.org/pdf/1606.05328.pdf)): +# +#
+# +# The left path is the vertical stack (the $N\times N$ convolution is masked correspondingly), +# and the right path is the horizontal stack. +# Gated convolutions are implemented by having a twice as large output channel size, +# and combine them by a element-wise multiplication of $\tanh$ and a sigmoid. +# For a linear layer, we can express a gated activation unit as follows: +# +# $$\mathbf{y} = \tanh\left(\mathbf{W}_{f}\mathbf{x}\right)\odot\sigma\left(\mathbf{W}_{g}\mathbf{x}\right)$$ +# +# For simplicity, biases have been neglected and the linear layer split into two part, $\mathbf{W}_{f}$ and $\mathbf{W}_{g}$. +# This concept resembles the input and modulation gate in an LSTM, and has been used in many other architectures as well. +# The main motivation behind this gated activation is that it might allow to model more complex interactions and simplifies learning. +# But as in any other architecture, this is mostly a design choice and can be considered a hyperparameters. +# +# Besides the gated convolutions, we also see that the horizontal stack uses a residual connection while the vertical stack does not. +# This is because we use the output of the horizontal stack for prediction. +# Each convolution in the vertical stack also receives a strong gradient signal +# as it is only two $1\times 1$ convolutions away from the residual connection, +# and does not require another residual connection to all its earleri layers. +# +# The implementation in PyTorch is fairly straight forward for this block, +# because the visualization above gives us a computation graph to follow: + + +# %% +class GatedMaskedConv(nn.Module): + def __init__(self, c_in, **kwargs): + """Gated Convolution block implemented the computation graph shown above.""" + super().__init__() + self.conv_vert = VerticalStackConvolution(c_in, c_out=2 * c_in, **kwargs) + self.conv_horiz = HorizontalStackConvolution(c_in, c_out=2 * c_in, **kwargs) + self.conv_vert_to_horiz = nn.Conv2d(2 * c_in, 2 * c_in, kernel_size=1, padding=0) + self.conv_horiz_1x1 = nn.Conv2d(c_in, c_in, kernel_size=1, padding=0) + + def forward(self, v_stack, h_stack): + # Vertical stack (left) + v_stack_feat = self.conv_vert(v_stack) + v_val, v_gate = v_stack_feat.chunk(2, dim=1) + v_stack_out = torch.tanh(v_val) * torch.sigmoid(v_gate) + + # Horizontal stack (right) + h_stack_feat = self.conv_horiz(h_stack) + h_stack_feat = h_stack_feat + self.conv_vert_to_horiz(v_stack_feat) + h_val, h_gate = h_stack_feat.chunk(2, dim=1) + h_stack_feat = torch.tanh(h_val) * torch.sigmoid(h_gate) + h_stack_out = self.conv_horiz_1x1(h_stack_feat) + h_stack_out = h_stack_out + h_stack + + return v_stack_out, h_stack_out + + +# %% [markdown] +# ### Building the model +# +# Using the gated convolutions, we can now build our PixelCNN model. +# The architecture consists of multiple stacked GatedMaskedConv blocks, where we add an additional dilation factor to a few convolutions. +# This is used to increase the receptive field of the model and allows to take a larger context into accout during generation. +# As a reminder, dilation on a convolution works looks as follows +# (figure credit - [Vincent Dumoulin and Francesco Visin](https://arxiv.org/pdf/1603.07285.pdf)): +# +#
+# +# Note that the smaller output size is only because the animation assumes no padding. +# In our implementation, we will pad the input image correspondingly. +# Alternatively to dilated convolutions, we could downsample the input and use a encoder-decoder architecture as in PixelCNN++ [3]. +# This is especially beneficial if we want to build a very deep autoregressive model. +# Nonetheless, as we seek to train a reasonably small model, dilated convolutions are the more efficient option to use here. +# +# Below, we implement the PixelCNN model as a PyTorch Lightning module. +# Besides the stack of gated convolutions, we also have the initial +# horizontal and vertical convolutions which mask the center pixel, and a +# final $1\times 1$ convolution which maps the output features to class +# predictions. To determine the likelihood of a batch of images, we first +# create our initial features using the masked horizontal and vertical +# input convolution. Next, we forward the features through the stack of +# gated convolutions. Finally, we take the output features of the +# horizontal stack, and apply the $1\times 1$ convolution for +# classification. We use the bits per dimension metric for the likelihood, +# similarly to Tutorial 11 and assignment 3. + + +# %% +class PixelCNN(L.LightningModule): + def __init__(self, c_in, c_hidden): + super().__init__() + self.save_hyperparameters() + + # Initial convolutions skipping the center pixel + self.conv_vstack = VerticalStackConvolution(c_in, c_hidden, mask_center=True) + self.conv_hstack = HorizontalStackConvolution(c_in, c_hidden, mask_center=True) + # Convolution block of PixelCNN. We use dilation instead of downscaling + self.conv_layers = nn.ModuleList( + [ + GatedMaskedConv(c_hidden), + GatedMaskedConv(c_hidden, dilation=2), + GatedMaskedConv(c_hidden), + GatedMaskedConv(c_hidden, dilation=4), + GatedMaskedConv(c_hidden), + GatedMaskedConv(c_hidden, dilation=2), + GatedMaskedConv(c_hidden), + ] + ) + # Output classification convolution (1x1) + self.conv_out = nn.Conv2d(c_hidden, c_in * 256, kernel_size=1, padding=0) + + self.example_input_array = train_set[0][0][None] + + def forward(self, x): + """Forward image through model and return logits for each pixel. + + Args: + x: Image tensor with integer values between 0 and 255. + """ + # Scale input from 0 to 255 back to -1 to 1 + x = (x.float() / 255.0) * 2 - 1 + + # Initial convolutions + v_stack = self.conv_vstack(x) + h_stack = self.conv_hstack(x) + # Gated Convolutions + for layer in self.conv_layers: + v_stack, h_stack = layer(v_stack, h_stack) + # 1x1 classification convolution + # Apply ELU before 1x1 convolution for non-linearity on residual connection + out = self.conv_out(F.elu(h_stack)) + + # Output dimensions: [Batch, Classes, Channels, Height, Width] + out = out.reshape(out.shape[0], 256, out.shape[1] // 256, out.shape[2], out.shape[3]) + return out + + def calc_likelihood(self, x): + # Forward pass with bpd likelihood calculation + pred = self.forward(x) + nll = F.cross_entropy(pred, x, reduction="none") + bpd = nll.mean(dim=[1, 2, 3]) * np.log2(np.exp(1)) + return bpd.mean() + + @torch.no_grad() + def sample(self, img_shape, img=None): + """Sampling function for the autoregressive model. + + Args: + img_shape: Shape of the image to generate (B,C,H,W) + img (optional): If given, this tensor will be used as + a starting image. The pixels to fill + should be -1 in the input tensor. + """ + # Create empty image + if img is None: + img = torch.zeros(img_shape, dtype=torch.long).to(device) - 1 + # Generation loop + for h in tqdm(range(img_shape[2]), leave=False): + for w in range(img_shape[3]): + for c in range(img_shape[1]): + # Skip if not to be filled (-1) + if (img[:, c, h, w] != -1).all().item(): + continue + # For efficiency, we only have to input the upper part of the image + # as all other parts will be skipped by the masked convolutions anyways + pred = self.forward(img[:, :, : h + 1, :]) + probs = F.softmax(pred[:, :, c, h, w], dim=-1) + img[:, c, h, w] = torch.multinomial(probs, num_samples=1).squeeze(dim=-1) + return img + + def configure_optimizers(self): + optimizer = optim.Adam(self.parameters(), lr=1e-3) + scheduler = optim.lr_scheduler.StepLR(optimizer, 1, gamma=0.99) + return [optimizer], [scheduler] + + def training_step(self, batch, batch_idx): + loss = self.calc_likelihood(batch[0]) + self.log("train_bpd", loss) + return loss + + def validation_step(self, batch, batch_idx): + loss = self.calc_likelihood(batch[0]) + self.log("val_bpd", loss) + + def test_step(self, batch, batch_idx): + loss = self.calc_likelihood(batch[0]) + self.log("test_bpd", loss) + + +# %% [markdown] +# To sample from the autoregressive model, we need to iterate over all dimensions of the input. +# We start with an empty image, and fill the pixels one by one, starting from the upper left corner. +# Note that as for predicting $x_i$, all pixels below it have no influence on the prediction. +# Hence, we can cut the image in height without changing the prediction while increasing efficiency. +# Nevertheless, all the loops in the sampling function already show that it will take us quite some time to sample. +# A lot of computation could be reused across loop iterations as those the features on the already predicted pixels will not change over iterations. +# Nevertheless, this takes quite some effort to implement, and is often not done in implementations because in the end, +# autoregressive sampling remains sequential and slow. +# Hence, we settle with the default implementation here. +# +# Before training the model, we can check the full receptive field of the model on an MNIST image of size $28\times 28$: + +# %% +test_model = PixelCNN(c_in=1, c_hidden=64) +inp = torch.zeros(1, 1, 28, 28) +inp.requires_grad_() +out = test_model(inp) +show_center_recep_field(inp, out.squeeze(dim=2)) +del inp, out, test_model + +# %% [markdown] +# The visualization shows that for predicting any pixel, we can take almost half of the image into account. +# However, keep in mind that this is the "theoretical" receptive field and not necessarily +# the [effective receptive field](https://arxiv.org/pdf/1701.04128.pdf), which is usually much smaller. +# For a stronger model, we should therefore try to increase the receptive +# field even further. Especially, for the pixel on the bottom right, the +# very last pixel, we would be allowed to take into account the whole +# image. However, our current receptive field only spans across 1/4 of the +# image. An encoder-decoder architecture can help with this, but it also +# shows that we require a much deeper, more complex network in +# autoregressive models than in VAEs or energy-based models. + +# %% [markdown] +# ### Training loop +# +# To train the model, we again can rely on PyTorch Lightning and write a +# function below for loading the pretrained model if it exists. To reduce +# the computational cost, we have saved the validation and test score in +# the checkpoint already: + + +# %% +def train_model(**kwargs): + # Create a PyTorch Lightning trainer with the generation callback + trainer = L.Trainer( + default_root_dir=os.path.join(CHECKPOINT_PATH, "PixelCNN"), + accelerator="auto", + devices=1, + max_epochs=150, + callbacks=[ + ModelCheckpoint(save_weights_only=True, mode="min", monitor="val_bpd"), + LearningRateMonitor("epoch"), + ], + ) + result = None + # Check whether pretrained model exists. If yes, load it and skip training + pretrained_filename = os.path.join(CHECKPOINT_PATH, "PixelCNN.ckpt") + if os.path.isfile(pretrained_filename): + print("Found pretrained model, loading...") + model = PixelCNN.load_from_checkpoint(pretrained_filename) + ckpt = torch.load(pretrained_filename, map_location=device) + result = ckpt.get("result", None) + else: + model = PixelCNN(**kwargs) + trainer.fit(model, train_loader, val_loader) + model = model.to(device) + + if result is None: + # Test best model on validation and test set + val_result = trainer.test(model, dataloaders=val_loader, verbose=False) + test_result = trainer.test(model, dataloaders=test_loader, verbose=False) + result = {"test": test_result, "val": val_result} + return model, result + + +# %% [markdown] +# Training the model is time consuming and we recommend using the provided pre-trained model for going through this notebook. +# However, feel free to play around with the hyperparameter like number of layers etc. +# if you want to get a feeling for those. +# +# When calling the training function with a pre-trained model, we automatically load it and print its test performance: + +# %% +model, result = train_model(c_in=1, c_hidden=64) +test_res = result["test"][0] +print( + "Test bits per dimension: %4.3fbpd" % (test_res["test_loss"] if "test_loss" in test_res else test_res["test_bpd"]) +) + +# %% [markdown] +# With a test performance of 0.809bpd, the PixelCNN significantly outperforms the normalizing flows we have seen in Tutorial 11. +# Considering image modeling as an autoregressive problem simplifies the learning process as predicting +# one pixel given the ground truth of all others is much easier than predicting all pixels at once. +# In addition, PixelCNN can explicitly predict the pixel values by a discrete softmax while +# Normalizing Flows have to learn transformations in continuous latent space. +# These two aspects allow the PixelCNN to achieve a notably better performance. +# +# To fully compare the models, let's also measure the number of parameters of the PixelCNN: + +# %% +num_params = sum(np.prod(param.shape) for param in model.parameters()) +print(f"Number of parameters: {num_params:,}") + +# %% [markdown] +# Compared to the multi-scale normalizing flows, the PixelCNN has considerably less parameters. +# Of course, the number of parameters depend on our hyperparameter choices. +# Nevertheless, in general, it can be said that autoregressive models +# require considerably less parameters than normalizing flows to reach +# good performance, based on the reasons stated above. Still, +# autoregressive models are much slower in sampling than normalizing +# flows, which limits their possible applications. + +# %% [markdown] +# ## Sampling +# +# One way of qualitatively analysing generative models is by looking at the actual samples. +# Let's therefore use our sampling function to generate a few digits: + +# %% +L.seed_everything(1) +samples = model.sample(img_shape=(16, 1, 28, 28)) +show_imgs(samples.cpu()) + +# %% [markdown] +# Most of the samples can be identified as digits, and overall we achieve a better quality than we had in normalizing flows. +# This goes along with the lower likelihood we achieved with autoregressive models. +# Nevertheless, we also see that there is still place for improvement +# as a considerable amount of samples cannot be identified (for example the first row). +# Deeper autoregressive models are expected to achieve better quality, +# as they can take more context into account for generating the pixels. +# +# Note that on Google Colab, you might see different results, specifically with a white line at the top. +# After some debugging, it seemed that the difference occurs inside the dilated convolution, +# as it gives different results for different batch sizes. +# However, it is hard to debug this further as it might be a bug of the installed PyTorch version on Google Colab. +# +# The trained model itself is not restricted to any specific image size. +# However, what happens if we actually sample a larger image than we had +# seen in our training dataset? Let's try below to sample images of size +# $64\times64$ instead of $28\times28$: + +# %% +L.seed_everything(1) +samples = model.sample(img_shape=(8, 1, 64, 64)) +show_imgs(samples.cpu()) + +# %% [markdown] +# The larger images show that changing the size of the image during testing confuses the model +# and generates abstract figures (you can sometimes spot a digit in the upper left corner). +# In addition, sampling for images of 64x64 pixels take more than a minute on a GPU. +# Clearly, autoregressive models cannot be scaled to large images without changing the sampling procedure such as with [forecasting](https://arxiv.org/abs/2002.09928). +# Our implementation is also not the most efficient as many computations can be stored and reused throughout the sampling process. +# Nevertheless, the sampling procedure stays sequential which is +# inherently slower than parallel generation like done in normalizing +# flows. + +# %% [markdown] +# ### Autocompletion +# +# One common application done with autoregressive models is +# auto-completing an image. As autoregressive models predict pixels one by +# one, we can set the first $N$ pixels to predefined values and check how +# the model completes the image. For implementing this, we just need to +# skip the iterations in the sampling loop that already have a value +# unequals -1. See above in our PyTorch Lightning module for the specific +# implementation. In the cell below, we randomly take three images from +# the training set, mask about the lower half of the image, and let the +# model autocomplete it. To see the diversity of samples, we do this 12 +# times for each image: + + +# %% +def autocomplete_image(img): + # Remove lower half of the image + img_init = img.clone() + img_init[:, 10:, :] = -1 + print("Original image and input image to sampling:") + show_imgs([img, img_init]) + # Generate 12 example completions + img_init = img_init.unsqueeze(dim=0).expand(12, -1, -1, -1).to(device) + L.seed_everything(1) + img_generated = model.sample(img_init.shape, img_init) + print("Autocompletion samples:") + show_imgs(img_generated) + + +for i in range(1, 4): + img = train_set[i][0] + autocomplete_image(img) + +# %% [markdown] +# For the first two digits (7 and 6), we see that the 12 samples all +# result in a shape which resemble the original digit. Nevertheless, there +# are some style difference in writing the 7, and some deformed sixes in +# the samples. When autocompleting the 9 below, we see that the model can +# fit multiple digits to it. We obtain diverse samples from 0, 3, 8 and 9. +# This shows that despite having no latent space, we can still obtain +# diverse samples from an autoregressive model. + +# %% [markdown] +# ### Visualization of the predictive distribution (softmax) +# +# Autoregressive models use a softmax over 256 values to predict the next pixel. +# This gives the model a large flexibility as the probabilities for each pixel value can be learned independently if necessary. +# However, the values are actually not independent because the values 32 and 33 are much closer than 32 and 255. +# In the following, we visualize the softmax distribution that the model predicts to gain insights how it has learned the relationships of close-by pixels. +# +# To do this, we first run the model on a batch of images and store the output softmax distributions: + +# %% +det_loader = data.DataLoader(train_set, batch_size=128, shuffle=False, drop_last=False) +imgs, _ = next(iter(det_loader)) +imgs = imgs.to(device) +with torch.no_grad(): + out = model(imgs) + out = F.softmax(out, dim=1) + mean_out = out.mean(dim=[0, 2, 3, 4]).cpu().numpy() + out = out.cpu().numpy() + +# %% [markdown] +# Before diving into the model, let's visualize the distribution of the pixel values in the whole dataset: + +# %% +sns.set() +plot_args = {"color": to_rgb("C0") + (0.5,), "edgecolor": "C0", "linewidth": 0.5, "width": 1.0} +plt.hist(imgs.view(-1).cpu().numpy(), bins=256, density=True, **plot_args) +plt.yscale("log") +plt.xticks([0, 64, 128, 192, 256]) +plt.show() +plt.close() + +# %% [markdown] +# As we would expect from the seen images, the pixel value 0 (black) is the dominant value, followed by a batch of values between 250 and 255. +# Note that we use a log scale on the y-axis due to the big imbalance in the dataset. +# Interestingly, the pixel values 64, 128 and 191 also stand out which is likely due to the quantization used during the creation of the dataset. +# For RGB images, we would also see two peaks around 0 and 255, +# but the values in between would be much more frequent than in MNIST +# (see Figure 1 in the [PixelCNN++](https://arxiv.org/pdf/1701.05517.pdf) for a visualization on CIFAR10). +# +# Next, we can visualize the distribution our model predicts (in average): + +# %% +plt.bar(np.arange(mean_out.shape[0]), mean_out, **plot_args) +plt.yscale("log") +plt.xticks([0, 64, 128, 192, 256]) +plt.show() +plt.close() + +# %% [markdown] +# This distribution is very close to the actual dataset distribution. +# This is in general a good sign, but we can see a slightly smoother histogram than above. +# +# Finally, to take a closer look at learned value relations, we can +# visualize the distribution for individual pixel predictions to get a +# better intuition. For this, we pick 4 random images and pixels, and +# visualize their distribution below: + +# %% +fig, ax = plt.subplots(2, 2, figsize=(10, 6)) +for i in range(4): + ax_sub = ax[i // 2][i % 2] + ax_sub.bar(np.arange(out.shape[1], dtype=np.int32), out[i + 4, :, 0, 14, 14], **plot_args) + ax_sub.set_yscale("log") + ax_sub.set_xticks([0, 64, 128, 192, 256]) +plt.show() +plt.close() + +# %% [markdown] +# Overall we see a very diverse set of distributions, with a usual peak +# for 0 and close to 1. However, the distributions in the first row show a +# potentially undesirable behavior. For instance, the value 242 has a +# 1000x lower likelihood than 243 although they are extremely close and +# can often not be distinguished. This shows that the model might have not +# generlized well over pixel values. The better solution to this problem +# is to use discrete logitics mixtures instead of a softmax distribution. +# A discrete logistic distribution can be imagined as discretized, binned +# Gaussians. Using a mixture of discrete logistics instead of a softmax +# introduces an inductive bias to the model to assign close-by values +# similar likelihoods. We can visualize a discrete logistic below: + +# %% +mu = Tensor([128]) +sigma = Tensor([2.0]) + + +def discrete_logistic(x, mu, sigma): + return torch.sigmoid((x + 0.5 - mu) / sigma) - torch.sigmoid((x - 0.5 - mu) / sigma) + + +x = torch.arange(256) +p = discrete_logistic(x, mu, sigma) + +# Visualization +plt.figure(figsize=(6, 3)) +plt.bar(x.numpy(), p.numpy(), **plot_args) +plt.xlim(96, 160) +plt.title("Discrete logistic distribution") +plt.xlabel("Pixel value") +plt.ylabel("Probability") +plt.show() +plt.close() + +# %% [markdown] +# Instead of the softmax, the model would output mean and standard +# deviations for the $K$ logistics we use in the mixture. This is one of +# the improvements in autoregressive models that PixelCNN++ [3] has +# introduced compared to the original PixelCNN. + +# %% [markdown] +# ## Conclusion +# +# In this tutorial, we have looked at autoregressive image modeling, and +# implemented the PixelCNN architecture. With the usage of masked +# convolutions, we are able to apply a convolutional network in which a +# pixel is only influenced by all its predecessors. Separating the masked +# convolution into a horizontal and vertical stack allowed us to remove +# the known blind spot on the right upper row of a pixel. In experiments, +# autoregressive models outperformed normalizing flows in terms of bits +# per dimension, but are much slower to sample from. Improvements, that we +# have not implemented ourselves here, are discrete logistic mixtures, a +# downsampling architecture, and changing the pixel order in a diagonal +# fashion (see PixelSNAIL). Overall, autoregressive models are another, +# strong family of generative models, which however are mostly used in +# sequence tasks because of their linear scaling in sampling time than +# quadratic as on images. + +# %% [markdown] +# ## References +# [1] van den Oord, A., et al. +# "Pixel Recurrent Neural Networks." +# arXiv preprint arXiv:1601.06759 (2016). +# [Link](https://arxiv.org/abs/1601.06759) +# +# [2] van den Oord, A., et al. +# "Conditional Image Generation with PixelCNN Decoders." +# In Advances in Neural Information Processing Systems 29, pp. +# 4790–4798 (2016). +# [Link](http://papers.nips.cc/paper/6527-conditional-image-generation-with-pixelcnn-decoders.pdf) +# +# [3] Salimans, Tim, et al. +# "PixelCNN++: Improving the PixelCNN with Discretized Logistic Mixture Likelihood and Other Modifications." +# arXiv preprint arXiv:1701.05517 (2017). +# [Link](https://arxiv.org/abs/1701.05517) diff --git a/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/PixelCNN_GatedConv.svg b/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/PixelCNN_GatedConv.svg new file mode 100644 index 0000000..2104663 --- /dev/null +++ b/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/PixelCNN_GatedConv.svg @@ -0,0 +1,2195 @@ + + + + + + image/svg+xmldiff --git a/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/autoregressive_image_modeling.svg b/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/autoregressive_image_modeling.svg new file mode 100644 index 0000000..8584a8b --- /dev/null +++ b/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/autoregressive_image_modeling.svg @@ -0,0 +1,961 @@ + + + + + + image/svg+xmldiff --git a/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/masked_convolution.svg b/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/masked_convolution.svg new file mode 100644 index 0000000..925dc48 --- /dev/null +++ b/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/masked_convolution.svg @@ -0,0 +1,923 @@ + + + + + + image/svg+xmldiff --git a/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/pixelcnn_blind_spot.svg b/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/pixelcnn_blind_spot.svg new file mode 100644 index 0000000..18ade2f --- /dev/null +++ b/_notebooks/course_UvA-DL/10-autoregressive-image-modeling/pixelcnn_blind_spot.svg @@ -0,0 +1,1091 @@ + + + + + + image/svg+xmldiff --git a/_notebooks/course_UvA-DL/11-vision-transformer/.meta.yml b/_notebooks/course_UvA-DL/11-vision-transformer/.meta.yml new file mode 100644 index 0000000..171d877 --- /dev/null +++ b/_notebooks/course_UvA-DL/11-vision-transformer/.meta.yml @@ -0,0 +1,23 @@ +title: "Tutorial 11: Vision Transformers" +author: Phillip Lippe +created: 2021-08-21 +updated: 2023-03-14 +license: CC BY-SA +description: | + In this tutorial, we will take a closer look at a recent new trend: Transformers for Computer Vision. + Since [Alexey Dosovitskiy et al.](https://openreview.net/pdf?id=YicbFdNTTy) successfully applied a Transformer on a variety of image recognition benchmarks, there have been an incredible amount of follow-up works showing that CNNs might not be optimal architecture for Computer Vision anymore. + But how do Vision Transformers work exactly, and what benefits and drawbacks do they offer in contrast to CNNs? + We will answer these questions by implementing a Vision Transformer ourselves, and train it on the popular, small dataset CIFAR10. + We will compare these results to popular convolutional architectures such as Inception, ResNet and DenseNet. + This notebook is part of a lecture series on Deep Learning at the University of Amsterdam. + The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io. +tags: + - Image +requirements: + - torchvision + - matplotlib + - seaborn + - lightning>=2.0.0rc0 +accelerator: + - CPU + - GPU diff --git a/docs/_static/images/course_UvA-DL/11-vision-transformer.jpg b/_notebooks/course_UvA-DL/11-vision-transformer/.thumb.jpg similarity index 100% rename from docs/_static/images/course_UvA-DL/11-vision-transformer.jpg rename to _notebooks/course_UvA-DL/11-vision-transformer/.thumb.jpg diff --git a/_notebooks/course_UvA-DL/11-vision-transformer/Vision_Transformer.py b/_notebooks/course_UvA-DL/11-vision-transformer/Vision_Transformer.py new file mode 100644 index 0000000..9d8cef8 --- /dev/null +++ b/_notebooks/course_UvA-DL/11-vision-transformer/Vision_Transformer.py @@ -0,0 +1,530 @@ +# %% [markdown] +#
+# Let's start with importing our standard set of libraries. + +# %% +import os +import urllib.request +from urllib.error import HTTPError + +import lightning as L +import matplotlib +import matplotlib.pyplot as plt +import matplotlib_inline.backend_inline +import seaborn as sns +import torch +import torch.nn as nn +import torch.nn.functional as F +import torch.optim as optim +import torch.utils.data as data +import torchvision +from lightning.pytorch.callbacks import LearningRateMonitor, ModelCheckpoint +from torchvision import transforms +from torchvision.datasets import CIFAR10 + +plt.set_cmap("cividis") +# %matplotlib inline +matplotlib_inline.backend_inline.set_matplotlib_formats("svg", "pdf") # For export +matplotlib.rcParams["lines.linewidth"] = 2.0 +sns.reset_orig() + +# %load_ext tensorboard + +# Path to the folder where the datasets are/should be downloaded (e.g. CIFAR10) +DATASET_PATH = os.environ.get("PATH_DATASETS", "data/") +# Path to the folder where the pretrained models are saved +CHECKPOINT_PATH = os.environ.get("PATH_CHECKPOINT", "saved_models/VisionTransformers/") + +# Setting the seed +L.seed_everything(42) + +# Ensure that all operations are deterministic on GPU (if used) for reproducibility +torch.backends.cudnn.deterministic = True +torch.backends.cudnn.benchmark = False + +device = torch.device("cuda:0") if torch.cuda.is_available() else torch.device("cpu") +print("Device:", device) + +# %% [markdown] +# We provide a pre-trained Vision Transformer which we download in the next cell. +# However, Vision Transformers can be relatively quickly trained on CIFAR10 with an overall training time of less than an hour on an NVIDIA TitanRTX. +# Feel free to experiment with training your own Transformer once you went through the whole notebook. + +# %% +# Github URL where saved models are stored for this tutorial +base_url = "https://raw.githubusercontent.com/phlippe/saved_models/main/" +# Files to download +pretrained_files = [ + "tutorial15/ViT.ckpt", + "tutorial15/tensorboards/ViT/events.out.tfevents.ViT", + "tutorial5/tensorboards/ResNet/events.out.tfevents.resnet", +] +# Create checkpoint path if it doesn't exist yet +os.makedirs(CHECKPOINT_PATH, exist_ok=True) + +# For each file, check whether it already exists. If not, try downloading it. +for file_name in pretrained_files: + file_path = os.path.join(CHECKPOINT_PATH, file_name.split("/", 1)[1]) + if "/" in file_name.split("/", 1)[1]: + os.makedirs(file_path.rsplit("/", 1)[0], exist_ok=True) + if not os.path.isfile(file_path): + file_url = base_url + file_name + print("Downloading %s..." % file_url) + try: + urllib.request.urlretrieve(file_url, file_path) + except HTTPError as e: + print( + "Something went wrong. Please try to download the file from the GDrive folder, or contact the author with the full output including the following error:\n", + e, + ) + +# %% [markdown] +# We load the CIFAR10 dataset below. +# We use the same setup of the datasets and data augmentations as for the CNNs in Tutorial 5 to keep a fair comparison. +# The constants in the `transforms.Normalize` correspond to the values +# that scale and shift the data to a zero mean and standard deviation of +# one. + +# %% +test_transform = transforms.Compose( + [ + transforms.ToTensor(), + transforms.Normalize([0.49139968, 0.48215841, 0.44653091], [0.24703223, 0.24348513, 0.26158784]), + ] +) +# For training, we add some augmentation. Networks are too powerful and would overfit. +train_transform = transforms.Compose( + [ + transforms.RandomHorizontalFlip(), + transforms.RandomResizedCrop((32, 32), scale=(0.8, 1.0), ratio=(0.9, 1.1)), + transforms.ToTensor(), + transforms.Normalize([0.49139968, 0.48215841, 0.44653091], [0.24703223, 0.24348513, 0.26158784]), + ] +) +# Loading the training dataset. We need to split it into a training and validation part +# We need to do a little trick because the validation set should not use the augmentation. +train_dataset = CIFAR10(root=DATASET_PATH, train=True, transform=train_transform, download=True) +val_dataset = CIFAR10(root=DATASET_PATH, train=True, transform=test_transform, download=True) +L.seed_everything(42) +train_set, _ = torch.utils.data.random_split(train_dataset, [45000, 5000]) +L.seed_everything(42) +_, val_set = torch.utils.data.random_split(val_dataset, [45000, 5000]) + +# Loading the test set +test_set = CIFAR10(root=DATASET_PATH, train=False, transform=test_transform, download=True) + +# We define a set of data loaders that we can use for various purposes later. +train_loader = data.DataLoader(train_set, batch_size=128, shuffle=True, drop_last=True, pin_memory=True, num_workers=4) +val_loader = data.DataLoader(val_set, batch_size=128, shuffle=False, drop_last=False, num_workers=4) +test_loader = data.DataLoader(test_set, batch_size=128, shuffle=False, drop_last=False, num_workers=4) + +# Visualize some examples +NUM_IMAGES = 4 +CIFAR_images = torch.stack([val_set[idx][0] for idx in range(NUM_IMAGES)], dim=0) +img_grid = torchvision.utils.make_grid(CIFAR_images, nrow=4, normalize=True, pad_value=0.9) +img_grid = img_grid.permute(1, 2, 0) + +plt.figure(figsize=(8, 8)) +plt.title("Image examples of the CIFAR10 dataset") +plt.imshow(img_grid) +plt.axis("off") +plt.show() +plt.close() + +# %% [markdown] +# ## Transformers for image classification +# +# Transformers have been originally proposed to process sets since it is a permutation-equivariant architecture, i.e., producing the same output permuted if the input is permuted. +# To apply Transformers to sequences, we have simply added a positional encoding to the input feature vectors, and the model learned by itself what to do with it. +# So, why not do the same thing on images? +# This is exactly what [Alexey Dosovitskiy et al. ](https://openreview.net/pdf?id=YicbFdNTTy) proposed in their paper "An Image is Worth 16x16 Words: Transformers for Image Recognition at Scale". +# Specifically, the Vision Transformer is a model for image classification that views images as sequences of smaller patches. +# As a preprocessing step, we split an image of, for example, $48\times 48$ pixels into 9 $16\times 16$ patches. +# Each of those patches is considered to be a "word"/"token", and projected to a feature space. +# With adding positional encodings and a token for classification on top, we can apply a Transformer as usual to this sequence and start training it for our task. +# A nice GIF visualization of the architecture is shown below (figure credit - [Phil Wang](https://github.com/lucidrains/vit-pytorch/blob/main/images/vit.gif)): +# +#
+# +# We will walk step by step through the Vision Transformer, and implement all parts by ourselves. +# First, let's implement the image preprocessing: an image of size $N\times N$ has to be split into $(N/M)^2$ patches of size $M\times M$. +# These represent the input words to the Transformer. + + +# %% +def img_to_patch(x, patch_size, flatten_channels=True): + """ + Inputs: + x - Tensor representing the image of shape [B, C, H, W] + patch_size - Number of pixels per dimension of the patches (integer) + flatten_channels - If True, the patches will be returned in a flattened format + as a feature vector instead of a image grid. + """ + B, C, H, W = x.shape + x = x.reshape(B, C, H // patch_size, patch_size, W // patch_size, patch_size) + x = x.permute(0, 2, 4, 1, 3, 5) # [B, H', W', C, p_H, p_W] + x = x.flatten(1, 2) # [B, H'*W', C, p_H, p_W] + if flatten_channels: + x = x.flatten(2, 4) # [B, H'*W', C*p_H*p_W] + return x + + +# %% [markdown] +# Let's take a look at how that works for our CIFAR examples above. +# For our images of size $32\times 32$, we choose a patch size of 4. +# Hence, we obtain sequences of 64 patches of size $4\times 4$. +# We visualize them below: + +# %% +img_patches = img_to_patch(CIFAR_images, patch_size=4, flatten_channels=False) + +fig, ax = plt.subplots(CIFAR_images.shape[0], 1, figsize=(14, 3)) +fig.suptitle("Images as input sequences of patches") +for i in range(CIFAR_images.shape[0]): + img_grid = torchvision.utils.make_grid(img_patches[i], nrow=64, normalize=True, pad_value=0.9) + img_grid = img_grid.permute(1, 2, 0) + ax[i].imshow(img_grid) + ax[i].axis("off") +plt.show() +plt.close() + +# %% [markdown] +# Compared to the original images, it is much harder to recognize the objects from those patch lists now. +# Still, this is the input we provide to the Transformer for classifying the images. +# The model has to learn itself how it has to combine the patches to recognize the objects. +# The inductive bias in CNNs that an image is grid of pixels, is lost in this input format. +# +# After we have looked at the preprocessing, we can now start building the Transformer model. +# Since we have discussed the fundamentals of Multi-Head Attention in [Tutorial 6](https://uvadlc-notebooks.readthedocs.io/en/latest/tutorial_notebooks/tutorial6/Transformers_and_MHAttention.html), we will use the PyTorch module `nn.MultiheadAttention` ([docs](https://pytorch.org/docs/stable/generated/torch.nn.MultiheadAttention.html?highlight=multihead#torch.nn.MultiheadAttention)) here. +# Further, we use the Pre-Layer Normalization version of the Transformer blocks proposed by [Ruibin Xiong et al. ](http://proceedings.mlr.press/v119/xiong20b/xiong20b.pdf) in 2020. +# The idea is to apply Layer Normalization not in between residual blocks, but instead as a first layer in the residual blocks. +# This reorganization of the layers supports better gradient flow and removes the necessity of a warm-up stage. +# A visualization of the difference between the standard Post-LN and the Pre-LN version is shown below. +# +#
+# +# The implementation of the Pre-LN attention block looks as follows: + + +# %% +class AttentionBlock(nn.Module): + def __init__(self, embed_dim, hidden_dim, num_heads, dropout=0.0): + """ + Inputs: + embed_dim - Dimensionality of input and attention feature vectors + hidden_dim - Dimensionality of hidden layer in feed-forward network + (usually 2-4x larger than embed_dim) + num_heads - Number of heads to use in the Multi-Head Attention block + dropout - Amount of dropout to apply in the feed-forward network + """ + super().__init__() + + self.layer_norm_1 = nn.LayerNorm(embed_dim) + self.attn = nn.MultiheadAttention(embed_dim, num_heads) + self.layer_norm_2 = nn.LayerNorm(embed_dim) + self.linear = nn.Sequential( + nn.Linear(embed_dim, hidden_dim), + nn.GELU(), + nn.Dropout(dropout), + nn.Linear(hidden_dim, embed_dim), + nn.Dropout(dropout), + ) + + def forward(self, x): + inp_x = self.layer_norm_1(x) + x = x + self.attn(inp_x, inp_x, inp_x)[0] + x = x + self.linear(self.layer_norm_2(x)) + return x + + +# %% [markdown] +# Now we have all modules ready to build our own Vision Transformer. +# Besides the Transformer encoder, we need the following modules: +# +# * A **linear projection** layer that maps the input patches to a feature vector of larger size. +# It is implemented by a simple linear layer that takes each $M\times M$ patch independently as input. +# * A **classification token** that is added to the input sequence. +# We will use the output feature vector of the classification token (CLS token in short) for determining the classification prediction. +# * Learnable **positional encodings** that are added to the tokens before being processed by the Transformer. +# Those are needed to learn position-dependent information, and convert the set to a sequence. +# Since we usually work with a fixed resolution, we can learn the positional encodings instead of having the pattern of sine and cosine functions. +# * A **MLP head** that takes the output feature vector of the CLS token, and maps it to a classification prediction. +# This is usually implemented by a small feed-forward network or even a single linear layer. +# +# With those components in mind, let's implement the full Vision Transformer below: + + +# %% +class VisionTransformer(nn.Module): + def __init__( + self, + embed_dim, + hidden_dim, + num_channels, + num_heads, + num_layers, + num_classes, + patch_size, + num_patches, + dropout=0.0, + ): + """ + Inputs: + embed_dim - Dimensionality of the input feature vectors to the Transformer + hidden_dim - Dimensionality of the hidden layer in the feed-forward networks + within the Transformer + num_channels - Number of channels of the input (3 for RGB) + num_heads - Number of heads to use in the Multi-Head Attention block + num_layers - Number of layers to use in the Transformer + num_classes - Number of classes to predict + patch_size - Number of pixels that the patches have per dimension + num_patches - Maximum number of patches an image can have + dropout - Amount of dropout to apply in the feed-forward network and + on the input encoding + """ + super().__init__() + + self.patch_size = patch_size + + # Layers/Networks + self.input_layer = nn.Linear(num_channels * (patch_size**2), embed_dim) + self.transformer = nn.Sequential( + *(AttentionBlock(embed_dim, hidden_dim, num_heads, dropout=dropout) for _ in range(num_layers)) + ) + self.mlp_head = nn.Sequential(nn.LayerNorm(embed_dim), nn.Linear(embed_dim, num_classes)) + self.dropout = nn.Dropout(dropout) + + # Parameters/Embeddings + self.cls_token = nn.Parameter(torch.randn(1, 1, embed_dim)) + self.pos_embedding = nn.Parameter(torch.randn(1, 1 + num_patches, embed_dim)) + + def forward(self, x): + # Preprocess input + x = img_to_patch(x, self.patch_size) + B, T, _ = x.shape + x = self.input_layer(x) + + # Add CLS token and positional encoding + cls_token = self.cls_token.repeat(B, 1, 1) + x = torch.cat([cls_token, x], dim=1) + x = x + self.pos_embedding[:, : T + 1] + + # Apply Transforrmer + x = self.dropout(x) + x = x.transpose(0, 1) + x = self.transformer(x) + + # Perform classification prediction + cls = x[0] + out = self.mlp_head(cls) + return out + + +# %% [markdown] +# Finally, we can put everything into a PyTorch Lightning Module as usual. +# We use `torch.optim.AdamW` as the optimizer, which is Adam with a corrected weight decay implementation. +# Since we use the Pre-LN Transformer version, we do not need to use a learning rate warmup stage anymore. +# Instead, we use the same learning rate scheduler as the CNNs in our previous tutorial on image classification. + + +# %% +class ViT(L.LightningModule): + def __init__(self, model_kwargs, lr): + super().__init__() + self.save_hyperparameters() + self.model = VisionTransformer(**model_kwargs) + self.example_input_array = next(iter(train_loader))[0] + + def forward(self, x): + return self.model(x) + + def configure_optimizers(self): + optimizer = optim.AdamW(self.parameters(), lr=self.hparams.lr) + lr_scheduler = optim.lr_scheduler.MultiStepLR(optimizer, milestones=[100, 150], gamma=0.1) + return [optimizer], [lr_scheduler] + + def _calculate_loss(self, batch, mode="train"): + imgs, labels = batch + preds = self.model(imgs) + loss = F.cross_entropy(preds, labels) + acc = (preds.argmax(dim=-1) == labels).float().mean() + + self.log("%s_loss" % mode, loss) + self.log("%s_acc" % mode, acc) + return loss + + def training_step(self, batch, batch_idx): + loss = self._calculate_loss(batch, mode="train") + return loss + + def validation_step(self, batch, batch_idx): + self._calculate_loss(batch, mode="val") + + def test_step(self, batch, batch_idx): + self._calculate_loss(batch, mode="test") + + +# %% [markdown] +# ## Experiments +# +# Commonly, Vision Transformers are applied to large-scale image classification benchmarks such as ImageNet to leverage their full potential. +# However, here we take a step back and ask: can Vision Transformer also succeed on classical, small benchmarks such as CIFAR10? +# To find this out, we train a Vision Transformer from scratch on the CIFAR10 dataset. +# Let's first create a training function for our PyTorch Lightning module +# which also loads the pre-trained model if you have downloaded it above. + + +# %% +def train_model(**kwargs): + trainer = L.Trainer( + default_root_dir=os.path.join(CHECKPOINT_PATH, "ViT"), + accelerator="auto", + devices=1, + max_epochs=180, + callbacks=[ + ModelCheckpoint(save_weights_only=True, mode="max", monitor="val_acc"), + LearningRateMonitor("epoch"), + ], + ) + trainer.logger._log_graph = True # If True, we plot the computation graph in tensorboard + trainer.logger._default_hp_metric = None # Optional logging argument that we don't need + + # Check whether pretrained model exists. If yes, load it and skip training + pretrained_filename = os.path.join(CHECKPOINT_PATH, "ViT.ckpt") + if os.path.isfile(pretrained_filename): + print("Found pretrained model at %s, loading..." % pretrained_filename) + # Automatically loads the model with the saved hyperparameters + model = ViT.load_from_checkpoint(pretrained_filename) + else: + L.seed_everything(42) # To be reproducable + model = ViT(**kwargs) + trainer.fit(model, train_loader, val_loader) + # Load best checkpoint after training + model = ViT.load_from_checkpoint(trainer.checkpoint_callback.best_model_path) + + # Test best model on validation and test set + val_result = trainer.test(model, dataloaders=val_loader, verbose=False) + test_result = trainer.test(model, dataloaders=test_loader, verbose=False) + result = {"test": test_result[0]["test_acc"], "val": val_result[0]["test_acc"]} + + return model, result + + +# %% [markdown] +# Now, we can already start training our model. +# As seen in our implementation, we have couple of hyperparameter that we have to choose. +# When creating this notebook, we have performed a small grid search over hyperparameters and listed the best hyperparameters in the cell below. +# Nevertheless, it is worth to discuss the influence that each hyperparameter has, and what intuition we have for choosing its value. +# +# First, let's consider the patch size. +# The smaller we make the patches, the longer the input sequences to the Transformer become. +# While in general, this allows the Transformer to model more complex functions, it requires a longer computation time due to its quadratic memory usage in the attention layer. +# Furthermore, small patches can make the task more difficult since the Transformer has to learn which patches are close-by, and which are far away. +# We experimented with patch sizes of 2, 4 and 8 which gives us the input sequence lengths of 256, 64, and 16 respectively. +# We found 4 to result in the best performance, and hence pick it below. +# +# Next, the embedding and hidden dimensionality have a similar impact to a Transformer as to an MLP. +# The larger the sizes, the more complex the model becomes, and the longer it takes to train. +# In Transformer however, we have one more aspect to consider: the query-key sizes in the Multi-Head Attention layers. +# Each key has the feature dimensionality of `embed_dim/num_heads`. +# Considering that we have an input sequence length of 64, a minimum reasonable size for the key vectors is 16 or 32. +# Lower dimensionalities can restrain the possible attention maps too much. +# We observed that more than 8 heads are not necessary for the Transformer, and therefore pick a embedding dimensionality of `256`. +# The hidden dimensionality in the feed-forward networks is usually 2-4x larger than the embedding dimensionality, and thus we pick `512`. +# +# Finally, the learning rate for Transformers is usually relatively small, and in papers, a common value to use is 3e-5. +# However, since we work with a smaller dataset and have a potentially easier task, we found that we are able to increase the learning rate to 3e-4 without any problems. +# To reduce overfitting, we use a dropout value of 0.2. +# Remember that we also use small image augmentations as regularization during training. +# +# Feel free to explore the hyperparameters yourself by changing the values below. +# In general, the Vision Transformer did not show to be too sensitive to +# the hyperparameter choices on the CIFAR10 dataset. + +# %% +model, results = train_model( + model_kwargs={ + "embed_dim": 256, + "hidden_dim": 512, + "num_heads": 8, + "num_layers": 6, + "patch_size": 4, + "num_channels": 3, + "num_patches": 64, + "num_classes": 10, + "dropout": 0.2, + }, + lr=3e-4, +) +print("ViT results", results) + +# %% [markdown] +# The Vision Transformer achieves a validation and test performance of about 75%. +# In comparison, almost all CNN architectures that we have tested in [Tutorial 5](https://uvadlc-notebooks.readthedocs.io/en/latest/tutorial_notebooks/tutorial5/Inception_ResNet_DenseNet.html) obtained a classification performance of around 90%. +# This is a considerable gap and shows that although Vision Transformers perform strongly on ImageNet with potential pretraining, they cannot come close to simple CNNs on CIFAR10 when being trained from scratch. +# The differences between a CNN and Transformer can be well observed in the training curves. +# Let's look at them in a tensorboard below: + +# %% +# Opens tensorboard in notebook. Adjust the path to your CHECKPOINT_PATH! +# %tensorboard --logdir ../saved_models/tutorial15/tensorboards/ + +# %% [markdown] +#
+ +# %% [markdown] +# The tensorboard compares the Vision Transformer to a ResNet trained on CIFAR10. +# When looking at the training losses, we see that the ResNet learns much more quickly in the first iterations. +# While the learning rate might have an influence on the initial learning speed, we see the same trend in the validation accuracy. +# The ResNet achieves the best performance of the Vision Transformer after just 5 epochs (2000 iterations). +# Further, while the ResNet training loss and validation accuracy have a similar trend, the validation performance of the Vision Transformers only marginally changes after 10k iterations while the training loss has almost just started going down. +# Yet, the Vision Transformer is also able to achieve a close-to 100% accuracy on the training set. +# +# All those observed phenomenons can be explained with a concept that we have visited before: inductive biases. +# Convolutional Neural Networks have been designed with the assumption that images are translation invariant. +# Hence, we apply convolutions with shared filters across the image. +# Furthermore, a CNN architecture integrates the concept of distance in an image: two pixels that are close to each other are more related than two distant pixels. +# Local patterns are combined into larger patterns, until we perform our classification prediction. +# All those aspects are inductive biases of a CNN. +# In contrast, a Vision Transformer does not know which two pixels are close to each other, and which are far apart. +# It has to learn this information solely from the sparse learning signal of the classification task. +# This is a huge disadvantage when we have a small dataset since such information is crucial for generalizing to an unseen test dataset. +# With large enough datasets and/or good pre-training, a Transformer can learn this information without the need of inductive biases, and instead is more flexible than a CNN. +# Especially long-distance relations between local patterns can be difficult to process in CNNs, while in Transformers, all patches have the distance of one. +# This is why Vision Transformers are so strong on large-scale datasets +# such as ImageNet, but underperform a lot when being applied to a small +# dataset such as CIFAR10. + +# %% [markdown] +# ## Conclusion +# +# In this tutorial, we have implemented our own Vision Transformer from scratch and applied it on the task of image classification. +# Vision Transformers work by splitting an image into a sequence of smaller patches, use those as input to a standard Transformer encoder. +# While Vision Transformers achieved outstanding results on large-scale image recognition benchmarks such as ImageNet, they considerably underperform when being trained from scratch on small-scale datasets like CIFAR10. +# The reason is that in contrast to CNNs, Transformers do not have the inductive biases of translation invariance and the feature hierachy (i.e. larger patterns consist of many smaller patterns). +# However, these aspects can be learned when enough data is provided, or the model has been pre-trained on other large-scale tasks. +# Considering that Vision Transformers have just been proposed end of 2020, there is likely a lot more to come on Transformers for Computer Vision. +# +# +# ### References +# +# Dosovitskiy, Alexey, et al. +# "An image is worth 16x16 words: Transformers for image recognition at scale." +# International Conference on Representation Learning (2021). +# [link](https://arxiv.org/pdf/2010.11929.pdf) +# +# Chen, Xiangning, et al. +# "When Vision Transformers Outperform ResNets without Pretraining or Strong Data Augmentations." +# arXiv preprint arXiv:2106.01548 (2021). +# [link](https://arxiv.org/abs/2106.01548) +# +# Tolstikhin, Ilya, et al. +# "MLP-mixer: An all-MLP Architecture for Vision." +# arXiv preprint arXiv:2105.01601 (2021). +# [link](https://arxiv.org/abs/2105.01601) +# +# Xiong, Ruibin, et al. +# "On layer normalization in the transformer architecture." +# International Conference on Machine Learning. +# PMLR, 2020. +# [link](http://proceedings.mlr.press/v119/xiong20b/xiong20b.pdf) diff --git a/_notebooks/course_UvA-DL/11-vision-transformer/pre_layer_norm.svg b/_notebooks/course_UvA-DL/11-vision-transformer/pre_layer_norm.svg new file mode 100644 index 0000000..cb7fbd4 --- /dev/null +++ b/_notebooks/course_UvA-DL/11-vision-transformer/pre_layer_norm.svg @@ -0,0 +1,810 @@ + + + + + + image/svg+xml + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/_notebooks/course_UvA-DL/11-vision-transformer/tensorboard_screenshot.png b/_notebooks/course_UvA-DL/11-vision-transformer/tensorboard_screenshot.png new file mode 100644 index 0000000..626e930 Binary files /dev/null and b/_notebooks/course_UvA-DL/11-vision-transformer/tensorboard_screenshot.png differ diff --git a/_notebooks/course_UvA-DL/11-vision-transformer/vit_architecture.png b/_notebooks/course_UvA-DL/11-vision-transformer/vit_architecture.png new file mode 100644 index 0000000..446aa44 Binary files /dev/null and b/_notebooks/course_UvA-DL/11-vision-transformer/vit_architecture.png differ diff --git a/_notebooks/course_UvA-DL/12-meta-learning/.meta.yml b/_notebooks/course_UvA-DL/12-meta-learning/.meta.yml new file mode 100644 index 0000000..18f459d --- /dev/null +++ b/_notebooks/course_UvA-DL/12-meta-learning/.meta.yml @@ -0,0 +1,29 @@ +title: "Tutorial 12: Meta-Learning - Learning to Learn" +author: Phillip Lippe +created: 2021-08-21 +updated: 2023-03-14 +license: CC BY-SA +tags: + - Few-shot-learning + - MAML + - ProtoNet +description: | + In this tutorial, we will discuss algorithms that learn models which can quickly adapt to new classes and/or tasks with few samples. + This area of machine learning is called _Meta-Learning_ aiming at "learning to learn". + Learning from very few examples is a natural task for humans. In contrast to current deep learning models, we need to see only a few examples of a police car or firetruck to recognize them in daily traffic. + This is crucial ability since in real-world application, it is rarely the case that the data stays static and does not change over time. + For example, an object detection system for mobile phones trained on data from 2000 will have troubles detecting today's common mobile phones, and thus, needs to adapt to new data without excessive label effort. + The optimization techniques we have discussed so far struggle with this because they only aim at obtaining a good performance on a test set that had similar data. + However, what if the test set has classes that we do not have in the training set? + Or what if we want to test the model on a completely different task? + We will discuss and implement three common Meta-Learning algorithms for such situations. + This notebook is part of a lecture series on Deep Learning at the University of Amsterdam. + The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io. +requirements: + - torchvision + - matplotlib + - seaborn + - lightning>=2.0.0rc0 +accelerator: + - CPU + - GPU diff --git a/docs/_static/images/course_UvA-DL/12-meta-learning.jpg b/_notebooks/course_UvA-DL/12-meta-learning/.thumb.jpg similarity index 100% rename from docs/_static/images/course_UvA-DL/12-meta-learning.jpg rename to _notebooks/course_UvA-DL/12-meta-learning/.thumb.jpg diff --git a/_notebooks/course_UvA-DL/12-meta-learning/MAML_algorithm.svg b/_notebooks/course_UvA-DL/12-meta-learning/MAML_algorithm.svg new file mode 100644 index 0000000..1812df4 --- /dev/null +++ b/_notebooks/course_UvA-DL/12-meta-learning/MAML_algorithm.svg @@ -0,0 +1,5318 @@ + + + + + + image/svg+xml + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/_notebooks/course_UvA-DL/12-meta-learning/MAML_figure.svg b/_notebooks/course_UvA-DL/12-meta-learning/MAML_figure.svg new file mode 100644 index 0000000..9e5838b --- /dev/null +++ b/_notebooks/course_UvA-DL/12-meta-learning/MAML_figure.svg @@ -0,0 +1,935 @@ + + + + + + image/svg+xmldiff --git a/_notebooks/course_UvA-DL/12-meta-learning/Meta_Learning.py b/_notebooks/course_UvA-DL/12-meta-learning/Meta_Learning.py new file mode 100644 index 0000000..5fdd66a --- /dev/null +++ b/_notebooks/course_UvA-DL/12-meta-learning/Meta_Learning.py @@ -0,0 +1,1332 @@ +# %% [markdown] +#
+# Meta-Learning offers solutions to these situations, and we will discuss three popular algorithms: __Prototypical Networks__ ([Snell et al., 2017](https://arxiv.org/pdf/1703.05175.pdf)), __Model-Agnostic Meta-Learning / MAML__ ([Finn et al., 2017](http://proceedings.mlr.press/v70/finn17a.html)), and __Proto-MAML__ ([Triantafillou et al., 2020](https://openreview.net/pdf?id=rkgAGAVKPr)). +# We will focus on the task of few-shot classification where the training and test set have distinct sets of classes. +# For instance, we would train the model on the binary classifications of cats-birds and flowers-bikes, but during test time, the model would need to learn from 4 examples each the difference between dogs and otters, two classes we have not seen during training (Figure credit - [Lilian Weng](https://lilianweng.github.io/lil-log/2018/11/30/meta-learning.html)). +# +#
+# +# A different setup, which is very common in Reinforcement Learning and recently Natural Language Processing, is to aim at few-shot learning of a completely new task. +# For example, an robot agent that learned to run, jump and pick up boxes, should quickly adapt to collecting and stacking boxes. +# In NLP, we can think of a model which was trained sentiment classification, hatespeech detection and sarcasm classification, to adapt to classifying the emotion of a text. +# All methods we will discuss in this notebook can be easily applied to these settings since we only use a different definition of a 'task'. +# For few-shot classification, we consider a task to distinguish between $M$ novel classes. +# Here, we would not only have novel classes, but also a completely different dataset. +# +# First of all, let's start with importing our standard libraries. We will again be using PyTorch Lightning. + +# %% +import json +import os +import random +import urllib.request +from collections import defaultdict +from copy import deepcopy +from statistics import mean, stdev +from urllib.error import HTTPError + +import lightning as L +import matplotlib +import matplotlib.pyplot as plt +import matplotlib_inline.backend_inline +import numpy as np +import seaborn as sns +import torch +import torch.nn.functional as F +import torch.optim as optim +import torch.utils.data as data +import torchvision +from lightning.pytorch.callbacks import LearningRateMonitor, ModelCheckpoint +from PIL import Image +from torchvision import transforms +from torchvision.datasets import CIFAR100, SVHN +from tqdm.auto import tqdm + +plt.set_cmap("cividis") +# %matplotlib inline +matplotlib_inline.backend_inline.set_matplotlib_formats("svg", "pdf") # For export +matplotlib.rcParams["lines.linewidth"] = 2.0 +sns.reset_orig() + +# Import tensorboard +# %load_ext tensorboard + +# Path to the folder where the datasets are/should be downloaded (e.g. CIFAR10) +DATASET_PATH = os.environ.get("PATH_DATASETS", "data/") +# Path to the folder where the pretrained models are saved +CHECKPOINT_PATH = os.environ.get("PATH_CHECKPOINT", "saved_models/MetaLearning/") + +# Setting the seed +L.seed_everything(42) + +# Ensure that all operations are deterministic on GPU (if used) for reproducibility +torch.backends.cudnn.deterministic = True +torch.backends.cudnn.benchmark = False + +device = torch.device("cuda:0") if torch.cuda.is_available() else torch.device("cpu") +print("Device:", device) + +# %% [markdown] +# Training the models in this notebook can take between 2 and 8 hours, and the evaluation time of some algorithms is in the span of couples of minutes. +# Hence, we download pre-trained models and results below. + +# %% +# Github URL where saved models are stored for this tutorial +base_url = "https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial16/" +# Files to download +pretrained_files = [ + "ProtoNet.ckpt", + "ProtoMAML.ckpt", + "tensorboards/ProtoNet/events.out.tfevents.ProtoNet", + "tensorboards/ProtoMAML/events.out.tfevents.ProtoMAML", + "protomaml_fewshot.json", + "protomaml_svhn_fewshot.json", +] +# Create checkpoint path if it doesn't exist yet +os.makedirs(CHECKPOINT_PATH, exist_ok=True) + +# For each file, check whether it already exists. If not, try downloading it. +for file_name in pretrained_files: + file_path = os.path.join(CHECKPOINT_PATH, file_name) + if "/" in file_name: + os.makedirs(file_path.rsplit("/", 1)[0], exist_ok=True) + if not os.path.isfile(file_path): + file_url = base_url + file_name + print("Downloading %s..." % file_url) + try: + urllib.request.urlretrieve(file_url, file_path) + except HTTPError as e: + print( + "Something went wrong. Please try to download the file from the GDrive folder, or contact the author with the full output including the following error:\n", + e, + ) + +# %% [markdown] +# ## Few-shot classification +# +# We start our implementation by discussing the dataset setup. +# In this notebook, we will use CIFAR100 which we have already seen in Tutorial 6. +# CIFAR100 has 100 classes each with 600 images of size $32\times 32$ pixels. +# Instead of splitting the training, validation and test set over examples, we will split them over classes: we will use 80 classes for training, and 10 for validation and 10 for testing. +# Our overall goal is to obtain a model that can distinguish between the 10 test classes with seeing very little examples. +# First, let's load the dataset and visualize some examples. + +# %% +# Loading CIFAR100 dataset +cifar_train_set = CIFAR100(root=DATASET_PATH, train=True, download=True, transform=transforms.ToTensor()) +cifar_test_set = CIFAR100(root=DATASET_PATH, train=False, download=True, transform=transforms.ToTensor()) + +# %% +# Visualize some examples +NUM_IMAGES = 12 +cifar_images = [cifar_train_set[np.random.randint(len(cifar_train_set))][0] for idx in range(NUM_IMAGES)] +cifar_images = torch.stack(cifar_images, dim=0) +img_grid = torchvision.utils.make_grid(cifar_images, nrow=6, normalize=True, pad_value=0.9) +img_grid = img_grid.permute(1, 2, 0) + +plt.figure(figsize=(8, 8)) +plt.title("Image examples of the CIFAR100 dataset") +plt.imshow(img_grid) +plt.axis("off") +plt.show() +plt.close() + +# %% [markdown] +# ### Data preprocessing +# +# Next, we need to prepare the dataset in the training, validation and test split as mentioned before. +# The torchvision package gives us the training and test set as two separate dataset objects. +# The next code cells will merge the original training and test set, and then create the new train-val-test split. + +# %% +# Merging original training and test set +cifar_all_images = np.concatenate([cifar_train_set.data, cifar_test_set.data], axis=0) +cifar_all_targets = torch.LongTensor(cifar_train_set.targets + cifar_test_set.targets) + +# %% [markdown] +# To have an easier time handling the dataset, we define our own, simple dataset class below. +# It takes a set of images, labels/targets, and image transformations, and +# returns the corresponding images and labels element-wise. + + +# %% +class ImageDataset(data.Dataset): + def __init__(self, imgs, targets, img_transform=None): + """ + Inputs: + imgs - Numpy array of shape [N,32,32,3] containing all images. + targets - PyTorch array of shape [N] containing all labels. + img_transform - A torchvision transformation that should be applied + to the images before returning. If none, no transformation + is applied. + """ + super().__init__() + self.img_transform = img_transform + self.imgs = imgs + self.targets = targets + + def __getitem__(self, idx): + img, target = self.imgs[idx], self.targets[idx] + img = Image.fromarray(img) + + if self.img_transform is not None: + img = self.img_transform(img) + + return img, target + + def __len__(self): + return self.imgs.shape[0] + + +# %% [markdown] +# Now, we can create the class splits. +# We will assign the classes randomly to training, validation and test, and use a 80%-10%-10% split. + +# %% +L.seed_everything(0) # Set seed for reproducibility +classes = torch.randperm(100) # Returns random permutation of numbers 0 to 99 +train_classes, val_classes, test_classes = classes[:80], classes[80:90], classes[90:] + +# %% [markdown] +# To get an intuition of the validation and test classes, we print the class names below: + +# %% +# Printing validation and test classes +idx_to_class = {val: key for key, val in cifar_train_set.class_to_idx.items()} +print("Validation classes:", [idx_to_class[c.item()] for c in val_classes]) +print("Test classes:", [idx_to_class[c.item()] for c in test_classes]) + +# %% [markdown] +# As we can see, the classes have quite some variety and some classes might be easier to distinguish than others. +# For instance, in the test classes, 'pickup_truck' is the only vehicle while the classes 'mushroom', 'worm' and 'forest' might be harder to keep apart. +# Remember that we want to learn the classification of those ten classes from 80 other classes in our training set, and few examples from the actual test classes. +# We will experiment with the number of examples per class. +# +# Finally, we can create the training, validation and test dataset according to our split above. +# For this, we create dataset objects of our previously defined class `ImageDataset`. + + +# %% +def dataset_from_labels(imgs, targets, class_set, **kwargs): + class_mask = (targets[:, None] == class_set[None, :]).any(dim=-1) + return ImageDataset(imgs=imgs[class_mask], targets=targets[class_mask], **kwargs) + + +# %% [markdown] +# As in our experiments before on CIFAR in Tutorial 5, 6 and 9, we normalize the dataset. +# Additionally, we use small augmentations during training to prevent overfitting. + +# %% +DATA_MEANS = (cifar_train_set.data / 255.0).mean(axis=(0, 1, 2)) +DATA_STD = (cifar_train_set.data / 255.0).std(axis=(0, 1, 2)) + +test_transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize(DATA_MEANS, DATA_STD)]) +# For training, we add some augmentation. +train_transform = transforms.Compose( + [ + transforms.RandomHorizontalFlip(), + transforms.RandomResizedCrop((32, 32), scale=(0.8, 1.0), ratio=(0.9, 1.1)), + transforms.ToTensor(), + transforms.Normalize(DATA_MEANS, DATA_STD), + ] +) + +train_set = dataset_from_labels(cifar_all_images, cifar_all_targets, train_classes, img_transform=train_transform) +val_set = dataset_from_labels(cifar_all_images, cifar_all_targets, val_classes, img_transform=test_transform) +test_set = dataset_from_labels(cifar_all_images, cifar_all_targets, test_classes, img_transform=test_transform) + +# %% [markdown] +# ### Data sampling +# +# The strategy of how to use the available training data for learning few-shot adaptation is crucial in meta-learning. +# All three algorithms that we discuss here have a similar idea: simulate few-shot learning during training. +# Specifically, at each training step, we randomly select a small number of classes, and sample a small number of examples for each class. +# This represents our few-shot training batch, which we also refer to as **support set**. +# Additionally, we sample a second set of examples from the same classes, and refer to this batch as **query set**. +# Our training objective is to classify the query set correctly from seeing the support set and its corresponding labels. +# The main difference between our three methods (ProtoNet, MAML, and Proto-MAML) is in how they use the support set to adapt to the training classes. +# +# This subsection summarizes the code that is needed to create such training batches. +# In PyTorch, we can specify the data sampling procedure by so-called `Sampler` ([documentation](https://pytorch.org/docs/stable/data.html#data-loading-order-and-sampler)). +# Samplers are iteratable objects that return indices in the order in which the data elements should be sampled. +# In our previous notebooks, we usually used the option `shuffle=True` in the `data.DataLoader` objects which creates a sampler returning the data indices in a random order. +# Here, we focus on samplers that return batches of indices that correspond to support and query set batches. +# Below, we implement such a sampler. + + +# %% +class FewShotBatchSampler: + def __init__(self, dataset_targets, N_way, K_shot, include_query=False, shuffle=True, shuffle_once=False): + """ + Inputs: + dataset_targets - PyTorch tensor of the labels of the data elements. + N_way - Number of classes to sample per batch. + K_shot - Number of examples to sample per class in the batch. + include_query - If True, returns batch of size N_way*K_shot*2, which + can be split into support and query set. Simplifies + the implementation of sampling the same classes but + distinct examples for support and query set. + shuffle - If True, examples and classes are newly shuffled in each + iteration (for training) + shuffle_once - If True, examples and classes are shuffled once in + the beginning, but kept constant across iterations + (for validation) + """ + super().__init__() + self.dataset_targets = dataset_targets + self.N_way = N_way + self.K_shot = K_shot + self.shuffle = shuffle + self.include_query = include_query + if self.include_query: + self.K_shot *= 2 + self.batch_size = self.N_way * self.K_shot # Number of overall images per batch + + # Organize examples by class + self.classes = torch.unique(self.dataset_targets).tolist() + self.num_classes = len(self.classes) + self.indices_per_class = {} + self.batches_per_class = {} # Number of K-shot batches that each class can provide + for c in self.classes: + self.indices_per_class[c] = torch.where(self.dataset_targets == c)[0] + self.batches_per_class[c] = self.indices_per_class[c].shape[0] // self.K_shot + + # Create a list of classes from which we select the N classes per batch + self.iterations = sum(self.batches_per_class.values()) // self.N_way + self.class_list = [c for c in self.classes for _ in range(self.batches_per_class[c])] + if shuffle_once or self.shuffle: + self.shuffle_data() + else: + # For testing, we iterate over classes instead of shuffling them + sort_idxs = [ + i + p * self.num_classes for i, c in enumerate(self.classes) for p in range(self.batches_per_class[c]) + ] + self.class_list = np.array(self.class_list)[np.argsort(sort_idxs)].tolist() + + def shuffle_data(self): + # Shuffle the examples per class + for c in self.classes: + perm = torch.randperm(self.indices_per_class[c].shape[0]) + self.indices_per_class[c] = self.indices_per_class[c][perm] + # Shuffle the class list from which we sample. Note that this way of shuffling + # does not prevent to choose the same class twice in a batch. However, for + # training and validation, this is not a problem. + random.shuffle(self.class_list) + + def __iter__(self): + # Shuffle data + if self.shuffle: + self.shuffle_data() + + # Sample few-shot batches + start_index = defaultdict(int) + for it in range(self.iterations): + class_batch = self.class_list[it * self.N_way : (it + 1) * self.N_way] # Select N classes for the batch + index_batch = [] + for c in class_batch: # For each class, select the next K examples and add them to the batch + index_batch.extend(self.indices_per_class[c][start_index[c] : start_index[c] + self.K_shot]) + start_index[c] += self.K_shot + if self.include_query: # If we return support+query set, sort them so that they are easy to split + index_batch = index_batch[::2] + index_batch[1::2] + yield index_batch + + def __len__(self): + return self.iterations + + +# %% [markdown] +# Now, we can create our intended data loaders by passing an object of `FewShotBatchSampler` as `batch_sampler=...` input to the PyTorch data loader object. +# For our experiments, we will use a 5-class 4-shot training setting. +# This means that each support set contains 5 classes with 4 examples each, i.e., 20 images overall. +# Usually, it is good to keep the number of shots equal to the number that you aim to test on. +# However, we will experiment later with different number of shots, and hence, we pick 4 as a compromise for now. +# To get the best performing model, it is recommended to consider the +# number of training shots as hyperparameter in a grid search. + +# %% +N_WAY = 5 +K_SHOT = 4 +train_data_loader = data.DataLoader( + train_set, + batch_sampler=FewShotBatchSampler(train_set.targets, include_query=True, N_way=N_WAY, K_shot=K_SHOT, shuffle=True), + num_workers=4, +) +val_data_loader = data.DataLoader( + val_set, + batch_sampler=FewShotBatchSampler( + val_set.targets, include_query=True, N_way=N_WAY, K_shot=K_SHOT, shuffle=False, shuffle_once=True + ), + num_workers=4, +) + +# %% [markdown] +# For simplicity, we implemented the sampling of a support and query set as sampling a support set with twice the number of examples. +# After sampling a batch from the data loader, we need to split it into a support and query set. +# We can summarize this step in the following function: + + +# %% +def split_batch(imgs, targets): + support_imgs, query_imgs = imgs.chunk(2, dim=0) + support_targets, query_targets = targets.chunk(2, dim=0) + return support_imgs, query_imgs, support_targets, query_targets + + +# %% [markdown] +# Finally, to ensure that our implementation of the data sampling process is correct, we can sample a batch and visualize its support and query set. +# What we would like to see is that the support and query set have the same classes, but distinct examples. + +# %% +imgs, targets = next(iter(val_data_loader)) # We use the validation set since it does not apply augmentations +support_imgs, query_imgs, _, _ = split_batch(imgs, targets) +support_grid = torchvision.utils.make_grid(support_imgs, nrow=K_SHOT, normalize=True, pad_value=0.9) +support_grid = support_grid.permute(1, 2, 0) +query_grid = torchvision.utils.make_grid(query_imgs, nrow=K_SHOT, normalize=True, pad_value=0.9) +query_grid = query_grid.permute(1, 2, 0) + +fig, ax = plt.subplots(1, 2, figsize=(8, 5)) +ax[0].imshow(support_grid) +ax[0].set_title("Support set") +ax[0].axis("off") +ax[1].imshow(query_grid) +ax[1].set_title("Query set") +ax[1].axis("off") +fig.suptitle("Few Shot Batch", weight="bold") +fig.show() +plt.close(fig) + +# %% [markdown] +# As we can see, the support and query set have the same five classes, but different examples. +# The models will be tasked to classify the examples in the query set by learning from the support set and its labels. +# With the data sampling in place, we can now start to implement our first meta-learning model: Prototypical Networks. + +# %% [markdown] +# ## Prototypical Networks +# +#
+ +# %% [markdown] +# The Prototypical Network, or ProtoNet for short, is a metric-based meta-learning algorithm which operates similar to a nearest neighbor classification. +# Metric-based meta-learning methods classify a new example $\mathbf{x}$ based on some distance function $d_{\varphi}$ between $x$ and all elements in the support set. +# ProtoNets implements this idea with the concept of prototypes in a learned feature space. +# First, ProtoNet uses an embedding function $f_{\theta}$ to encode each input in the support set into a $L$-dimensional feature vector. +# Next, for each class $c$, we collect the feature vectors of all examples with label $c$, and average their feature vectors. +# Formally, we can define this as: +# +# $$\mathbf{v}_c=\frac{1}{|S_c|}\sum_{(\mathbf{x}_i,y_i)\in S_c}f_{\theta}(\mathbf{x}_i)$$ +# +# where $S_c$ is the part of the support set $S$ for which $y_i=c$, and $\mathbf{v}_c$ represents the _prototype_ of class $c$. +# The prototype calculation is visualized below for a 2-dimensional feature space and 3 classes (Figure credit - [Snell et al.](https://arxiv.org/pdf/1703.05175.pdf)). +# The colored dots represent encoded support elements with color-corresponding class label, and the black dots next to the class label are the averaged prototypes. +# +#
+# +# Based on these prototypes, we want to classify a new example. +# Remember that since we want to learn the encoding function $f_{\theta}$, this classification must be differentiable and hence, we need to define a probability distribution across classes. +# For this, we will make use of the distance function $d_{\varphi}$: the closer a new example $\mathbf{x}$ is to a prototype $\mathbf{v}_c$, the higher the probability for $\mathbf{x}$ belonging to class $c$. +# Formally, we can simply use a softmax over the distances of $\mathbf{x}$ to all class prototypes: +# +# $$p(y=c\vert\mathbf{x})=\text{softmax}(-d_{\varphi}(f_{\theta}(\mathbf{x}), \mathbf{v}_c))=\frac{\exp\left(-d_{\varphi}(f_{\theta}(\mathbf{x}), \mathbf{v}_c)\right)}{\sum_{c'\in \mathcal{C}}\exp\left(-d_{\varphi}(f_{\theta}(\mathbf{x}), \mathbf{v}_{c'})\right)}$$ +# +# Note that the negative sign is necessary since we want to increase the probability for close-by vectors and have a low probability for distant vectors. +# We train the network $f_{\theta}$ based on the cross entropy error of the training query set examples. +# Thereby, the gradient flows through both the prototypes $\mathbf{v}_c$ and the query set encodings $f_{\theta}(\mathbf{x})$. +# For the distance function $d_{\varphi}$, we can choose any function as long as it is differentiable with respect to both of its inputs. +# The most common function, which we also use here, is the squared +# euclidean distance, but there has been several works on different +# distance functions as well. + +# %% [markdown] +# ### ProtoNet implementation + +# %% [markdown] +# Now that we know how a ProtoNet works in principle, let's look at how we can apply to our specific problem of few-shot image classification, and implement it below. +# First, we need to define the encoder function $f_{\theta}$. +# Since we work with CIFAR images, we can take a look back at Tutorial 5 where we compared common Computer Vision architectures, and choose one of the best performing ones. +# Here, we go with a DenseNet since it is in general more parameter efficient than ResNet. +# Luckily, we do not need to implement DenseNet ourselves again and can rely on torchvision's model package instead. +# We use common hyperparameters of 64 initial feature channels, add 32 per block, and use a bottleneck size of 64 (i.e. 2 times the growth rate). +# We use 4 stages of 6 layers each, which results in overall about 1 million parameters. +# Note that the torchvision package assumes that the last layer is used for classification and hence calls its output size `num_classes`. +# However, we can instead just use it as the feature space of ProtoNet, and choose an arbitrary dimensionality. +# We will use the same network for other algorithms in this notebook to ensure a fair comparison. + + +# %% +def get_convnet(output_size): + convnet = torchvision.models.DenseNet( + growth_rate=32, + block_config=(6, 6, 6, 6), + bn_size=2, + num_init_features=64, + num_classes=output_size, # Output dimensionality + ) + return convnet + + +# %% [markdown] +# Next, we can look at implementing ProtoNet. +# We will define it as PyTorch Lightning module to use all functionalities of PyTorch Lightning. +# The first step during training is to encode all images in a batch with our network. +# Next, we calculate the class prototypes from the support set (function `calculate_prototypes`), and classify the query set examples according to the prototypes (function `classify_feats`). +# Keep in mind that we use the data sampling described before, such that the support and query set are stacked together in the batch. +# Thus, we use our previously defined function `split_batch` to split them apart. +# The full code can be found below. + + +# %% +class ProtoNet(L.LightningModule): + def __init__(self, proto_dim, lr): + """Inputs. + + proto_dim - Dimensionality of prototype feature space + lr - Learning rate of Adam optimizer + """ + super().__init__() + self.save_hyperparameters() + self.model = get_convnet(output_size=self.hparams.proto_dim) + + def configure_optimizers(self): + optimizer = optim.AdamW(self.parameters(), lr=self.hparams.lr) + scheduler = optim.lr_scheduler.MultiStepLR(optimizer, milestones=[140, 180], gamma=0.1) + return [optimizer], [scheduler] + + @staticmethod + def calculate_prototypes(features, targets): + # Given a stack of features vectors and labels, return class prototypes + # features - shape [N, proto_dim], targets - shape [N] + classes, _ = torch.unique(targets).sort() # Determine which classes we have + prototypes = [] + for c in classes: + p = features[torch.where(targets == c)[0]].mean(dim=0) # Average class feature vectors + prototypes.append(p) + prototypes = torch.stack(prototypes, dim=0) + # Return the 'classes' tensor to know which prototype belongs to which class + return prototypes, classes + + def classify_feats(self, prototypes, classes, feats, targets): + # Classify new examples with prototypes and return classification error + dist = torch.pow(prototypes[None, :] - feats[:, None], 2).sum(dim=2) # Squared euclidean distance + preds = F.log_softmax(-dist, dim=1) + labels = (classes[None, :] == targets[:, None]).long().argmax(dim=-1) + acc = (preds.argmax(dim=1) == labels).float().mean() + return preds, labels, acc + + def calculate_loss(self, batch, mode): + # Determine training loss for a given support and query set + imgs, targets = batch + features = self.model(imgs) # Encode all images of support and query set + support_feats, query_feats, support_targets, query_targets = split_batch(features, targets) + prototypes, classes = ProtoNet.calculate_prototypes(support_feats, support_targets) + preds, labels, acc = self.classify_feats(prototypes, classes, query_feats, query_targets) + loss = F.cross_entropy(preds, labels) + + self.log("%s_loss" % mode, loss) + self.log("%s_acc" % mode, acc) + return loss + + def training_step(self, batch, batch_idx): + return self.calculate_loss(batch, mode="train") + + def validation_step(self, batch, batch_idx): + self.calculate_loss(batch, mode="val") + + +# %% [markdown] +# For validation, we use the same principle as training and sample support and query sets from the hold-out 10 classes. +# However, this gives us noisy scores depending on which query sets are chosen to which support sets. +# This is why we will use a different strategy during testing. +# For validation, our training strategy is sufficient since it is much +# faster than testing, and gives a good estimate of the training +# generalization as long as we keep the support-query sets constant across +# validation iterations. + +# %% [markdown] +# ### Training +# +# After implementing the model, we can already start training it. +# We use our common PyTorch Lightning training function, and train the model for 200 epochs. +# The training function takes `model_class` as input argument, i.e. the +# PyTorch Lightning module class that should be trained, since we will +# reuse this function for other algorithms as well. + + +# %% +def train_model(model_class, train_loader, val_loader, **kwargs): + trainer = L.Trainer( + default_root_dir=os.path.join(CHECKPOINT_PATH, model_class.__name__), + accelerator="auto", + devices=1, + max_epochs=200, + callbacks=[ + ModelCheckpoint(save_weights_only=True, mode="max", monitor="val_acc"), + LearningRateMonitor("epoch"), + ], + enable_progress_bar=False, + ) + trainer.logger._default_hp_metric = None + + # Check whether pretrained model exists. If yes, load it and skip training + pretrained_filename = os.path.join(CHECKPOINT_PATH, model_class.__name__ + ".ckpt") + if os.path.isfile(pretrained_filename): + print("Found pretrained model at %s, loading..." % pretrained_filename) + # Automatically loads the model with the saved hyperparameters + model = model_class.load_from_checkpoint(pretrained_filename) + else: + L.seed_everything(42) # To be reproducable + model = model_class(**kwargs) + trainer.fit(model, train_loader, val_loader) + model = model_class.load_from_checkpoint( + trainer.checkpoint_callback.best_model_path + ) # Load best checkpoint after training + + return model + + +# %% [markdown] +# Below is the training call for our ProtoNet. +# We use a 64-dimensional feature space. +# Larger feature spaces showed to give noisier results since the squared euclidean distance becomes proportionally larger in expectation, and smaller feature spaces might not allow for enough flexibility. +# We recommend to load the pre-trained model here at first, but feel free +# to play around with the hyperparameters yourself. + +# %% +protonet_model = train_model( + ProtoNet, proto_dim=64, lr=2e-4, train_loader=train_data_loader, val_loader=val_data_loader +) + +# %% [markdown] +# We can also take a closer look at the TensorBoard below. + +# %% +# Opens tensorboard in notebook. Adjust the path to your CHECKPOINT_PATH if needed +# # %tensorboard --logdir ../saved_models/tutorial16/tensorboards/ProtoNet/ + +# %% [markdown] +#
+# +# In contrast to standard supervised learning, we see that ProtoNet does not overfit as much as we would expect. +# The validation accuracy is of course lower than the average training, but the training loss does not stick close to zero. +# This is because no training batch is as the other, and we also mix new examples in the support set and query set. +# This gives us slightly different prototypes in every iteration, and makes it harder for the network to fully overfit. + +# %% [markdown] +# ### Testing +# +# Our goal of meta-learning is to obtain a model that can quickly adapt to a new task, or in this case, new classes to distinguish between. +# To test this, we will use our trained ProtoNet and adapt it to the 10 test classes. +# Thereby, we pick $k$ examples per class from which we determine the prototypes, and test the classification accuracy on all other examples. +# This can be seen as using the $k$ examples per class as support set, and the rest of the dataset as a query set. +# We iterate through the dataset such that each example has been once included in a support set. +# The average performance over all support sets tells us how well we can expect ProtoNet to perform when seeing only $k$ examples per class. +# During training, we used $k=4$. +# In testing, we will experiment with $k=\{2,4,8,16,32\}$ to get a better sense of how $k$ influences the results. +# We would expect that we achieve higher accuracies the more examples we have in the support set, but we don't know how it scales. +# Hence, let's first implement a function that executes the testing procedure for a given $k$: + + +# %% +@torch.no_grad() +def test_proto_net(model, dataset, data_feats=None, k_shot=4): + """Inputs. + + model - Pretrained ProtoNet model + dataset - The dataset on which the test should be performed. + Should be instance of ImageDataset + data_feats - The encoded features of all images in the dataset. + If None, they will be newly calculated, and returned + for later usage. + k_shot - Number of examples per class in the support set. + """ + model = model.to(device) + model.eval() + num_classes = dataset.targets.unique().shape[0] + exmps_per_class = dataset.targets.shape[0] // num_classes # We assume uniform example distribution here + + # The encoder network remains unchanged across k-shot settings. Hence, we only need + # to extract the features for all images once. + if data_feats is None: + # Dataset preparation + dataloader = data.DataLoader(dataset, batch_size=128, num_workers=4, shuffle=False, drop_last=False) + + img_features = [] + img_targets = [] + for imgs, targets in tqdm(dataloader, "Extracting image features", leave=False): + imgs = imgs.to(device) + feats = model.model(imgs) + img_features.append(feats.detach().cpu()) + img_targets.append(targets) + img_features = torch.cat(img_features, dim=0) + img_targets = torch.cat(img_targets, dim=0) + # Sort by classes, so that we obtain tensors of shape [num_classes, exmps_per_class, ...] + # Makes it easier to process later + img_targets, sort_idx = img_targets.sort() + img_targets = img_targets.reshape(num_classes, exmps_per_class).transpose(0, 1) + img_features = img_features[sort_idx].reshape(num_classes, exmps_per_class, -1).transpose(0, 1) + else: + img_features, img_targets = data_feats + + # We iterate through the full dataset in two manners. First, to select the k-shot batch. + # Second, the evaluate the model on all other examples + accuracies = [] + for k_idx in tqdm(range(0, img_features.shape[0], k_shot), "Evaluating prototype classification", leave=False): + # Select support set and calculate prototypes + k_img_feats = img_features[k_idx : k_idx + k_shot].flatten(0, 1) + k_targets = img_targets[k_idx : k_idx + k_shot].flatten(0, 1) + prototypes, proto_classes = model.calculate_prototypes(k_img_feats, k_targets) + # Evaluate accuracy on the rest of the dataset + batch_acc = 0 + for e_idx in range(0, img_features.shape[0], k_shot): + if k_idx == e_idx: # Do not evaluate on the support set examples + continue + e_img_feats = img_features[e_idx : e_idx + k_shot].flatten(0, 1) + e_targets = img_targets[e_idx : e_idx + k_shot].flatten(0, 1) + _, _, acc = model.classify_feats(prototypes, proto_classes, e_img_feats, e_targets) + batch_acc += acc.item() + batch_acc /= img_features.shape[0] // k_shot - 1 + accuracies.append(batch_acc) + + return (mean(accuracies), stdev(accuracies)), (img_features, img_targets) + + +# %% [markdown] +# Testing ProtoNet is relatively quick if we have processed all images once. Hence, we can do in this notebook: + +# %% +protonet_accuracies = dict() +data_feats = None +for k in [2, 4, 8, 16, 32]: + protonet_accuracies[k], data_feats = test_proto_net(protonet_model, test_set, data_feats=data_feats, k_shot=k) + print( + "Accuracy for k=%i: %4.2f%% (+-%4.2f%%)" + % (k, 100.0 * protonet_accuracies[k][0], 100 * protonet_accuracies[k][1]) + ) + +# %% [markdown] +# Before discussing the results above, let's first plot the accuracies over number of examples in the support set: + + +# %% +def plot_few_shot(acc_dict, name, color=None, ax=None): + sns.set() + if ax is None: + fig, ax = plt.subplots(1, 1, figsize=(5, 3)) + ks = sorted(list(acc_dict.keys())) + mean_accs = [acc_dict[k][0] for k in ks] + std_accs = [acc_dict[k][1] for k in ks] + ax.plot(ks, mean_accs, marker="o", markeredgecolor="k", markersize=6, label=name, color=color) + ax.fill_between( + ks, + [m - s for m, s in zip(mean_accs, std_accs)], + [m + s for m, s in zip(mean_accs, std_accs)], + alpha=0.2, + color=color, + ) + ax.set_xticks(ks) + ax.set_xlim([ks[0] - 1, ks[-1] + 1]) + ax.set_xlabel("Number of shots per class", weight="bold") + ax.set_ylabel("Accuracy", weight="bold") + if len(ax.get_title()) == 0: + ax.set_title("Few-Shot Performance " + name, weight="bold") + else: + ax.set_title(ax.get_title() + " and " + name, weight="bold") + ax.legend() + return ax + + +# %% +ax = plot_few_shot(protonet_accuracies, name="ProtoNet", color="C1") +plt.show() +plt.close() + +# %% [markdown] +# As we initially expected, the performance of ProtoNet indeed increases the more samples we have. +# However, even with just two samples per class, we classify almost half of the images correctly, which is well above random accuracy (10%). +# The curve shows an exponentially dampend trend, meaning that adding 2 extra examples to $k=2$ has a much higher impact than adding 2 extra samples if we already have $k=16$. +# Nonetheless, we can say that ProtoNet adapts fairly well to new classes. + +# %% [markdown] +# ## MAML and ProtoMAML +# +#
+ +# %% [markdown] +# The second meta-learning algorithm we will look at is MAML, short for Model-Agnostic Meta-Learning. +# MAML is an optimization-based meta-learning algorithm, which means that it tries to adjust the standard optimization procedure to a few-shot setting. +# The idea of MAML is relatively simple: given a model, support and query set during training, we optimize the model for $m$ steps on the support set, and evaluate the gradients of the query loss with respect to the original model's parameters. +# For the same model, we do it for a few different support-query sets and accumulate the gradients. +# This results in learning a model that provides a good initialization for being quickly adapted to the training tasks. +# If we denote the model parameters with $\theta$, we can visualize the procedure as follows (Figure credit - [Finn et al. ](http://proceedings.mlr.press/v70/finn17a.html)). +# +#
+ +# %% [markdown] +# The full algorithm of MAML is therefore as follows. +# At each training step, we sample a batch of tasks, i.e., a batch of support-query set pairs. +# For each task $\mathcal{T}_i$, we optimize a model $f_{\theta}$ on the support set via SGD, and denote this model as $f_{\theta_i'}$. +# We refer to this optimization as _inner loop_. +# Using this new model, we calculate the gradients of the original parameters, $\theta$, with respect to the query loss on $f_{\theta_i'}$. +# These gradients are accumulated over all tasks, and used to update $\theta$. +# This is called _outer loop_ since we iterate over tasks. +# The full MAML algorithm is summarized below (Figure credit - [Finn et al. ](http://proceedings.mlr.press/v70/finn17a.html)). +# +#
+ +# %% [markdown] +# To obtain gradients for the initial parameters $\theta$ from the optimized model $f_{\theta_i'}$, we actually need second-order gradients, i.e. gradients of gradients, as the support set gradients depend on $\theta$ as well. +# This makes MAML computationally expensive, especially when using mulitple inner loop steps. +# A simpler, yet almost equally well performing alternative is First-Order MAML (FOMAML) which only uses first-order gradients. +# This means that the second-order gradients are ignored, and we can calculate the outer loop gradients (line 10 in algorithm 2) simply by calculating the gradients with respect to $\theta_i'$, and use those as update to $\theta$. +# Hence, the new update rule becomes: +# $$\theta\leftarrow\theta-\beta\sum_{\mathcal{T}_i\sim p(\mathcal{T})}\nabla_{\theta_i'}\mathcal{L}_{\mathcal{T}_i}(f_{\theta_i'})$$ +# Note the change of $\theta$ to $\theta_i'$ for $\nabla$. + +# %% [markdown] +# ### ProtoMAML +# +# A problem of MAML is how to design the output classification layer. +# In case all tasks have different number of classes, we need to initialize the output layer with zeros or randomly in every iteration. +# Even if we always have the same number of classes, we just start from random predictions. +# This requires several inner loop steps to reach a reasonable classification result. +# To overcome this problem, Triantafillou et al. +# (2020) propose to combine the merits of Prototypical Networks and MAML. +# Specifically, we can use prototypes to initialize our output layer to have a strong initialization. +# Thereby, it can be shown that the softmax over euclidean distances can be reformulated as a linear layer with softmax. +# To see this, let's first write out the negative euclidean distance between a feature vector $f_{\theta}(\mathbf{x}^{*})$ of a new data point $\mathbf{x}^{*}$ to a prototype $\mathbf{v}_c$ of class $c$: +# $$ +# -||f_{\theta}(\mathbf{x}^{*})-\mathbf{v}_c||^2=-f_{\theta}(\mathbf{x}^{*})^Tf_{\theta}(\mathbf{x}^{*})+2\mathbf{v}_c^{T}f_{\theta}(\mathbf{x}^{*})-\mathbf{v}_c^T\mathbf{v}_c +# $$ +# +# We perform the classification across all classes $c\in\mathcal{C}$ and take a softmax on the distance. +# Hence, any term that is same for all classes can be removed without changing the output probabilities. +# In the equation above, this is true for $-f_{\theta}(\mathbf{x}^{*})^Tf_{\theta}(\mathbf{x}^{*})$ since it is independent of any class prototype. +# Thus, we can write: +# +# $$ +# -||f_{\theta}(\mathbf{x}^{*})-\mathbf{v}_c||^2=2\mathbf{v}_c^{T}f_{\theta}(\mathbf{x}^{*})-||\mathbf{v}_c||^2+\text{constant} +# $$ +# +# Taking a second look at the equation above, it looks a lot like a linear layer. +# For this, we use $\mathbf{W}_{c,\cdot}=2\mathbf{v}_c$ and $b_c=-||\mathbf{v}_c||^2$ which gives us the linear layer $\mathbf{W}f_{\theta}(\mathbf{x}^{*})+\mathbf{b}$. +# Hence, if we initialize the output weight with twice the prototypes, and the biases by the negative squared L2 norm of the prototypes, we start with a Prototypical Network. +# MAML allows us to adapt this layer and the rest of the network further. +# +# In the following, we will implement First-Order ProtoMAML for few-shot classification. +# The implementation of MAML would be the same except the output layer initialization. + +# %% [markdown] +# ### ProtoMAML implementation +# +# For implementing ProtoMAML, we can follow Algorithm 2 with minor modifications. +# At each training step, we first sample a batch of tasks, and a support and query set for each task. +# In our case of few-shot classification, this means that we simply sample multiple support-query set pairs from our sampler. +# For each task, we finetune our current model on the support set. +# However, since we need to remember the original parameters for the other tasks, the outer loop gradient update and future training steps, we need to create a copy of our model, and finetune only the copy. +# We can copy a model by using standard Python functions like `deepcopy`. +# The inner loop is implemented in the function `adapt_few_shot` in the PyTorch Lightning module below. +# +# After finetuning the model, we apply it on the query set and calculate the first-order gradients with respect to the original parameters $\theta$. +# In contrast to simple MAML, we also have to consider the gradients with respect to the output layer initialization, i.e. the prototypes, since they directly rely on $\theta$. +# To realize this efficiently, we take two steps. +# First, we calculate the prototypes by applying the original model, i.e. not the copied model, on the support elements. +# When initializing the output layer, we detach the prototypes to stop the gradients. +# This is because in the inner loop itself, we do not want to consider gradients through the prototypes back to the original model. +# However, after the inner loop is finished, we re-attach the computation graph of the prototypes by writing `output_weight = (output_weight - init_weight).detach() + init_weight`. +# While this line does not change the value of the variable `output_weight`, it adds its dependency on the prototype initialization `init_weight`. +# Thus, if we call `.backward` on `output_weight`, we will automatically calculate the first-order gradients with respect to the prototype initialization in the original model. +# +# After calculating all gradients and summing them together in the original model, we can take a standard optimizer step. +# PyTorch Lightning's method is however designed to return a loss-tensor on which we call `.backward` first. +# Since this is not possible here, we need to perform the optimization step ourselves. +# All details can be found in the code below. +# +# For implementing (Proto-)MAML with second-order gradients, it is recommended to use libraries such as [$\nabla$higher](https://github.com/facebookresearch/higher) from Facebook AI Research. +# For simplicity, we stick with first-order methods here. + + +# %% +class ProtoMAML(L.LightningModule): + def __init__(self, proto_dim, lr, lr_inner, lr_output, num_inner_steps): + """Inputs. + + proto_dim - Dimensionality of prototype feature space + lr - Learning rate of the outer loop Adam optimizer + lr_inner - Learning rate of the inner loop SGD optimizer + lr_output - Learning rate for the output layer in the inner loop + num_inner_steps - Number of inner loop updates to perform + """ + super().__init__() + self.save_hyperparameters() + self.model = get_convnet(output_size=self.hparams.proto_dim) + + def configure_optimizers(self): + optimizer = optim.AdamW(self.parameters(), lr=self.hparams.lr) + scheduler = optim.lr_scheduler.MultiStepLR(optimizer, milestones=[140, 180], gamma=0.1) + return [optimizer], [scheduler] + + def run_model(self, local_model, output_weight, output_bias, imgs, labels): + # Execute a model with given output layer weights and inputs + feats = local_model(imgs) + preds = F.linear(feats, output_weight, output_bias) + loss = F.cross_entropy(preds, labels) + acc = (preds.argmax(dim=1) == labels).float() + return loss, preds, acc + + def adapt_few_shot(self, support_imgs, support_targets): + # Determine prototype initialization + support_feats = self.model(support_imgs) + prototypes, classes = ProtoNet.calculate_prototypes(support_feats, support_targets) + support_labels = (classes[None, :] == support_targets[:, None]).long().argmax(dim=-1) + # Create inner-loop model and optimizer + local_model = deepcopy(self.model) + local_model.train() + local_optim = optim.SGD(local_model.parameters(), lr=self.hparams.lr_inner) + local_optim.zero_grad() + # Create output layer weights with prototype-based initialization + init_weight = 2 * prototypes + init_bias = -torch.norm(prototypes, dim=1) ** 2 + output_weight = init_weight.detach().requires_grad_() + output_bias = init_bias.detach().requires_grad_() + + # Optimize inner loop model on support set + for _ in range(self.hparams.num_inner_steps): + # Determine loss on the support set + loss, _, _ = self.run_model(local_model, output_weight, output_bias, support_imgs, support_labels) + # Calculate gradients and perform inner loop update + loss.backward() + local_optim.step() + # Update output layer via SGD + output_weight.data -= self.hparams.lr_output * output_weight.grad + output_bias.data -= self.hparams.lr_output * output_bias.grad + # Reset gradients + local_optim.zero_grad() + output_weight.grad.fill_(0) + output_bias.grad.fill_(0) + + # Re-attach computation graph of prototypes + output_weight = (output_weight - init_weight).detach() + init_weight + output_bias = (output_bias - init_bias).detach() + init_bias + + return local_model, output_weight, output_bias, classes + + def outer_loop(self, batch, mode="train"): + accuracies = [] + losses = [] + self.model.zero_grad() + + # Determine gradients for batch of tasks + for task_batch in batch: + imgs, targets = task_batch + support_imgs, query_imgs, support_targets, query_targets = split_batch(imgs, targets) + # Perform inner loop adaptation + local_model, output_weight, output_bias, classes = self.adapt_few_shot(support_imgs, support_targets) + # Determine loss of query set + query_labels = (classes[None, :] == query_targets[:, None]).long().argmax(dim=-1) + loss, preds, acc = self.run_model(local_model, output_weight, output_bias, query_imgs, query_labels) + # Calculate gradients for query set loss + if mode == "train": + loss.backward() + + for p_global, p_local in zip(self.model.parameters(), local_model.parameters()): + p_global.grad += p_local.grad # First-order approx. -> add gradients of finetuned and base model + + accuracies.append(acc.mean().detach()) + losses.append(loss.detach()) + + # Perform update of base model + if mode == "train": + opt = self.optimizers() + opt.step() + opt.zero_grad() + + self.log("%s_loss" % mode, sum(losses) / len(losses)) + self.log("%s_acc" % mode, sum(accuracies) / len(accuracies)) + + def training_step(self, batch, batch_idx): + self.outer_loop(batch, mode="train") + return None # Returning None means we skip the default training optimizer steps by PyTorch Lightning + + def validation_step(self, batch, batch_idx): + # Validation requires to finetune a model, hence we need to enable gradients + torch.set_grad_enabled(True) + self.outer_loop(batch, mode="val") + torch.set_grad_enabled(False) + + +# %% [markdown] +# ### Training +# +# To train ProtoMAML, we need to change our sampling slightly. +# Instead of a single support-query set batch, we need to sample multiple. +# To implement this, we yet use another Sampler which combines multiple batches from a `FewShotBatchSampler`, and returns it afterwards. +# Additionally, we define a `collate_fn` for our data loader which takes the stack of support-query set images, and returns the tasks as a list. +# This makes it easier to process in our PyTorch Lightning module before. +# The implementation of the sampler can be found below. + + +# %% +class TaskBatchSampler: + def __init__(self, dataset_targets, batch_size, N_way, K_shot, include_query=False, shuffle=True): + """ + Inputs: + dataset_targets - PyTorch tensor of the labels of the data elements. + batch_size - Number of tasks to aggregate in a batch + N_way - Number of classes to sample per batch. + K_shot - Number of examples to sample per class in the batch. + include_query - If True, returns batch of size N_way*K_shot*2, which + can be split into support and query set. Simplifies + the implementation of sampling the same classes but + distinct examples for support and query set. + shuffle - If True, examples and classes are newly shuffled in each + iteration (for training) + """ + super().__init__() + self.batch_sampler = FewShotBatchSampler(dataset_targets, N_way, K_shot, include_query, shuffle) + self.task_batch_size = batch_size + self.local_batch_size = self.batch_sampler.batch_size + + def __iter__(self): + # Aggregate multiple batches before returning the indices + batch_list = [] + for batch_idx, batch in enumerate(self.batch_sampler): + batch_list.extend(batch) + if (batch_idx + 1) % self.task_batch_size == 0: + yield batch_list + batch_list = [] + + def __len__(self): + return len(self.batch_sampler) // self.task_batch_size + + def get_collate_fn(self): + # Returns a collate function that converts one big tensor into a list of task-specific tensors + def collate_fn(item_list): + imgs = torch.stack([img for img, target in item_list], dim=0) + targets = torch.stack([target for img, target in item_list], dim=0) + imgs = imgs.chunk(self.task_batch_size, dim=0) + targets = targets.chunk(self.task_batch_size, dim=0) + return list(zip(imgs, targets)) + + return collate_fn + + +# %% [markdown] +# The creation of the data loaders is with this sampler straight-forward. +# Note that since many images need to loaded for a training batch, it is recommended to use less workers than usual. + +# %% +# Training constant (same as for ProtoNet) +N_WAY = 5 +K_SHOT = 4 + +# Training set +train_protomaml_sampler = TaskBatchSampler( + train_set.targets, include_query=True, N_way=N_WAY, K_shot=K_SHOT, batch_size=16 +) +train_protomaml_loader = data.DataLoader( + train_set, batch_sampler=train_protomaml_sampler, collate_fn=train_protomaml_sampler.get_collate_fn(), num_workers=2 +) + +# Validation set +val_protomaml_sampler = TaskBatchSampler( + val_set.targets, + include_query=True, + N_way=N_WAY, + K_shot=K_SHOT, + batch_size=1, # We do not update the parameters, hence the batch size is irrelevant here + shuffle=False, +) +val_protomaml_loader = data.DataLoader( + val_set, batch_sampler=val_protomaml_sampler, collate_fn=val_protomaml_sampler.get_collate_fn(), num_workers=2 +) + +# %% [markdown] +# Now, we are ready to train our ProtoMAML. +# We use the same feature space size as for ProtoNet, but can use a higher learning rate since the outer loop gradients are accumulated over 16 batches. +# The inner loop learning rate is set to 0.1, which is much higher than the outer loop lr because we use SGD in the inner loop instead of Adam. +# Commonly, the learning rate for the output layer is higher than the base model is the base model is very deep or pre-trained. +# However, for our setup, we observed no noticable impact of using a different learning rate than the base model. +# The number of inner loop updates is another crucial hyperparmaeter, and depends on the similarity of our training tasks. +# Since all tasks are on images from the same dataset, we notice that a single inner loop update achieves similar performance as 3 or 5 while training considerably faster. +# However, especially in RL and NLP, larger number of inner loop steps are often needed. + +# %% +protomaml_model = train_model( + ProtoMAML, + proto_dim=64, + lr=1e-3, + lr_inner=0.1, + lr_output=0.1, + num_inner_steps=1, # Often values between 1 and 10 + train_loader=train_protomaml_loader, + val_loader=val_protomaml_loader, +) + +# %% [markdown] +# Let's have a look at the training TensorBoard. + +# %% +# Opens tensorboard in notebook. Adjust the path to your CHECKPOINT_PATH if needed +# # %tensorboard --logdir ../saved_models/tutorial16/tensorboards/ProtoMAML/ + +# %% [markdown] +#
+# +# One obvious difference to ProtoNet is that the loss curves look much less noisy. +# This is because we average the outer loop gradients over multiple tasks, and thus have a smoother training curve. +# Additionally, we only have 15k training iterations after 200 epochs. +# This is again because of the task batches, which cause 16 times less iterations. +# However, each iteration has seen 16 times more data in this experiment. +# Thus, we still have a fair comparison between ProtoMAML and ProtoNet. +# At first sight on the validation accuracy, one would assume that +# ProtoNet performs superior to ProtoMAML, but we have to verify that with +# proper testing below. + +# %% [markdown] +# ### Testing +# +# We test ProtoMAML in the same manner as ProtoNet, namely by picking random examples in the test set as support sets and use the rest of the dataset as query set. +# Instead of just calculating the prototypes for all examples, we need to finetune a separate model for each support set. +# This is why this process is more expensive than ProtoNet, and in our case, testing $k=\{2,4,8,16,32\}$ can take almost an hour. +# Hence, we provide evaluation files besides the pretrained models. + + +# %% +def test_protomaml(model, dataset, k_shot=4): + L.seed_everything(42) + model = model.to(device) + num_classes = dataset.targets.unique().shape[0] + + # Data loader for full test set as query set + full_dataloader = data.DataLoader(dataset, batch_size=128, num_workers=4, shuffle=False, drop_last=False) + # Data loader for sampling support sets + sampler = FewShotBatchSampler( + dataset.targets, include_query=False, N_way=num_classes, K_shot=k_shot, shuffle=False, shuffle_once=False + ) + sample_dataloader = data.DataLoader(dataset, batch_sampler=sampler, num_workers=2) + + # We iterate through the full dataset in two manners. First, to select the k-shot batch. + # Second, the evaluate the model on all other examples + accuracies = [] + for (support_imgs, support_targets), support_indices in tqdm( + zip(sample_dataloader, sampler), "Performing few-shot finetuning" + ): + support_imgs = support_imgs.to(device) + support_targets = support_targets.to(device) + # Finetune new model on support set + local_model, output_weight, output_bias, classes = model.adapt_few_shot(support_imgs, support_targets) + with torch.no_grad(): # No gradients for query set needed + local_model.eval() + batch_acc = torch.zeros((0,), dtype=torch.float32, device=device) + # Evaluate all examples in test dataset + for query_imgs, query_targets in full_dataloader: + query_imgs = query_imgs.to(device) + query_targets = query_targets.to(device) + query_labels = (classes[None, :] == query_targets[:, None]).long().argmax(dim=-1) + _, _, acc = model.run_model(local_model, output_weight, output_bias, query_imgs, query_labels) + batch_acc = torch.cat([batch_acc, acc.detach()], dim=0) + # Exclude support set elements + for s_idx in support_indices: + batch_acc[s_idx] = 0 + batch_acc = batch_acc.sum().item() / (batch_acc.shape[0] - len(support_indices)) + accuracies.append(batch_acc) + return mean(accuracies), stdev(accuracies) + + +# %% [markdown] +# In contrast to training, it is recommended to use many more inner loop updates during testing. +# During training, we are not interested in getting the best model from the inner loop, but the model which can provide the best gradients. +# Hence, one update might be already sufficient in training, but for testing, it was often observed that larger number of updates can give a considerable performance boost. +# Thus, we change the inner loop updates to 200 before testing. + +# %% +protomaml_model.hparams.num_inner_steps = 200 + +# %% [markdown] +# Now, we can test our model. +# For the pre-trained models, we provide a json file with the results to reduce evaluation time. + +# %% +protomaml_result_file = os.path.join(CHECKPOINT_PATH, "protomaml_fewshot.json") + +if os.path.isfile(protomaml_result_file): + # Load pre-computed results + with open(protomaml_result_file) as f: + protomaml_accuracies = json.load(f) + protomaml_accuracies = {int(k): v for k, v in protomaml_accuracies.items()} +else: + # Perform same experiments as for ProtoNet + protomaml_accuracies = dict() + for k in [2, 4, 8, 16, 32]: + protomaml_accuracies[k] = test_protomaml(protomaml_model, test_set, k_shot=k) + # Export results + with open(protomaml_result_file, "w") as f: + json.dump(protomaml_accuracies, f, indent=4) + +for k in protomaml_accuracies: + print( + "Accuracy for k=%i: %4.2f%% (+-%4.2f%%)" + % (k, 100.0 * protomaml_accuracies[k][0], 100.0 * protomaml_accuracies[k][1]) + ) + +# %% [markdown] +# Again, let's plot the results in our plot from before. + +# %% +ax = plot_few_shot(protonet_accuracies, name="ProtoNet", color="C1") +plot_few_shot(protomaml_accuracies, name="ProtoMAML", color="C2", ax=ax) +plt.show() +plt.close() + +# %% [markdown] +# We can observe that ProtoMAML is indeed able to outperform ProtoNet for $k>4$. +# This is because with more samples, it becomes more relevant to also adapt the base model's parameters. +# Meanwhile, for $k=2$, ProtoMAML achieves lower performance than ProtoNet. +# This is likely also related to choosing 200 inner loop updates since with more updates, there exists the risk of overfitting. +# Nonetheless, the high standard deviation for $k=2$ makes it hard to take any statistically valid conclusion. +# +# Overall, we can conclude that ProtoMAML slightly outperforms ProtoNet for larger shot counts. +# However, one disadvantage of ProtoMAML is its much longer training and testing time. +# ProtoNet provides a simple, efficient, yet strong baseline for +# ProtoMAML, and might be the better solution in situations where limited +# resources are available. + +# %% [markdown] +# ## Domain adaptation +# +# So far, we have evaluated our meta-learning algorithms on the same dataset on which we have trained them. +# However, meta-learning algorithms are especially interesting when we want to move from one to another dataset. +# So, what happens if we apply them on a quite different dataset than CIFAR? +# This is what we try out below, and evaluate ProtoNet and ProtoMAML on the SVHN dataset. + +# %% [markdown] +# ### SVHN dataset +# +# The Street View House Numbers (SVHN) dataset is a real-world image dataset for house number detection. +# It is similar to MNIST by having the classes 0 to 9, but is more difficult due to its real-world setting and possible distracting numbers left and right. +# Let's first load the dataset, and visualize some images to get an impression of the dataset. + +# %% +SVHN_test_dataset = SVHN(root=DATASET_PATH, split="test", download=True, transform=transforms.ToTensor()) + +# %% +# Visualize some examples +NUM_IMAGES = 12 +SVHN_images = [SVHN_test_dataset[np.random.randint(len(SVHN_test_dataset))][0] for idx in range(NUM_IMAGES)] +SVHN_images = torch.stack(SVHN_images, dim=0) +img_grid = torchvision.utils.make_grid(SVHN_images, nrow=6, normalize=True, pad_value=0.9) +img_grid = img_grid.permute(1, 2, 0) + +plt.figure(figsize=(8, 8)) +plt.title("Image examples of the SVHN dataset") +plt.imshow(img_grid) +plt.axis("off") +plt.show() +plt.close() + +# %% [markdown] +# Each image is labeled with one class between 0 and 9 representing the main digit in the image. +# Can our ProtoNet and ProtoMAML learn to classify the digits from only a few examples? +# This is what we will test out below. +# The images have the same size as CIFAR, so that we can use the images without changes. +# We first prepare the dataset, for which we take the first 500 images per class. +# For this dataset, we use our test functions as before to get an estimated performance for different number of shots. + +# %% +imgs = np.transpose(SVHN_test_dataset.data, (0, 2, 3, 1)) +targets = SVHN_test_dataset.labels +# Limit number of examples to 500 to reduce test time +min_label_count = min(500, np.bincount(SVHN_test_dataset.labels).min()) + +idxs = np.concatenate([np.where(targets == c)[0][:min_label_count] for c in range(1 + targets.max())], axis=0) +imgs = imgs[idxs] +targets = torch.from_numpy(targets[idxs]).long() + +svhn_fewshot_dataset = ImageDataset(imgs, targets, img_transform=test_transform) +svhn_fewshot_dataset.imgs.shape + +# %% [markdown] +# ### Experiments +# +# First, we can apply ProtoNet to the SVHN dataset: + +# %% +protonet_svhn_accuracies = dict() +data_feats = None +for k in [2, 4, 8, 16, 32]: + protonet_svhn_accuracies[k], data_feats = test_proto_net( + protonet_model, svhn_fewshot_dataset, data_feats=data_feats, k_shot=k + ) + print( + "Accuracy for k=%i: %4.2f%% (+-%4.2f%%)" + % (k, 100.0 * protonet_svhn_accuracies[k][0], 100 * protonet_svhn_accuracies[k][1]) + ) + +# %% [markdown] +# It becomes clear that the results are much lower than the ones on CIFAR, and just slightly above random for $k=2$. +# How about ProtoMAML? +# We provide again evaluation files since the evaluation can take several minutes to complete. + +# %% +protomaml_result_file = os.path.join(CHECKPOINT_PATH, "protomaml_svhn_fewshot.json") + +if os.path.isfile(protomaml_result_file): + # Load pre-computed results + with open(protomaml_result_file) as f: + protomaml_svhn_accuracies = json.load(f) + protomaml_svhn_accuracies = {int(k): v for k, v in protomaml_svhn_accuracies.items()} +else: + # Perform same experiments as for ProtoNet + protomaml_svhn_accuracies = dict() + for k in [2, 4, 8, 16, 32]: + protomaml_svhn_accuracies[k] = test_protomaml(protomaml_model, svhn_fewshot_dataset, k_shot=k) + # Export results + with open(protomaml_result_file, "w") as f: + json.dump(protomaml_svhn_accuracies, f, indent=4) + +for k in protomaml_svhn_accuracies: + print( + "Accuracy for k=%i: %4.2f%% (+-%4.2f%%)" + % (k, 100.0 * protomaml_svhn_accuracies[k][0], 100.0 * protomaml_svhn_accuracies[k][1]) + ) + +# %% [markdown] +# While ProtoMAML shows similar performance than ProtoNet for $k\leq 4$, it considerably outperforms ProtoNet for more than 8 shots. +# This is because we can adapt the base model, which is crucial when the data does not fit the original training data. +# For $k=32$, ProtoMAML achieves $13\%$ higher classification accuracy than ProtoNet which already starts to flatten out. +# We can see the trend more clearly in our plot below. + +# %% +ax = plot_few_shot(protonet_svhn_accuracies, name="ProtoNet", color="C1") +plot_few_shot(protomaml_svhn_accuracies, name="ProtoMAML", color="C2", ax=ax) +plt.show() +plt.close() + +# %% [markdown] +# ## Conclusion +# +# In this notebook, we have discussed meta-learning algorithms that learn to adapt to new classes and/or tasks with just a few samples. +# We have discussed three popular algorithms, namely ProtoNet, MAML and ProtoMAML. +# On the few-shot image classification task of CIFAR100, ProtoNet and ProtoMAML showed to perform similarly well, with slight benefits of ProtoMAML for larger shot sizes. +# However, for out-of-distribution data (SVHN), the ability to optimize the base model showed to be crucial and gave ProtoMAML considerable performance gains over ProtoNet. +# Nonetheless, ProtoNet offers other advantages compared to ProtoMAML, namely a very cheap training and test cost as well as a simpler implementation. +# Hence, it is recommended to consider whether the additionally complexity +# of ProtoMAML is worth the extra training computation cost, or whether +# ProtoNet is already sufficient for the task at hand. + +# %% [markdown] +# ### References +# +# [1] Snell, Jake, Kevin Swersky, and Richard S. Zemel. +# "Prototypical networks for few-shot learning." +# NeurIPS 2017. +# ([link](https://arxiv.org/pdf/1703.05175.pdf)) +# +# [2] Chelsea Finn, Pieter Abbeel, Sergey Levine. +# "Model-Agnostic Meta-Learning for Fast Adaptation of Deep Networks." +# ICML 2017. +# ([link](http://proceedings.mlr.press/v70/finn17a.html)) +# +# [3] Triantafillou, Eleni, Tyler Zhu, Vincent Dumoulin, Pascal Lamblin, Utku Evci, Kelvin Xu, Ross Goroshin et al. +# "Meta-dataset: A dataset of datasets for learning to learn from few examples." +# ICLR 2020. +# ([link](https://openreview.net/pdf?id=rkgAGAVKPr)) diff --git a/_notebooks/course_UvA-DL/12-meta-learning/few-shot-classification.png b/_notebooks/course_UvA-DL/12-meta-learning/few-shot-classification.png new file mode 100644 index 0000000..d0146d1 Binary files /dev/null and b/_notebooks/course_UvA-DL/12-meta-learning/few-shot-classification.png differ diff --git a/_notebooks/course_UvA-DL/12-meta-learning/protonet_classification.svg b/_notebooks/course_UvA-DL/12-meta-learning/protonet_classification.svg new file mode 100644 index 0000000..716fbe3 --- /dev/null +++ b/_notebooks/course_UvA-DL/12-meta-learning/protonet_classification.svg @@ -0,0 +1,612 @@ + + + + + + image/svg+xml + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/_notebooks/course_UvA-DL/12-meta-learning/tensorboard_screenshot_ProtoMAML.png b/_notebooks/course_UvA-DL/12-meta-learning/tensorboard_screenshot_ProtoMAML.png new file mode 100644 index 0000000..13f2993 Binary files /dev/null and b/_notebooks/course_UvA-DL/12-meta-learning/tensorboard_screenshot_ProtoMAML.png differ diff --git a/_notebooks/course_UvA-DL/12-meta-learning/tensorboard_screenshot_ProtoNet.png b/_notebooks/course_UvA-DL/12-meta-learning/tensorboard_screenshot_ProtoNet.png new file mode 100644 index 0000000..e420ef8 Binary files /dev/null and b/_notebooks/course_UvA-DL/12-meta-learning/tensorboard_screenshot_ProtoNet.png differ diff --git a/_notebooks/course_UvA-DL/13-contrastive-learning/.meta.yml b/_notebooks/course_UvA-DL/13-contrastive-learning/.meta.yml new file mode 100644 index 0000000..6f9832f --- /dev/null +++ b/_notebooks/course_UvA-DL/13-contrastive-learning/.meta.yml @@ -0,0 +1,26 @@ +title: "Tutorial 13: Self-Supervised Contrastive Learning with SimCLR" +author: Phillip Lippe +created: 2021-08-30 +updated: 2023-03-14 +license: CC BY-SA +tags: + - Image + - Self-Supervised + - Contrastive-Learning +description: | + In this tutorial, we will take a closer look at self-supervised contrastive learning. + Self-supervised learning, or also sometimes called unsupervised learning, describes the scenario where we have given input data, but no accompanying labels to train in a classical supervised way. + However, this data still contains a lot of information from which we can learn: how are the images different from each other? + What patterns are descriptive for certain images? + Can we cluster the images? + To get an insight into these questions, we will implement a popular, simple contrastive learning method, SimCLR, and apply it to the STL10 dataset. + This notebook is part of a lecture series on Deep Learning at the University of Amsterdam. + The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io. +requirements: + - torchvision + - matplotlib + - seaborn + - lightning>=2.0.0rc0 +accelerator: + - CPU + - GPU diff --git a/docs/_static/images/course_UvA-DL/13-contrastive-learning.jpg b/_notebooks/course_UvA-DL/13-contrastive-learning/.thumb.jpg similarity index 100% rename from docs/_static/images/course_UvA-DL/13-contrastive-learning.jpg rename to _notebooks/course_UvA-DL/13-contrastive-learning/.thumb.jpg diff --git a/_notebooks/course_UvA-DL/13-contrastive-learning/SimCLR.py b/_notebooks/course_UvA-DL/13-contrastive-learning/SimCLR.py new file mode 100644 index 0000000..1bc97bb --- /dev/null +++ b/_notebooks/course_UvA-DL/13-contrastive-learning/SimCLR.py @@ -0,0 +1,841 @@ +# %% [markdown] +#
+# Methods for self-supervised learning try to learn as much as possible from the data alone, so it can quickly be finetuned for a specific classification task. +# The benefit of self-supervised learning is that a large dataset can often easily be obtained. +# For instance, if we want to train a vision model on semantic segmentation for autonomous driving, we can collect large amounts of data by simply installing a camera in a car, and driving through a city for an hour. +# In contrast, if we would want to do supervised learning, we would have to manually label all those images before training a model. +# This is extremely expensive, and would likely take a couple of months to manually label the same amount of data. +# Further, self-supervised learning can provide an alternative to transfer learning from models pretrained on ImageNet since we could pretrain a model on a specific dataset/situation, e.g. traffic scenarios for autonomous driving. +# +# Within the last two years, a lot of new approaches have been proposed for self-supervised learning, in particular for images, that have resulted in great improvements over supervised models when few labels are available. +# The subfield that we will focus on in this tutorial is contrastive learning. +# Contrastive learning is motivated by the question mentioned above: how are images different from each other? +# Specifically, contrastive learning methods train a model to cluster an image and its slightly augmented version in latent space, while the distance to other images should be maximized. +# A very recent and simple method for this is [SimCLR](https://arxiv.org/abs/2006.10029), which is visualized below (figure credit - [Ting Chen et al. ](https://simclr.github.io/)). +# +#
![simclr contrastive learning](simclr_contrastive_learning.png){width="500px"}
+# +# The general setup is that we are given a dataset of images without any labels, and want to train a model on this data such that it can quickly adapt to any image recognition task afterward. +# During each training iteration, we sample a batch of images as usual. +# For each image, we create two versions by applying data augmentation techniques like cropping, Gaussian noise, blurring, etc. +# An example of such is shown on the left with the image of the dog. +# We will go into the details and effects of the chosen augmentation techniques later. +# On those images, we apply a CNN like ResNet and obtain as output a 1D feature vector on which we apply a small MLP. +# The output features of the two augmented images are then trained to be close to each other, while all other images in that batch should be as different as possible. +# This way, the model has to learn to recognize the content of the image that remains unchanged under the data augmentations, such as objects which we usually care about in supervised tasks. +# +# We will now implement this framework ourselves and discuss further details along the way. +# Let's first start with importing our standard libraries below: + +# %% +import os +import urllib.request +from copy import deepcopy +from urllib.error import HTTPError + +import lightning as L +import matplotlib +import matplotlib.pyplot as plt +import matplotlib_inline.backend_inline +import seaborn as sns +import torch +import torch.nn as nn +import torch.nn.functional as F +import torch.optim as optim +import torch.utils.data as data +import torchvision +from lightning.pytorch.callbacks import LearningRateMonitor, ModelCheckpoint +from torchvision import transforms +from torchvision.datasets import STL10 +from tqdm.notebook import tqdm + +plt.set_cmap("cividis") +# %matplotlib inline +matplotlib_inline.backend_inline.set_matplotlib_formats("svg", "pdf") # For export +matplotlib.rcParams["lines.linewidth"] = 2.0 +sns.set() + +# Import tensorboard +# %load_ext tensorboard + +# Path to the folder where the datasets are/should be downloaded (e.g. CIFAR10) +DATASET_PATH = os.environ.get("PATH_DATASETS", "data/") +# Path to the folder where the pretrained models are saved +CHECKPOINT_PATH = os.environ.get("PATH_CHECKPOINT", "saved_models/ContrastiveLearning/") +# In this notebook, we use data loaders with heavier computational processing. It is recommended to use as many +# workers as possible in a data loader, which corresponds to the number of CPU cores +NUM_WORKERS = os.cpu_count() + +# Setting the seed +L.seed_everything(42) + +# Ensure that all operations are deterministic on GPU (if used) for reproducibility +torch.backends.cudnn.determinstic = True +torch.backends.cudnn.benchmark = False + +device = torch.device("cuda:0") if torch.cuda.is_available() else torch.device("cpu") +print("Device:", device) +print("Number of workers:", NUM_WORKERS) + +# %% [markdown] +# As in many tutorials before, we provide pre-trained models. +# Note that those models are slightly larger as normal (~100MB overall) since we use the default ResNet-18 architecture. +# If you are running this notebook locally, make sure to have sufficient disk space available. + +# %% +# Github URL where saved models are stored for this tutorial +base_url = "https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial17/" +# Files to download +pretrained_files = [ + "SimCLR.ckpt", + "ResNet.ckpt", + "tensorboards/SimCLR/events.out.tfevents.SimCLR", + "tensorboards/classification/ResNet/events.out.tfevents.ResNet", +] +pretrained_files += [f"LogisticRegression_{size}.ckpt" for size in [10, 20, 50, 100, 200, 500]] +# Create checkpoint path if it doesn't exist yet +os.makedirs(CHECKPOINT_PATH, exist_ok=True) + +# For each file, check whether it already exists. If not, try downloading it. +for file_name in pretrained_files: + file_path = os.path.join(CHECKPOINT_PATH, file_name) + if "/" in file_name: + os.makedirs(file_path.rsplit("/", 1)[0], exist_ok=True) + if not os.path.isfile(file_path): + file_url = base_url + file_name + print(f"Downloading {file_url}...") + try: + urllib.request.urlretrieve(file_url, file_path) + except HTTPError as e: + print( + "Something went wrong. Please try to download the file from the GDrive folder, or contact the author with the full output including the following error:\n", + e, + ) + +# %% [markdown] +# ## SimCLR +# +# We will start our exploration of contrastive learning by discussing the effect of different data augmentation techniques, and how we can implement an efficient data loader for such. +# Next, we implement SimCLR with PyTorch Lightning, and finally train it on a large, unlabeled dataset. + +# %% [markdown] +# ### Data Augmentation for Contrastive Learning +# +# To allow efficient training, we need to prepare the data loading such that we sample two different, random augmentations for each image in the batch. +# The easiest way to do this is by creating a transformation that, when being called, applies a set of data augmentations to an image twice. +# This is implemented in the class `ContrastiveTransformations` below: + + +# %% +class ContrastiveTransformations: + def __init__(self, base_transforms, n_views=2): + self.base_transforms = base_transforms + self.n_views = n_views + + def __call__(self, x): + return [self.base_transforms(x) for i in range(self.n_views)] + + +# %% [markdown] +# The contrastive learning framework can easily be extended to have more _positive_ examples by sampling more than two augmentations of the same image. +# However, the most efficient training is usually obtained by using only two. +# +# Next, we can look at the specific augmentations we want to apply. +# The choice of the data augmentation to use is the most crucial hyperparameter in SimCLR since it directly affects how the latent space is structured, and what patterns might be learned from the data. +# Let's first take a look at some of the most popular data augmentations (figure credit - [Ting Chen and Geoffrey Hinton](https://ai.googleblog.com/2020/04/advancing-self-supervised-and-semi.html)): +# +#
+# +# All of them can be used, but it turns out that two augmentations stand out in their importance: crop-and-resize, and color distortion. +# Interestingly, however, they only lead to strong performance if they have been used together as discussed by [Ting Chen et al. ](https://arxiv.org/abs/2006.10029) in their SimCLR paper. +# When performing randomly cropping and resizing, we can distinguish between two situations: (a) cropped image A provides a local view of cropped image B, or (b) cropped images C and D show neighboring views of the same image (figure credit - [Ting Chen and Geoffrey Hinton](https://ai.googleblog.com/2020/04/advancing-self-supervised-and-semi.html)). +# +#
+# +# While situation (a) requires the model to learn some sort of scale invariance to make crops A and B similar in latent space, situation (b) is more challenging since the model needs to recognize an object beyond its limited view. +# However, without color distortion, there is a loophole that the model can exploit, namely that different crops of the same image usually look very similar in color space. +# Consider the picture of the dog above. +# Simply from the color of the fur and the green color tone of the background, you can reason that two patches belong to the same image without actually recognizing the dog in the picture. +# In this case, the model might end up focusing only on the color histograms of the images, and ignore other more generalizable features. +# If, however, we distort the colors in the two patches randomly and independently of each other, the model cannot rely on this simple feature anymore. +# Hence, by combining random cropping and color distortions, the model can only match two patches by learning generalizable representations. +# +# Overall, for our experiments, we apply a set of 5 transformations following the original SimCLR setup: random horizontal flip, crop-and-resize, color distortion, random grayscale, and gaussian blur. +# In comparison to the [original implementation](https://github.com/google-research/simclr), we reduce the effect of the color jitter slightly (0.5 instead of 0.8 for brightness, contrast, and saturation, and 0.1 instead of 0.2 for hue). +# In our experiments, this setting obtained better performance and was faster and more stable to train. +# If, for instance, the brightness scale highly varies in a dataset, the +# original settings can be more beneficial since the model can't rely on +# this information anymore to distinguish between images. + +# %% +contrast_transforms = transforms.Compose( + [ + transforms.RandomHorizontalFlip(), + transforms.RandomResizedCrop(size=96), + transforms.RandomApply([transforms.ColorJitter(brightness=0.5, contrast=0.5, saturation=0.5, hue=0.1)], p=0.8), + transforms.RandomGrayscale(p=0.2), + transforms.GaussianBlur(kernel_size=9), + transforms.ToTensor(), + transforms.Normalize((0.5,), (0.5,)), + ] +) + +# %% [markdown] +# After discussing the data augmentation techniques, we can now focus on the dataset. +# In this tutorial, we will use the [STL10 dataset](https://cs.stanford.edu/~acoates/stl10/), which, similarly to CIFAR10, contains images of 10 classes: airplane, bird, car, cat, deer, dog, horse, monkey, ship, truck. +# However, the images have a higher resolution, namely $96\times 96$ pixels, and we are only provided with 500 labeled images per class. +# Additionally, we have a much larger set of $100,000$ unlabeled images which are similar to the training images but are sampled from a wider range of animals and vehicles. +# This makes the dataset ideal to showcase the benefits that self-supervised learning offers. +# +# Luckily, the STL10 dataset is provided through torchvision. +# Keep in mind, however, that since this dataset is relatively large and has a considerably higher resolution than CIFAR10, it requires more disk space (~3GB) and takes a bit of time to download. +# For our initial discussion of self-supervised learning and SimCLR, we +# will create two data loaders with our contrastive transformations above: +# the `unlabeled_data` will be used to train our model via contrastive +# learning, and `train_data_contrast` will be used as a validation set in +# contrastive learning. + +# %% +unlabeled_data = STL10( + root=DATASET_PATH, + split="unlabeled", + download=True, + transform=ContrastiveTransformations(contrast_transforms, n_views=2), +) +train_data_contrast = STL10( + root=DATASET_PATH, + split="train", + download=True, + transform=ContrastiveTransformations(contrast_transforms, n_views=2), +) + +# %% [markdown] +# Finally, before starting with our implementation of SimCLR, let's look +# at some example image pairs sampled with our augmentations: + +# %% +# Visualize some examples +L.seed_everything(42) +NUM_IMAGES = 6 +imgs = torch.stack([img for idx in range(NUM_IMAGES) for img in unlabeled_data[idx][0]], dim=0) +img_grid = torchvision.utils.make_grid(imgs, nrow=6, normalize=True, pad_value=0.9) +img_grid = img_grid.permute(1, 2, 0) + +plt.figure(figsize=(10, 5)) +plt.title("Augmented image examples of the STL10 dataset") +plt.imshow(img_grid) +plt.axis("off") +plt.show() +plt.close() + +# %% [markdown] +# We see the wide variety of our data augmentation, including randomly cropping, grayscaling, gaussian blur, and color distortion. +# Thus, it remains a challenging task for the model to match two, independently augmented patches of the same image. + +# %% [markdown] +# ### SimCLR implementation +# +# Using the data loader pipeline above, we can now implement SimCLR. +# At each iteration, we get for every image $x$ two differently augmented versions, which we refer to as $\tilde{x}_i$ and $\tilde{x}_j$. +# Both of these images are encoded into a one-dimensional feature vector, between which we want to maximize similarity which minimizes it to all other images in the batch. +# The encoder network is split into two parts: a base encoder network $f(\cdot)$, and a projection head $g(\cdot)$. +# The base network is usually a deep CNN as we have seen in e.g. [Tutorial 5](https://uvadlc-notebooks.readthedocs.io/en/latest/tutorial_notebooks/tutorial5/Inception_ResNet_DenseNet.html) before, and is responsible for extracting a representation vector from the augmented data examples. +# In our experiments, we will use the common ResNet-18 architecture as $f(\cdot)$, and refer to the output as $f(\tilde{x}_i)=h_i$. +# The projection head $g(\cdot)$ maps the representation $h$ into a space where we apply the contrastive loss, i.e., compare similarities between vectors. +# It is often chosen to be a small MLP with non-linearities, and for simplicity, we follow the original SimCLR paper setup by defining it as a two-layer MLP with ReLU activation in the hidden layer. +# Note that in the follow-up paper, [SimCLRv2](https://arxiv.org/abs/2006.10029), the authors mention that larger/wider MLPs can boost the performance considerably. +# This is why we apply an MLP with four times larger hidden dimensions, but deeper MLPs showed to overfit on the given dataset. +# The general setup is visualized below (figure credit - [Ting Chen et al. ](https://arxiv.org/abs/2006.10029)): +# +#
+# +# After finishing the training with contrastive learning, we will remove the projection head $g(\cdot)$, and use $f(\cdot)$ as a pretrained feature extractor. +# The representations $z$ that come out of the projection head $g(\cdot)$ have been shown to perform worse than those of the base network $f(\cdot)$ when finetuning the network for a new task. +# This is likely because the representations $z$ are trained to become invariant to many features like the color that can be important for downstream tasks. +# Thus, $g(\cdot)$ is only needed for the contrastive learning stage. +# +# Now that the architecture is described, let's take a closer look at how we train the model. +# As mentioned before, we want to maximize the similarity between the representations of the two augmented versions of the same image, i.e., $z_i$ and $z_j$ in the figure above, while minimizing it to all other examples in the batch. +# SimCLR thereby applies the InfoNCE loss, originally proposed by [Aaron van den Oord et al. ](https://arxiv.org/abs/1807.03748) for contrastive learning. +# In short, the InfoNCE loss compares the similarity of $z_i$ and $z_j$ to the similarity of $z_i$ to any other representation in the batch by performing a softmax over the similarity values. +# The loss can be formally written as: +# $$ +# \ell_{i,j}=-\log \frac{\exp(\text{sim}(z_i,z_j)/\tau)}{\sum_{k=1}^{2N}\mathbb{1}_{[k\neq i]}\exp(\text{sim}(z_i,z_k)/\tau)}=-\text{sim}(z_i,z_j)/\tau+\log\left[\sum_{k=1}^{2N}\mathbb{1}_{[k\neq i]}\exp(\text{sim}(z_i,z_k)/\tau)\right] +# $$ +# The function $\text{sim}$ is a similarity metric, and the hyperparameter $\tau$ is called temperature determining how peaked the distribution is. +# Since many similarity metrics are bounded, the temperature parameter allows us to balance the influence of many dissimilar image patches versus one similar patch. +# The similarity metric that is used in SimCLR is cosine similarity, as defined below: +# $$ +# \text{sim}(z_i,z_j) = \frac{z_i^\top \cdot z_j}{||z_i||\cdot||z_j||} +# $$ +# The maximum cosine similarity possible is $1$, while the minimum is $-1$. +# In general, we will see that the features of two different images will converge to a cosine similarity around zero since the minimum, $-1$, would require $z_i$ and $z_j$ to be in the exact opposite direction in all feature dimensions, which does not allow for great flexibility. +# +# Finally, now that we have discussed all details, let's implement SimCLR below as a PyTorch Lightning module: + + +# %% +class SimCLR(L.LightningModule): + def __init__(self, hidden_dim, lr, temperature, weight_decay, max_epochs=500): + super().__init__() + self.save_hyperparameters() + assert self.hparams.temperature > 0.0, "The temperature must be a positive float!" + # Base model f(.) + self.convnet = torchvision.models.resnet18( + pretrained=False, num_classes=4 * hidden_dim + ) # num_classes is the output size of the last linear layer + # The MLP for g(.) consists of Linear->ReLU->Linear + self.convnet.fc = nn.Sequential( + self.convnet.fc, # Linear(ResNet output, 4*hidden_dim) + nn.ReLU(inplace=True), + nn.Linear(4 * hidden_dim, hidden_dim), + ) + + def configure_optimizers(self): + optimizer = optim.AdamW(self.parameters(), lr=self.hparams.lr, weight_decay=self.hparams.weight_decay) + lr_scheduler = optim.lr_scheduler.CosineAnnealingLR( + optimizer, T_max=self.hparams.max_epochs, eta_min=self.hparams.lr / 50 + ) + return [optimizer], [lr_scheduler] + + def info_nce_loss(self, batch, mode="train"): + imgs, _ = batch + imgs = torch.cat(imgs, dim=0) + + # Encode all images + feats = self.convnet(imgs) + # Calculate cosine similarity + cos_sim = F.cosine_similarity(feats[:, None, :], feats[None, :, :], dim=-1) + # Mask out cosine similarity to itself + self_mask = torch.eye(cos_sim.shape[0], dtype=torch.bool, device=cos_sim.device) + cos_sim.masked_fill_(self_mask, -9e15) + # Find positive example -> batch_size//2 away from the original example + pos_mask = self_mask.roll(shifts=cos_sim.shape[0] // 2, dims=0) + # InfoNCE loss + cos_sim = cos_sim / self.hparams.temperature + nll = -cos_sim[pos_mask] + torch.logsumexp(cos_sim, dim=-1) + nll = nll.mean() + + # Logging loss + self.log(mode + "_loss", nll) + # Get ranking position of positive example + comb_sim = torch.cat( + [cos_sim[pos_mask][:, None], cos_sim.masked_fill(pos_mask, -9e15)], # First position positive example + dim=-1, + ) + sim_argsort = comb_sim.argsort(dim=-1, descending=True).argmin(dim=-1) + # Logging ranking metrics + self.log(mode + "_acc_top1", (sim_argsort == 0).float().mean()) + self.log(mode + "_acc_top5", (sim_argsort < 5).float().mean()) + self.log(mode + "_acc_mean_pos", 1 + sim_argsort.float().mean()) + + return nll + + def training_step(self, batch, batch_idx): + return self.info_nce_loss(batch, mode="train") + + def validation_step(self, batch, batch_idx): + self.info_nce_loss(batch, mode="val") + + +# %% [markdown] +# Alternatively to performing the validation on the contrastive learning loss as well, we could also take a simple, small downstream task, and track the performance of the base network $f(\cdot)$ on that. +# However, in this tutorial, we will restrict ourselves to the STL10 +# dataset where we use the task of image classification on STL10 as our +# test task. + +# %% [markdown] +# ### Training +# +# Now that we have implemented SimCLR and the data loading pipeline, we are ready to train the model. +# We will use the same training function setup as usual. +# For saving the best model checkpoint, we track the metric `val_acc_top5`, which describes how often the correct image patch is within the top-5 most similar examples in the batch. +# This is usually less noisy than the top-1 metric, making it a better metric to choose the best model from. + + +# %% +def train_simclr(batch_size, max_epochs=500, **kwargs): + trainer = L.Trainer( + default_root_dir=os.path.join(CHECKPOINT_PATH, "SimCLR"), + accelerator="auto", + devices=1, + max_epochs=max_epochs, + callbacks=[ + ModelCheckpoint(save_weights_only=True, mode="max", monitor="val_acc_top5"), + LearningRateMonitor("epoch"), + ], + ) + trainer.logger._default_hp_metric = None # Optional logging argument that we don't need + + # Check whether pretrained model exists. If yes, load it and skip training + pretrained_filename = os.path.join(CHECKPOINT_PATH, "SimCLR.ckpt") + if os.path.isfile(pretrained_filename): + print(f"Found pretrained model at {pretrained_filename}, loading...") + # Automatically loads the model with the saved hyperparameters + model = SimCLR.load_from_checkpoint(pretrained_filename) + else: + train_loader = data.DataLoader( + unlabeled_data, + batch_size=batch_size, + shuffle=True, + drop_last=True, + pin_memory=True, + num_workers=NUM_WORKERS, + ) + val_loader = data.DataLoader( + train_data_contrast, + batch_size=batch_size, + shuffle=False, + drop_last=False, + pin_memory=True, + num_workers=NUM_WORKERS, + ) + L.seed_everything(42) # To be reproducable + model = SimCLR(max_epochs=max_epochs, **kwargs) + trainer.fit(model, train_loader, val_loader) + # Load best checkpoint after training + model = SimCLR.load_from_checkpoint(trainer.checkpoint_callback.best_model_path) + + return model + + +# %% [markdown] +# A common observation in contrastive learning is that the larger the batch size, the better the models perform. +# A larger batch size allows us to compare each image to more negative examples, leading to overall smoother loss gradients. +# However, in our case, we experienced that a batch size of 256 was sufficient to get good results. + +# %% +simclr_model = train_simclr( + batch_size=256, hidden_dim=128, lr=5e-4, temperature=0.07, weight_decay=1e-4, max_epochs=500 +) + +# %% [markdown] +# To get an intuition of how training with contrastive learning behaves, we can take a look at the TensorBoard below: + +# %% +# %tensorboard --logdir ../saved_models/tutorial17/tensorboards/SimCLR/ + +# %% [markdown] +#
![tensorboard simclr](tensorboard_simclr.png){width="1200px"}
+# +# One thing to note is that contrastive learning benefits a lot from long training. +# The shown plot above is from a training that took approx. +# 1 day on a NVIDIA TitanRTX. +# Training the model for even longer might reduce its loss further, but we did not experience any gains from it for the downstream task on image classification. +# In general, contrastive learning can also benefit from using larger models, if sufficient unlabeled data is available. + +# %% [markdown] +# ## Logistic Regression +# +#
+# After we have trained our model via contrastive learning, we can deploy it on downstream tasks and see how well it performs with little data. +# A common setup, which also verifies whether the model has learned generalized representations, is to perform Logistic Regression on the features. +# In other words, we learn a single, linear layer that maps the representations to a class prediction. +# Since the base network $f(\cdot)$ is not changed during the training process, the model can only perform well if the representations of $h$ describe all features that might be necessary for the task. +# Further, we do not have to worry too much about overfitting since we have very few parameters that are trained. +# Hence, we might expect that the model can perform well even with very little data. +# +# First, let's implement a simple Logistic Regression setup for which we assume that the images already have been encoded in their feature vectors. +# If very little data is available, it might be beneficial to dynamically encode the images during training so that we can also apply data augmentations. +# However, the way we implement it here is much more efficient and can be trained within a few seconds. +# Further, using data augmentations did not show any significant gain in this simple setup. + + +# %% +class LogisticRegression(L.LightningModule): + def __init__(self, feature_dim, num_classes, lr, weight_decay, max_epochs=100): + super().__init__() + self.save_hyperparameters() + # Mapping from representation h to classes + self.model = nn.Linear(feature_dim, num_classes) + + def configure_optimizers(self): + optimizer = optim.AdamW(self.parameters(), lr=self.hparams.lr, weight_decay=self.hparams.weight_decay) + lr_scheduler = optim.lr_scheduler.MultiStepLR( + optimizer, milestones=[int(self.hparams.max_epochs * 0.6), int(self.hparams.max_epochs * 0.8)], gamma=0.1 + ) + return [optimizer], [lr_scheduler] + + def _calculate_loss(self, batch, mode="train"): + feats, labels = batch + preds = self.model(feats) + loss = F.cross_entropy(preds, labels) + acc = (preds.argmax(dim=-1) == labels).float().mean() + + self.log(mode + "_loss", loss) + self.log(mode + "_acc", acc) + return loss + + def training_step(self, batch, batch_idx): + return self._calculate_loss(batch, mode="train") + + def validation_step(self, batch, batch_idx): + self._calculate_loss(batch, mode="val") + + def test_step(self, batch, batch_idx): + self._calculate_loss(batch, mode="test") + + +# %% [markdown] +# The data we use is the training and test set of STL10. +# The training contains 500 images per class, while the test set has 800 images per class. + +# %% +img_transforms = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.5,), (0.5,))]) + +train_img_data = STL10(root=DATASET_PATH, split="train", download=True, transform=img_transforms) +test_img_data = STL10(root=DATASET_PATH, split="test", download=True, transform=img_transforms) + +print("Number of training examples:", len(train_img_data)) +print("Number of test examples:", len(test_img_data)) + +# %% [markdown] +# Next, we implement a small function to encode all images in our datasets. +# The output representations are then used as inputs to the Logistic Regression model. + + +# %% +@torch.no_grad() +def prepare_data_features(model, dataset): + # Prepare model + network = deepcopy(model.convnet) + network.fc = nn.Identity() # Removing projection head g(.) + network.eval() + network.to(device) + + # Encode all images + data_loader = data.DataLoader(dataset, batch_size=64, num_workers=NUM_WORKERS, shuffle=False, drop_last=False) + feats, labels = [], [] + for batch_imgs, batch_labels in tqdm(data_loader): + batch_imgs = batch_imgs.to(device) + batch_feats = network(batch_imgs) + feats.append(batch_feats.detach().cpu()) + labels.append(batch_labels) + + feats = torch.cat(feats, dim=0) + labels = torch.cat(labels, dim=0) + + # Sort images by labels + labels, idxs = labels.sort() + feats = feats[idxs] + + return data.TensorDataset(feats, labels) + + +# %% [markdown] +# Let's apply the function to both training and test set below. + +# %% +train_feats_simclr = prepare_data_features(simclr_model, train_img_data) +test_feats_simclr = prepare_data_features(simclr_model, test_img_data) + +# %% [markdown] +# Finally, we can write a training function as usual. +# We evaluate the model on the test set every 10 epochs to allow early +# stopping, but the low frequency of the validation ensures that we do not +# overfit too much on the test set. + + +# %% +def train_logreg(batch_size, train_feats_data, test_feats_data, model_suffix, max_epochs=100, **kwargs): + trainer = L.Trainer( + default_root_dir=os.path.join(CHECKPOINT_PATH, "LogisticRegression"), + accelerator="auto", + devices=1, + max_epochs=max_epochs, + callbacks=[ + ModelCheckpoint(save_weights_only=True, mode="max", monitor="val_acc"), + LearningRateMonitor("epoch"), + ], + enable_progress_bar=False, + check_val_every_n_epoch=10, + ) + trainer.logger._default_hp_metric = None + + # Data loaders + train_loader = data.DataLoader( + train_feats_data, batch_size=batch_size, shuffle=True, drop_last=False, pin_memory=True, num_workers=0 + ) + test_loader = data.DataLoader( + test_feats_data, batch_size=batch_size, shuffle=False, drop_last=False, pin_memory=True, num_workers=0 + ) + + # Check whether pretrained model exists. If yes, load it and skip training + pretrained_filename = os.path.join(CHECKPOINT_PATH, f"LogisticRegression_{model_suffix}.ckpt") + if os.path.isfile(pretrained_filename): + print(f"Found pretrained model at {pretrained_filename}, loading...") + model = LogisticRegression.load_from_checkpoint(pretrained_filename) + else: + L.seed_everything(42) # To be reproducable + model = LogisticRegression(**kwargs) + trainer.fit(model, train_loader, test_loader) + model = LogisticRegression.load_from_checkpoint(trainer.checkpoint_callback.best_model_path) + + # Test best model on train and validation set + train_result = trainer.test(model, dataloaders=train_loader, verbose=False) + test_result = trainer.test(model, dataloaders=test_loader, verbose=False) + result = {"train": train_result[0]["test_acc"], "test": test_result[0]["test_acc"]} + + return model, result + + +# %% [markdown] +# Despite the training dataset of STL10 already only having 500 labeled images per class, we will perform experiments with even smaller datasets. +# Specifically, we train a Logistic Regression model for datasets with only 10, 20, 50, 100, 200, and all 500 examples per class. +# This gives us an intuition on how well the representations learned by contrastive learning can be transfered to a image recognition task like this classification. +# First, let's define a function to create the intended sub-datasets from the full training set: + + +# %% +def get_smaller_dataset(original_dataset, num_imgs_per_label): + new_dataset = data.TensorDataset( + *(t.unflatten(0, (10, 500))[:, :num_imgs_per_label].flatten(0, 1) for t in original_dataset.tensors) + ) + return new_dataset + + +# %% [markdown] +# Next, let's run all models. +# Despite us training 6 models, this cell could be run within a minute or two without the pretrained models. + +# %% +results = {} +for num_imgs_per_label in [10, 20, 50, 100, 200, 500]: + sub_train_set = get_smaller_dataset(train_feats_simclr, num_imgs_per_label) + _, small_set_results = train_logreg( + batch_size=64, + train_feats_data=sub_train_set, + test_feats_data=test_feats_simclr, + model_suffix=num_imgs_per_label, + feature_dim=train_feats_simclr.tensors[0].shape[1], + num_classes=10, + lr=1e-3, + weight_decay=1e-3, + ) + results[num_imgs_per_label] = small_set_results + +# %% [markdown] +# Finally, let's plot the results. + +# %% +dataset_sizes = sorted(k for k in results) +test_scores = [results[k]["test"] for k in dataset_sizes] + +fig = plt.figure(figsize=(6, 4)) +plt.plot( + dataset_sizes, + test_scores, + "--", + color="#000", + marker="*", + markeredgecolor="#000", + markerfacecolor="y", + markersize=16, +) +plt.xscale("log") +plt.xticks(dataset_sizes, labels=dataset_sizes) +plt.title("STL10 classification over dataset size", fontsize=14) +plt.xlabel("Number of images per class") +plt.ylabel("Test accuracy") +plt.minorticks_off() +plt.show() + +for k, score in zip(dataset_sizes, test_scores): + print(f"Test accuracy for {k:3d} images per label: {100*score:4.2f}%") + +# %% [markdown] +# As one would expect, the classification performance improves the more data we have. +# However, with only 10 images per class, we can already classify more than 60% of the images correctly. +# This is quite impressive, considering that the images are also higher dimensional than e.g. CIFAR10. +# With the full dataset, we achieve an accuracy of 81%. +# The increase between 50 to 500 images per class might suggest a linear increase in performance with an exponentially larger dataset. +# However, with even more data, we could also finetune $f(\cdot)$ in the training process, allowing for the representations to adapt more to the specific classification task given. +# +# To set the results above into perspective, we will train the base +# network, a ResNet-18, on the classification task from scratch. + +# %% [markdown] +# ## Baseline +# +# As a baseline to our results above, we will train a standard ResNet-18 with random initialization on the labeled training set of STL10. +# The results will give us an indication of the advantages that contrastive learning on unlabeled data has compared to using only supervised training. +# The implementation of the model is straightforward since the ResNet +# architecture is provided in the torchvision library. + + +# %% +class ResNet(L.LightningModule): + def __init__(self, num_classes, lr, weight_decay, max_epochs=100): + super().__init__() + self.save_hyperparameters() + self.model = torchvision.models.resnet18(pretrained=False, num_classes=num_classes) + + def configure_optimizers(self): + optimizer = optim.AdamW(self.parameters(), lr=self.hparams.lr, weight_decay=self.hparams.weight_decay) + lr_scheduler = optim.lr_scheduler.MultiStepLR( + optimizer, milestones=[int(self.hparams.max_epochs * 0.7), int(self.hparams.max_epochs * 0.9)], gamma=0.1 + ) + return [optimizer], [lr_scheduler] + + def _calculate_loss(self, batch, mode="train"): + imgs, labels = batch + preds = self.model(imgs) + loss = F.cross_entropy(preds, labels) + acc = (preds.argmax(dim=-1) == labels).float().mean() + + self.log(mode + "_loss", loss) + self.log(mode + "_acc", acc) + return loss + + def training_step(self, batch, batch_idx): + return self._calculate_loss(batch, mode="train") + + def validation_step(self, batch, batch_idx): + self._calculate_loss(batch, mode="val") + + def test_step(self, batch, batch_idx): + self._calculate_loss(batch, mode="test") + + +# %% [markdown] +# It is clear that the ResNet easily overfits on the training data since its parameter count is more than 1000 times larger than the dataset size. +# To make the comparison to the contrastive learning models fair, we apply data augmentations similar to the ones we used before: horizontal flip, crop-and-resize, grayscale, and gaussian blur. +# Color distortions as before are not used because the color distribution of an image showed to be an important feature for the classification. +# Hence, we observed no noticeable performance gains when adding color distortions to the set of augmentations. +# Similarly, we restrict the resizing operation before cropping to the max. +# 125% of its original resolution, instead of 1250% as done in SimCLR. +# This is because, for classification, the model needs to recognize the full object, while in contrastive learning, we only want to check whether two patches belong to the same image/object. +# Hence, the chosen augmentations below are overall weaker than in the contrastive learning case. + +# %% +train_transforms = transforms.Compose( + [ + transforms.RandomHorizontalFlip(), + transforms.RandomResizedCrop(size=96, scale=(0.8, 1.0)), + transforms.RandomGrayscale(p=0.2), + transforms.GaussianBlur(kernel_size=9, sigma=(0.1, 0.5)), + transforms.ToTensor(), + transforms.Normalize((0.5,), (0.5,)), + ] +) + +train_img_aug_data = STL10(root=DATASET_PATH, split="train", download=True, transform=train_transforms) + +# %% [markdown] +# The training function for the ResNet is almost identical to the Logistic Regression setup. +# Note that we allow the ResNet to perform validation every 2 epochs to +# also check whether the model overfits strongly in the first iterations +# or not. + + +# %% +def train_resnet(batch_size, max_epochs=100, **kwargs): + trainer = L.Trainer( + default_root_dir=os.path.join(CHECKPOINT_PATH, "ResNet"), + accelerator="auto", + devices=1, + max_epochs=max_epochs, + callbacks=[ + ModelCheckpoint(save_weights_only=True, mode="max", monitor="val_acc"), + LearningRateMonitor("epoch"), + ], + check_val_every_n_epoch=2, + ) + trainer.logger._default_hp_metric = None + + # Data loaders + train_loader = data.DataLoader( + train_img_aug_data, + batch_size=batch_size, + shuffle=True, + drop_last=True, + pin_memory=True, + num_workers=NUM_WORKERS, + ) + test_loader = data.DataLoader( + test_img_data, batch_size=batch_size, shuffle=False, drop_last=False, pin_memory=True, num_workers=NUM_WORKERS + ) + + # Check whether pretrained model exists. If yes, load it and skip training + pretrained_filename = os.path.join(CHECKPOINT_PATH, "ResNet.ckpt") + if os.path.isfile(pretrained_filename): + print("Found pretrained model at %s, loading..." % pretrained_filename) + model = ResNet.load_from_checkpoint(pretrained_filename) + else: + L.seed_everything(42) # To be reproducable + model = ResNet(**kwargs) + trainer.fit(model, train_loader, test_loader) + model = ResNet.load_from_checkpoint(trainer.checkpoint_callback.best_model_path) + + # Test best model on validation set + train_result = trainer.test(model, dataloaders=train_loader, verbose=False) + val_result = trainer.test(model, dataloaders=test_loader, verbose=False) + result = {"train": train_result[0]["test_acc"], "test": val_result[0]["test_acc"]} + + return model, result + + +# %% [markdown] +# Finally, let's train the model and check its results: + +# %% +resnet_model, resnet_result = train_resnet(batch_size=64, num_classes=10, lr=1e-3, weight_decay=2e-4, max_epochs=100) +print(f"Accuracy on training set: {100*resnet_result['train']:4.2f}%") +print(f"Accuracy on test set: {100*resnet_result['test']:4.2f}%") + +# %% [markdown] +# The ResNet trained from scratch achieves 73.31% on the test set. +# This is almost 8% less than the contrastive learning model, and even slightly less than SimCLR achieves with 1/10 of the data. +# This shows that self-supervised, contrastive learning provides +# considerable performance gains by leveraging large amounts of unlabeled +# data when little labeled data is available. + +# %% [markdown] +# ## Conclusion +# +# In this tutorial, we have discussed self-supervised contrastive learning and implemented SimCLR as an example method. +# We have applied it to the STL10 dataset and showed that it can learn generalizable representations that we can use to train simple classification models. +# With 500 images per label, it achieved an 8% higher accuracy than a similar model solely trained from supervision and performs on par with it when only using a tenth of the labeled data. +# Our experimental results are limited to a single dataset, but recent works such as [Ting Chen et al. ](https://arxiv.org/abs/2006.10029) showed similar trends for larger datasets like ImageNet. +# Besides the discussed hyperparameters, the size of the model seems to be important in contrastive learning as well. +# If a lot of unlabeled data is available, larger models can achieve much stronger results and come close to their supervised baselines. +# Further, there are also approaches for combining contrastive and supervised learning, leading to performance gains beyond supervision (see [Khosla et al.](https://arxiv.org/abs/2004.11362)). +# Moreover, contrastive learning is not the only approach to self-supervised learning that has come up in the last two years and showed great results. +# Other methods include distillation-based methods like [BYOL](https://arxiv.org/abs/2006.07733) and redundancy reduction techniques like [Barlow Twins](https://arxiv.org/abs/2103.03230). +# There is a lot more to explore in the self-supervised domain, and more, impressive steps ahead are to be expected. +# +# ### References +# +# [1] Chen, T., Kornblith, S., Norouzi, M., and Hinton, G. (2020). +# A simple framework for contrastive learning of visual representations. +# In International conference on machine learning (pp. +# 1597-1607). +# PMLR. +# ([link](https://arxiv.org/abs/2002.05709)) +# +# [2] Chen, T., Kornblith, S., Swersky, K., Norouzi, M., and Hinton, G. (2020). +# Big self-supervised models are strong semi-supervised learners. +# NeurIPS 2021 ([link](https://arxiv.org/abs/2006.10029)). +# +# [3] Oord, A. V. D., Li, Y., and Vinyals, O. +# (2018). +# Representation learning with contrastive predictive coding. +# arXiv preprint arXiv:1807.03748. +# ([link](https://arxiv.org/abs/1807.03748)) +# +# [4] Grill, J.B., Strub, F., Altché, F., Tallec, C., Richemond, P.H., Buchatskaya, E., Doersch, C., Pires, B.A., Guo, Z.D., Azar, M.G. +# and Piot, B. +# (2020). +# Bootstrap your own latent: A new approach to self-supervised learning. +# arXiv preprint arXiv:2006.07733. +# ([link](https://arxiv.org/abs/2006.07733)) +# +# [5] Khosla, P., Teterwak, P., Wang, C., Sarna, A., Tian, Y., Isola, P., Maschinot, A., Liu, C. and Krishnan, D. (2020). +# Supervised contrastive learning. +# arXiv preprint arXiv:2004.11362. +# ([link](https://arxiv.org/abs/2004.11362)) +# +# [6] Zbontar, J., Jing, L., Misra, I., LeCun, Y. and Deny, S. (2021). +# Barlow twins: Self-supervised learning via redundancy reduction. +# arXiv preprint arXiv:2103.03230. +# ([link](https://arxiv.org/abs/2103.03230)) diff --git a/_notebooks/course_UvA-DL/13-contrastive-learning/crop_views.svg b/_notebooks/course_UvA-DL/13-contrastive-learning/crop_views.svg new file mode 100644 index 0000000..6ea2ba9 --- /dev/null +++ b/_notebooks/course_UvA-DL/13-contrastive-learning/crop_views.svg @@ -0,0 +1 @@ + diff --git a/_notebooks/course_UvA-DL/13-contrastive-learning/simclr_contrastive_learning.png b/_notebooks/course_UvA-DL/13-contrastive-learning/simclr_contrastive_learning.png new file mode 100644 index 0000000..622b411 Binary files /dev/null and b/_notebooks/course_UvA-DL/13-contrastive-learning/simclr_contrastive_learning.png differ diff --git a/_notebooks/course_UvA-DL/13-contrastive-learning/simclr_data_augmentations.jpg b/_notebooks/course_UvA-DL/13-contrastive-learning/simclr_data_augmentations.jpg new file mode 100644 index 0000000..57a440c Binary files /dev/null and b/_notebooks/course_UvA-DL/13-contrastive-learning/simclr_data_augmentations.jpg differ diff --git a/_notebooks/course_UvA-DL/13-contrastive-learning/simclr_network_setup.svg b/_notebooks/course_UvA-DL/13-contrastive-learning/simclr_network_setup.svg new file mode 100644 index 0000000..687a62d --- /dev/null +++ b/_notebooks/course_UvA-DL/13-contrastive-learning/simclr_network_setup.svg @@ -0,0 +1,228 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/_notebooks/course_UvA-DL/13-contrastive-learning/tensorboard_simclr.png b/_notebooks/course_UvA-DL/13-contrastive-learning/tensorboard_simclr.png new file mode 100644 index 0000000..bfe6859 Binary files /dev/null and b/_notebooks/course_UvA-DL/13-contrastive-learning/tensorboard_simclr.png differ diff --git a/_notebooks/flash_tutorials/electricity_forecasting/.meta.yml b/_notebooks/flash_tutorials/electricity_forecasting/.meta.yml new file mode 100644 index 0000000..ab165e1 --- /dev/null +++ b/_notebooks/flash_tutorials/electricity_forecasting/.meta.yml @@ -0,0 +1,24 @@ +title: Electricity Price Forecasting with N-BEATS +author: Ethan Harris (ethan@pytorchlightning.ai) +created: 2021-11-23 +updated: 2021-12-16 +license: CC BY-SA +build: 3 +tags: + - Tabular + - Forecasting + - Timeseries +description: | + This tutorial covers using Lightning Flash and it's integration with PyTorch Forecasting to train an autoregressive + model (N-BEATS) on hourly electricity pricing data. We show how the built-in interpretability tools from PyTorch + Forecasting can be used with Flash to plot the trend and daily seasonality in our data discovered by the model. We + also cover how features from PyTorch Lightning such as the learning rate finder can be used easily with Flash. As a + bonus, we show hat we can resample daily observations from the data to discover weekly trends instead. +requirements: + - pandas==1.1.5 + - lightning-flash[tabular]>=0.6.0 + - pytorch-lightning==1.3.6 # todo: update to latest + - numpy<1.24 +accelerator: + - GPU + - CPU diff --git a/_notebooks/flash_tutorials/electricity_forecasting/.thumb.svg b/_notebooks/flash_tutorials/electricity_forecasting/.thumb.svg new file mode 100644 index 0000000..3f8037e --- /dev/null +++ b/_notebooks/flash_tutorials/electricity_forecasting/.thumb.svg @@ -0,0 +1 @@ + diff --git a/_notebooks/flash_tutorials/electricity_forecasting/diagram.png b/_notebooks/flash_tutorials/electricity_forecasting/diagram.png new file mode 100644 index 0000000..47120db Binary files /dev/null and b/_notebooks/flash_tutorials/electricity_forecasting/diagram.png differ diff --git a/_notebooks/flash_tutorials/electricity_forecasting/electricity_forecasting.py b/_notebooks/flash_tutorials/electricity_forecasting/electricity_forecasting.py new file mode 100644 index 0000000..621cd30 --- /dev/null +++ b/_notebooks/flash_tutorials/electricity_forecasting/electricity_forecasting.py @@ -0,0 +1,311 @@ +# %% [markdown] +# In this tutorial we'll look at using [Lightning Flash](https://github.com/Lightning-AI/lightning-flash) and it's +# integration with [PyTorch Forecasting](https://github.com/jdb78/pytorch-forecasting) for autoregressive modelling of +# electricity prices using [the N-BEATS model](https://arxiv.org/abs/1905.10437). +# We'll start by using N-BEATS to uncover daily patterns (seasonality) from hourly observations and then show how we can +# resample daily averages to uncover weekly patterns too. +# +# Along the way, we'll see how the built-in tools from PyTorch Lightning, like the learning rate finder, can be used +# seamlessly with Flash to help make the process of putting a model together as smooth as possible. + +# %% + +import os +from typing import Any, Dict + +import flash +import matplotlib.pyplot as plt +import pandas as pd +import torch +from flash.core.data.utils import download_data +from flash.core.integrations.pytorch_forecasting import convert_predictions +from flash.tabular.forecasting import TabularForecaster, TabularForecastingData + +DATASET_PATH = os.environ.get("PATH_DATASETS", "data/") + +# %% [markdown] +# ## Loading the data +# +# We'll use the Spanish hourly energy demand generation and weather data set from Kaggle: +# https://www.kaggle.com/nicholasjhana/energy-consumption-generation-prices-and-weather +# +# First, download the data: + +# %% +download_data("https://pl-flash-data.s3.amazonaws.com/kaggle_electricity.zip", DATASET_PATH) + +# %% [markdown] +# ## Data loading +# +# To load the data, we start by loading the CSV file into a pandas DataFrame: + +# %% +df_energy_hourly = pd.read_csv(f"{DATASET_PATH}/energy_dataset.csv", parse_dates=["time"]) + +# %% [markdown] +# Before we can load the data into Flash, there are a few preprocessing steps we need to take. +# The first preprocessing step is to set the `time` field as the index (formatted as a datetime). +# The second step is to resample the data to the desired frequency in case it is different from the desired observation +# frequency. +# Since we are performing autoregressive modelling, we can remove all columns except for `"price actual"`. +# +# For the third preprocessing step, we need to create a "time_idx" column. +# The "time_idx" column should contain integers corresponding to the observation index (e.g. in our case the difference +# between two "time_idx" values is the number of hours between the observations). +# To do this we convert the datetime to an index by taking the nanoseconds value and dividing by the number of +# nanoseconds in a single unit of our chosen frequency. +# We then subtract the minimum value so it starts at zero (although it would still work without this step). +# +# The Flash `TabularForecastingData` (which uses the `TimeSeriesDataSet` from PyTorch Forecasting internally) also +# supports loading data from multiple time series (e.g. you may have electricity data from multiple countries). +# To indicate that our data is all from the same series, we add a `constant` column with a constant value of zero. +# +# Here's the full preprocessing function: + +# %% + + +def preprocess(df: pd.DataFrame, frequency: str = "1H") -> pd.DataFrame: + df["time"] = pd.to_datetime(df["time"], utc=True, infer_datetime_format=True) + df.set_index("time", inplace=True) + + df = df.resample(frequency).mean() + + df = df.filter(["price actual"]) + + df["time_idx"] = (df.index.view(int) / pd.Timedelta(frequency).value).astype(int) + df["time_idx"] -= df["time_idx"].min() + + df["constant"] = 0 + + return df + + +df_energy_hourly = preprocess(df_energy_hourly) + +# %% [markdown] +# ## Creating the Flash DataModule +# +# Now, we can create a `TabularForecastingData`. +# The role of the `TabularForecastingData` is to split up our time series into windows which include a region to encode +# (of size `max_encoder_length`) and a region to predict (of size `max_prediction_length`) which will be used to compute +# the loss. +# The size of the prediction window should be chosen depending on the kinds of trends we would like our model to +# uncover. +# In our case, we are interested in how electricity prices change throughout the day, so a one day prediction window +# (`max_prediction_length = 24`) makes sense here. +# The size of the encoding window can vary, however, in the [N-BEATS paper](https://arxiv.org/abs/1905.10437) the +# authors suggest using an encoder length of between two and ten times the prediction length. +# We therefore choose two days (`max_encoder_length = 48`) as the encoder length. + +# %% +max_prediction_length = 24 +max_encoder_length = 24 * 2 + +training_cutoff = df_energy_hourly["time_idx"].max() - max_prediction_length + +datamodule = TabularForecastingData.from_data_frame( + time_idx="time_idx", + target="price actual", + group_ids=["constant"], + max_encoder_length=max_encoder_length, + max_prediction_length=max_prediction_length, + time_varying_unknown_reals=["price actual"], + train_data_frame=df_energy_hourly[df_energy_hourly["time_idx"] <= training_cutoff], + val_data_frame=df_energy_hourly, + batch_size=256, +) + +# %% [markdown] +# ## Creating the Flash Task +# +# Now, we're ready to create a `TabularForecaster`. +# The N-BEATS model has two primary hyper-parameters:`"widths"`, and `"backcast_loss_ratio"`. +# In the [PyTorch Forecasting Documentation](https://pytorch-forecasting.readthedocs.io/en/latest/api/pytorch_forecasting.models.nbeats.NBeats.html), +# the authors recommend using `"widths"` of `[32, 512]`. +# In order to prevent overfitting with smaller datasets, a good rule of thumb is to limit the number of parameters of +# your model. +# For this reason, we use `"widths"` of `[16, 256]`. +# +# To understand the `"backcast_loss_ratio"`, let's take a look at this diagram of the model taken from +# [the arXiv paper](https://arxiv.org/abs/1905.10437): +# +# ![N-BEATS diagram](diagram.png) +# +# Each 'block' within the N-BEATS architecture includes a forecast output and a backcast which can each yield their own +# loss. +# The `"backcast_loss_ratio"` is the ratio of the backcast loss to the forecast loss. +# A value of `1.0` means that the loss function is simply the sum of the forecast and backcast losses. + +# %% +model = TabularForecaster( + datamodule.parameters, backbone="n_beats", backbone_kwargs={"widths": [16, 256], "backcast_loss_ratio": 1.0} +) + +# %% [markdown] +# ## Finding the learning rate +# +# Tabular models can be particularly sensitive to the choice of learning rate. +# Helpfully, PyTorch Lightning provides a built-in learning rate finder that suggests a suitable learning rate +# automatically. +# To use it, we first create our Trainer. +# We apply gradient clipping (a common technique for tabular tasks) with ``gradient_clip_val=0.01`` in order to help +# prevent our model from over-fitting. +# Here's how to find the learning rate: + +# %% +trainer = flash.Trainer( + max_epochs=3, + gpus=int(torch.cuda.is_available()), + gradient_clip_val=0.01, +) + +res = trainer.tuner.lr_find(model, datamodule=datamodule, min_lr=1e-5) +print(f"Suggested learning rate: {res.suggestion()}") +res.plot(show=True, suggest=True).show() + +# %% [markdown] +# Once the suggest learning rate has been found, we can update our model with it: + +# %% +model.learning_rate = res.suggestion() + +# %% [markdown] +# ## Training the model +# Now all we have to do is train the model! + +# %% +trainer.fit(model, datamodule=datamodule) + +# %% [markdown] +# ## Plot the interpretation +# +# An important feature of the N-BEATS model is that it can be configured to produce an interpretable prediction that is +# split into both a low frequency (trend) component and a high frequency (seasonality) component. +# For hourly observations, we might expect the trend component to show us how electricity prices are changing from one +# day to the next (for example, whether prices were generally higher or lower than yesterday). +# In contrast, the seasonality component would be expected to show us the general pattern in prices through the day +# (for example, if there is typically a peak in price around lunch time or a drop at night). +# +# It is often useful to visualize this decomposition and the `TabularForecaster` makes it simple. +# First, we load the best model from our training run and generate some predictions. +# Next, we convert the predictions to the format expected by PyTorch Forecasting using the `convert_predictions` utility +# function. +# Finally, we plot the interpretation using the `pytorch_forecasting_model` attribute. +# Here's the full function: + +# %% + + +def plot_interpretation(model_path: str, predict_df: pd.DataFrame, parameters: Dict[str, Any]): + model = TabularForecaster.load_from_checkpoint(model_path) + datamodule = TabularForecastingData.from_data_frame( + parameters=parameters, + predict_data_frame=predict_df, + batch_size=256, + ) + trainer = flash.Trainer(gpus=int(torch.cuda.is_available())) + predictions = trainer.predict(model, datamodule=datamodule) + predictions, inputs = convert_predictions(predictions) + model.pytorch_forecasting_model.plot_interpretation(inputs, predictions, idx=0) + plt.show() + + +# %% [markdown] +# And now we run the function to plot the trend and seasonality curves: + +# %% +# Todo: Make sure to uncomment the line below if you want to run predictions and visualize the graph +# plot_interpretation(trainer.checkpoint_callback.best_model_path, df_energy_hourly, datamodule.parameters) + +# %% [markdown] +# It worked! The plot shows that the `TabularForecaster` does a reasonable job of modelling the time series and also +# breaks it down into a trend component and a seasonality component (in this case showing daily fluctuations in +# electricity prices). +# +# ## Bonus: Weekly trends +# +# The type of seasonality that the model learns to detect is dictated by the frequency of observations and the length of +# the encoding / prediction window. +# We might imagine that our pipeline could be changed to instead uncover weekly trends if we resample daily +# observations from our data instead of hourly. +# +# We can use our preprocessing function to do this. +# First, we load the data as before then preprocess it (this time setting `frequency = "1D"`). + +# %% +df_energy_daily = pd.read_csv(f"{DATASET_PATH}/energy_dataset.csv", parse_dates=["time"]) +df_energy_daily = preprocess(df_energy_daily, frequency="1D") + +# %% [markdown] +# Now let's create our `TabularForecastingData` as before, this time with a four week encoding window and a one week +# prediction window. + +# %% +max_prediction_length = 1 * 7 +max_encoder_length = 4 * 7 + +training_cutoff = df_energy_daily["time_idx"].max() - max_prediction_length + +datamodule = TabularForecastingData.from_data_frame( + time_idx="time_idx", + target="price actual", + group_ids=["constant"], + max_encoder_length=max_encoder_length, + max_prediction_length=max_prediction_length, + time_varying_unknown_reals=["price actual"], + train_data_frame=df_energy_daily[df_energy_daily["time_idx"] <= training_cutoff], + val_data_frame=df_energy_daily, + batch_size=256, +) + +# %% [markdown] +# Now it's time to create a new model and trainer. +# We run for 24 times the number of epochs this time as we now have around 1/24th of the number of observations. +# This time, instead of using the learning rate finder we just set the learning rate manually: + +# %% +model = TabularForecaster( + datamodule.parameters, + backbone="n_beats", + backbone_kwargs={"widths": [16, 256], "backcast_loss_ratio": 1.0}, + learning_rate=5e-4, +) + +trainer = flash.Trainer( + max_epochs=3 * 24, + check_val_every_n_epoch=24, + gpus=int(torch.cuda.is_available()), + gradient_clip_val=0.01, +) + +# %% [markdown] +# Finally, we train the new model: + +# %% +trainer.fit(model, datamodule=datamodule) + +# %% [markdown] +# Now let's look at what it learned: + +# %% +# Todo: Make sure to uncomment the line below if you want to run predictions and visualize the graph +# plot_interpretation(trainer.checkpoint_callback.best_model_path, df_energy_daily, datamodule.parameters) + +# %% [markdown] +# Success! We can now also see weekly trends / seasonality uncovered by our new model. +# +# ## Closing thoughts and next steps! +# +# This tutorial has shown how Flash and PyTorch Forecasting can be used to train state-of-the-art auto-regressive +# forecasting models (such as N-BEATS). +# We've seen how we can influence the kinds of trends and patterns uncovered by the model by resampling the data and +# changing the hyper-parameters. +# +# There are plenty of ways you could take this tutorial further. +# For example, you could try a more complex model, such as the +# [temporal fusion transformer](https://pytorch-forecasting.readthedocs.io/en/latest/api/pytorch_forecasting.models.temporal_fusion_transformer.TemporalFusionTransformer.html), +# which can handle additional inputs (the kaggle data set we used also includes weather data). +# +# Alternatively, if you want to be a bit more adventurous, you could look at +# [some of the other problems that can solved with Lightning Flash](https://lightning-flash.readthedocs.io/en/stable/?badge=stable). diff --git a/_notebooks/flash_tutorials/image_classification/.meta.yml b/_notebooks/flash_tutorials/image_classification/.meta.yml new file mode 100644 index 0000000..e4f1cfc --- /dev/null +++ b/_notebooks/flash_tutorials/image_classification/.meta.yml @@ -0,0 +1,19 @@ +title: Image Classification on Hymenoptera Dataset +author: Ethan Harris (ethan@pytorchlightning.ai) +created: 2021-11-23 +updated: 2022-08-26 +license: CC BY-SA +build: 3 +tags: + - Image Classification + - Image +description: | + In this tutorial, we'll go over the basics of lightning Flash by finetuning/predictin with an ImageClassifier on [Hymenoptera Dataset](https://www.kaggle.com/ajayrana/hymenoptera-data) containing ants and bees images. +requirements: + - pytorch-lightning==1.6.* + - lightning-flash[image]>=0.7.0 + - torchmetrics<0.11 # todo: task argument is missing + - numpy<1.24 +accelerator: + - GPU + - CPU diff --git a/_notebooks/flash_tutorials/image_classification/image_classification.py b/_notebooks/flash_tutorials/image_classification/image_classification.py new file mode 100644 index 0000000..ba34a8b --- /dev/null +++ b/_notebooks/flash_tutorials/image_classification/image_classification.py @@ -0,0 +1,115 @@ +# %% [markdown] +# In this tutorial, we'll go over the basics of lightning Flash by finetuning/predictin with an ImageClassifier on [Hymenoptera Dataset](https://www.kaggle.com/ajayrana/hymenoptera-data) containing ants and bees images. +# +# # Finetuning +# +# Finetuning consists of four steps: +# +# - 1. Train a source neural network model on a source dataset. For computer vision, it is traditionally the [ImageNet dataset](http://www.image-net.org). As training is costly, library such as [Torchvision](https://pytorch.org/vision/stable/index.html) library supports popular pre-trainer model architectures . In this notebook, we will be using their [resnet-18](https://pytorch.org/hub/pytorch_vision_resnet/). +# +# - 2. Create a new neural network called the target model. Its architecture replicates the source model and parameters, expect the latest layer which is removed. This model without its latest layer is traditionally called a backbone +# +# - 3. Add new layers after the backbone where the latest output size is the number of target dataset categories. Those new layers, traditionally called head will be randomly initialized while backbone will conserve its pre-trained weights from ImageNet. +# +# - 4. Train the target model on a target dataset, such as Hymenoptera Dataset with ants and bees. However, freezing some layers at training start such as the backbone tends to be more stable. In Flash, it can easily be done with `trainer.finetune(..., strategy="freeze")`. It is also common to `freeze/unfreeze` the backbone. In `Flash`, it can be done with `trainer.finetune(..., strategy="freeze_unfreeze")`. If one wants more control on the unfreeze flow, Flash supports `trainer.finetune(..., strategy=MyFinetuningStrategy())` where `MyFinetuningStrategy` is subclassing `pytorch_lightning.callbacks.BaseFinetuning`. + +# %% + +import flash +from flash.core.data.utils import download_data +from flash.image import ImageClassificationData, ImageClassifier + +# %% [markdown] +# ## Download data +# The data are downloaded from a URL, and save in a 'data' directory. + +# %% +download_data("https://pl-flash-data.s3.amazonaws.com/hymenoptera_data.zip", "data/") + + +# %% [markdown] +# ## Load the data +# +# Flash Tasks have built-in DataModules that you can use to organize your data. Pass in a train, validation and test folders and Flash will take care of the rest. +# Creates a ImageClassificationData object from folders of images arranged in this way: +# +# train/dog/xxx.png +# train/dog/xxy.png +# train/dog/xxz.png +# train/cat/123.png +# train/cat/nsdf3.png +# train/cat/asd932.png + +# %% +datamodule = ImageClassificationData.from_folders( + train_folder="data/hymenoptera_data/train/", + val_folder="data/hymenoptera_data/val/", + test_folder="data/hymenoptera_data/test/", + batch_size=1, +) + + +# %% [markdown] +# ## Build the model +# Create the ImageClassifier task. By default, the ImageClassifier task uses a [resnet-18](https://pytorch.org/hub/pytorch_vision_resnet/) backbone to train or finetune your model. +# For [Hymenoptera Dataset](https://www.kaggle.com/ajayrana/hymenoptera-data) containing ants and bees images, ``datamodule.num_classes`` will be 2. +# Backbone can easily be changed with `ImageClassifier(backbone="resnet50")` or you could provide your own `ImageClassifier(backbone=my_backbone)` + +# %% +model = ImageClassifier(num_classes=datamodule.num_classes) + + +# %% [markdown] +# ## Create the trainer. Run once on data +# The trainer object can be used for training or fine-tuning tasks on new sets of data. +# You can pass in parameters to control the training routine- limit the number of epochs, run on GPUs or TPUs, etc. +# For more details, read the [Trainer Documentation](https://pytorch-lightning.readthedocs.io/en/stable/api/pytorch_lightning.trainer.trainer.Trainer.html?highlight=Trainer). +# In this demo, we will limit the fine-tuning to run just one epoch using max_epochs=2. + +# %% +trainer = flash.Trainer(max_epochs=1) + + +# %% [markdown] +# ## Finetune the model + +# %% +trainer.finetune(model, datamodule=datamodule, strategy="freeze") + + +# %% [markdown] +# ## Test the model + +# %% +trainer.test(model, datamodule=datamodule) + + +# %% [markdown] +# ## Save it! + +# %% +trainer.save_checkpoint("image_classification_model.pt") + +# %% [markdown] +# ## Predicting +# **Load the model from a checkpoint** + +# %% +model = ImageClassifier.load_from_checkpoint( + "https://flash-weights.s3.amazonaws.com/0.7.0/image_classification_model.pt" +) + +# %% [markdown] +# **Predict what's on a few images! ants or bees?** + +# %% +datamodule = ImageClassificationData.from_files( + predict_files=[ + "data/hymenoptera_data/val/bees/65038344_52a45d090d.jpg", + "data/hymenoptera_data/val/bees/590318879_68cf112861.jpg", + "data/hymenoptera_data/val/ants/540543309_ddbb193ee5.jpg", + ], + batch_size=1, +) +predictions = trainer.predict(model, datamodule=datamodule) +print(predictions) diff --git a/_notebooks/flash_tutorials/tabular_classification/.meta.yml b/_notebooks/flash_tutorials/tabular_classification/.meta.yml new file mode 100644 index 0000000..8e885a9 --- /dev/null +++ b/_notebooks/flash_tutorials/tabular_classification/.meta.yml @@ -0,0 +1,18 @@ +title: Tabular Classification on Titanic Dataset +author: Ethan Harris (ethan@pytorchlightning.ai) +created: 2021-11-23 +updated: 2022-08-26 +license: CC BY-SA +build: 3 +tags: + - Tabular Classification + - Tabular +description: | + In this notebook, we'll go over the basics of lightning Flash by training a TabularClassifier on [Titanic Dataset](https://www.kaggle.com/c/titanic). +requirements: + - lightning-flash[tabular]>=0.6.0 + - pytorch-lightning==1.3.6 # todo: update to latest + - numpy<1.24 +accelerator: + - GPU + - CPU diff --git a/_notebooks/flash_tutorials/tabular_classification/tabular_classification.py b/_notebooks/flash_tutorials/tabular_classification/tabular_classification.py new file mode 100644 index 0000000..a2089ca --- /dev/null +++ b/_notebooks/flash_tutorials/tabular_classification/tabular_classification.py @@ -0,0 +1,98 @@ +# %% [markdown] +# In this notebook, we'll go over the basics of lightning Flash by training a TabularClassifier on [Titanic Dataset](https://www.kaggle.com/c/titanic). + +# # Training + +# %% + +import flash +from flash.core.data.utils import download_data +from flash.tabular import TabularClassificationData, TabularClassifier + +# %% [markdown] +# ## Download the data +# The data are downloaded from a URL, and save in a 'data' directory. + +# %% +download_data("https://pl-flash-data.s3.amazonaws.com/titanic.zip", "data/") + + +# %% [markdown] +# ## Load the data +# Flash Tasks have built-in DataModules that you can use to organize your data. Pass in a train, validation and test folders and Flash will take care of the rest. +# +# Creates a TabularData relies on [Pandas DataFrame](https://pandas.pydata.org/pandas-docs/stable/reference/api/pandas.DataFrame.html). + +# %% +datamodule = TabularClassificationData.from_csv( + ["Sex", "Age", "SibSp", "Parch", "Ticket", "Cabin", "Embarked"], + ["Fare"], + target_fields="Survived", + train_file="./data/titanic/titanic.csv", + test_file="./data/titanic/test.csv", + val_split=0.25, + batch_size=8, +) + + +# %% [markdown] +# ## Build the model +# +# Note: Categorical columns will be mapped to the embedding space. Embedding space is set of tensors to be trained associated to each categorical column. + +# %% +model = TabularClassifier.from_data(datamodule) + + +# %% [markdown] +# ## Create the trainer. Run 10 times on data + +# %% +trainer = flash.Trainer(max_epochs=10) + + +# %% [markdown] +# ## Train the model + +# %% +trainer.fit(model, datamodule=datamodule) + +# %% [markdown] +# ## Test model + +# %% +trainer.test(model, datamodule=datamodule) + + +# %% [markdown] +# ## Save it! + +# %% +trainer.save_checkpoint("tabular_classification_model.pt") + + +# %% [markdown] +# # Predicting +# ## Load the model from a checkpoint +# +# `TabularClassifier.load_from_checkpoint` supports both url or local_path to a checkpoint. If provided with an url, the checkpoint will first be downloaded and laoded to re-create the model. + +# %% +model = TabularClassifier.load_from_checkpoint( + "https://flash-weights.s3.amazonaws.com/0.7.0/tabular_classification_model.pt" +) + + +# %% [markdown] +# ## Generate predictions from a sheet file! Who would survive? +# +# `TabularClassifier.predict` support both DataFrame and path to `.csv` file. + +# %% +datamodule = TabularClassificationData.from_csv( + predict_file="data/titanic/titanic.csv", + parameters=datamodule.parameters, + batch_size=8, +) +predictions = trainer.predict(model, datamodule=datamodule) +print(predictions) diff --git a/_notebooks/flash_tutorials/text_classification/.meta.yml b/_notebooks/flash_tutorials/text_classification/.meta.yml new file mode 100644 index 0000000..1b1592a --- /dev/null +++ b/_notebooks/flash_tutorials/text_classification/.meta.yml @@ -0,0 +1,19 @@ +title: Finetuning a Text Classifier on IMDB Dataset +author: Ethan Harris (ethan@pytorchlightning.ai) +created: 2021-11-23 +updated: 2022-08-26 +license: CC BY-SA +build: 3 +tags: + - Text Classification + - Text +description: | + In this notebook, we'll go over the basics of lightning Flash by finetunig a TextClassifier on IMDB Dataset. +requirements: + - pytorch-lightning==1.6.* + - lightning-flash[text]>=0.7.0 + - torchmetrics<0.11 # todo: update to use task=... + - numpy<1.24 +accelerator: + - GPU + - CPU diff --git a/_notebooks/flash_tutorials/text_classification/text_classification.py b/_notebooks/flash_tutorials/text_classification/text_classification.py new file mode 100644 index 0000000..f83bac5 --- /dev/null +++ b/_notebooks/flash_tutorials/text_classification/text_classification.py @@ -0,0 +1,110 @@ +# %% [markdown] +# In this notebook, we'll go over the basics of lightning Flash by finetunig a TextClassifier on [IMDB Dataset](https://paperswithcode.com/dataset/imdb-movie-reviews). +# +# # Finetuning +# +# Finetuning consists of four steps: +# +# - 1. Train a source neural network model on a source dataset. For text classication, it is traditionally a transformer model such as BERT [Bidirectional Encoder Representations from Transformers](https://arxiv.org/abs/1810.04805) trained on wikipedia. +# As those model are costly to train, [Transformers](https://github.com/huggingface/transformers) or [FairSeq](https://github.com/pytorch/fairseq) libraries provides popular pre-trained model architectures for NLP. In this notebook, we will be using [tiny-bert](https://huggingface.co/prajjwal1/bert-tiny). +# +# - 2. Create a new neural network the target model. Its architecture replicates all model designs and their parameters on the source model, expect the latest layer which is removed. This model without its latest layers is traditionally called a backbone +# +# - 3. Add new layers after the backbone where the latest output size is the number of target dataset categories. Those new layers, traditionally called head, will be randomly initialized while backbone will conserve its pre-trained weights from ImageNet. +# +# - 4. Train the target model on a target dataset, such as Hymenoptera Dataset with ants and bees. However, freezing some layers at training start such as the backbone tends to be more stable. In Flash, it can easily be done with `trainer.finetune(..., strategy="freeze")`. It is also common to `freeze/unfreeze` the backbone. In `Flash`, it can be done with `trainer.finetune(..., strategy="freeze_unfreeze")`. If a one wants more control on the unfreeze flow, Flash supports `trainer.finetune(..., strategy=MyFinetuningStrategy())` where `MyFinetuningStrategy` is subclassing `pytorch_lightning.callbacks.BaseFinetuning`. + +# %% + +import flash +from flash.core.data.utils import download_data +from flash.text import TextClassificationData, TextClassifier + +# %% [markdown] +# ## Download the data +# The data are downloaded from a URL, and save in a 'data' directory. + +# %% +download_data("https://pl-flash-data.s3.amazonaws.com/imdb.zip", "data/") + + +# %% [markdown] +# ## Load the data +# +# Flash Tasks have built-in DataModules that you can use to organize your data. Pass in a train, validation and test folders and Flash will take care of the rest. +# Creates a TextClassificationData object from csv file. + +# %% +datamodule = TextClassificationData.from_csv( + "review", + "sentiment", + train_file="data/imdb/train.csv", + val_file="data/imdb/valid.csv", + test_file="data/imdb/test.csv", + batch_size=512, # just increased for the example to run fast +) + + +# %% [markdown] +# ## Build the model +# +# Create the TextClassifier task. By default, the TextClassifier task uses a [tiny-bert](https://huggingface.co/prajjwal1/bert-tiny) backbone to train or finetune your model demo. You could use any models from [transformers - Text Classification](https://huggingface.co/models?filter=text-classification,pytorch) +# +# Backbone can easily be changed with such as `TextClassifier(backbone='bert-tiny-mnli')` + +# %% +model = TextClassifier(num_classes=datamodule.num_classes, backbone="prajjwal1/bert-tiny") + + +# %% [markdown] +# ## Create the trainer. Run once on data + +# %% +trainer = flash.Trainer(max_epochs=1) + + +# %% [markdown] +# ## Fine-tune the model +# +# The backbone won't be freezed and the entire model will be finetuned on the imdb dataset + +# %% +trainer.finetune(model, datamodule=datamodule, strategy="freeze") + + +# %% [markdown] +# ## Test model + +# %% +trainer.test(model, datamodule=datamodule) + + +# %% [markdown] +# ## Save it! + +# %% +trainer.save_checkpoint("text_classification_model.pt") + + +# %% [markdown] +# ## Predicting +# **Load the model from a checkpoint** + +# %% +model = TextClassifier.load_from_checkpoint("text_classification_model.pt") + + +# %% [markdown] +# **Classify a few sentences! How was the movie?** + +# %% +datamodule = TextClassificationData.from_lists( + predict_data=[ + "Turgid dialogue, feeble characterization - Harvey Keitel a judge?.", + "The worst movie in the history of cinema.", + "I come from Bulgaria where it 's almost impossible to have a tornado.", + ], + batch_size=4, +) +predictions = trainer.predict(model, datamodule=datamodule) +print(predictions) diff --git a/_notebooks/lightning_examples/augmentation_kornia/.meta.yml b/_notebooks/lightning_examples/augmentation_kornia/.meta.yml new file mode 100644 index 0000000..7f5c11c --- /dev/null +++ b/_notebooks/lightning_examples/augmentation_kornia/.meta.yml @@ -0,0 +1,24 @@ +title: GPU and batched data augmentation with Kornia and PyTorch-Lightning +author: PL/Kornia team +created: 2021-06-11 +updated: 2023-03-15 +license: CC BY-SA +build: 0 +tags: + - Image +description: | + In this tutorial we will show how to combine both Kornia and PyTorch Lightning + to perform efficient data augmentation to train a simple model using the GPU in batch + mode without additional effort. +requirements: + - kornia + - lightning + - torchmetrics + - torchvision + - matplotlib + - pandas + - seaborn + - lightning>=2.0.0rc0 +accelerator: + - CPU + - GPU diff --git a/docs/_static/icon.svg b/_notebooks/lightning_examples/augmentation_kornia/.thumb.svg similarity index 100% rename from docs/_static/icon.svg rename to _notebooks/lightning_examples/augmentation_kornia/.thumb.svg diff --git a/_notebooks/lightning_examples/augmentation_kornia/augmentation.py b/_notebooks/lightning_examples/augmentation_kornia/augmentation.py new file mode 100644 index 0000000..46ab969 --- /dev/null +++ b/_notebooks/lightning_examples/augmentation_kornia/augmentation.py @@ -0,0 +1,206 @@ +# %% +import os + +import lightning as L +import matplotlib.pyplot as plt +import numpy as np +import pandas as pd +import seaborn as sn +import torch +import torch.nn as nn +import torchmetrics +import torchvision +from IPython.display import display +from kornia import image_to_tensor, tensor_to_image +from kornia.augmentation import ColorJitter, RandomChannelShuffle, RandomHorizontalFlip, RandomThinPlateSpline +from lightning.pytorch.loggers import CSVLogger +from torch import Tensor +from torch.nn import functional as F +from torch.utils.data import DataLoader +from torchvision.datasets import CIFAR10 + +sn.set() + +# %% [markdown] +# ## Define Data Augmentations module +# +# [Kornia](https://github.com/kornia/kornia) is low level Computer Vision library that provides a dedicated module +# [`kornia.augmentation`](https://kornia.readthedocs.io/en/latest/augmentation.html) module implementing +# en extensive set of data augmentation techniques for image and video. +# +# Similar to Lightning, in Kornia it's promoted to encapsulate functionalities inside classes for readability +# and efficiency purposes. In this case, we define a data augmentaton pipeline subclassing a `nn.Module` +# where the augmentation_kornia (also subclassing `nn.Module`) are combined with other PyTorch components +# such as `nn.Sequential`. +# +# Checkout the different augmentation operators in Kornia docs and experiment yourself! + + +# %% +class DataAugmentation(nn.Module): + """Module to perform data augmentation using Kornia on torch tensors.""" + + def __init__(self, apply_color_jitter: bool = False) -> None: + super().__init__() + self._apply_color_jitter = apply_color_jitter + + self.transforms = nn.Sequential( + RandomHorizontalFlip(p=0.75), + RandomChannelShuffle(p=0.75), + RandomThinPlateSpline(p=0.75), + ) + + self.jitter = ColorJitter(0.5, 0.5, 0.5, 0.5) + + @torch.no_grad() # disable gradients for effiency + def forward(self, x: Tensor) -> Tensor: + x_out = self.transforms(x) # BxCxHxW + if self._apply_color_jitter: + x_out = self.jitter(x_out) + return x_out + + +# %% [markdown] +# ## Define a Pre-processing module +# +# In addition to the `DataAugmentation` modudle that will sample random parameters during the training stage, +# we define a `Preprocess` class to handle the conversion of the image type to properly work with `Tensor`. +# +# For this example we use `torchvision` CIFAR10 which return samples of `PIL.Image`, however, +# to take all the advantages of PyTorch and Kornia we need to cast the images into tensors. +# +# To do that we will use `kornia.image_to_tensor` which casts and permutes the images in the right format. + + +# %% +class Preprocess(nn.Module): + """Module to perform pre-process using Kornia on torch tensors.""" + + @torch.no_grad() # disable gradients for effiency + def forward(self, x) -> Tensor: + x_tmp: np.ndarray = np.array(x) # HxWxC + x_out: Tensor = image_to_tensor(x_tmp, keepdim=True) # CxHxW + return x_out.float() / 255.0 + + +# %% [markdown] +# ## Define PyTorch Lightning model +# +# The next step is to define our `LightningModule` to have a proper organisation of our training pipeline. +# This is a simple example just to show how to structure your baseline to be used as a reference, +# do not expect a high performance. +# +# Notice that the `Preprocess` class is injected into the dataset and will be applied per sample. +# +# The interesting part in the proposed approach happens inside the `training_step` where with just a single +# line of code we apply the data augmentation in batch and no need to worry about the device. +# This means that our `DataAugmentation` pipeline will automatically executed in the GPU. + + +# %% +class CoolSystem(L.LightningModule): + def __init__(self): + super().__init__() + # not the best model: expereiment yourself + self.model = torchvision.models.resnet18(pretrained=True) + self.preprocess = Preprocess() # per sample transforms + self.transform = DataAugmentation() # per batch augmentation_kornia + self.train_accuracy = torchmetrics.Accuracy(task="multiclass", num_classes=1000) + self.val_accuracy = torchmetrics.Accuracy(task="multiclass", num_classes=1000) + + def forward(self, x): + return self.model(x) + + def compute_loss(self, y_hat, y): + return F.cross_entropy(y_hat, y) + + def show_batch(self, win_size=(10, 10)): + def _to_vis(data): + return tensor_to_image(torchvision.utils.make_grid(data, nrow=8)) + + # get a batch from the training set: try with `val_datlaoader` :) + imgs, labels = next(iter(self.train_dataloader())) + imgs_aug = self.transform(imgs) # apply transforms + # use matplotlib to visualize + plt.figure(figsize=win_size) + plt.imshow(_to_vis(imgs)) + plt.figure(figsize=win_size) + plt.imshow(_to_vis(imgs_aug)) + + def on_after_batch_transfer(self, batch, dataloader_idx): + x, y = batch + if self.trainer.training: + x = self.transform(x) # => we perform GPU/Batched data augmentation + return x, y + + def training_step(self, batch, batch_idx): + x, y = batch + y_hat = self(x) + loss = self.compute_loss(y_hat, y) + self.train_accuracy.update(y_hat, y) + self.log("train_loss", loss, prog_bar=False) + self.log("train_acc", self.train_accuracy, prog_bar=False) + return loss + + def validation_step(self, batch, batch_idx): + x, y = batch + y_hat = self(x) + loss = self.compute_loss(y_hat, y) + self.val_accuracy.update(y_hat, y) + self.log("valid_loss", loss, prog_bar=False) + self.log("valid_acc", self.val_accuracy, prog_bar=True) + + def configure_optimizers(self): + optimizer = torch.optim.AdamW(self.model.parameters(), lr=1e-4) + scheduler = torch.optim.lr_scheduler.CosineAnnealingLR(optimizer, self.trainer.max_epochs, 0) + return [optimizer], [scheduler] + + def prepare_data(self): + CIFAR10(os.getcwd(), train=True, download=True, transform=self.preprocess) + CIFAR10(os.getcwd(), train=False, download=True, transform=self.preprocess) + + def train_dataloader(self): + dataset = CIFAR10(os.getcwd(), train=True, download=True, transform=self.preprocess) + loader = DataLoader(dataset, batch_size=32) + return loader + + def val_dataloader(self): + dataset = CIFAR10(os.getcwd(), train=False, download=True, transform=self.preprocess) + loader = DataLoader(dataset, batch_size=32) + return loader + + +# %% [markdown] +# ## Visualize images + +# %% +# init model +model = CoolSystem() + +# %% +model.show_batch(win_size=(14, 14)) + +# %% [markdown] +# ## Run training + +# %% +# Initialize a trainer +trainer = L.Trainer( + accelerator="auto", + devices=1, + max_epochs=10, + logger=CSVLogger(save_dir="logs/"), +) + +# Train the model ⚡ +trainer.fit(model) + +# %% [markdown] +# ### Visualize the training results + +# %% +metrics = pd.read_csv(f"{trainer.logger.log_dir}/metrics.csv") +del metrics["step"] +metrics.set_index("epoch", inplace=True) +display(metrics.dropna(axis=1, how="all").head()) +sn.relplot(data=metrics, kind="line") diff --git a/_notebooks/lightning_examples/barlow-twins/.meta.yml b/_notebooks/lightning_examples/barlow-twins/.meta.yml new file mode 100644 index 0000000..9a2227b --- /dev/null +++ b/_notebooks/lightning_examples/barlow-twins/.meta.yml @@ -0,0 +1,23 @@ +title: Barlow Twins Tutorial +author: Ananya Harsh Jha +created: 2021-09-19 +updated: 2023-03-15 +license: CC BY-SA +build: 0 +tags: + - Image + - Self-Supervised +description: | + This notebook describes the self-supervised learning method Barlow Twins. + Barlow Twins differs from other recently proposed algorithms as it doesn't + fall under the category of either contrastive learning, or methods like knowledge + distillation or clustering. The simplicity of the loss function and its effectiveness + in comparison to the current state of the art makes Barlow Twins an interesting + case study. +requirements: + - torchvision + - matplotlib + - lightning>=2.0.0rc0 +accelerator: + - GPU + - CPU diff --git a/_notebooks/lightning_examples/barlow-twins/barlow_twins.py b/_notebooks/lightning_examples/barlow-twins/barlow_twins.py new file mode 100644 index 0000000..85a3132 --- /dev/null +++ b/_notebooks/lightning_examples/barlow-twins/barlow_twins.py @@ -0,0 +1,437 @@ +# %% [markdown] +# ## Barlow Twins +# +# Barlow Twins finds itself in unique place amongst the current state-of-the-art self-supervised learning methods. It does not fall under the existing categories of contrastive learning, knowledge distillation or clustering based methods. Instead, it creates its own category of redundancy reductionand achieves competitive performance with a simple yet effective loss function. In this tutorial, we look at coding up a small version of Barlow Twins algorithm using PyTorch Lightning. + +# %% +from functools import partial +from typing import Sequence, Tuple, Union + +import lightning as L +import matplotlib.pyplot as plt +import numpy as np +import torch +import torch.nn as nn +import torch.nn.functional as F +import torchvision.transforms as transforms +import torchvision.transforms.functional as VisionF +from lightning.pytorch.callbacks import Callback, ModelCheckpoint +from torch import Tensor +from torch.utils.data import DataLoader +from torchmetrics.functional import accuracy +from torchvision.datasets import CIFAR10 +from torchvision.models.resnet import resnet18 +from torchvision.utils import make_grid + +batch_size = 32 +num_workers = 0 # to run notebook on CPU +max_epochs = 200 +z_dim = 128 + + +# %% [markdown] +# ### Transforms +# +# We first define the data augmentation pipeline used in Barlow Twins. Here, we use pipeline proposed in SimCLR, which generates two copies/views of an input image by applying the following transformations in a sequence. +# +# First it takes a random crop of the image and resizes it to a fixed pre-specified size. Then, it applies a left-to-right random flip with a probability of 0.5. This step is followed by a composition of color jitter, conversion to grayscale with a probability of 0.2 and the application of a Gaussian blur filter. Finally, we normalize the image and convert it to a tensor. +# +# Within this transform, we add a third view for our online finetuner, which we explain later on. But, to explain things quickly here, we add a another transform to perform perform test our encoder on a downstream classification task. + +# %% +class BarlowTwinsTransform: + def __init__(self, train=True, input_height=224, gaussian_blur=True, jitter_strength=1.0, normalize=None): + self.input_height = input_height + self.gaussian_blur = gaussian_blur + self.jitter_strength = jitter_strength + self.normalize = normalize + self.train = train + + color_jitter = transforms.ColorJitter( + 0.8 * self.jitter_strength, + 0.8 * self.jitter_strength, + 0.8 * self.jitter_strength, + 0.2 * self.jitter_strength, + ) + + color_transform = [transforms.RandomApply([color_jitter], p=0.8), transforms.RandomGrayscale(p=0.2)] + + if self.gaussian_blur: + kernel_size = int(0.1 * self.input_height) + if kernel_size % 2 == 0: + kernel_size += 1 + + color_transform.append(transforms.RandomApply([transforms.GaussianBlur(kernel_size=kernel_size)], p=0.5)) + + self.color_transform = transforms.Compose(color_transform) + + if normalize is None: + self.final_transform = transforms.ToTensor() + else: + self.final_transform = transforms.Compose([transforms.ToTensor(), normalize]) + + self.transform = transforms.Compose( + [ + transforms.RandomResizedCrop(self.input_height), + transforms.RandomHorizontalFlip(p=0.5), + self.color_transform, + self.final_transform, + ] + ) + + self.finetune_transform = None + if self.train: + self.finetune_transform = transforms.Compose( + [ + transforms.RandomCrop(32, padding=4, padding_mode="reflect"), + transforms.RandomHorizontalFlip(), + transforms.ToTensor(), + ] + ) + else: + self.finetune_transform = transforms.ToTensor() + + def __call__(self, sample): + return self.transform(sample), self.transform(sample), self.finetune_transform(sample) + + +# %% [markdown] +# ### Dataset +# +# We select CIFAR10 as the dataset to demonstrate the pre-training process for Barlow Twins. CIFAR10 images are 32x32 in size and we do not apply a Gaussian blur transformation on them. In this step, we create the training and validation dataloaders for CIFAR10. + +# %% +def cifar10_normalization(): + normalize = transforms.Normalize( + mean=[x / 255.0 for x in [125.3, 123.0, 113.9]], std=[x / 255.0 for x in [63.0, 62.1, 66.7]] + ) + return normalize + + +train_transform = BarlowTwinsTransform( + train=True, input_height=32, gaussian_blur=False, jitter_strength=0.5, normalize=cifar10_normalization() +) +train_dataset = CIFAR10(root=".", train=True, download=True, transform=train_transform) + +val_transform = BarlowTwinsTransform( + train=False, input_height=32, gaussian_blur=False, jitter_strength=0.5, normalize=cifar10_normalization() +) +val_dataset = CIFAR10(root=".", train=False, download=True, transform=train_transform) + +train_loader = DataLoader(train_dataset, batch_size=batch_size, shuffle=True, num_workers=num_workers, drop_last=True) +val_loader = DataLoader(val_dataset, batch_size=batch_size, shuffle=False, num_workers=num_workers, drop_last=True) + +# %% [markdown] +# ### Plot images +# +# To see how the CIFAR10 images look after the data augmentation pipeline, we load a few images from the dataloader and plot them here. + +# %% +for batch in val_loader: + (img1, img2, _), label = batch + break + +img_grid = make_grid(img1, normalize=True) + + +def show(imgs): + if not isinstance(imgs, list): + imgs = [imgs] + fix, axs = plt.subplots(ncols=len(imgs), squeeze=False) + for i, img in enumerate(imgs): + img = img.detach() + img = VisionF.to_pil_image(img) + axs[0, i].imshow(np.asarray(img)) + axs[0, i].set(xticklabels=[], yticklabels=[], xticks=[], yticks=[]) + + +show(img_grid) + + +# %% [markdown] +# ### Barlow Twins Loss +# +# Here we define the loss function for Barlow Twins. It first normalizes the D dimensinonal vectors from the projection head and then computes the DxD cross-correlation matrix between the normalized vectors of the 2 views of each image. +# +# Then it splits this cross-correlation matrix into two parts. The first part, the diagonal of this matrix is brought closer to 1, which pushes up the cosine similarity between the latent vectors of two views of each image, thus making the backbone invariant to the transformations applied to the views. The second part of the loss pushes the non-diagonal elements of the cross-corrlelation matrix closes to 0. This reduces the redundancy between the different dimensions of the latent vector. + +# %% +class BarlowTwinsLoss(nn.Module): + def __init__(self, batch_size, lambda_coeff=5e-3, z_dim=128): + super().__init__() + + self.z_dim = z_dim + self.batch_size = batch_size + self.lambda_coeff = lambda_coeff + + def off_diagonal_ele(self, x): + # taken from: https://github.com/facebookresearch/barlowtwins/blob/main/main.py + # return a flattened view of the off-diagonal elements of a square matrix + n, m = x.shape + assert n == m + return x.flatten()[:-1].view(n - 1, n + 1)[:, 1:].flatten() + + def forward(self, z1, z2): + # N x D, where N is the batch size and D is output dim of projection head + z1_norm = (z1 - torch.mean(z1, dim=0)) / torch.std(z1, dim=0) + z2_norm = (z2 - torch.mean(z2, dim=0)) / torch.std(z2, dim=0) + + cross_corr = torch.matmul(z1_norm.T, z2_norm) / self.batch_size + + on_diag = torch.diagonal(cross_corr).add_(-1).pow_(2).sum() + off_diag = self.off_diagonal_ele(cross_corr).pow_(2).sum() + + return on_diag + self.lambda_coeff * off_diag + + +# %% [markdown] +# ### Backbone +# +# This is a standard Resnet backbone that we pre-train using the Barlow Twins method. To accommodate the 32x32 CIFAR10 images, we replace the first 7x7 convolution of the Resnet backbone by a 3x3 filter. We also remove the first Maxpool layer from the network for CIFAR10 images. + +# %% +encoder = resnet18() + +# for CIFAR10, replace the first 7x7 conv with smaller 3x3 conv and remove the first maxpool +encoder.conv1 = nn.Conv2d(3, 64, kernel_size=3, stride=1, padding=1, bias=False) +encoder.maxpool = nn.MaxPool2d(kernel_size=1, stride=1) + +# replace classification fc layer of Resnet to obtain representations from the backbone +encoder.fc = nn.Identity() + + +# %% [markdown] +# ### Projection head +# +# Unlike SimCLR and BYOL, the downstream performance of Barlow Twins greatly benefits from having a larger projection head after the backbone network. The paper utilizes a 3 layer MLP with 8192 hidden dimensions and 8192 as the output dimenion of the projection head. For the purposes of the tutorial, we use a smaller projection head. But, it is imperative to mention here that in practice, Barlow Twins needs to be trained using a bigger projection head as it is highly sensitive to its architecture and output dimensionality. + +# %% +class ProjectionHead(nn.Module): + def __init__(self, input_dim=2048, hidden_dim=2048, output_dim=128): + super().__init__() + + self.projection_head = nn.Sequential( + nn.Linear(input_dim, hidden_dim, bias=True), + nn.BatchNorm1d(hidden_dim), + nn.ReLU(), + nn.Linear(hidden_dim, output_dim, bias=False), + ) + + def forward(self, x): + return self.projection_head(x) + + +# %% [markdown] +# ### Learning rate warmup +# +# For the purposes of this tutorial, we keep things simple and use a linear warmup schedule with Adam optimizer. In our previous experiments we have found that linear warmup part is much more important for the final performance of a model than the cosine decay component of the schedule. + +# %% +def fn(warmup_steps, step): + if step < warmup_steps: + return float(step) / float(max(1, warmup_steps)) + else: + return 1.0 + + +def linear_warmup_decay(warmup_steps): + return partial(fn, warmup_steps) + + +# %% [markdown] +# ### Barlow Twins Lightning Module +# +# We keep the LightningModule for Barlow Twins neat and simple. It takes in an backbone encoder and initializes the projection head and the loss function. We configure the optimizer and the learning rate scheduler in the ``configure_optimizers`` method. + +# %% +class BarlowTwins(L.LightningModule): + def __init__( + self, + encoder, + encoder_out_dim, + num_training_samples, + batch_size, + lambda_coeff=5e-3, + z_dim=128, + learning_rate=1e-4, + warmup_epochs=10, + max_epochs=200, + ): + super().__init__() + + self.encoder = encoder + self.projection_head = ProjectionHead(input_dim=encoder_out_dim, hidden_dim=encoder_out_dim, output_dim=z_dim) + self.loss_fn = BarlowTwinsLoss(batch_size=batch_size, lambda_coeff=lambda_coeff, z_dim=z_dim) + + self.learning_rate = learning_rate + self.warmup_epochs = warmup_epochs + self.max_epochs = max_epochs + + self.train_iters_per_epoch = num_training_samples // batch_size + + def forward(self, x): + return self.encoder(x) + + def shared_step(self, batch): + (x1, x2, _), _ = batch + + z1 = self.projection_head(self.encoder(x1)) + z2 = self.projection_head(self.encoder(x2)) + + return self.loss_fn(z1, z2) + + def training_step(self, batch, batch_idx): + loss = self.shared_step(batch) + self.log("train_loss", loss, on_step=True, on_epoch=False) + return loss + + def validation_step(self, batch, batch_idx): + loss = self.shared_step(batch) + self.log("val_loss", loss, on_step=False, on_epoch=True) + + def configure_optimizers(self): + optimizer = torch.optim.Adam(self.parameters(), lr=self.learning_rate) + + warmup_steps = self.train_iters_per_epoch * self.warmup_epochs + + scheduler = { + "scheduler": torch.optim.lr_scheduler.LambdaLR( + optimizer, + linear_warmup_decay(warmup_steps), + ), + "interval": "step", + "frequency": 1, + } + + return [optimizer], [scheduler] + + +# %% [markdown] +# ### Evaluation +# +# We define a callback which appends a linear layer on top of the encoder and trains the classification evaluation head in an online manner. We make sure not to backpropagate the gradients back to the encoder while tuning the linear layer. This technique was used in SimCLR as well and they showed that the final downstream classification peformance is pretty much similar to the results on online finetuning as the training progresses. + +# %% +class OnlineFineTuner(Callback): + def __init__( + self, + encoder_output_dim: int, + num_classes: int, + ) -> None: + super().__init__() + + self.optimizer: torch.optim.Optimizer + + self.encoder_output_dim = encoder_output_dim + self.num_classes = num_classes + + def on_fit_start(self, trainer: L.Trainer, pl_module: L.LightningModule) -> None: + # add linear_eval layer and optimizer + pl_module.online_finetuner = nn.Linear(self.encoder_output_dim, self.num_classes).to(pl_module.device) + self.optimizer = torch.optim.Adam(pl_module.online_finetuner.parameters(), lr=1e-4) + + def extract_online_finetuning_view( + self, batch: Sequence, device: Union[str, torch.device] + ) -> Tuple[Tensor, Tensor]: + (_, _, finetune_view), y = batch + finetune_view = finetune_view.to(device) + y = y.to(device) + + return finetune_view, y + + def on_train_batch_end( + self, + trainer: L.Trainer, + pl_module: L.LightningModule, + outputs: Sequence, + batch: Sequence, + batch_idx: int, + ) -> None: + x, y = self.extract_online_finetuning_view(batch, pl_module.device) + + with torch.no_grad(): + feats = pl_module(x) + + feats = feats.detach() + preds = pl_module.online_finetuner(feats) + loss = F.cross_entropy(preds, y) + + loss.backward() + self.optimizer.step() + self.optimizer.zero_grad() + + acc = accuracy(F.softmax(preds, dim=1), y, task="multiclass", num_classes=10) + pl_module.log("online_train_acc", acc, on_step=True, on_epoch=False) + pl_module.log("online_train_loss", loss, on_step=True, on_epoch=False) + + def on_validation_batch_end( + self, + trainer: L.Trainer, + pl_module: L.LightningModule, + outputs: Sequence, + batch: Sequence, + batch_idx: int, + ) -> None: + x, y = self.extract_online_finetuning_view(batch, pl_module.device) + + with torch.no_grad(): + feats = pl_module(x) + + feats = feats.detach() + preds = pl_module.online_finetuner(feats) + loss = F.cross_entropy(preds, y) + + acc = accuracy(F.softmax(preds, dim=1), y, task="multiclass", num_classes=10) + pl_module.log("online_val_acc", acc, on_step=False, on_epoch=True, sync_dist=True) + pl_module.log("online_val_loss", loss, on_step=False, on_epoch=True, sync_dist=True) + + +# %% [markdown] +# Finally, we define the trainer for training the model. We pass in the ``train_loader`` and ``val_loader`` we had initialized earlier to the ``fit`` function. + +# %% +encoder_out_dim = 512 + +model = BarlowTwins( + encoder=encoder, + encoder_out_dim=encoder_out_dim, + num_training_samples=len(train_dataset), + batch_size=batch_size, + z_dim=z_dim, +) + +online_finetuner = OnlineFineTuner(encoder_output_dim=encoder_out_dim, num_classes=10) +checkpoint_callback = ModelCheckpoint(every_n_epochs=100, save_top_k=-1, save_last=True) + +trainer = L.Trainer( + max_epochs=max_epochs, + accelerator="auto", + devices=1, + callbacks=[online_finetuner, checkpoint_callback], +) + +# uncomment this to train the model +# this is done for the tutorial so that the notebook compiles +# trainer.fit(model, train_loader, val_loader) + +# %% [markdown] +# ### Using the trained encoder for downstream tasks +# +# Once the encoder is pretrained on CIFAR10, we can use it to get image embeddings and use them further downstream on tasks like classification, detection, segmentation etc. +# +# In this tutorial, we did not completely train our encoder for 100s of epochs using the Barlow Twins pretraining method. So, we will load the pretrained encoder weights from a checkpoint and show the image embeddings obtained from that. +# +# To create this checkpoint, the encoder was pretrained for 200 epochs, and obtained a online finetune accuracy of x% on CIFAR-10. + +# %% +# ckpt_model = torch.load('') # upload checkpoint to aws +# encoder = ckpt_model.encoder +encoder = model.encoder + +downstream_dataset = CIFAR10(root=".", train=False, transform=transforms.ToTensor()) +dataloader = DataLoader(downstream_dataset, batch_size=4, shuffle=False) + +for batch in dataloader: + img, label = batch + print(encoder(img).shape) + break diff --git a/_notebooks/lightning_examples/basic-gan/.meta.yaml b/_notebooks/lightning_examples/basic-gan/.meta.yaml new file mode 100644 index 0000000..dca0517 --- /dev/null +++ b/_notebooks/lightning_examples/basic-gan/.meta.yaml @@ -0,0 +1,20 @@ +title: PyTorch Lightning Basic GAN Tutorial +author: PL team +created: 2020-12-21 +updated: 2023-03-15 +license: CC BY-SA +build: 0 +tags: + - Image +description: | + How to train a GAN! + + Main takeaways: + 1. Generator and discriminator are arbitrary PyTorch modules. + 2. training_step does both the generator and discriminator training. +requirements: + - torchvision + - lightning>=2.0.0rc0 +accelerator: + - CPU + - GPU diff --git a/_notebooks/lightning_examples/basic-gan/gan.py b/_notebooks/lightning_examples/basic-gan/gan.py new file mode 100644 index 0000000..b8e3827 --- /dev/null +++ b/_notebooks/lightning_examples/basic-gan/gan.py @@ -0,0 +1,266 @@ +# %% +import os + +import lightning as L +import numpy as np +import torch +import torch.nn as nn +import torch.nn.functional as F +import torchvision +import torchvision.transforms as transforms +from torch.utils.data import DataLoader, random_split +from torchvision.datasets import MNIST + +PATH_DATASETS = os.environ.get("PATH_DATASETS", ".") +BATCH_SIZE = 256 if torch.cuda.is_available() else 64 +NUM_WORKERS = int(os.cpu_count() / 2) + +# %% [markdown] +# ### MNIST DataModule +# +# Below, we define a DataModule for the MNIST Dataset. To learn more about DataModules, check out our tutorial +# on them or see the [latest release docs](https://lightning.ai/docs/pytorch/stable/data/datamodule.html). + + +# %% +class MNISTDataModule(L.LightningDataModule): + def __init__( + self, + data_dir: str = PATH_DATASETS, + batch_size: int = BATCH_SIZE, + num_workers: int = NUM_WORKERS, + ): + super().__init__() + self.data_dir = data_dir + self.batch_size = batch_size + self.num_workers = num_workers + + self.transform = transforms.Compose( + [ + transforms.ToTensor(), + transforms.Normalize((0.1307,), (0.3081,)), + ] + ) + + self.dims = (1, 28, 28) + self.num_classes = 10 + + def prepare_data(self): + # download + MNIST(self.data_dir, train=True, download=True) + MNIST(self.data_dir, train=False, download=True) + + def setup(self, stage=None): + # Assign train/val datasets for use in dataloaders + if stage == "fit" or stage is None: + mnist_full = MNIST(self.data_dir, train=True, transform=self.transform) + self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000]) + + # Assign test dataset for use in dataloader(s) + if stage == "test" or stage is None: + self.mnist_test = MNIST(self.data_dir, train=False, transform=self.transform) + + def train_dataloader(self): + return DataLoader( + self.mnist_train, + batch_size=self.batch_size, + num_workers=self.num_workers, + ) + + def val_dataloader(self): + return DataLoader(self.mnist_val, batch_size=self.batch_size, num_workers=self.num_workers) + + def test_dataloader(self): + return DataLoader(self.mnist_test, batch_size=self.batch_size, num_workers=self.num_workers) + + +# %% [markdown] +# ### A. Generator + + +# %% +class Generator(nn.Module): + def __init__(self, latent_dim, img_shape): + super().__init__() + self.img_shape = img_shape + + def block(in_feat, out_feat, normalize=True): + layers = [nn.Linear(in_feat, out_feat)] + if normalize: + layers.append(nn.BatchNorm1d(out_feat, 0.8)) + layers.append(nn.LeakyReLU(0.2, inplace=True)) + return layers + + self.model = nn.Sequential( + *block(latent_dim, 128, normalize=False), + *block(128, 256), + *block(256, 512), + *block(512, 1024), + nn.Linear(1024, int(np.prod(img_shape))), + nn.Tanh(), + ) + + def forward(self, z): + img = self.model(z) + img = img.view(img.size(0), *self.img_shape) + return img + + +# %% [markdown] +# ### B. Discriminator + + +# %% +class Discriminator(nn.Module): + def __init__(self, img_shape): + super().__init__() + + self.model = nn.Sequential( + nn.Linear(int(np.prod(img_shape)), 512), + nn.LeakyReLU(0.2, inplace=True), + nn.Linear(512, 256), + nn.LeakyReLU(0.2, inplace=True), + nn.Linear(256, 1), + nn.Sigmoid(), + ) + + def forward(self, img): + img_flat = img.view(img.size(0), -1) + validity = self.model(img_flat) + + return validity + + +# %% [markdown] +# ### C. GAN +# +# #### A couple of cool features to check out in this example... +# +# - We use `some_tensor.type_as(another_tensor)` to make sure we initialize new tensors on the right device (i.e. GPU, CPU). +# - Lightning will put your dataloader data on the right device automatically +# - In this example, we pull from latent dim on the fly, so we need to dynamically add tensors to the right device. +# - `type_as` is the way we recommend to do this. +# - This example shows how to use multiple dataloaders in your `LightningModule`. + + +# %% +class GAN(L.LightningModule): + def __init__( + self, + channels, + width, + height, + latent_dim: int = 100, + lr: float = 0.0002, + b1: float = 0.5, + b2: float = 0.999, + batch_size: int = BATCH_SIZE, + **kwargs, + ): + super().__init__() + self.save_hyperparameters() + self.automatic_optimization = False + + # networks + data_shape = (channels, width, height) + self.generator = Generator(latent_dim=self.hparams.latent_dim, img_shape=data_shape) + self.discriminator = Discriminator(img_shape=data_shape) + + self.validation_z = torch.randn(8, self.hparams.latent_dim) + + self.example_input_array = torch.zeros(2, self.hparams.latent_dim) + + def forward(self, z): + return self.generator(z) + + def adversarial_loss(self, y_hat, y): + return F.binary_cross_entropy(y_hat, y) + + def training_step(self, batch): + imgs, _ = batch + + optimizer_g, optimizer_d = self.optimizers() + + # sample noise + z = torch.randn(imgs.shape[0], self.hparams.latent_dim) + z = z.type_as(imgs) + + # train generator + # generate images + self.toggle_optimizer(optimizer_g) + self.generated_imgs = self(z) + + # log sampled images + sample_imgs = self.generated_imgs[:6] + grid = torchvision.utils.make_grid(sample_imgs) + self.logger.experiment.add_image("generated_images", grid, 0) + + # ground truth result (ie: all fake) + # put on GPU because we created this tensor inside training_loop + valid = torch.ones(imgs.size(0), 1) + valid = valid.type_as(imgs) + + # adversarial loss is binary cross-entropy + g_loss = self.adversarial_loss(self.discriminator(self(z)), valid) + self.log("g_loss", g_loss, prog_bar=True) + self.manual_backward(g_loss) + optimizer_g.step() + optimizer_g.zero_grad() + self.untoggle_optimizer(optimizer_g) + + # train discriminator + # Measure discriminator's ability to classify real from generated samples + self.toggle_optimizer(optimizer_d) + + # how well can it label as real? + valid = torch.ones(imgs.size(0), 1) + valid = valid.type_as(imgs) + + real_loss = self.adversarial_loss(self.discriminator(imgs), valid) + + # how well can it label as fake? + fake = torch.zeros(imgs.size(0), 1) + fake = fake.type_as(imgs) + + fake_loss = self.adversarial_loss(self.discriminator(self(z).detach()), fake) + + # discriminator loss is the average of these + d_loss = (real_loss + fake_loss) / 2 + self.log("d_loss", d_loss, prog_bar=True) + self.manual_backward(d_loss) + optimizer_d.step() + optimizer_d.zero_grad() + self.untoggle_optimizer(optimizer_d) + + def configure_optimizers(self): + lr = self.hparams.lr + b1 = self.hparams.b1 + b2 = self.hparams.b2 + + opt_g = torch.optim.Adam(self.generator.parameters(), lr=lr, betas=(b1, b2)) + opt_d = torch.optim.Adam(self.discriminator.parameters(), lr=lr, betas=(b1, b2)) + return [opt_g, opt_d], [] + + def on_validation_epoch_end(self): + z = self.validation_z.type_as(self.generator.model[0].weight) + + # log sampled images + sample_imgs = self(z) + grid = torchvision.utils.make_grid(sample_imgs) + self.logger.experiment.add_image("generated_images", grid, self.current_epoch) + + +# %% +dm = MNISTDataModule() +model = GAN(*dm.dims) +trainer = L.Trainer( + accelerator="auto", + devices=1, + max_epochs=5, +) +trainer.fit(model, dm) + +# %% +# Start tensorboard. +# %load_ext tensorboard +# %tensorboard --logdir lightning_logs/ diff --git a/_notebooks/lightning_examples/cifar10-baseline/.meta.yml b/_notebooks/lightning_examples/cifar10-baseline/.meta.yml new file mode 100644 index 0000000..6862531 --- /dev/null +++ b/_notebooks/lightning_examples/cifar10-baseline/.meta.yml @@ -0,0 +1,17 @@ +title: PyTorch Lightning CIFAR10 ~94% Baseline Tutorial +author: PL team +created: 2020-12-21 +updated: 2023-03-15 +license: CC BY-SA +build: 0 +tags: + - Image +description: > + Train a Resnet to 94% accuracy on Cifar10! +requirements: + - torchvision + - pandas + - seaborn + - lightning>=2.0.0rc0 +accelerator: + - GPU diff --git a/_notebooks/lightning_examples/cifar10-baseline/baseline.py b/_notebooks/lightning_examples/cifar10-baseline/baseline.py new file mode 100644 index 0000000..9abc859 --- /dev/null +++ b/_notebooks/lightning_examples/cifar10-baseline/baseline.py @@ -0,0 +1,255 @@ +# %% +# Run this if you intend to use TPUs +# # !pip install cloud-tpu-client==0.10 https://storage.googleapis.com/tpu-pytorch/wheels/torch_xla-1.8-cp37-cp37m-linux_x86_64.whl + +# %% +import os + +import lightning as L +import pandas as pd +import seaborn as sn +import torch +import torch.nn as nn +import torch.nn.functional as F +import torchvision +from IPython.display import display +from lightning.pytorch.callbacks import LearningRateMonitor +from lightning.pytorch.loggers import CSVLogger +from torch.optim.lr_scheduler import OneCycleLR +from torch.optim.swa_utils import AveragedModel, update_bn +from torch.utils.data import DataLoader, random_split +from torchmetrics.functional import accuracy +from torchvision.datasets import CIFAR10 + +L.seed_everything(7) + +PATH_DATASETS = os.environ.get("PATH_DATASETS", ".") +BATCH_SIZE = 256 if torch.cuda.is_available() else 64 +NUM_WORKERS = int(os.cpu_count() / 2) + +# %% [markdown] +# ### CIFAR10 DataLoaders +# + +# %% + +cifar10_normalization = torchvision.transforms.Normalize( + mean=[x / 255.0 for x in [125.3, 123.0, 113.9]], + std=[x / 255.0 for x in [63.0, 62.1, 66.7]], +) + + +def split_dataset(dataset, val_split=0.2, train=True): + """Splits the dataset into train and validation set.""" + len_dataset = len(dataset) + splits = get_splits(len_dataset, val_split) + dataset_train, dataset_val = random_split(dataset, splits, generator=torch.Generator().manual_seed(42)) + + if train: + return dataset_train + return dataset_val + + +def get_splits(len_dataset, val_split): + """Computes split lengths for train and validation set.""" + if isinstance(val_split, int): + train_len = len_dataset - val_split + splits = [train_len, val_split] + elif isinstance(val_split, float): + val_len = int(val_split * len_dataset) + train_len = len_dataset - val_len + splits = [train_len, val_len] + else: + raise ValueError(f"Unsupported type {type(val_split)}") + + return splits + + +train_transforms = torchvision.transforms.Compose( + [ + torchvision.transforms.RandomCrop(32, padding=4), + torchvision.transforms.RandomHorizontalFlip(), + torchvision.transforms.ToTensor(), + cifar10_normalization, + ] +) +test_transforms = torchvision.transforms.Compose( + [ + torchvision.transforms.ToTensor(), + cifar10_normalization, + ] +) + +dataset_train = CIFAR10(PATH_DATASETS, train=True, download=True, transform=train_transforms) +dataset_val = CIFAR10(PATH_DATASETS, train=True, download=True, transform=test_transforms) +dataset_train = split_dataset(dataset_train) +dataset_val = split_dataset(dataset_val, train=False) +dataset_test = CIFAR10(PATH_DATASETS, train=False, download=True, transform=test_transforms) + +train_dataloader = DataLoader(dataset_train, batch_size=BATCH_SIZE, shuffle=True, num_workers=NUM_WORKERS) +val_dataloader = DataLoader(dataset_val, batch_size=BATCH_SIZE, shuffle=False, num_workers=NUM_WORKERS) +test_dataloader = DataLoader(dataset_test, batch_size=BATCH_SIZE, shuffle=False, num_workers=NUM_WORKERS) + + +# %% [markdown] +# ### Resnet +# Modify the pre-existing Resnet architecture from TorchVision. The pre-existing architecture is based on ImageNet +# images (224x224) as input. So we need to modify it for CIFAR10 images (32x32). + + +# %% +def create_model(): + model = torchvision.models.resnet18(pretrained=False, num_classes=10) + model.conv1 = nn.Conv2d(3, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False) + model.maxpool = nn.Identity() + return model + + +# %% [markdown] +# ### Lightning Module +# Check out the [`configure_optimizers`](https://lightning.ai/docs/pytorch/stable/common/lightning_module.html#configure-optimizers) +# method to use custom Learning Rate schedulers. The OneCycleLR with SGD will get you to around 92-93% accuracy +# in 20-30 epochs and 93-94% accuracy in 40-50 epochs. Feel free to experiment with different +# LR schedules from https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate + + +# %% +class LitResnet(L.LightningModule): + def __init__(self, lr=0.05): + super().__init__() + + self.save_hyperparameters() + self.model = create_model() + + def forward(self, x): + out = self.model(x) + return F.log_softmax(out, dim=1) + + def training_step(self, batch, batch_idx): + x, y = batch + logits = self(x) + loss = F.nll_loss(logits, y) + self.log("train_loss", loss) + return loss + + def evaluate(self, batch, stage=None): + x, y = batch + logits = self(x) + loss = F.nll_loss(logits, y) + preds = torch.argmax(logits, dim=1) + acc = accuracy(preds, y, task="multiclass", num_classes=10) + + if stage: + self.log(f"{stage}_loss", loss, prog_bar=True) + self.log(f"{stage}_acc", acc, prog_bar=True) + + def validation_step(self, batch, batch_idx): + self.evaluate(batch, "val") + + def test_step(self, batch, batch_idx): + self.evaluate(batch, "test") + + def configure_optimizers(self): + optimizer = torch.optim.SGD( + self.parameters(), + lr=self.hparams.lr, + momentum=0.9, + weight_decay=5e-4, + ) + steps_per_epoch = 45000 // BATCH_SIZE + scheduler_dict = { + "scheduler": OneCycleLR( + optimizer, + 0.1, + epochs=self.trainer.max_epochs, + steps_per_epoch=steps_per_epoch, + ), + "interval": "step", + } + return {"optimizer": optimizer, "lr_scheduler": scheduler_dict} + + +# %% +model = LitResnet(lr=0.05) + +trainer = L.Trainer( + max_epochs=30, + accelerator="auto", + devices=1, + logger=CSVLogger(save_dir="logs/"), + callbacks=[LearningRateMonitor(logging_interval="step")], +) + +trainer.fit(model, train_dataloader, val_dataloaders=val_dataloader) +trainer.test(model, test_dataloader) + +# %% + +metrics = pd.read_csv(f"{trainer.logger.log_dir}/metrics.csv") +del metrics["step"] +metrics.set_index("epoch", inplace=True) +display(metrics.dropna(axis=1, how="all").head()) +sn.relplot(data=metrics, kind="line") + +# %% [markdown] +# ### Bonus: Use [Stochastic Weight Averaging](https://arxiv.org/abs/1803.05407) to get a boost on performance +# +# Use SWA from torch.optim to get a quick performance boost. Also shows a couple of cool features from Lightning: +# - Use `training_epoch_end` to run code after the end of every epoch +# - Use a pretrained model directly with this wrapper for SWA + + +# %% +class SWAResnet(LitResnet): + def __init__(self, trained_model, lr=0.01): + super().__init__() + + self.save_hyperparameters("lr") + self.model = trained_model + self.swa_model = AveragedModel(self.model) + + def forward(self, x): + out = self.swa_model(x) + return F.log_softmax(out, dim=1) + + def on_train_epoch_end(self): + self.swa_model.update_parameters(self.model) + + def validation_step(self, batch, batch_idx, stage=None): + x, y = batch + logits = F.log_softmax(self.model(x), dim=1) + loss = F.nll_loss(logits, y) + preds = torch.argmax(logits, dim=1) + acc = accuracy(preds, y, task="multiclass", num_classes=10) + + self.log("val_loss", loss, prog_bar=True) + self.log("val_acc", acc, prog_bar=True) + + def configure_optimizers(self): + optimizer = torch.optim.SGD(self.model.parameters(), lr=self.hparams.lr, momentum=0.9, weight_decay=5e-4) + return optimizer + + def on_train_end(self): + update_bn(self.trainer.datamodule.train_dataloader(), self.swa_model, device=self.device) + + +# %% +swa_model = SWAResnet(model.model, lr=0.01) + +swa_trainer = L.Trainer( + max_epochs=20, + accelerator="auto", + devices=1, + logger=CSVLogger(save_dir="logs/"), +) + +swa_trainer.fit(swa_model, train_dataloader, val_dataloader=val_dataloader) +swa_trainer.test(swa_model, test_dataloader) + +# %% + +metrics = pd.read_csv(f"{trainer.logger.log_dir}/metrics.csv") +del metrics["step"] +metrics.set_index("epoch", inplace=True) +display(metrics.dropna(axis=1, how="all").head()) +sn.relplot(data=metrics, kind="line") diff --git a/_notebooks/lightning_examples/datamodules/.meta.yml b/_notebooks/lightning_examples/datamodules/.meta.yml new file mode 100644 index 0000000..5c8fc0b --- /dev/null +++ b/_notebooks/lightning_examples/datamodules/.meta.yml @@ -0,0 +1,16 @@ +title: PyTorch Lightning DataModules +author: PL team +created: 2020-12-21 +updated: 2023-03-15 +license: CC BY-SA +build: 0 +description: This notebook will walk you through how to start using Datamodules. With + the release of `pytorch-lightning` version 0.9.0, we have included a new class called + `LightningDataModule` to help you decouple data related hooks from your `LightningModule`. + The most up-to-date documentation on datamodules can be found + [here](https://lightning.ai/docs/pytorch/stable/data/datamodule.html). +requirements: + - torchvision +accelerator: + - CPU + - GPU diff --git a/_notebooks/lightning_examples/datamodules/datamodules.py b/_notebooks/lightning_examples/datamodules/datamodules.py new file mode 100644 index 0000000..dd5b655 --- /dev/null +++ b/_notebooks/lightning_examples/datamodules/datamodules.py @@ -0,0 +1,339 @@ +# %% [markdown] +# ## Introduction +# +# First, we'll go over a regular `LightningModule` implementation without the use of a `LightningDataModule` + +# %% +import os + +import lightning as L +import torch +import torch.nn.functional as F +from torch import nn +from torch.utils.data import DataLoader, random_split +from torchmetrics.functional import accuracy +from torchvision import transforms + +# Note - you must have torchvision installed for this example +from torchvision.datasets import CIFAR10, MNIST + +PATH_DATASETS = os.environ.get("PATH_DATASETS", ".") +BATCH_SIZE = 256 if torch.cuda.is_available() else 64 + +# %% [markdown] +# ### Defining the LitMNISTModel +# +# Below, we reuse a `LightningModule` from our hello world tutorial that classifies MNIST Handwritten Digits. +# +# Unfortunately, we have hardcoded dataset-specific items within the model, +# forever limiting it to working with MNIST Data. 😢 +# +# This is fine if you don't plan on training/evaluating your model on different datasets. +# However, in many cases, this can become bothersome when you want to try out your architecture with different datasets. + + +# %% +class LitMNIST(L.LightningModule): + def __init__(self, data_dir=PATH_DATASETS, hidden_size=64, learning_rate=2e-4): + super().__init__() + + # We hardcode dataset specific stuff here. + self.data_dir = data_dir + self.num_classes = 10 + self.dims = (1, 28, 28) + channels, width, height = self.dims + self.transform = transforms.Compose( + [ + transforms.ToTensor(), + transforms.Normalize((0.1307,), (0.3081,)), + ] + ) + + self.hidden_size = hidden_size + self.learning_rate = learning_rate + + # Build model + self.model = nn.Sequential( + nn.Flatten(), + nn.Linear(channels * width * height, hidden_size), + nn.ReLU(), + nn.Dropout(0.1), + nn.Linear(hidden_size, hidden_size), + nn.ReLU(), + nn.Dropout(0.1), + nn.Linear(hidden_size, self.num_classes), + ) + + def forward(self, x): + x = self.model(x) + return F.log_softmax(x, dim=1) + + def training_step(self, batch): + x, y = batch + logits = self(x) + loss = F.nll_loss(logits, y) + return loss + + def validation_step(self, batch, batch_idx): + x, y = batch + logits = self(x) + loss = F.nll_loss(logits, y) + preds = torch.argmax(logits, dim=1) + acc = accuracy(preds, y, task="multiclass", num_classes=10) + self.log("val_loss", loss, prog_bar=True) + self.log("val_acc", acc, prog_bar=True) + + def configure_optimizers(self): + optimizer = torch.optim.Adam(self.parameters(), lr=self.learning_rate) + return optimizer + + #################### + # DATA RELATED HOOKS + #################### + + def prepare_data(self): + # download + MNIST(self.data_dir, train=True, download=True) + MNIST(self.data_dir, train=False, download=True) + + def setup(self, stage=None): + # Assign train/val datasets for use in dataloaders + if stage == "fit" or stage is None: + mnist_full = MNIST(self.data_dir, train=True, transform=self.transform) + self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000]) + + # Assign test dataset for use in dataloader(s) + if stage == "test" or stage is None: + self.mnist_test = MNIST(self.data_dir, train=False, transform=self.transform) + + def train_dataloader(self): + return DataLoader(self.mnist_train, batch_size=128) + + def val_dataloader(self): + return DataLoader(self.mnist_val, batch_size=128) + + def test_dataloader(self): + return DataLoader(self.mnist_test, batch_size=128) + + +# %% [markdown] +# ### Training the ListMNIST Model + +# %% +model = LitMNIST() +trainer = L.Trainer( + max_epochs=2, + accelerator="auto", + devices=1, +) +trainer.fit(model) + +# %% [markdown] +# ## Using DataModules +# +# DataModules are a way of decoupling data-related hooks from the `LightningModule +# ` so you can develop dataset agnostic models. + +# %% [markdown] +# ### Defining The MNISTDataModule +# +# Let's go over each function in the class below and talk about what they're doing: +# +# 1. ```__init__``` +# - Takes in a `data_dir` arg that points to where you have downloaded/wish to download the MNIST dataset. +# - Defines a transform that will be applied across train, val, and test dataset splits. +# - Defines default `self.dims`. +# +# +# 2. ```prepare_data``` +# - This is where we can download the dataset. We point to our desired dataset and ask torchvision's `MNIST` dataset class to download if the dataset isn't found there. +# - **Note we do not make any state assignments in this function** (i.e. `self.something = ...`) +# +# 3. ```setup``` +# - Loads in data from file and prepares PyTorch tensor datasets for each split (train, val, test). +# - Setup expects a 'stage' arg which is used to separate logic for 'fit' and 'test'. +# - If you don't mind loading all your datasets at once, you can set up a condition to allow for both 'fit' related setup and 'test' related setup to run whenever `None` is passed to `stage`. +# - **Note this runs across all GPUs and it *is* safe to make state assignments here** +# +# +# 4. ```x_dataloader``` +# - `train_dataloader()`, `val_dataloader()`, and `test_dataloader()` all return PyTorch `DataLoader` instances that are created by wrapping their respective datasets that we prepared in `setup()` + + +# %% +class MNISTDataModule(L.LightningDataModule): + def __init__(self, data_dir: str = PATH_DATASETS): + super().__init__() + self.data_dir = data_dir + self.transform = transforms.Compose( + [ + transforms.ToTensor(), + transforms.Normalize((0.1307,), (0.3081,)), + ] + ) + + self.dims = (1, 28, 28) + self.num_classes = 10 + + def prepare_data(self): + # download + MNIST(self.data_dir, train=True, download=True) + MNIST(self.data_dir, train=False, download=True) + + def setup(self, stage=None): + # Assign train/val datasets for use in dataloaders + if stage == "fit" or stage is None: + mnist_full = MNIST(self.data_dir, train=True, transform=self.transform) + self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000]) + + # Assign test dataset for use in dataloader(s) + if stage == "test" or stage is None: + self.mnist_test = MNIST(self.data_dir, train=False, transform=self.transform) + + def train_dataloader(self): + return DataLoader(self.mnist_train, batch_size=BATCH_SIZE) + + def val_dataloader(self): + return DataLoader(self.mnist_val, batch_size=BATCH_SIZE) + + def test_dataloader(self): + return DataLoader(self.mnist_test, batch_size=BATCH_SIZE) + + +# %% [markdown] +# ### Defining the dataset agnostic `LitModel` +# +# Below, we define the same model as the `LitMNIST` model we made earlier. +# +# However, this time our model has the freedom to use any input data that we'd like 🔥. + + +# %% +class LitModel(L.LightningModule): + def __init__(self, channels, width, height, num_classes, hidden_size=64, learning_rate=2e-4): + super().__init__() + + # We take in input dimensions as parameters and use those to dynamically build model. + self.channels = channels + self.width = width + self.height = height + self.num_classes = num_classes + self.hidden_size = hidden_size + self.learning_rate = learning_rate + + self.model = nn.Sequential( + nn.Flatten(), + nn.Linear(channels * width * height, hidden_size), + nn.ReLU(), + nn.Dropout(0.1), + nn.Linear(hidden_size, hidden_size), + nn.ReLU(), + nn.Dropout(0.1), + nn.Linear(hidden_size, num_classes), + ) + + def forward(self, x): + x = self.model(x) + return F.log_softmax(x, dim=1) + + def training_step(self, batch): + x, y = batch + logits = self(x) + loss = F.nll_loss(logits, y) + return loss + + def validation_step(self, batch, batch_idx): + x, y = batch + logits = self(x) + loss = F.nll_loss(logits, y) + preds = torch.argmax(logits, dim=1) + acc = accuracy(preds, y, task="multiclass", num_classes=10) + self.log("val_loss", loss, prog_bar=True) + self.log("val_acc", acc, prog_bar=True) + + def configure_optimizers(self): + optimizer = torch.optim.Adam(self.parameters(), lr=self.learning_rate) + return optimizer + + +# %% [markdown] +# ### Training the `LitModel` using the `MNISTDataModule` +# +# Now, we initialize and train the `LitModel` using the `MNISTDataModule`'s configuration settings and dataloaders. + +# %% +# Init DataModule +dm = MNISTDataModule() +# Init model from datamodule's attributes +model = LitModel(*dm.dims, dm.num_classes) +# Init trainer +trainer = L.Trainer( + max_epochs=3, + accelerator="auto", + devices=1, +) +# Pass the datamodule as arg to trainer.fit to override model hooks :) +trainer.fit(model, dm) + +# %% [markdown] +# ### Defining the CIFAR10 DataModule +# +# Lets prove the `LitModel` we made earlier is dataset agnostic by defining a new datamodule for the CIFAR10 dataset. + + +# %% +class CIFAR10DataModule(L.LightningDataModule): + def __init__(self, data_dir: str = "./"): + super().__init__() + self.data_dir = data_dir + self.transform = transforms.Compose( + [ + transforms.ToTensor(), + transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5)), + ] + ) + + self.dims = (3, 32, 32) + self.num_classes = 10 + + def prepare_data(self): + # download + CIFAR10(self.data_dir, train=True, download=True) + CIFAR10(self.data_dir, train=False, download=True) + + def setup(self, stage=None): + # Assign train/val datasets for use in dataloaders + if stage == "fit" or stage is None: + cifar_full = CIFAR10(self.data_dir, train=True, transform=self.transform) + self.cifar_train, self.cifar_val = random_split(cifar_full, [45000, 5000]) + + # Assign test dataset for use in dataloader(s) + if stage == "test" or stage is None: + self.cifar_test = CIFAR10(self.data_dir, train=False, transform=self.transform) + + def train_dataloader(self): + return DataLoader(self.cifar_train, batch_size=BATCH_SIZE) + + def val_dataloader(self): + return DataLoader(self.cifar_val, batch_size=BATCH_SIZE) + + def test_dataloader(self): + return DataLoader(self.cifar_test, batch_size=BATCH_SIZE) + + +# %% [markdown] +# ### Training the `LitModel` using the `CIFAR10DataModule` +# +# Our model isn't very good, so it will perform pretty badly on the CIFAR10 dataset. +# +# The point here is that we can see that our `LitModel` has no problem using a different datamodule as its input data. + +# %% +dm = CIFAR10DataModule() +model = LitModel(*dm.dims, dm.num_classes, hidden_size=256) +trainer = L.Trainer( + max_epochs=5, + accelerator="auto", + devices=1, +) +trainer.fit(model, dm) diff --git a/_notebooks/lightning_examples/finetuning-scheduler/.meta.yml b/_notebooks/lightning_examples/finetuning-scheduler/.meta.yml new file mode 100644 index 0000000..6264155 --- /dev/null +++ b/_notebooks/lightning_examples/finetuning-scheduler/.meta.yml @@ -0,0 +1,21 @@ +title: Fine-Tuning Scheduler +author: "[Dan Dale](https://github.com/speediedan)" +created: 2021-11-29 +updated: 2023-01-24 +license: CC BY-SA +build: 0 +tags: + - Fine-Tuning +description: | + This notebook introduces the [Fine-Tuning Scheduler](https://finetuning-scheduler.readthedocs.io/en/stable/index.html) extension + and demonstrates the use of it to fine-tune a small foundation model on the + [RTE](https://huggingface.co/datasets/viewer/?dataset=super_glue&config=rte) task of + [SuperGLUE](https://super.gluebenchmark.com/) with iterative early-stopping defined according to a user-specified + schedule. It uses Hugging Face's ``datasets`` and ``transformers`` libraries to retrieve the relevant benchmark data + and foundation model weights. The required dependencies are installed via the finetuning-scheduler ``[examples]`` extra. +requirements: + - finetuning-scheduler[examples]>=0.4.0 + - datasets<2.8.0 # todo: AttributeError: module 'datasets.arrow_dataset' has no attribute 'Batch' + - lightning>=2.0.0rc0 +accelerator: + - GPU diff --git a/_notebooks/lightning_examples/finetuning-scheduler/RteBoolqModule_ft_schedule_deberta_base.yaml b/_notebooks/lightning_examples/finetuning-scheduler/RteBoolqModule_ft_schedule_deberta_base.yaml new file mode 100644 index 0000000..62bdbae --- /dev/null +++ b/_notebooks/lightning_examples/finetuning-scheduler/RteBoolqModule_ft_schedule_deberta_base.yaml @@ -0,0 +1,18 @@ + +0: + params: + - model.classifier.bias + - model.classifier.weight + - model.pooler.dense.bias + - model.pooler.dense.weight + - model.deberta.encoder.LayerNorm.bias + - model.deberta.encoder.LayerNorm.weight + - model.deberta.encoder.rel_embeddings.weight + - model.deberta.encoder.layer.{0,11}.(output|attention|intermediate).* +1: + params: + - model.deberta.embeddings.LayerNorm.bias + - model.deberta.embeddings.LayerNorm.weight +2: + params: + - model.deberta.embeddings.word_embeddings.weight diff --git a/_notebooks/lightning_examples/finetuning-scheduler/emphasized_yaml.png b/_notebooks/lightning_examples/finetuning-scheduler/emphasized_yaml.png new file mode 100644 index 0000000..492be1d Binary files /dev/null and b/_notebooks/lightning_examples/finetuning-scheduler/emphasized_yaml.png differ diff --git a/_notebooks/lightning_examples/finetuning-scheduler/finetuning-scheduler.py b/_notebooks/lightning_examples/finetuning-scheduler/finetuning-scheduler.py new file mode 100644 index 0000000..956897d --- /dev/null +++ b/_notebooks/lightning_examples/finetuning-scheduler/finetuning-scheduler.py @@ -0,0 +1,708 @@ +# %% [markdown] +# ## Scheduled Fine-Tuning with the Fine-Tuning Scheduler Extension +# +# ![Fine-Tuning Scheduler logo](logo_fts.png){height="55px" width="401px"} +# +# The [Fine-Tuning Scheduler](https://finetuning-scheduler.readthedocs.io/en/stable/index.html) extension accelerates and enhances model experimentation with flexible fine-tuning schedules. +# +# Training with the extension is simple and confers a host of benefits: +# +# - it dramatically increases fine-tuning flexibility +# - expedites and facilitates exploration of model tuning dynamics +# - enables marginal performance improvements of fine-tuned models +# +# Setup is straightforward, just install from PyPI! Since this notebook-based example requires a few additional packages (e.g. +# ``transformers``, ``sentencepiece``), we installed the ``finetuning-scheduler`` package with the ``[examples]`` extra above. +# Once the ``finetuning-scheduler`` package is installed, the [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) callback is available for use with PyTorch Lightning. +# For additional installation options, please see the Fine-Tuning Scheduler [README](https://github.com/speediedan/finetuning-scheduler/blob/main/README.md). +# +# +# +#
+# +# Fundamentally, [Fine-Tuning Scheduler](https://finetuning-scheduler.readthedocs.io/en/stable/index.html) enables +# scheduled, multi-phase, fine-tuning of foundation models. Gradual unfreezing (i.e. thawing) can help maximize +# foundation model knowledge retention while allowing (typically upper layers of) the model to +# optimally adapt to new tasks during transfer learning [1, 2, 3](#f1) +# +#
+# +# The [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) callback orchestrates the gradual unfreezing +# of models via a fine-tuning schedule that is either implicitly generated (the default) or explicitly provided by the user +# (more computationally efficient). Fine-tuning phase transitions are driven by +# [FTSEarlyStopping](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts_supporters.html#finetuning_scheduler.fts_supporters.FTSEarlyStopping) +# criteria (a multi-phase extension of ``EarlyStopping`` packaged with FinetuningScheduler), user-specified epoch transitions or a composition of the two (the default mode). +# A [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) training session completes when the +# final phase of the schedule has its stopping criteria met. See +# the [early stopping documentation](https://lightning.ai/docs/pytorch/stable/api/pytorch_lightning.callbacks.EarlyStopping.html) for more details on that callback's configuration. +# +# ![FinetuningScheduler explicit loss animation](fts_explicit_loss_anim.gif){height="272px" width="376px"} + +# %% [markdown] +# +# ## Basic Usage +# +#
+# +# If no fine-tuning schedule is provided by the user, [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) will generate a +# [default schedule](#The-Default-Finetuning-Schedule) and proceed to fine-tune according to the generated schedule, +# using default [FTSEarlyStopping](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts_supporters.html#finetuning_scheduler.fts_supporters.FTSEarlyStopping) and [FTSCheckpoint](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts_supporters.html#finetuning_scheduler.fts_supporters.FTSCheckpoint) callbacks with ``monitor=val_loss``. +# +#
+# +# ```python +# from pytorch_lightning import Trainer +# from finetuning_scheduler import FinetuningScheduler +# trainer = Trainer(callbacks=[FinetuningScheduler()]) +# ``` + +# %% [markdown] +# ## The Default Fine-Tuning Schedule +# +# Schedule definition is facilitated via the [gen_ft_schedule](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts_supporters.html#finetuning_scheduler.fts_supporters.ScheduleImplMixin.gen_ft_schedule) method which dumps a default fine-tuning schedule (by default using a naive, 2-parameters per level heuristic) which can be adjusted as +# desired by the user and/or subsequently passed to the callback. Using the default/implicitly generated schedule will likely be less computationally efficient than a user-defined fine-tuning schedule but is useful for exploring a model's fine-tuning behavior and can serve as a good baseline for subsequent explicit schedule refinement. +# While the current version of [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) only supports single optimizer and (optional) lr_scheduler configurations, per-phase maximum learning rates can be set as demonstrated in the next section. + +# %% [markdown] +# ## Specifying a Fine-Tuning Schedule +# +# To specify a fine-tuning schedule, it's convenient to first generate the default schedule and then alter the thawed/unfrozen parameter groups associated with each fine-tuning phase as desired. Fine-tuning phases are zero-indexed and executed in ascending order. +# +# 1. First, generate the default schedule to ``Trainer.log_dir``. It will be named after your +# ``LightningModule`` subclass with the suffix ``_ft_schedule.yaml``. +# +# ```python +# from pytorch_lightning import Trainer +# from finetuning_scheduler import FinetuningScheduler +# trainer = Trainer(callbacks=[FinetuningScheduler(gen_ft_sched_only=True)]) +# ``` +# +# 2. Alter the schedule as desired. +# +# ![side_by_side_yaml](side_by_side_yaml.png){height="327px" width="800px"} +# +# 3. Once the fine-tuning schedule has been altered as desired, pass it to +# [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) to commence scheduled training: +# +# ```python +# from pytorch_lightning import Trainer +# from finetuning_scheduler import FinetuningScheduler +# +# trainer = Trainer(callbacks=[FinetuningScheduler(ft_schedule="/path/to/my/schedule/my_schedule.yaml")]) +# ``` + +# %% [markdown] +# ## Early-Stopping and Epoch-Driven Phase Transition Criteria +# +# +# By default, [FTSEarlyStopping](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts_supporters.html#finetuning_scheduler.fts_supporters.FTSEarlyStopping) and epoch-driven +# transition criteria are composed. If a ``max_transition_epoch`` is specified for a given phase, the next fine-tuning phase will begin at that epoch unless [FTSEarlyStopping](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts_supporters.html#finetuning_scheduler.fts_supporters.FTSEarlyStopping) criteria are met first. +# If [FinetuningScheduler.epoch_transitions_only](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler.params.epoch_transitions_only) is ``True``, [FTSEarlyStopping](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts_supporters.html#finetuning_scheduler.fts_supporters.FTSEarlyStopping) will not be used +# and transitions will be exclusively epoch-driven. +# +# +#
+# +# **Tip:** Use of regex expressions can be convenient for specifying more complex schedules. Also, a per-phase base maximum lr can be specified: +# +# ![emphasized_yaml](emphasized_yaml.png){height="380px" width="800px"} +# +#
+# +# +# +# The end-to-end example in this notebook ([Scheduled Fine-Tuning For SuperGLUE](#superglue)) uses [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) in explicit mode to fine-tune a small foundation model on the [RTE](https://huggingface.co/datasets/viewer/?dataset=super_glue&config=rte) task of [SuperGLUE](https://super.gluebenchmark.com/). +# Please see the [official Fine-Tuning Scheduler documentation](https://finetuning-scheduler.readthedocs.io/en/stable/index.html) if you are interested in a similar [CLI-based example](https://finetuning-scheduler.readthedocs.io/en/stable/index.html#example-scheduled-fine-tuning-for-superglue) using the LightningCLI. + +# %% [markdown] +# ## Resuming Scheduled Fine-Tuning Training Sessions +# +# Resumption of scheduled fine-tuning training is identical to the continuation of +# [other training sessions](https://lightning.ai/docs/pytorch/stable/common/trainer.html) with the caveat that the provided checkpoint must have been saved by a [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) session. +# [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) uses [FTSCheckpoint](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts_supporters.html#finetuning_scheduler.fts_supporters.FTSCheckpoint) (an extension of ``ModelCheckpoint``) to maintain schedule state with special metadata. +# +# +# ```python +# from pytorch_lightning import Trainer +# from finetuning_scheduler import FinetuningScheduler +# trainer = Trainer(callbacks=[FinetuningScheduler()]) +# trainer.fit(..., ckpt_path="some/path/to/my_checkpoint.ckpt") +# ``` +# +# Training will resume at the depth/level of the provided checkpoint according to the specified schedule. Schedules can be altered between training sessions but schedule compatibility is left to the user for maximal flexibility. If executing a user-defined schedule, typically the same schedule should be provided for the original and resumed training sessions. +# +# By default ([FinetuningScheduler.restore_best](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html?highlight=restore_best#finetuning_scheduler.fts.FinetuningScheduler.params.restore_best) is ``True``), [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) will attempt to restore the best available checkpoint before fine-tuning depth transitions. +# +# ```python +# trainer = Trainer(callbacks=[FinetuningScheduler()]) +# trainer.fit(..., ckpt_path="some/path/to/my_kth_best_checkpoint.ckpt") +# ``` +# +# Note that similar to the behavior of [ModelCheckpoint](https://lightning.ai/docs/pytorch/stable/api/pytorch_lightning.callbacks.ModelCheckpoint.html), (specifically [this PR](https://github.com/Lightning-AI/lightning/pull/12045)), +# when resuming training with a different [FTSCheckpoint](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts_supporters.html#finetuning_scheduler.fts_supporters.FTSCheckpoint) ``dirpath`` from the provided +# checkpoint, the new training session's checkpoint state will be re-initialized at the resumption depth with the provided checkpoint being set as the best checkpoint. + +# %% [markdown] +#
+# +# **Note:** Currently, [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) supports the following strategy types: +# +# - ``ddp`` (and alias ``ddp_find_unused_parameters_false``) +# - ``fsdp_native`` (and alias ``fsdp_native_full_shard_offload``) +# - ``ddp_spawn`` (and aliases ``ddp_fork``, ``ddp_notebook``) +# - ``dp`` +# - ``ddp_sharded`` (deprecated, to be removed in 2.0) +# - ``ddp_sharded_spawn`` (deprecated, to be removed in 2.0) +# +# Custom or officially unsupported strategies can be used by setting [FinetuningScheduler.allow_untested](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html?highlight=allow_untested#finetuning_scheduler.fts.FinetuningScheduler.params.allow_untested) to ``True``. +# Note that most currently unsupported strategies are so because they require varying degrees of modification to be compatible. For example, ``deepspeed`` will require a [StrategyAdapter](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.strategy_adapters.html#finetuning_scheduler.strategy_adapters.StrategyAdapter) to be written (similar to the one for ``FSDP``, [FSDPStrategyAdapter](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.strategy_adapters.html#finetuning_scheduler.strategy_adapters.FSDPStrategyAdapter)) before support can be added (PRs welcome!), +# while ``tpu_spawn`` would require an override of the current broadcast method to include python objects. +#
+ +# %% [markdown] +#
+# +# ## Scheduled Fine-Tuning For SuperGLUE +# +# The following example demonstrates the use of [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) to fine-tune a small foundation model on the [RTE](https://huggingface.co/datasets/viewer/?dataset=super_glue&config=rte) task of [SuperGLUE](https://super.gluebenchmark.com/). Iterative early-stopping will be applied according to a user-specified schedule. +# + +# %% +import os +import warnings +from datetime import datetime +from typing import Any, Dict, List, Optional + +from packaging.version import Version + +import sentencepiece as sp # noqa: F401 # isort: split +import datasets +import evaluate +import pytorch_lightning as pl +import torch +from datasets import logging as datasets_logging +from lightning_fabric.accelerators.cuda import is_cuda_available +from pytorch_lightning.callbacks import EarlyStopping, ModelCheckpoint +from pytorch_lightning.loggers.tensorboard import TensorBoardLogger +from pytorch_lightning.utilities import rank_zero_warn +from torch.optim.lr_scheduler import CosineAnnealingWarmRestarts +from torch.utils.data import DataLoader +from transformers import AutoConfig, AutoModelForSequenceClassification, AutoTokenizer +from transformers import logging as transformers_logging +from transformers.tokenization_utils_base import BatchEncoding + +if Version(torch.__version__) == Version("1.12.0") or torch.__version__.startswith("1.12.0"): + # we need to use a patched version of AdamW to fix https://github.com/pytorch/pytorch/issues/80809 + # and allow examples to succeed with torch 1.12.0 (this torch bug is fixed in 1.12.1) + from fts_examples.patched_adamw import AdamW +else: + from torch.optim.adamw import AdamW + +# %% +# Import the `FinetuningScheduler` PyTorch Lightning extension module we want to use. This will import all necessary callbacks. +import finetuning_scheduler as fts # isort: split + +# set notebook-level variables +TASK_NUM_LABELS = {"boolq": 2, "rte": 2} +DEFAULT_TASK = "rte" + +# reduce hf logging verbosity to focus on tutorial-relevant code/messages +for hflogger in [transformers_logging, datasets_logging]: + hflogger.set_verbosity_error() +# ignore warnings related tokenizers_parallelism/DataLoader parallelism trade-off and +# expected logging behavior +for warnf in [ + r".*does not have many workers.*", + r".*The number of training samples.*", + r".*converting to a fast.*", + r".*number of training batches.*", +]: + warnings.filterwarnings("ignore", warnf) + + +# %% +class RteBoolqDataModule(pl.LightningDataModule): + """A ``LightningDataModule`` designed for both the RTE or BoolQ SuperGLUE Hugging Face datasets.""" + + TASK_TEXT_FIELD_MAP = {"rte": ("premise", "hypothesis"), "boolq": ("question", "passage")} + LOADER_COLUMNS = ( + "datasets_idx", + "input_ids", + "token_type_ids", + "attention_mask", + "start_positions", + "end_positions", + "labels", + ) + + def __init__( + self, + model_name_or_path: str, + task_name: str = DEFAULT_TASK, + max_seq_length: int = 128, + train_batch_size: int = 16, + eval_batch_size: int = 16, + tokenizers_parallelism: bool = True, + **dataloader_kwargs: Any, + ): + r"""Initialize the ``LightningDataModule`` designed for both the RTE or BoolQ SuperGLUE Hugging Face + datasets. + + Args: + model_name_or_path (str): + Can be either: + - A string, the ``model id`` of a pretrained model hosted inside a model repo on huggingface.co. + Valid model ids can be located at the root-level, like ``bert-base-uncased``, or namespaced + under a user or organization name, like ``dbmdz/bert-base-german-cased``. + - A path to a ``directory`` containing model weights saved using + :meth:`~transformers.PreTrainedModel.save_pretrained`, e.g., ``./my_model_directory/``. + task_name (str, optional): Name of the SuperGLUE task to execute. This module supports 'rte' or 'boolq'. + Defaults to DEFAULT_TASK which is 'rte'. + max_seq_length (int, optional): Length to which we will pad sequences or truncate input. Defaults to 128. + train_batch_size (int, optional): Training batch size. Defaults to 16. + eval_batch_size (int, optional): Batch size to use for validation and testing splits. Defaults to 16. + tokenizers_parallelism (bool, optional): Whether to use parallelism in the tokenizer. Defaults to True. + \**dataloader_kwargs: Arguments passed when initializing the dataloader. + """ + super().__init__() + task_name = task_name if task_name in TASK_NUM_LABELS.keys() else DEFAULT_TASK + self.text_fields = self.TASK_TEXT_FIELD_MAP[task_name] + self.dataloader_kwargs = { + "num_workers": dataloader_kwargs.get("num_workers", 0), + "pin_memory": dataloader_kwargs.get("pin_memory", False), + } + self.save_hyperparameters() + os.environ["TOKENIZERS_PARALLELISM"] = "true" if self.hparams.tokenizers_parallelism else "false" + self.tokenizer = AutoTokenizer.from_pretrained( + self.hparams.model_name_or_path, use_fast=True, local_files_only=False + ) + + def prepare_data(self): + """Load the SuperGLUE dataset.""" + # N.B. PL calls prepare_data from a single process (rank 0) so do not use it to assign + # state (e.g. self.x=y) + datasets.load_dataset("super_glue", self.hparams.task_name) + + def setup(self, stage): + """Setup our dataset splits for training/validation.""" + self.dataset = datasets.load_dataset("super_glue", self.hparams.task_name) + for split in self.dataset.keys(): + self.dataset[split] = self.dataset[split].map( + self._convert_to_features, batched=True, remove_columns=["label"] + ) + self.columns = [c for c in self.dataset[split].column_names if c in self.LOADER_COLUMNS] + self.dataset[split].set_format(type="torch", columns=self.columns) + + self.eval_splits = [x for x in self.dataset.keys() if "validation" in x] + + def train_dataloader(self): + return DataLoader(self.dataset["train"], batch_size=self.hparams.train_batch_size, **self.dataloader_kwargs) + + def val_dataloader(self): + return DataLoader(self.dataset["validation"], batch_size=self.hparams.eval_batch_size, **self.dataloader_kwargs) + + def _convert_to_features(self, example_batch: datasets.arrow_dataset.LazyDict) -> BatchEncoding: + """Convert raw text examples to a :class:`~transformers.tokenization_utils_base.BatchEncoding` container + (derived from python dict) of features that includes helpful methods for translating between word/character + space and token space. + + Args: + example_batch ([type]): The set of examples to convert to token space. + + Returns: + ``BatchEncoding``: A batch of encoded examples (note default tokenizer batch_size=1000). + """ + text_pairs = list(zip(example_batch[self.text_fields[0]], example_batch[self.text_fields[1]])) + # Tokenize the text/text pairs + features = self.tokenizer.batch_encode_plus( + text_pairs, max_length=self.hparams.max_seq_length, padding="longest", truncation=True + ) + # Rename label to labels to make it easier to pass to model forward + features["labels"] = example_batch["label"] + return features + + +# %% +class RteBoolqModule(pl.LightningModule): + """A ``LightningModule`` that can be used to fine-tune a foundation model on either the RTE or BoolQ SuperGLUE + tasks using Hugging Face implementations of a given model and the `SuperGLUE Hugging Face dataset.""" + + def __init__( + self, + model_name_or_path: str, + optimizer_init: Dict[str, Any], + lr_scheduler_init: Dict[str, Any], + model_cfg: Optional[Dict[str, Any]] = None, + task_name: str = DEFAULT_TASK, + experiment_tag: str = "default", + ): + """ + Args: + model_name_or_path (str): Path to pretrained model or identifier from https://huggingface.co/models. + optimizer_init (Dict[str, Any]): The desired optimizer configuration. + lr_scheduler_init (Dict[str, Any]): The desired learning rate scheduler config. + model_cfg (Optional[Dict[str, Any]], optional): Defines overrides of the default model config. Defaults to + ``None``. + task_name (str, optional): The SuperGLUE task to execute, one of ``'rte'``, ``'boolq'``. Defaults to "rte". + experiment_tag (str, optional): The tag to use for the experiment and tensorboard logs. Defaults to + "default". + """ + super().__init__() + if task_name not in TASK_NUM_LABELS.keys(): + rank_zero_warn(f"Invalid task_name {task_name!r}. Proceeding with the default task: {DEFAULT_TASK!r}") + task_name = DEFAULT_TASK + self.num_labels = TASK_NUM_LABELS[task_name] + self.model_cfg = model_cfg or {} + conf = AutoConfig.from_pretrained(model_name_or_path, num_labels=self.num_labels, local_files_only=False) + self.model = AutoModelForSequenceClassification.from_pretrained(model_name_or_path, config=conf) + self.model.config.update(self.model_cfg) # apply model config overrides + self.init_hparams = { + "optimizer_init": optimizer_init, + "lr_scheduler_init": lr_scheduler_init, + "model_config": self.model.config, + "model_name_or_path": model_name_or_path, + "task_name": task_name, + "experiment_id": f"{datetime.now().strftime('%Y%m%d_%H%M%S')}_{experiment_tag}", + } + self.save_hyperparameters(self.init_hparams) + self.metric = evaluate.load("super_glue", self.hparams.task_name, experiment_id=self.hparams.experiment_id) + self.no_decay = ["bias", "LayerNorm.weight"] + + @property + def finetuningscheduler_callback(self) -> fts.FinetuningScheduler: + fts_callback = [c for c in self.trainer.callbacks if isinstance(c, fts.FinetuningScheduler)] + return fts_callback[0] if fts_callback else None + + def forward(self, **inputs): + return self.model(**inputs) + + def training_step(self, batch, batch_idx): + outputs = self(**batch) + loss = outputs[0] + self.log("train_loss", loss) + return loss + + def training_epoch_end(self, outputs: List[Any]) -> None: + if self.finetuningscheduler_callback: + self.log("finetuning_schedule_depth", float(self.finetuningscheduler_callback.curr_depth)) + + def validation_step(self, batch, batch_idx, dataloader_idx=0): + outputs = self(**batch) + val_loss, logits = outputs[:2] + if self.num_labels >= 1: + preds = torch.argmax(logits, axis=1) + elif self.num_labels == 1: + preds = logits.squeeze() + labels = batch["labels"] + self.log("val_loss", val_loss, prog_bar=True) + metric_dict = self.metric.compute(predictions=preds, references=labels) + self.log_dict(metric_dict, prog_bar=True) + + def _init_param_groups(self) -> List[Dict]: + """Initialize the parameter groups. Used to ensure weight_decay is not applied to our specified bias + parameters when we initialize the optimizer. + + Returns: + List[Dict]: A list of parameter group dictionaries. + """ + return [ + { + "params": [ + p + for n, p in self.model.named_parameters() + if not any(nd in n for nd in self.no_decay) and p.requires_grad + ], + "weight_decay": self.hparams.optimizer_init["weight_decay"], + }, + { + "params": [ + p + for n, p in self.model.named_parameters() + if any(nd in n for nd in self.no_decay) and p.requires_grad + ], + "weight_decay": 0.0, + }, + ] + + def configure_optimizers(self): + # the phase 0 parameters will have been set to require gradients during setup + # you can initialize the optimizer with a simple requires.grad filter as is often done, + # but in this case we pass a list of parameter groups to ensure weight_decay is + # not applied to the bias parameter (for completeness, in this case it won't make much + # performance difference) + optimizer = AdamW(params=self._init_param_groups(), **self.hparams.optimizer_init) + scheduler = { + "scheduler": CosineAnnealingWarmRestarts(optimizer, **self.hparams.lr_scheduler_init), + "interval": "epoch", + } + return [optimizer], [scheduler] + + +# %% [markdown] +# ### Our Training Sessions +# +# We'll be comparing three different fine-tuning training configurations. Every configuration in this example depends +# upon a shared set of defaults, only differing in their respective fine-tuning schedules. +# +# | Experiment Tag | Training Scenario Description | +# |:-----------------:| ---------------------------------------------------------------------- | +# | ``fts_explicit`` | Training with a fine-tuning schedule explicitly provided by the user | +# | ``nofts_baseline``| A baseline fine-tuning training session (without scheduled fine-tuning) | +# | ``fts_implicit`` | Training with an implicitly generated fine-tuning schedule (the default) | +# +# Let's begin by configuring the ``fts_explicit`` scenario. We'll subsequently run the other two scenarios for +# comparison. + +# %% +# Let's create a fine-tuning schedule for our model and run an explicitly scheduled fine-tuning training scenario with it +# Please see the [FinetuningScheduler documentation](https://finetuning-scheduler.readthedocs.io/en/stable/index.html) for a full description of the schedule format + + +ft_schedule_yaml = """ +0: + params: + - model.classifier.bias + - model.classifier.weight + - model.pooler.dense.bias + - model.pooler.dense.weight + - model.deberta.encoder.LayerNorm.bias + - model.deberta.encoder.LayerNorm.weight + - model.deberta.encoder.rel_embeddings.weight + - model.deberta.encoder.layer.{0,11}.(output|attention|intermediate).* +1: + params: + - model.deberta.embeddings.LayerNorm.bias + - model.deberta.embeddings.LayerNorm.weight +2: + params: + - model.deberta.embeddings.word_embeddings.weight +""" +ft_schedule_name = "RteBoolqModule_ft_schedule_deberta_base.yaml" +# Let's write the schedule to a file so we can simulate loading an explicitly defined fine-tuning +# schedule. +with open(ft_schedule_name, "w") as f: + f.write(ft_schedule_yaml) + +# %% +datasets.logging.disable_progress_bar() +pl.seed_everything(42) +dm = RteBoolqDataModule(model_name_or_path="microsoft/deberta-v3-base", tokenizers_parallelism=True) + +# %% [markdown] +# ### Optimizer Configuration +# +#
+# +# Though other optimizers can arguably yield some marginal advantage contingent on the context, +# the Adam optimizer (and the [AdamW version](https://pytorch.org/docs/stable/_modules/torch/optim/adamw.html#AdamW) which +# implements decoupled weight decay) remains robust to hyperparameter choices and is commonly used for fine-tuning +# foundation language models. See [(Sivaprasad et al., 2020)](#f2) and [(Mosbach, Andriushchenko & Klakow, 2020)](#f3) for theoretical and systematic empirical justifications of Adam and its use in fine-tuning +# large transformer-based language models. The values used here have some justification +# in the referenced literature but have been largely empirically determined and while a good +# starting point could be could be further tuned. +# +#
+ +# %% +optimizer_init = {"weight_decay": 1e-05, "eps": 1e-07, "lr": 1e-05} + +# %% [markdown] +# ### LR Scheduler Configuration +# +#
+# +# The [CosineAnnealingWarmRestarts scheduler](https://pytorch.org/docs/stable/generated/torch.optim.lr_scheduler.CosineAnnealingWarmRestarts.html?highlight=cosineannealingwarm#torch.optim.lr_scheduler.CosineAnnealingWarmRestarts) nicely fits with our iterative fine-tuning since it does not depend upon a global max_epoch +# value. The importance of initial warmup is reduced due to the innate warmup effect of Adam bias correction [[5]](#f3) +# and the gradual thawing we are performing. Note that commonly used LR schedulers that depend on providing +# max_iterations/epochs (e.g. the +# [CosineWarmupScheduler](https://github.com/Lightning-AI/tutorials/blob/0c325829101d5a6ebf32ed99bbf5b09badf04a59/course_UvA-DL/05-transformers-and-MH-attention/Transformers_MHAttention.py#L688) +# used in other pytorch-lightning tutorials) also work with FinetuningScheduler. Though the LR scheduler is theoretically +# justified [(Loshchilov & Hutter, 2016)](#f4), the particular values provided here are primarily empircally driven. +# +# [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) also supports LR scheduler +# reinitialization in both explicit and implicit finetuning schedule modes. See the [advanced usage documentation](https://finetuning-scheduler.readthedocs.io/en/stable/advanced/lr_scheduler_reinitialization.html) for explanations and demonstration of the extension's support for more complex requirements. +#
+ + +# %% +lr_scheduler_init = {"T_0": 1, "T_mult": 2, "eta_min": 1e-07} + +# %% +# Load our lightning module... +lightning_module_kwargs = { + "model_name_or_path": "microsoft/deberta-v3-base", + "optimizer_init": optimizer_init, + "lr_scheduler_init": lr_scheduler_init, +} +model = RteBoolqModule(**lightning_module_kwargs, experiment_tag="fts_explicit") + +# %% [markdown] +# ### Callback Configuration +# +# The only callback required to invoke the [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) is the [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) callback itself. +# Default versions of [FTSCheckpoint](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts_supporters.html#finetuning_scheduler.fts_supporters.FTSCheckpoint) and [FTSEarlyStopping](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts_supporters.html#finetuning_scheduler.fts_supporters.FTSEarlyStopping) +# (if not specifying ``epoch_only_transitions``) will be included ([as discussed above](#basic_usage)) if not provided +# in the callbacks list. For demonstration purposes I'm including example configurations of all three callbacks below. + +# %% +# let's save our callback configurations for the explicit scenario since we'll be reusing the same +# configurations for the implicit and nofts_baseline scenarios (except the config for the +# FinetuningScheduler callback itself of course in the case of nofts_baseline) +earlystopping_kwargs = {"monitor": "val_loss", "min_delta": 0.001, "patience": 2} +checkpoint_kwargs = {"monitor": "val_loss", "save_top_k": 1} +fts_kwargs = {"max_depth": 1} +callbacks = [ + fts.FinetuningScheduler(ft_schedule=ft_schedule_name, **fts_kwargs), + fts.FTSEarlyStopping(**earlystopping_kwargs), + fts.FTSCheckpoint(**checkpoint_kwargs), +] + +# %% +logger = TensorBoardLogger("lightning_logs", name="fts_explicit") +# optionally start tensorboard and monitor progress graphically while viewing multi-phase fine-tuning specific training +# logs in the cell output below by uncommenting the next 2 lines +# # %load_ext tensorboard +# # %tensorboard --logdir lightning_logs +# disable progress bar by default to focus on multi-phase training logs. Set to True to re-enable if desired +enable_progress_bar = False + +# %% + + +def train() -> None: + trainer = pl.Trainer( + enable_progress_bar=enable_progress_bar, + max_epochs=100, + precision=16, + accelerator="auto", + devices=1 if is_cuda_available() else None, + callbacks=callbacks, + logger=logger, + ) + trainer.fit(model, datamodule=dm) + + +print( + "Note given the computation associated w/ the multiple phases of fine-tuning demonstrated, this notebook is best used with an accelerator" +) +train() + +# %% [markdown] +# ### Running the Baseline and Implicit Fine-Tuning Scenarios +# +# Let's now compare our ``nofts_baseline`` and ``fts_implicit`` scenarios with the ``fts_explicit`` one we just ran. +# +# We'll need to update our callbacks list, using the core PL ``EarlyStopping`` and ``ModelCheckpoint`` callbacks for the +# ``nofts_baseline`` (which operate identically to their FTS analogs apart from the recursive training support). +# For both core PyTorch Lightning and user-registered callbacks, we can define our callbacks using a dictionary as we do +# with the LightningCLI. This allows us to avoid managing imports and support more complex configuration separated from +# code. +# +# Note that we'll be using identical callback configurations to the ``fts_explicit`` scenario. Keeping [max_depth](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html?highlight=max_depth#finetuning_scheduler.fts.FinetuningScheduler.params.max_depth) for +# the implicit schedule will limit fine-tuning to just the last 4 parameters of the model, which is only a small fraction +# of the parameters you'd want to tune for maximum performance. Since the implicit schedule is quite computationally +# intensive and most useful for exploring model behavior, leaving [max_depth](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html?highlight=max_depth#finetuning_scheduler.fts.FinetuningScheduler.params.max_depth) 1 allows us to demo implicit mode +# behavior while keeping the computational cost and runtime of this notebook reasonable. To review how a full implicit +# mode run compares to the ``nofts_baseline`` and ``fts_explicit`` scenarios, please see the the following +# [tensorboard experiment summary](https://tensorboard.dev/experiment/n7U8XhrzRbmvVzC4SQSpWw/). + + +# %% +nofts_callbacks = [EarlyStopping(**earlystopping_kwargs), ModelCheckpoint(**checkpoint_kwargs)] +fts_implicit_callbacks = [ + fts.FinetuningScheduler(**fts_kwargs), + fts.FTSEarlyStopping(**earlystopping_kwargs), + fts.FTSCheckpoint(**checkpoint_kwargs), +] +scenario_callbacks = {"nofts_baseline": nofts_callbacks, "fts_implicit": fts_implicit_callbacks} + +# %% +for scenario_name, scenario_callbacks in scenario_callbacks.items(): + model = RteBoolqModule(**lightning_module_kwargs, experiment_tag=scenario_name) + logger = TensorBoardLogger("lightning_logs", name=scenario_name) + callbacks = scenario_callbacks + print(f"Beginning training the '{scenario_name}' scenario") + train() + +# %% [markdown] +# ### Reviewing the Training Results +# +# See the [tensorboard experiment summaries](https://tensorboard.dev/experiment/n7U8XhrzRbmvVzC4SQSpWw/) to get a sense +# of the relative computational and performance tradeoffs associated with these [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) configurations. +# The summary compares a full ``fts_implicit`` execution to ``fts_explicit`` and ``nofts_baseline`` scenarios using DDP +# training with 2 GPUs. The full logs/schedules and detailed system configuration used for all three scenarios are available +# [here](https://drive.google.com/file/d/1LrUcisRLHeJgh_BDOOD_GUBPp5iHAkoR/view?usp=sharing) and the checkpoints +# produced in the scenarios [here](https://drive.google.com/file/d/1t7myBgcqcZ9ax_IT9QVk-vFH_l_o5UXB/view?usp=sharing) +# (caution, ~3.5GB). +# +# [![fts_explicit_accuracy](fts_explicit_accuracy.png){height="315px" width="492px"}](https://tensorboard.dev/experiment/n7U8XhrzRbmvVzC4SQSpWw/#scalars&_smoothingWeight=0&runSelectionState=eyJmdHNfZXhwbGljaXQiOnRydWUsIm5vZnRzX2Jhc2VsaW5lIjpmYWxzZSwiZnRzX2ltcGxpY2l0IjpmYWxzZX0%3D) +# [![nofts_baseline](nofts_baseline_accuracy.png){height="316px" width="505px"}](https://tensorboard.dev/experiment/n7U8XhrzRbmvVzC4SQSpWw/#scalars&_smoothingWeight=0&runSelectionState=eyJmdHNfZXhwbGljaXQiOmZhbHNlLCJub2Z0c19iYXNlbGluZSI6dHJ1ZSwiZnRzX2ltcGxpY2l0IjpmYWxzZX0%3D) +# +# Note that the results above may vary to a small degree from the tensorboard summaries generated by this notebook +# which used DP, 1 GPU and likely when you're running this, different versions of certain software components (e.g. pytorch, transformers). +# +# [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) expands the space of possible fine-tuning schedules and the composition of more sophisticated schedules can +# yield marginal fine-tuning performance gains. That stated, it should be emphasized the primary utility of [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) is to grant +# greater fine-tuning flexibility for model exploration in research. For example, glancing at DeBERTa-v3's implicit training +# run, a critical tuning transition point is immediately apparent: +# +# [![implicit_training_transition](implicit_training_transition.png){height="272px" width="494px"}](https://tensorboard.dev/experiment/n7U8XhrzRbmvVzC4SQSpWw/#scalars&_smoothingWeight=0&runSelectionState=eyJmdHNfZXhwbGljaXQiOmZhbHNlLCJub2Z0c19iYXNlbGluZSI6ZmFsc2UsImZ0c19pbXBsaWNpdCI6dHJ1ZX0%3D) +# +# Our `val_loss` begins a precipitous decline at step 3119 which corresponds to phase 17 in the schedule. Referring to our +# schedule, in phase 17 we're beginning tuning the attention parameters of our 10th encoder layer (of 11). Interesting! +# Though beyond the scope of this tutorial, it might be worth investigating these dynamics further and +# [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) allows one to do just that quite easily. +# +# %% [markdown] +# +# Note that though this example is intended to capture a common usage scenario, substantial variation is expected +# among use cases and models. +# In summary, [FinetuningScheduler](https://finetuning-scheduler.readthedocs.io/en/stable/api/finetuning_scheduler.fts.html#finetuning_scheduler.fts.FinetuningScheduler) provides increased fine-tuning flexibility that can be useful in a variety of +# contexts from exploring model tuning behavior to maximizing performance. +# %% [markdown] +# ## Footnotes +# +#
    +#
  1. +# +# [Howard, J., & Ruder, S. (2018)](https://arxiv.org/pdf/1801.06146.pdf). Fine-tuned Language +# Models for Text Classification. ArXiv, abs/1801.06146. [↩](#a1) +# +#
  2. +#
  3. +# +# [Chronopoulou, A., Baziotis, C., & Potamianos, A. (2019)](https://arxiv.org/pdf/1902.10547.pdf). +# An embarrassingly simple approach for transfer learning from pretrained language models. arXiv +# preprint arXiv:1902.10547. [↩](#a1) +# +#
  4. +#
  5. +# +# [Peters, M. E., Ruder, S., & Smith, N. A. (2019)](https://arxiv.org/pdf/1903.05987.pdf). To tune or not to +# tune? adapting pretrained representations to diverse tasks. arXiv preprint arXiv:1903.05987. [↩](#a1) +# +#
  6. +#
  7. +# +# [Sivaprasad, P. T., Mai, F., Vogels, T., Jaggi, M., & Fleuret, F. (2020)](https://arxiv.org/pdf/1910.11758.pdf). +# Optimizer benchmarking needs to account for hyperparameter tuning. In International Conference on Machine Learning +# (pp. 9036-9045). PMLR. [↩](#a2) +# +#
  8. +#
  9. +# +# [Mosbach, M., Andriushchenko, M., & Klakow, D. (2020)](https://arxiv.org/pdf/2006.04884.pdf). On the stability of +# fine-tuning bert: Misconceptions, explanations, and strong baselines. arXiv preprint arXiv:2006.04884. [↩](#a2) +# +#
  10. +#
  11. +# +# [Loshchilov, I., & Hutter, F. (2016)](https://arxiv.org/pdf/1608.03983.pdf). Sgdr: Stochastic gradient descent with +# warm restarts. arXiv preprint arXiv:1608.03983. [↩](#a3) +# +#
  12. +# +#
+ +# %% [markdown] +# diff --git a/_notebooks/lightning_examples/finetuning-scheduler/fts_explicit_accuracy.png b/_notebooks/lightning_examples/finetuning-scheduler/fts_explicit_accuracy.png new file mode 100644 index 0000000..b5d8f55 Binary files /dev/null and b/_notebooks/lightning_examples/finetuning-scheduler/fts_explicit_accuracy.png differ diff --git a/_notebooks/lightning_examples/finetuning-scheduler/fts_explicit_loss_anim.gif b/_notebooks/lightning_examples/finetuning-scheduler/fts_explicit_loss_anim.gif new file mode 100644 index 0000000..7451f65 Binary files /dev/null and b/_notebooks/lightning_examples/finetuning-scheduler/fts_explicit_loss_anim.gif differ diff --git a/_notebooks/lightning_examples/finetuning-scheduler/implicit_training_transition.png b/_notebooks/lightning_examples/finetuning-scheduler/implicit_training_transition.png new file mode 100644 index 0000000..6854dbf Binary files /dev/null and b/_notebooks/lightning_examples/finetuning-scheduler/implicit_training_transition.png differ diff --git a/_notebooks/lightning_examples/finetuning-scheduler/logo_fts.png b/_notebooks/lightning_examples/finetuning-scheduler/logo_fts.png new file mode 100644 index 0000000..02e14a3 Binary files /dev/null and b/_notebooks/lightning_examples/finetuning-scheduler/logo_fts.png differ diff --git a/_notebooks/lightning_examples/finetuning-scheduler/nofts_baseline_accuracy.png b/_notebooks/lightning_examples/finetuning-scheduler/nofts_baseline_accuracy.png new file mode 100644 index 0000000..b78f8c6 Binary files /dev/null and b/_notebooks/lightning_examples/finetuning-scheduler/nofts_baseline_accuracy.png differ diff --git a/_notebooks/lightning_examples/finetuning-scheduler/side_by_side_yaml.png b/_notebooks/lightning_examples/finetuning-scheduler/side_by_side_yaml.png new file mode 100644 index 0000000..3a32a1f Binary files /dev/null and b/_notebooks/lightning_examples/finetuning-scheduler/side_by_side_yaml.png differ diff --git a/_notebooks/lightning_examples/mnist-hello-world/.meta.yml b/_notebooks/lightning_examples/mnist-hello-world/.meta.yml new file mode 100644 index 0000000..ae9f221 --- /dev/null +++ b/_notebooks/lightning_examples/mnist-hello-world/.meta.yml @@ -0,0 +1,19 @@ +title: Introduction to PyTorch Lightning +author: PL team +created: 2020-12-21 +updated: 2023-05-15 +license: CC BY-SA +build: 0 +tags: + - Image +description: In this notebook, we'll go over the basics of lightning by preparing + models to train on the [MNIST Handwritten Digits dataset](https://en.wikipedia.org/wiki/MNIST_database). +requirements: + - torchvision + - torchmetrics >=0.11.0 + - pandas + - seaborn + - lightning>=2.0.0rc0 +accelerator: + - CPU + - GPU diff --git a/_notebooks/lightning_examples/mnist-hello-world/hello-world.py b/_notebooks/lightning_examples/mnist-hello-world/hello-world.py new file mode 100644 index 0000000..cd6c6ef --- /dev/null +++ b/_notebooks/lightning_examples/mnist-hello-world/hello-world.py @@ -0,0 +1,238 @@ +# %% +import os + +import lightning as L +import pandas as pd +import seaborn as sn +import torch +from IPython.display import display +from lightning.pytorch.loggers import CSVLogger +from torch import nn +from torch.nn import functional as F +from torch.utils.data import DataLoader, random_split +from torchmetrics import Accuracy +from torchvision import transforms +from torchvision.datasets import MNIST + +PATH_DATASETS = os.environ.get("PATH_DATASETS", ".") +BATCH_SIZE = 256 if torch.cuda.is_available() else 64 + +# %% [markdown] +# ## Simplest example +# +# Here's the simplest most minimal example with just a training loop (no validation, no testing). +# +# **Keep in Mind** - A `LightningModule` *is* a PyTorch `nn.Module` - it just has a few more helpful features. + + +# %% +class MNISTModel(L.LightningModule): + def __init__(self): + super().__init__() + self.l1 = torch.nn.Linear(28 * 28, 10) + + def forward(self, x): + return torch.relu(self.l1(x.view(x.size(0), -1))) + + def training_step(self, batch, batch_nb): + x, y = batch + loss = F.cross_entropy(self(x), y) + return loss + + def configure_optimizers(self): + return torch.optim.Adam(self.parameters(), lr=0.02) + + +# %% [markdown] +# By using the `Trainer` you automatically get: +# 1. Tensorboard logging +# 2. Model checkpointing +# 3. Training and validation loop +# 4. early-stopping + +# %% +# Init our model +mnist_model = MNISTModel() + +# Init DataLoader from MNIST Dataset +train_ds = MNIST(PATH_DATASETS, train=True, download=True, transform=transforms.ToTensor()) +train_loader = DataLoader(train_ds, batch_size=BATCH_SIZE) + +# Initialize a trainer +trainer = L.Trainer( + accelerator="auto", + devices=1, + max_epochs=3, +) + +# Train the model ⚡ +trainer.fit(mnist_model, train_loader) + +# %% [markdown] +# ## A more complete MNIST Lightning Module Example +# +# That wasn't so hard was it? +# +# Now that we've got our feet wet, let's dive in a bit deeper and write a more complete `LightningModule` for MNIST... +# +# This time, we'll bake in all the dataset specific pieces directly in the `LightningModule`. +# This way, we can avoid writing extra code at the beginning of our script every time we want to run it. +# +# --- +# +# ### Note what the following built-in functions are doing: +# +# 1. [prepare_data()](https://lightning.ai/docs/pytorch/stable/common/lightning_module.html#prepare-data) 💾 +# - This is where we can download the dataset. We point to our desired dataset and ask torchvision's `MNIST` dataset class to download if the dataset isn't found there. +# - **Note we do not make any state assignments in this function** (i.e. `self.something = ...`) +# +# 2. [setup(stage)](https://lightning.ai/docs/pytorch/stable/common/lightning_module.html#setup) ⚙️ +# - Loads in data from file and prepares PyTorch tensor datasets for each split (train, val, test). +# - Setup expects a 'stage' arg which is used to separate logic for 'fit' and 'test'. +# - If you don't mind loading all your datasets at once, you can set up a condition to allow for both 'fit' related setup and 'test' related setup to run whenever `None` is passed to `stage` (or ignore it altogether and exclude any conditionals). +# - **Note this runs across all GPUs and it *is* safe to make state assignments here** +# +# 3. [x_dataloader()](https://lightning.ai/docs/pytorch/stable/api/pytorch_lightning.core.hooks.DataHooks.html#pytorch_lightning.core.hooks.DataHooks.train_dataloader) ♻️ +# - `train_dataloader()`, `val_dataloader()`, and `test_dataloader()` all return PyTorch `DataLoader` instances that are created by wrapping their respective datasets that we prepared in `setup()` + + +# %% +class LitMNIST(L.LightningModule): + def __init__(self, data_dir=PATH_DATASETS, hidden_size=64, learning_rate=2e-4): + super().__init__() + + # Set our init args as class attributes + self.data_dir = data_dir + self.hidden_size = hidden_size + self.learning_rate = learning_rate + + # Hardcode some dataset specific attributes + self.num_classes = 10 + self.dims = (1, 28, 28) + channels, width, height = self.dims + self.transform = transforms.Compose( + [ + transforms.ToTensor(), + transforms.Normalize((0.1307,), (0.3081,)), + ] + ) + + # Define PyTorch model + self.model = nn.Sequential( + nn.Flatten(), + nn.Linear(channels * width * height, hidden_size), + nn.ReLU(), + nn.Dropout(0.1), + nn.Linear(hidden_size, hidden_size), + nn.ReLU(), + nn.Dropout(0.1), + nn.Linear(hidden_size, self.num_classes), + ) + + self.val_accuracy = Accuracy(task="multiclass", num_classes=10) + self.test_accuracy = Accuracy(task="multiclass", num_classes=10) + + def forward(self, x): + x = self.model(x) + return F.log_softmax(x, dim=1) + + def training_step(self, batch, batch_idx): + x, y = batch + logits = self(x) + loss = F.nll_loss(logits, y) + return loss + + def validation_step(self, batch, batch_idx): + x, y = batch + logits = self(x) + loss = F.nll_loss(logits, y) + preds = torch.argmax(logits, dim=1) + self.val_accuracy.update(preds, y) + + # Calling self.log will surface up scalars for you in TensorBoard + self.log("val_loss", loss, prog_bar=True) + self.log("val_acc", self.val_accuracy, prog_bar=True) + + def test_step(self, batch, batch_idx): + x, y = batch + logits = self(x) + loss = F.nll_loss(logits, y) + preds = torch.argmax(logits, dim=1) + self.test_accuracy.update(preds, y) + + # Calling self.log will surface up scalars for you in TensorBoard + self.log("test_loss", loss, prog_bar=True) + self.log("test_acc", self.test_accuracy, prog_bar=True) + + def configure_optimizers(self): + optimizer = torch.optim.Adam(self.parameters(), lr=self.learning_rate) + return optimizer + + #################### + # DATA RELATED HOOKS + #################### + + def prepare_data(self): + # download + MNIST(self.data_dir, train=True, download=True) + MNIST(self.data_dir, train=False, download=True) + + def setup(self, stage=None): + # Assign train/val datasets for use in dataloaders + if stage == "fit" or stage is None: + mnist_full = MNIST(self.data_dir, train=True, transform=self.transform) + self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000]) + + # Assign test dataset for use in dataloader(s) + if stage == "test" or stage is None: + self.mnist_test = MNIST(self.data_dir, train=False, transform=self.transform) + + def train_dataloader(self): + return DataLoader(self.mnist_train, batch_size=BATCH_SIZE) + + def val_dataloader(self): + return DataLoader(self.mnist_val, batch_size=BATCH_SIZE) + + def test_dataloader(self): + return DataLoader(self.mnist_test, batch_size=BATCH_SIZE) + + +# %% +model = LitMNIST() +trainer = L.Trainer( + accelerator="auto", + devices=1, + max_epochs=3, + logger=CSVLogger(save_dir="logs/"), +) +trainer.fit(model) + +# %% [markdown] +# ### Testing +# +# To test a model, call `trainer.test(model)`. +# +# Or, if you've just trained a model, you can just call `trainer.test()` and Lightning will automatically +# test using the best saved checkpoint (conditioned on val_loss). + +# %% +trainer.test() + +# %% [markdown] +# ### Bonus Tip +# +# You can keep calling `trainer.fit(model)` as many times as you'd like to continue training + +# %% +trainer.fit(model) + +# %% [markdown] +# In Colab, you can use the TensorBoard magic function to view the logs that Lightning has created for you! + +# %% + +metrics = pd.read_csv(f"{trainer.logger.log_dir}/metrics.csv") +del metrics["step"] +metrics.set_index("epoch", inplace=True) +display(metrics.dropna(axis=1, how="all").head()) +sn.relplot(data=metrics, kind="line") diff --git a/_notebooks/lightning_examples/mnist-tpu-training/.meta.yml b/_notebooks/lightning_examples/mnist-tpu-training/.meta.yml new file mode 100644 index 0000000..7c82362 --- /dev/null +++ b/_notebooks/lightning_examples/mnist-tpu-training/.meta.yml @@ -0,0 +1,16 @@ +title: TPU training with PyTorch Lightning +author: PL team +created: 2020-12-21 +updated: 2023-05-15 +license: CC BY-SA +build: 0 +tags: + - Image +description: In this notebook, we'll train a model on TPUs. Updating one Trainer flag is all you need for that. + The most up to documentation related to TPU training can be found + [here](https://lightning.ai/docs/pytorch/stable/accelerators/tpu.html). +requirements: + - torchvision + - lightning>=2.0.0rc0 +accelerator: + - TPU diff --git a/_notebooks/lightning_examples/mnist-tpu-training/mnist-tpu.py b/_notebooks/lightning_examples/mnist-tpu-training/mnist-tpu.py new file mode 100644 index 0000000..f0d7427 --- /dev/null +++ b/_notebooks/lightning_examples/mnist-tpu-training/mnist-tpu.py @@ -0,0 +1,174 @@ +# %% [markdown] +# ### Install Colab TPU compatible PyTorch/TPU wheels and dependencies + +# %% +# ! pip install cloud-tpu-client==0.10 https://storage.googleapis.com/tpu-pytorch/wheels/torch_xla-1.8-cp37-cp37m-linux_x86_64.whl + +import lightning as L + +# %% +import torch +import torch.nn.functional as F +from torch import nn +from torch.utils.data import DataLoader, random_split +from torchmetrics.functional import accuracy +from torchvision import transforms + +# Note - you must have torchvision installed for this example +from torchvision.datasets import MNIST + +BATCH_SIZE = 1024 + +# %% [markdown] +# ### Defining The `MNISTDataModule` +# +# Below we define `MNISTDataModule`. You can learn more about datamodules +# in [docs](https://lightning.ai/docs/pytorch/stable/data/datamodule.html). + + +# %% +class MNISTDataModule(L.LightningDataModule): + def __init__(self, data_dir: str = "./"): + super().__init__() + self.data_dir = data_dir + self.transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.1307,), (0.3081,))]) + + self.dims = (1, 28, 28) + self.num_classes = 10 + + def prepare_data(self): + # download + MNIST(self.data_dir, train=True, download=True) + MNIST(self.data_dir, train=False, download=True) + + def setup(self, stage=None): + # Assign train/val datasets for use in dataloaders + if stage == "fit" or stage is None: + mnist_full = MNIST(self.data_dir, train=True, transform=self.transform) + self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000]) + + # Assign test dataset for use in dataloader(s) + if stage == "test" or stage is None: + self.mnist_test = MNIST(self.data_dir, train=False, transform=self.transform) + + def train_dataloader(self): + return DataLoader(self.mnist_train, batch_size=BATCH_SIZE) + + def val_dataloader(self): + return DataLoader(self.mnist_val, batch_size=BATCH_SIZE) + + def test_dataloader(self): + return DataLoader(self.mnist_test, batch_size=BATCH_SIZE) + + +# %% [markdown] +# ### Defining the `LitModel` +# +# Below, we define the model `LitMNIST`. + + +# %% +class LitModel(L.LightningModule): + def __init__(self, channels, width, height, num_classes, hidden_size=64, learning_rate=2e-4): + super().__init__() + + self.save_hyperparameters() + + self.model = nn.Sequential( + nn.Flatten(), + nn.Linear(channels * width * height, hidden_size), + nn.ReLU(), + nn.Dropout(0.1), + nn.Linear(hidden_size, hidden_size), + nn.ReLU(), + nn.Dropout(0.1), + nn.Linear(hidden_size, num_classes), + ) + + def forward(self, x): + x = self.model(x) + return F.log_softmax(x, dim=1) + + def training_step(self, batch, batch_idx): + x, y = batch + logits = self(x) + loss = F.nll_loss(logits, y) + self.log("train_loss", loss) + return loss + + def validation_step(self, batch, batch_idx): + x, y = batch + logits = self(x) + loss = F.nll_loss(logits, y) + preds = torch.argmax(logits, dim=1) + acc = accuracy(preds, y) + self.log("val_loss", loss, prog_bar=True) + self.log("val_acc", acc, prog_bar=True) + + def configure_optimizers(self): + optimizer = torch.optim.Adam(self.parameters(), lr=self.hparams.learning_rate) + return optimizer + + +# %% [markdown] +# ### TPU Training +# +# Lightning supports training on a single TPU core or 8 TPU cores. +# +# The Trainer parameter `devices` defines how many TPU cores to train on (1 or 8) / Single TPU core to train on [1] +# along with accelerator='tpu'. +# +# For Single TPU training, Just pass the TPU core ID [1-8] in a list. +# Setting `devices=[5]` will train on TPU core ID 5. + +# %% [markdown] +# Train on TPU core ID 5 with `devices=[5]`. + +# %% +# Init DataModule +dm = MNISTDataModule() +# Init model from datamodule's attributes +model = LitModel(*dm.size(), dm.num_classes) +# Init trainer +trainer = L.Trainer( + max_epochs=3, + accelerator="tpu", + devices=[5], +) +# Train +trainer.fit(model, dm) + +# %% [markdown] +# Train on single TPU core with `devices=1`. + +# %% +# Init DataModule +dm = MNISTDataModule() +# Init model from datamodule's attributes +model = LitModel(*dm.dims, dm.num_classes) +# Init trainer +trainer = L.Trainer( + max_epochs=3, + accelerator="tpu", + devices=1, +) +# Train +trainer.fit(model, dm) + +# %% [markdown] +# Train on 8 TPU cores with `accelerator='tpu'` and `devices=8`. +# You might have to restart the notebook to run it on 8 TPU cores after training on single TPU core. + +# %% +# Init DataModule +dm = MNISTDataModule() +# Init model from datamodule's attributes +model = LitModel(*dm.dims, dm.num_classes) +# Init trainer +trainer = L.Trainer( + max_epochs=3, + accelerator="tpu", + devices=8, +) +# Train +trainer.fit(model, dm) diff --git a/_notebooks/lightning_examples/reinforce-learning-DQN/.meta.yml b/_notebooks/lightning_examples/reinforce-learning-DQN/.meta.yml new file mode 100644 index 0000000..abf466a --- /dev/null +++ b/_notebooks/lightning_examples/reinforce-learning-DQN/.meta.yml @@ -0,0 +1,23 @@ +title: How to train a Deep Q Network +author: PL team +created: 2021-01-31 +updated: 2021-12-03 +license: CC BY-SA +build: 2 +tags: + - RL +description: | + Main takeaways: + + 1. RL has the same flow as previous models we have seen, with a few additions + 2. Handle unsupervised learning by using an IterableDataset where the dataset itself is constantly updated during training + 3. Each training step carries has the agent taking an action in the environment and storing the experience in the IterableDataset +requirements: + - gym + - pygame + - pandas + - seaborn + - lightning>=2.0.0rc0 +accelerator: + - CPU + - GPU diff --git a/_notebooks/lightning_examples/reinforce-learning-DQN/dqn.py b/_notebooks/lightning_examples/reinforce-learning-DQN/dqn.py new file mode 100644 index 0000000..357f203 --- /dev/null +++ b/_notebooks/lightning_examples/reinforce-learning-DQN/dqn.py @@ -0,0 +1,382 @@ +# %% +import os +from collections import OrderedDict, deque, namedtuple +from typing import Iterator, List, Tuple + +import gym +import numpy as np +import pandas as pd +import seaborn as sn +import torch +from IPython.core.display import display +from pytorch_lightning import LightningModule, Trainer +from pytorch_lightning.loggers import CSVLogger +from torch import Tensor, nn +from torch.optim import Adam, Optimizer +from torch.utils.data import DataLoader +from torch.utils.data.dataset import IterableDataset + +PATH_DATASETS = os.environ.get("PATH_DATASETS", ".") + + +# %% +class DQN(nn.Module): + """Simple MLP network.""" + + def __init__(self, obs_size: int, n_actions: int, hidden_size: int = 128): + """ + Args: + obs_size: observation/state size of the environment + n_actions: number of discrete actions available in the environment + hidden_size: size of hidden layers + """ + super().__init__() + self.net = nn.Sequential( + nn.Linear(obs_size, hidden_size), + nn.ReLU(), + nn.Linear(hidden_size, n_actions), + ) + + def forward(self, x): + return self.net(x.float()) + + +# %% [markdown] +# ### Memory + +# %% + +# Named tuple for storing experience steps gathered in training +Experience = namedtuple( + "Experience", + field_names=["state", "action", "reward", "done", "new_state"], +) + + +# %% +class ReplayBuffer: + """Replay Buffer for storing past experiences allowing the agent to learn from them. + + Args: + capacity: size of the buffer + """ + + def __init__(self, capacity: int) -> None: + self.buffer = deque(maxlen=capacity) + + def __len__(self) -> None: + return len(self.buffer) + + def append(self, experience: Experience) -> None: + """Add experience to the buffer. + + Args: + experience: tuple (state, action, reward, done, new_state) + """ + self.buffer.append(experience) + + def sample(self, batch_size: int) -> Tuple: + indices = np.random.choice(len(self.buffer), batch_size, replace=False) + states, actions, rewards, dones, next_states = zip(*(self.buffer[idx] for idx in indices)) + + return ( + np.array(states), + np.array(actions), + np.array(rewards, dtype=np.float32), + np.array(dones, dtype=bool), + np.array(next_states), + ) + + +# %% +class RLDataset(IterableDataset): + """Iterable Dataset containing the ExperienceBuffer which will be updated with new experiences during training. + + Args: + buffer: replay buffer + sample_size: number of experiences to sample at a time + """ + + def __init__(self, buffer: ReplayBuffer, sample_size: int = 200) -> None: + self.buffer = buffer + self.sample_size = sample_size + + def __iter__(self) -> Iterator[Tuple]: + states, actions, rewards, dones, new_states = self.buffer.sample(self.sample_size) + for i in range(len(dones)): + yield states[i], actions[i], rewards[i], dones[i], new_states[i] + + +# %% [markdown] +# ### Agent + + +# %% +class Agent: + """Base Agent class handeling the interaction with the environment.""" + + def __init__(self, env: gym.Env, replay_buffer: ReplayBuffer) -> None: + """ + Args: + env: training environment + replay_buffer: replay buffer storing experiences + """ + self.env = env + self.replay_buffer = replay_buffer + self.reset() + self.state = self.env.reset() + + def reset(self) -> None: + """Resents the environment and updates the state.""" + self.state = self.env.reset() + + def get_action(self, net: nn.Module, epsilon: float, device: str) -> int: + """Using the given network, decide what action to carry out using an epsilon-greedy policy. + + Args: + net: DQN network + epsilon: value to determine likelihood of taking a random action + device: current device + + Returns: + action + """ + if np.random.random() < epsilon: + action = self.env.action_space.sample() + else: + state = torch.tensor([self.state]) + + if device not in ["cpu"]: + state = state.cuda(device) + + q_values = net(state) + _, action = torch.max(q_values, dim=1) + action = int(action.item()) + + return action + + @torch.no_grad() + def play_step( + self, + net: nn.Module, + epsilon: float = 0.0, + device: str = "cpu", + ) -> Tuple[float, bool]: + """Carries out a single interaction step between the agent and the environment. + + Args: + net: DQN network + epsilon: value to determine likelihood of taking a random action + device: current device + + Returns: + reward, done + """ + + action = self.get_action(net, epsilon, device) + + # do step in the environment + new_state, reward, done, _ = self.env.step(action) + + exp = Experience(self.state, action, reward, done, new_state) + + self.replay_buffer.append(exp) + + self.state = new_state + if done: + self.reset() + return reward, done + + +# %% [markdown] +# ### DQN Lightning Module + + +# %% +class DQNLightning(LightningModule): + """Basic DQN Model.""" + + def __init__( + self, + batch_size: int = 16, + lr: float = 1e-2, + env: str = "CartPole-v0", + gamma: float = 0.99, + sync_rate: int = 10, + replay_size: int = 1000, + warm_start_size: int = 1000, + eps_last_frame: int = 1000, + eps_start: float = 1.0, + eps_end: float = 0.01, + episode_length: int = 200, + warm_start_steps: int = 1000, + ) -> None: + """ + Args: + batch_size: size of the batches") + lr: learning rate + env: gym environment tag + gamma: discount factor + sync_rate: how many frames do we update the target network + replay_size: capacity of the replay buffer + warm_start_size: how many samples do we use to fill our buffer at the start of training + eps_last_frame: what frame should epsilon stop decaying + eps_start: starting value of epsilon + eps_end: final value of epsilon + episode_length: max length of an episode + warm_start_steps: max episode reward in the environment + """ + super().__init__() + self.save_hyperparameters() + + self.env = gym.make(self.hparams.env) + obs_size = self.env.observation_space.shape[0] + n_actions = self.env.action_space.n + + self.net = DQN(obs_size, n_actions) + self.target_net = DQN(obs_size, n_actions) + + self.buffer = ReplayBuffer(self.hparams.replay_size) + self.agent = Agent(self.env, self.buffer) + self.total_reward = 0 + self.episode_reward = 0 + self.populate(self.hparams.warm_start_steps) + + def populate(self, steps: int = 1000) -> None: + """Carries out several random steps through the environment to initially fill up the replay buffer with + experiences. + + Args: + steps: number of random steps to populate the buffer with + """ + for _ in range(steps): + self.agent.play_step(self.net, epsilon=1.0) + + def forward(self, x: Tensor) -> Tensor: + """Passes in a state x through the network and gets the q_values of each action as an output. + + Args: + x: environment state + + Returns: + q values + """ + output = self.net(x) + return output + + def dqn_mse_loss(self, batch: Tuple[Tensor, Tensor]) -> Tensor: + """Calculates the mse loss using a mini batch from the replay buffer. + + Args: + batch: current mini batch of replay data + + Returns: + loss + """ + states, actions, rewards, dones, next_states = batch + + state_action_values = self.net(states).gather(1, actions.long().unsqueeze(-1)).squeeze(-1) + + with torch.no_grad(): + next_state_values = self.target_net(next_states).max(1)[0] + next_state_values[dones] = 0.0 + next_state_values = next_state_values.detach() + + expected_state_action_values = next_state_values * self.hparams.gamma + rewards + + return nn.MSELoss()(state_action_values, expected_state_action_values) + + def get_epsilon(self, start: int, end: int, frames: int) -> float: + if self.global_step > frames: + return end + return start - (self.global_step / frames) * (start - end) + + def training_step(self, batch: Tuple[Tensor, Tensor], nb_batch) -> OrderedDict: + """Carries out a single step through the environment to update the replay buffer. Then calculates loss + based on the minibatch recieved. + + Args: + batch: current mini batch of replay data + nb_batch: batch number + + Returns: + Training loss and log metrics + """ + device = self.get_device(batch) + epsilon = self.get_epsilon(self.hparams.eps_start, self.hparams.eps_end, self.hparams.eps_last_frame) + self.log("epsilon", epsilon) + + # step through environment with agent + reward, done = self.agent.play_step(self.net, epsilon, device) + self.episode_reward += reward + self.log("episode reward", self.episode_reward) + + # calculates training loss + loss = self.dqn_mse_loss(batch) + + if done: + self.total_reward = self.episode_reward + self.episode_reward = 0 + + # Soft update of target network + if self.global_step % self.hparams.sync_rate == 0: + self.target_net.load_state_dict(self.net.state_dict()) + + self.log_dict( + { + "reward": reward, + "train_loss": loss, + } + ) + self.log("total_reward", self.total_reward, prog_bar=True) + self.log("steps", self.global_step, logger=False, prog_bar=True) + + return loss + + def configure_optimizers(self) -> List[Optimizer]: + """Initialize Adam optimizer.""" + optimizer = Adam(self.net.parameters(), lr=self.hparams.lr) + return optimizer + + def __dataloader(self) -> DataLoader: + """Initialize the Replay Buffer dataset used for retrieving experiences.""" + dataset = RLDataset(self.buffer, self.hparams.episode_length) + dataloader = DataLoader( + dataset=dataset, + batch_size=self.hparams.batch_size, + ) + return dataloader + + def train_dataloader(self) -> DataLoader: + """Get train loader.""" + return self.__dataloader() + + def get_device(self, batch) -> str: + """Retrieve device currently being used by minibatch.""" + return batch[0].device.index if self.on_gpu else "cpu" + + +# %% [markdown] +# ### Trainer + +# %% + +model = DQNLightning() + +trainer = Trainer( + accelerator="auto", + devices=1 if torch.cuda.is_available() else None, # limiting got iPython runs + max_epochs=150, + val_check_interval=50, + logger=CSVLogger(save_dir="logs/"), +) + +trainer.fit(model) + +# %% + +metrics = pd.read_csv(f"{trainer.logger.log_dir}/metrics.csv") +del metrics["step"] +metrics.set_index("epoch", inplace=True) +display(metrics.dropna(axis=1, how="all").head()) +sn.relplot(data=metrics, kind="line") diff --git a/_notebooks/lightning_examples/text-transformers/.meta.yml b/_notebooks/lightning_examples/text-transformers/.meta.yml new file mode 100644 index 0000000..f34c5fe --- /dev/null +++ b/_notebooks/lightning_examples/text-transformers/.meta.yml @@ -0,0 +1,21 @@ +title: Finetune Transformers Models with PyTorch Lightning +author: PL team +created: 2021-01-31 +updated: 2022-02-08 +license: CC BY-SA +build: 1 +tags: + - Text +description: | + This notebook will use HuggingFace's `datasets` library to get data, which will be wrapped in a `LightningDataModule`. + Then, we write a class to perform text classification on any dataset from the [GLUE Benchmark](https://gluebenchmark.com/). + (We just show CoLA and MRPC due to constraint on compute/disk) +requirements: + - transformers + - datasets + - scipy + - scikit-learn + - torchtext>=0.9 + - lightning>=2.0.0rc0 +accelerator: + - GPU diff --git a/_notebooks/lightning_examples/text-transformers/text-transformers.py b/_notebooks/lightning_examples/text-transformers/text-transformers.py new file mode 100644 index 0000000..cc04b7f --- /dev/null +++ b/_notebooks/lightning_examples/text-transformers/text-transformers.py @@ -0,0 +1,322 @@ +# %% +from datetime import datetime +from typing import Optional + +import datasets +import torch +from pytorch_lightning import LightningDataModule, LightningModule, Trainer, seed_everything +from torch.utils.data import DataLoader +from transformers import ( + AdamW, + AutoConfig, + AutoModelForSequenceClassification, + AutoTokenizer, + get_linear_schedule_with_warmup, +) + +# %% [markdown] +# ## Training BERT with Lightning + +# %% [markdown] +# ### Lightning DataModule for GLUE + + +# %% +class GLUEDataModule(LightningDataModule): + task_text_field_map = { + "cola": ["sentence"], + "sst2": ["sentence"], + "mrpc": ["sentence1", "sentence2"], + "qqp": ["question1", "question2"], + "stsb": ["sentence1", "sentence2"], + "mnli": ["premise", "hypothesis"], + "qnli": ["question", "sentence"], + "rte": ["sentence1", "sentence2"], + "wnli": ["sentence1", "sentence2"], + "ax": ["premise", "hypothesis"], + } + + glue_task_num_labels = { + "cola": 2, + "sst2": 2, + "mrpc": 2, + "qqp": 2, + "stsb": 1, + "mnli": 3, + "qnli": 2, + "rte": 2, + "wnli": 2, + "ax": 3, + } + + loader_columns = [ + "datasets_idx", + "input_ids", + "token_type_ids", + "attention_mask", + "start_positions", + "end_positions", + "labels", + ] + + def __init__( + self, + model_name_or_path: str, + task_name: str = "mrpc", + max_seq_length: int = 128, + train_batch_size: int = 32, + eval_batch_size: int = 32, + **kwargs, + ): + super().__init__() + self.model_name_or_path = model_name_or_path + self.task_name = task_name + self.max_seq_length = max_seq_length + self.train_batch_size = train_batch_size + self.eval_batch_size = eval_batch_size + + self.text_fields = self.task_text_field_map[task_name] + self.num_labels = self.glue_task_num_labels[task_name] + self.tokenizer = AutoTokenizer.from_pretrained(self.model_name_or_path, use_fast=True) + + def setup(self, stage: str): + self.dataset = datasets.load_dataset("glue", self.task_name) + + for split in self.dataset.keys(): + self.dataset[split] = self.dataset[split].map( + self.convert_to_features, + batched=True, + remove_columns=["label"], + ) + self.columns = [c for c in self.dataset[split].column_names if c in self.loader_columns] + self.dataset[split].set_format(type="torch", columns=self.columns) + + self.eval_splits = [x for x in self.dataset.keys() if "validation" in x] + + def prepare_data(self): + datasets.load_dataset("glue", self.task_name) + AutoTokenizer.from_pretrained(self.model_name_or_path, use_fast=True) + + def train_dataloader(self): + return DataLoader(self.dataset["train"], batch_size=self.train_batch_size, shuffle=True) + + def val_dataloader(self): + if len(self.eval_splits) == 1: + return DataLoader(self.dataset["validation"], batch_size=self.eval_batch_size) + elif len(self.eval_splits) > 1: + return [DataLoader(self.dataset[x], batch_size=self.eval_batch_size) for x in self.eval_splits] + + def test_dataloader(self): + if len(self.eval_splits) == 1: + return DataLoader(self.dataset["test"], batch_size=self.eval_batch_size) + elif len(self.eval_splits) > 1: + return [DataLoader(self.dataset[x], batch_size=self.eval_batch_size) for x in self.eval_splits] + + def convert_to_features(self, example_batch, indices=None): + # Either encode single sentence or sentence pairs + if len(self.text_fields) > 1: + texts_or_text_pairs = list(zip(example_batch[self.text_fields[0]], example_batch[self.text_fields[1]])) + else: + texts_or_text_pairs = example_batch[self.text_fields[0]] + + # Tokenize the text/text pairs + features = self.tokenizer.batch_encode_plus( + texts_or_text_pairs, max_length=self.max_seq_length, pad_to_max_length=True, truncation=True + ) + + # Rename label to labels to make it easier to pass to model forward + features["labels"] = example_batch["label"] + + return features + + +# %% [markdown] +# **You could use this datamodule with standalone PyTorch if you wanted...** + +# %% +dm = GLUEDataModule("distilbert-base-uncased") +dm.prepare_data() +dm.setup("fit") +next(iter(dm.train_dataloader())) + +# %% [markdown] +# ### Transformer LightningModule + + +# %% +class GLUETransformer(LightningModule): + def __init__( + self, + model_name_or_path: str, + num_labels: int, + task_name: str, + learning_rate: float = 2e-5, + adam_epsilon: float = 1e-8, + warmup_steps: int = 0, + weight_decay: float = 0.0, + train_batch_size: int = 32, + eval_batch_size: int = 32, + eval_splits: Optional[list] = None, + **kwargs, + ): + super().__init__() + + self.save_hyperparameters() + + self.config = AutoConfig.from_pretrained(model_name_or_path, num_labels=num_labels) + self.model = AutoModelForSequenceClassification.from_pretrained(model_name_or_path, config=self.config) + self.metric = datasets.load_metric( + "glue", self.hparams.task_name, experiment_id=datetime.now().strftime("%d-%m-%Y_%H-%M-%S") + ) + + def forward(self, **inputs): + return self.model(**inputs) + + def training_step(self, batch, batch_idx): + outputs = self(**batch) + loss = outputs[0] + return loss + + def validation_step(self, batch, batch_idx, dataloader_idx=0): + outputs = self(**batch) + val_loss, logits = outputs[:2] + + if self.hparams.num_labels > 1: + preds = torch.argmax(logits, axis=1) + elif self.hparams.num_labels == 1: + preds = logits.squeeze() + + labels = batch["labels"] + + return {"loss": val_loss, "preds": preds, "labels": labels} + + def validation_epoch_end(self, outputs): + if self.hparams.task_name == "mnli": + for i, output in enumerate(outputs): + # matched or mismatched + split = self.hparams.eval_splits[i].split("_")[-1] + preds = torch.cat([x["preds"] for x in output]).detach().cpu().numpy() + labels = torch.cat([x["labels"] for x in output]).detach().cpu().numpy() + loss = torch.stack([x["loss"] for x in output]).mean() + self.log(f"val_loss_{split}", loss, prog_bar=True) + split_metrics = { + f"{k}_{split}": v for k, v in self.metric.compute(predictions=preds, references=labels).items() + } + self.log_dict(split_metrics, prog_bar=True) + return loss + + preds = torch.cat([x["preds"] for x in outputs]).detach().cpu().numpy() + labels = torch.cat([x["labels"] for x in outputs]).detach().cpu().numpy() + loss = torch.stack([x["loss"] for x in outputs]).mean() + self.log("val_loss", loss, prog_bar=True) + self.log_dict(self.metric.compute(predictions=preds, references=labels), prog_bar=True) + + def configure_optimizers(self): + """Prepare optimizer and schedule (linear warmup and decay)""" + model = self.model + no_decay = ["bias", "LayerNorm.weight"] + optimizer_grouped_parameters = [ + { + "params": [p for n, p in model.named_parameters() if not any(nd in n for nd in no_decay)], + "weight_decay": self.hparams.weight_decay, + }, + { + "params": [p for n, p in model.named_parameters() if any(nd in n for nd in no_decay)], + "weight_decay": 0.0, + }, + ] + optimizer = AdamW(optimizer_grouped_parameters, lr=self.hparams.learning_rate, eps=self.hparams.adam_epsilon) + + scheduler = get_linear_schedule_with_warmup( + optimizer, + num_warmup_steps=self.hparams.warmup_steps, + num_training_steps=self.trainer.estimated_stepping_batches, + ) + scheduler = {"scheduler": scheduler, "interval": "step", "frequency": 1} + return [optimizer], [scheduler] + + +# %% [markdown] +# ## Training + +# %% [markdown] +# ### CoLA +# +# See an interactive view of the +# CoLA dataset in [NLP Viewer](https://huggingface.co/nlp/viewer/?dataset=glue&config=cola) + +# %% +seed_everything(42) + +dm = GLUEDataModule(model_name_or_path="albert-base-v2", task_name="cola") +dm.setup("fit") +model = GLUETransformer( + model_name_or_path="albert-base-v2", + num_labels=dm.num_labels, + eval_splits=dm.eval_splits, + task_name=dm.task_name, +) + +trainer = Trainer( + max_epochs=1, + accelerator="auto", + devices=1 if torch.cuda.is_available() else None, # limiting got iPython runs +) +trainer.fit(model, datamodule=dm) + +# %% [markdown] +# ### MRPC +# +# See an interactive view of the +# MRPC dataset in [NLP Viewer](https://huggingface.co/nlp/viewer/?dataset=glue&config=mrpc) + +# %% +seed_everything(42) + +dm = GLUEDataModule( + model_name_or_path="distilbert-base-cased", + task_name="mrpc", +) +dm.setup("fit") +model = GLUETransformer( + model_name_or_path="distilbert-base-cased", + num_labels=dm.num_labels, + eval_splits=dm.eval_splits, + task_name=dm.task_name, +) + +trainer = Trainer( + max_epochs=3, + accelerator="auto", + devices=1 if torch.cuda.is_available() else None, # limiting got iPython runs +) +trainer.fit(model, datamodule=dm) + +# %% [markdown] +# ### MNLI +# +# - The MNLI dataset is huge, so we aren't going to bother trying to train on it here. +# - We will skip over training and go straight to validation. +# +# See an interactive view of the +# MRPC dataset in [NLP Viewer](https://huggingface.co/nlp/viewer/?dataset=glue&config=mnli) + +# %% +dm = GLUEDataModule( + model_name_or_path="distilbert-base-cased", + task_name="mnli", +) +dm.setup("fit") +model = GLUETransformer( + model_name_or_path="distilbert-base-cased", + num_labels=dm.num_labels, + eval_splits=dm.eval_splits, + task_name=dm.task_name, +) + +trainer = Trainer( + max_epochs=3, + accelerator="auto", + devices=1 if torch.cuda.is_available() else None, # limiting got iPython runs +) +trainer.validate(model, dm) diff --git a/_notebooks/lightning_examples/warp-drive/.meta.yml b/_notebooks/lightning_examples/warp-drive/.meta.yml new file mode 100644 index 0000000..adf93f0 --- /dev/null +++ b/_notebooks/lightning_examples/warp-drive/.meta.yml @@ -0,0 +1,30 @@ +title: Multi-agent Reinforcement Learning With WarpDrive +author: Sunil Srinivasa (sunil.srinivasa@salesforce.com), Tian Lan (tian.lan@salesforce.com), Huan Wang (huan.wang@salesforce.com) and Stephan Zheng(stephan.zheng@salesforce.com) +created: 2022-03-01 +license: BSD 3-Clause "New" or "Revised" License +tags: + - Reinforcement Learning + - Multi-agent + - GPU +description: This notebook introduces multi-agent reinforcement learning (MARL) with WarpDrive (Lan et al. https://arxiv.org/abs/2108.13976). + WarpDrive is a flexible, lightweight, and easy-to-use open-source framework that implements end-to-end deep MARL on GPUs. + WarpDrive enables orders-of-magnitude speedups compared to CPU-GPU implementations, using the parallelization capability + of GPUs and several design choices to minimize communication overhead. WarpDrive also prioritizes user-friendliness - + it has utility functions to easily build MARL environments in CUDA and quality-of-life tools to run end-to-end MARL + using just a few lines of code, and is compatible with PyTorch. + + WarpDrive includes the following resources. + code - https://github.com/salesforce/warp-drive + documentation - http://opensource.salesforce.com/warp-drive/, and + white paper - https://arxiv.org/abs/2108.13976. + +requirements: + - rl-warp-drive==2.1 + - ffmpeg-python + # todo: after merging #155 we will relax this just to `torch<=1.10` and drop TV, TT, etc. + - torch==1.10.* + - torchvision==0.11.* + - torchtext==0.11.* + - lightning>=2.0.0rc0 +accelerator: + - GPU diff --git a/_notebooks/lightning_examples/warp-drive/multi_agent_rl.py b/_notebooks/lightning_examples/warp-drive/multi_agent_rl.py new file mode 100644 index 0000000..33efbe2 --- /dev/null +++ b/_notebooks/lightning_examples/warp-drive/multi_agent_rl.py @@ -0,0 +1,261 @@ +# %% [markdown] +# **⚠️ PLEASE NOTE:** +# This notebook runs on a GPU runtime. If running on Colab, choose Runtime > Change runtime type from the menu, then select `GPU` in the 'Hardware accelerator' dropdown menu. + +# %% [markdown] +# ## Introduction + +# %% [markdown] +# This tutorial provides a demonstration of a multi-agent Reinforcement Learning (RL) training loop with [WarpDrive](https://github.com/salesforce/warp-drive). WarpDrive is a flexible, lightweight, and easy-to-use RL framework that implements end-to-end deep multi-agent RL on a GPU (Graphics Processing Unit). Using the extreme parallelization capability of GPUs, it enables [orders-of-magnitude faster RL](https://arxiv.org/abs/2108.13976) compared to common implementations that blend CPU simulations and GPU models. WarpDrive is extremely efficient as it runs simulations across multiple agents and multiple environment replicas all in parallel and completely eliminates the back-and-forth data copying between the CPU and the GPU during every step. As such, WarpDrive +# - Can simulate 1000s of agents in each environment and thousands of environments in parallel, harnessing the extreme parallelism capability of GPUs. +# - Eliminates communication between CPU and GPU, and also within the GPU, as read and write operations occur in-place. +# - Is fully compatible with PyTorch, a highly flexible and very fast deep learning framework. +# - Implements parallel action sampling on CUDA C, which is ~3x faster than using PyTorch’s sampling methods. +# - Allows for large-scale distributed training on multiple GPUs. +# +# Below is an overview of WarpDrive’s layout of computational and data structures on a single GPU. +# ![](https://blog.salesforceairesearch.com/content/images/2021/08/warpdrive_framework_overview.png) +# Computations are organized into blocks, with multiple threads in each block. Each block runs a simulation environment and each thread +# simulates an agent in an environment. Blocks can access the shared GPU memory that stores simulation data and neural network policy models. A DataManager and FunctionManager enable defining multi-agent RL GPU-workflows with Python APIs. For more details, please read out white [paper](https://arxiv.org/abs/2108.13976). +# +# The Warpdrive framework comprises several utility functions that help easily implement any (OpenAI-)*gym-style* RL environment, and furthermore, provides quality-of-life tools to train it end-to-end using just a few lines of code. You may familiarize yourself with WarpDrive with the help of these [tutorials](https://github.com/salesforce/warp-drive/tree/master/tutorials). +# +# We invite everyone to **contribute to WarpDrive**, including adding new multi-agent environments, proposing new features and reporting issues on our open source [repository](https://github.com/salesforce/warp-drive). +# +# We have integrated WarpDrive with the [PyTorch Lightning](https://www.lightning.ai/) framework, which greatly reduces the trainer boilerplate code, and improves training modularity and flexibility. It abstracts away most of the engineering pieces of code, so users can focus on research and building models, and iterate on experiments really fast. PyTorch Lightning also provides support for easily running the model on any hardware, performing distributed training, model checkpointing, performance profiling, logging and visualization. +# +# Below, we demonstrate how to use WarpDrive and PyTorch Lightning together to train a game of [Tag](https://github.com/salesforce/warp-drive/blob/master/example_envs/tag_continuous/tag_continuous.py) where multiple *tagger* agents are trying to run after and tag multiple other *runner* agents. Here's a sample depiction of the game of Tag with $100$ runners and $5$ taggers. +# ![](https://blog.salesforceairesearch.com/content/images/2021/08/same_speed_50fps-1.gif) + +# %% [markdown] +# ## Dependencies + +# %% +import logging + +import torch +from example_envs.tag_continuous.tag_continuous import TagContinuous +from pytorch_lightning import Trainer +from warp_drive.env_wrapper import EnvWrapper +from warp_drive.training.pytorch_lightning import CUDACallback, PerfStatsCallback, WarpDriveModule + +# Uncomment below for enabling animation visualizations. +# from example_envs.utils.generate_rollout_animation import generate_tag_env_rollout_animation +# from IPython.display import HTML + + +# %% +assert torch.cuda.device_count() > 0, "This notebook only runs on a GPU!" + +# %% +# Set logger level e.g., DEBUG, INFO, WARNING, ERROR. +logging.getLogger().setLevel(logging.ERROR) + +# %% [markdown] +# ## Specify a set of run configurations for your experiments +# +# The run configuration is a dictionary comprising the environment parameters, the trainer and the policy network settings, as well as configurations for saving. +# +# For our experiment, we consider an environment wherein $5$ taggers and $100$ runners play the game of [Tag](https://github.com/salesforce/warp-drive/blob/master/example_envs/tag_continuous/tag_continuous.py) on a $20 \times 20$ plane. The game lasts $200$ timesteps. Each agent chooses it's own acceleration and turn actions at every timestep, and we use mechanics to determine how the agents move over the grid. When a tagger gets close to a runner, the runner is tagged, and is eliminated from the game. For the configuration below, the runners and taggers have the same unit skill levels, or top speeds. +# +# We train the agents using $50$ environments or simulations running in parallel. With WarpDrive, each simulation runs on separate GPU blocks. +# +# There are two separate policy networks used for the tagger and runner agents. Each network is a fully-connected model with two layers each of $256$ dimensions. We use the Advantage Actor Critic (A2C) algorithm for training. WarpDrive also currently provides the option to use the Proximal Policy Optimization (PPO) algorithm instead. + +# %% +run_config = dict( + name="tag_continuous", + # Environment settings. + env=dict( + # number of taggers in the environment + num_taggers=5, + # number of runners in the environment + num_runners=100, + # length of the (square) grid on which the game is played + grid_length=20.0, + # episode length in timesteps + episode_length=200, + # maximum acceleration + max_acceleration=0.1, + # minimum acceleration + min_acceleration=-0.1, + # maximum turn (in radians) + max_turn=2.35, # 3pi/4 radians + # minimum turn (in radians) + min_turn=-2.35, # -3pi/4 radians + # number of discretized accelerate actions + num_acceleration_levels=10, + # number of discretized turn actions + num_turn_levels=10, + # skill level for the tagger + skill_level_tagger=1.0, + # skill level for the runner + skill_level_runner=1.0, + # each agent sees the full (or partial) information of the world + use_full_observation=False, + # flag to indicate if a runner stays in the game after getting tagged + runner_exits_game_after_tagged=True, + # number of other agents each agent can see + # used in the case use_full_observation is False + num_other_agents_observed=10, + # positive reward for a tagger upon tagging a runner + tag_reward_for_tagger=10.0, + # negative reward for a runner upon getting tagged + tag_penalty_for_runner=-10.0, + # reward at the end of the game for a runner that isn't tagged + end_of_game_reward_for_runner=1.0, + # distance margin between a tagger and runner + # to consider the runner as being 'tagged' + tagging_distance=0.02, + ), + # Trainer settings. + trainer=dict( + # number of environment replicas (number of GPU blocks used) + num_envs=50, + # total batch size used for training per iteration (across all the environments) + train_batch_size=10000, + # total number of episodes to run the training for + # This can be set arbitrarily high! + num_episodes=500, + ), + # Policy network settings. + policy=dict( + runner=dict( + # flag indicating whether the model needs to be trained + to_train=True, + # algorithm used to train the policy + algorithm="A2C", + # discount rate + gamma=0.98, + # learning rate + lr=0.005, + # policy model settings + model=dict(type="fully_connected", fc_dims=[256, 256], model_ckpt_filepath=""), + ), + tagger=dict( + to_train=True, + algorithm="A2C", + gamma=0.98, + lr=0.002, + model=dict(type="fully_connected", fc_dims=[256, 256], model_ckpt_filepath=""), + ), + ), + # Checkpoint saving setting. + saving=dict( + # how often (in iterations) to print the metrics + metrics_log_freq=10, + # how often (in iterations) to save the model parameters + model_params_save_freq=5000, + # base folder used for saving + basedir="/tmp", + # experiment name + name="continuous_tag", + # experiment tag + tag="example", + ), +) + +# %% [markdown] +# ## Instantiate the WarpDrive Module +# +# In order to instantiate the WarpDrive module, we first use an environment wrapper to specify that the environment needs to be run on the GPU (via the `use_cuda` flag). Also, agents in the environment can share policy models; so we specify a dictionary to map each policy network model to the list of agent ids using that model. + +# %% +# Create a wrapped environment object via the EnvWrapper +# Ensure that env_backend is set to be "pycuda" or "numba"(in order to run on the GPU) +# WarpDrive v2 supports JIT compiled Numba backend now! +env_wrapper = EnvWrapper( + TagContinuous(**run_config["env"]), + num_envs=run_config["trainer"]["num_envs"], + env_backend="pycuda", +) + +# Agents can share policy models: this dictionary maps policy model names to agent ids. +policy_tag_to_agent_id_map = { + "tagger": list(env_wrapper.env.taggers), + "runner": list(env_wrapper.env.runners), +} + +wd_module = WarpDriveModule( + env_wrapper=env_wrapper, + config=run_config, + policy_tag_to_agent_id_map=policy_tag_to_agent_id_map, + verbose=True, +) + + +# %% [markdown] +# ## Visualizing an episode roll-out before training +# +# We have created a helper function (see below) to visualize an episode rollout. Internally, this function uses the WarpDrive module's `fetch_episode_states` API to fetch the data arrays on the GPU for the duration of an entire episode. Specifically, we fetch the state arrays pertaining to agents' x and y locations on the plane and indicators on which agents are still active in the game. Note that this function may be invoked at any time during training, and it will use the state of the policy models at that time to sample actions and generate the visualization. + +# %% [markdown] +# The animation below shows a sample realization of the game episode before training, i.e., with randomly chosen agent actions. The $5$ taggers are marked in pink, while the $100$ blue agents are the runners. Both the taggers and runners move around randomly and about half the runners remain at the end of the episode. + +# %% +# Uncomment below for enabling animation visualizations. +# anim = generate_tag_env_rollout_animation(wd_module, fps=25) +# HTML(anim.to_html5_video()) + +# %% [markdown] +# ## Create the Lightning Trainer +# +# Next, we create the trainer for training the WarpDrive model. We add the `performance stats` callbacks to the trainer to view the throughput performance of WarpDrive. + +# %% +log_freq = run_config["saving"]["metrics_log_freq"] + +# Define callbacks. +cuda_callback = CUDACallback(module=wd_module) +perf_stats_callback = PerfStatsCallback( + batch_size=wd_module.training_batch_size, + num_iters=wd_module.num_iters, + log_freq=log_freq, +) + +# Instantiate the PyTorch Lightning trainer with the callbacks. +# Also, set the number of gpus to 1, since this notebook uses just a single GPU. +num_gpus = 1 +num_episodes = run_config["trainer"]["num_episodes"] +episode_length = run_config["env"]["episode_length"] +training_batch_size = run_config["trainer"]["train_batch_size"] +num_epochs = int(num_episodes * episode_length / training_batch_size) + +trainer = Trainer( + accelerator="gpu", + devices=num_gpus, + callbacks=[cuda_callback, perf_stats_callback], + max_epochs=num_epochs, + log_every_n_steps=1, + reload_dataloaders_every_n_epochs=1, +) + +# %% +# Start tensorboard. +# %load_ext tensorboard +# %tensorboard --logdir lightning_logs/ + +# %% [markdown] +# ## Train the WarpDrive Module +# +# Finally, we invoke training. +# +# Note: please scroll up to the tensorboard cell to visualize the curves during training. + +# %% +trainer.fit(wd_module) + +# %% [markdown] +# ## Visualize an episode-rollout after training + +# %% +# Uncomment below for enabling animation visualizations. +# anim = generate_tag_env_rollout_animation(wd_module, fps=25) +# HTML(anim.to_html5_video()) + +# %% [markdown] +# Note: In the configuration above, we have set the trainer to only train on $500$ rollout episodes, but you can increase the `num_episodes` configuration parameter to train further. As more training happens, the runners learn to escape the taggers, and the taggers learn to chase after the runner. Sometimes, the taggers also collaborate to team-tag runners. A good number of episodes to train on (for the configuration we have used) is $2$M or higher. + +# %% +# Finally, close the WarpDrive module to clear up the CUDA memory heap +wd_module.graceful_close() diff --git a/_notebooks/pyproject.toml b/_notebooks/pyproject.toml new file mode 100644 index 0000000..8e49741 --- /dev/null +++ b/_notebooks/pyproject.toml @@ -0,0 +1,12 @@ +[tool.black] +# https://github.com/psf/black +line-length = 120 +exclude = "(.eggs|.git|.hg|.venv|_build|buck-out|build)" + +[tool.isort] +skip_glob = [] +profile = "black" +line_length = 120 + +[tool.autopep8] +ignore = ["E731"] diff --git a/_notebooks/requirements.txt b/_notebooks/requirements.txt new file mode 100644 index 0000000..9624fab --- /dev/null +++ b/_notebooks/requirements.txt @@ -0,0 +1,5 @@ +-r _requirements/devel.txt +-r .actions/requires.txt + +# default for all examples +-r _requirements/default.txt diff --git a/_notebooks/setup.cfg b/_notebooks/setup.cfg new file mode 100644 index 0000000..a7ed4be --- /dev/null +++ b/_notebooks/setup.cfg @@ -0,0 +1,49 @@ +[tool:pytest] +norecursedirs = + .git + .github + dist + build +addopts = + --strict + --doctest-modules + --color=yes + +[coverage:report] +exclude_lines = + pragma: no-cover + pass + + +[flake8] +max-line-length = 120 +exclude = + *.egg + build + temp +select = E,W,F +doctests = True +verbose = 2 +# https://pep8.readthedocs.io/en/latest/intro.html#error-codes +format = pylint +# see: https://www.flake8rules.com/ +ignore = + # line too long + E501 + # whitespace before ':' + E203 + + +# setup.cfg or tox.ini +[check-manifest] +ignore = + *.yml + .github + .github/* + + +[metadata] +license_file = LICENSE +description-file = README.md +# long_description = file:README.md +# long_description_content_type = text/markdown diff --git a/_notebooks/templates/img-classify/.meta.yml b/_notebooks/templates/img-classify/.meta.yml new file mode 100644 index 0000000..b26049d --- /dev/null +++ b/_notebooks/templates/img-classify/.meta.yml @@ -0,0 +1,21 @@ +title: Simple image classification with Lightning Flash +author: PL team +created: 2022-04-14 +updated: 2021-06-16 +license: CC BY-SA +build: 2 +tags: + - Image +description: | + This is a template to show simple image classification case if for some reason accelerator is required. +requirements: + - lightning-flash[image]>=0.7 + - numpy<1.24 + - pandas>=1.0 + - matplotlib>=3.0 + - seaborn +accelerator: + - GPU +datasets: + web: + - https://pl-flash-data.s3.amazonaws.com/hymenoptera_data.zip diff --git a/_notebooks/templates/img-classify/classify.py b/_notebooks/templates/img-classify/classify.py new file mode 100644 index 0000000..ba0273b --- /dev/null +++ b/_notebooks/templates/img-classify/classify.py @@ -0,0 +1,70 @@ +# %% +import os + +import flash +import matplotlib.pyplot as plt +import pandas as pd +import seaborn as sn +from flash.image import ImageClassificationData, ImageClassifier +from IPython.core.display import display +from pytorch_lightning.loggers import CSVLogger + +PATH_DATASETS = os.environ.get("PATH_DATASETS", ".") +# this dataset is automatically downloaded and extracted based on meta link +# this archive includes the one more level - folder with the same name +DATA_HYMENOPLERA = os.path.join(PATH_DATASETS, "hymenoptera_data", "hymenoptera_data") + +# %% [markdown] +# ## 1. Create the DataModule + +# %% +datamodule = ImageClassificationData.from_folders( + train_folder=f"{DATA_HYMENOPLERA}/train/", + val_folder=f"{DATA_HYMENOPLERA}/val/", + batch_size=1024, +) + +# %% [markdown] +# ## 2. Build the task + +# %% +model = ImageClassifier(backbone="resnet18", labels=datamodule.labels) + +# %% [markdown] +# ## 3. Create the trainer and finetune the model + +# %% +logger = CSVLogger(save_dir="logs/") +trainer = flash.Trainer(logger=logger, max_epochs=3, gpus=1) +trainer.finetune(model, datamodule=datamodule, strategy="freeze") + +# %% +metrics = pd.read_csv(f"{trainer.logger.log_dir}/metrics.csv") +del metrics["step"] +metrics.set_index("epoch", inplace=True) +display(metrics.dropna(axis=1, how="all").head()) + +g = sn.relplot(data=metrics, kind="line") +plt.gcf().set_size_inches(12, 4) +plt.grid() + +# %% [markdown] +# ## 4. Predict what's on a few images! ants or bees? + +# %% +datamodule = ImageClassificationData.from_files( + predict_files=[ + f"{DATA_HYMENOPLERA}/val/bees/65038344_52a45d090d.jpg", + f"{DATA_HYMENOPLERA}/val/bees/590318879_68cf112861.jpg", + f"{DATA_HYMENOPLERA}/val/ants/540543309_ddbb193ee5.jpg", + ], + batch_size=3, +) +predictions = trainer.predict(model, datamodule=datamodule, output="labels") +print(predictions) + +# %% [markdown] +# ## 5. Save the model! + +# %% +trainer.save_checkpoint("image_classification_model.pt") diff --git a/_notebooks/templates/simple/.meta.yml b/_notebooks/templates/simple/.meta.yml new file mode 100644 index 0000000..db12f93 --- /dev/null +++ b/_notebooks/templates/simple/.meta.yml @@ -0,0 +1,13 @@ +title: How to write a PyTorch Lightning tutorial +author: PL team +created: 2021-06-15 +updated: 2021-06-17 +license: CC +build: 10 +description: | + This is a template to show how to contribute a tutorial. +requirements: + - matplotlib +accelerator: + - CPU + - GPU diff --git a/_notebooks/templates/simple/.thumb.png b/_notebooks/templates/simple/.thumb.png new file mode 100644 index 0000000..e778f65 Binary files /dev/null and b/_notebooks/templates/simple/.thumb.png differ diff --git a/_notebooks/templates/simple/template.py b/_notebooks/templates/simple/template.py new file mode 100644 index 0000000..9f30ea0 --- /dev/null +++ b/_notebooks/templates/simple/template.py @@ -0,0 +1,45 @@ +# %% [markdown] +# ## Create a Markdown cell +# +# `# %% [markdown]` +# +# the content of single cell shall be connected with `# ` at each line, so for example: +# `# Add some text that will be rendered as markdown text.` + +# %% [markdown] +# ## Create a code cell +# +# `# %%` + +# %% +import torch + +print(torch.__version__) + +# %% [markdown] +# ## Add any Python codes +# Easy integration with Python ecosystem libraries component. +# +# For example create a simple plot with `matplotlib` with an image: +# +# ![test image](test.png) +# +# From: https://matplotlib.org/stable/gallery/lines_bars_and_markers/simple_plot.html + +# %% +import matplotlib.pyplot as plt # noqa: E402 +import numpy as np # noqa: E402 + +# Data for plotting +t = np.arange(0.0, 2.0, 0.01) +s = 1 + np.sin(2 * np.pi * t) + +fig, ax = plt.subplots() +ax.plot(t, s) + +ax.set(xlabel="time (s)", ylabel="voltage (mV)", title="About as simple as it gets, folks") +ax.grid() + +fig.savefig("test.png") +# render image to the notebooks +plt.show() diff --git a/_notebooks/templates/titanic/.meta.yml b/_notebooks/templates/titanic/.meta.yml new file mode 100644 index 0000000..dbe94d7 --- /dev/null +++ b/_notebooks/templates/titanic/.meta.yml @@ -0,0 +1,18 @@ +title: Solving Titanic dataset with Lightning Flash +author: PL team +created: 2021-10-15 +updated: 2021-12-10 +license: CC +build: 0 +description: | + This is a template to show how to contribute a tutorial. +requirements: + - https://github.com/PyTorchLightning/lightning-flash/archive/refs/tags/0.5.2.zip#egg=lightning-flash[tabular] + - matplotlib + - seaborn +accelerator: + - CPU + - GPU +datasets: + kaggle: + - titanic diff --git a/_notebooks/templates/titanic/tutorial.py b/_notebooks/templates/titanic/tutorial.py new file mode 100644 index 0000000..a82976f --- /dev/null +++ b/_notebooks/templates/titanic/tutorial.py @@ -0,0 +1,101 @@ +import os + +import matplotlib.pyplot as plt +import pandas as pd +import seaborn as sns +import torch +from flash import Trainer +from flash.tabular import TabularClassificationData, TabularClassifier + +# %% [markdown] +# ## 1. Create the DataModule +# +# ### Variable & Definition +# +# - survival: Survival (0 = No, 1 = Yes) +# - pclass: Ticket class (1 = 1st, 2 = 2nd, 3 = 3rd) +# - sex: Sex +# - Age: Age in years +# - sibsp: number of siblings / spouses aboard the Titanic +# - parch: number of parents / children aboard the Titanic +# - ticket: Ticket number +# - fare: Passenger fare +# - cabin: Cabin number +# - embarked: Port of Embarkation + +# %% +data_path = os.environ.get("PATH_DATASETS", "_datasets") +path_titanic = os.path.join(data_path, "titanic") +csv_train = os.path.join(path_titanic, "train.csv") +csv_test = os.path.join(path_titanic, "test.csv") + +df_train = pd.read_csv(csv_train) +df_train["Survived"].hist(bins=2) + +# %% +datamodule = TabularClassificationData.from_csv( + categorical_fields=["Sex", "Embarked", "Cabin"], + numerical_fields=["Fare", "Age", "Pclass", "SibSp", "Parch"], + target_fields="Survived", + train_file=csv_train, + val_split=0.1, + batch_size=8, +) + +# %% [markdown] +# ## 2. Build the task + +# %% +model = TabularClassifier.from_data( + datamodule, + learning_rate=0.1, + optimizer="Adam", + n_a=8, + gamma=0.3, +) + +# %% [markdown] +# ## 3. Create the trainer and train the model + +# %% +from pytorch_lightning.loggers import CSVLogger # noqa: E402] + +logger = CSVLogger(save_dir="logs/") +trainer = Trainer( + max_epochs=10, + gpus=torch.cuda.device_count(), + logger=logger, + accumulate_grad_batches=12, + gradient_clip_val=0.1, +) + +# %% + +trainer.fit(model, datamodule=datamodule) + +# %% + +metrics = pd.read_csv(f"{trainer.logger.log_dir}/metrics.csv") +metrics.set_index("step", inplace=True) +del metrics["epoch"] +sns.relplot(data=metrics, kind="line") +plt.gca().set_ylim([0, 1.25]) +plt.gcf().set_size_inches(10, 5) + +# %% [markdown] +# ## 4. Generate predictions from a CSV + +# %% +df_test = pd.read_csv(csv_test) + +predictions = model.predict(csv_test) +print(predictions[0]) + +# %% +import numpy as np # noqa: E402] + +assert len(df_test) == len(predictions) + +df_test["Survived"] = np.argmax(predictions, axis=-1) +df_test.set_index("PassengerId", inplace=True) +df_test["Survived"].hist(bins=5) diff --git a/docs/.buildinfo b/docs/.buildinfo deleted file mode 100644 index 1767b18..0000000 --- a/docs/.buildinfo +++ /dev/null @@ -1,4 +0,0 @@ -# Sphinx build info version 1 -# This file hashes the configuration used when building these files. When it is not found, a full rebuild will be done. -config: 9f51b0822c0fcb09f5289c381438e1cc -tags: 645f666f9bcd5a90fca523b33c5a78b7 diff --git a/docs/CNAME b/docs/CNAME deleted file mode 100644 index ba22efe..0000000 --- a/docs/CNAME +++ /dev/null @@ -1 +0,0 @@ -docs.pytorchlightning.kr diff --git a/docs/README.md b/docs/README.md new file mode 100644 index 0000000..d59458b --- /dev/null +++ b/docs/README.md @@ -0,0 +1,76 @@ +# PyTorch-Lightning Docs + +We are using Sphinx with Napoleon extension. +Moreover, we set Google style to follow with type convention. + +- [Napoleon formatting with Google style](https://sphinxcontrib-napoleon.readthedocs.io/en/latest/example_google.html) +- [ReStructured Text (reST)](https://docs.pylonsproject.org/projects/docs-style-guide/) +- [Paragraph-level markup](https://www.sphinx-doc.org/en/master/usage/restructuredtext/basics.html#paragraphs) + +See following short example of a sample function taking one position string and optional + +```python +from typing import Optional + + +def my_func(param_a: int, param_b: Optional[float] = None) -> str: + """Sample function. + + Args: + param_a: first parameter + param_b: second parameter + + Return: + sum of both numbers + + Example:: + + >>> my_func(1, 2) + 3 + + Note: + If you want to add something. + """ + p = param_b if param_b else 0 + return str(param_a + p) +``` + +## Building Docs + +When updating the docs, make sure to build them first locally and visually inspect the html files in your browser for +formatting errors. In certain cases, a missing blank line or a wrong indent can lead to a broken layout. +Run these commands + +```bash +git submodule update --init --recursive +make docs +``` + +and open `docs/build/html/index.html` in your browser. + +When you send a PR the continuous integration will run tests and build the docs. + +Notes: + +- You need to have LaTeX installed for rendering math equations. You can for example install TeXLive with the necessary extras by doing one of the following: + - on Ubuntu (Linux) run `sudo apt-get update && sudo apt-get install -y texlive-latex-extra dvipng texlive-pictures` + - use the [RTD docker image](https://hub.docker.com/r/readthedocs/build) +- You need to have pandoc installed for rendering Jupyter Notebooks. On Ubuntu (Linux), you can run: `sudo apt-get install pandoc` + +## Developing docs + +When developing the docs, building docs can be VERY slow locally because of the notebook tutorials. +To speed this up, enable this flag in before building docs: + +```bash +# builds notebooks which is slow +export PL_FAST_DOCS_DEV=0 + +# fast notebook build which is fast +export PL_FAST_DOCS_DEV=1 +``` + +## docs CSS/theme + +To change the CSS theme of the docs, go [here](https://github.com/Lightning-AI/lightning_sphinx_theme). +Apologies in advance... this is a bit complex to build and requires basic understanding of javascript/npm. diff --git a/docs/_modules/index.html b/docs/_modules/index.html deleted file mode 100644 index b78bc49..0000000 --- a/docs/_modules/index.html +++ /dev/null @@ -1,689 +0,0 @@ - - - - - - - - - - - - - Overview: module code — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
- - -
-
-
- -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/_modules/pytorch_lightning/callbacks/base.html b/docs/_modules/pytorch_lightning/callbacks/base.html deleted file mode 100644 index 7c0586e..0000000 --- a/docs/_modules/pytorch_lightning/callbacks/base.html +++ /dev/null @@ -1,1048 +0,0 @@ - - - - - - - - - - - - - pytorch_lightning.callbacks.base — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -

Source code for pytorch_lightning.callbacks.base

-# Copyright The PyTorch Lightning team.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-r"""
-Base class used to build new callbacks.
-
-"""
-
-from typing import Any, Dict, List, Optional, Type
-
-import torch
-from torch.optim import Optimizer
-
-import pytorch_lightning as pl
-from pytorch_lightning.utilities.types import STEP_OUTPUT
-
-
-class Callback:
-    r"""
-    Abstract base class used to build new callbacks.
-
-    Subclass this class and override any of the relevant hooks
-    """
-
-    @property
-    def state_key(self) -> str:
-        """Identifier for the state of the callback.
-
-        Used to store and retrieve a callback's state from the checkpoint dictionary by
-        ``checkpoint["callbacks"][state_key]``. Implementations of a callback need to provide a unique state key if 1)
-        the callback has state and 2) it is desired to maintain the state of multiple instances of that callback.
-        """
-        return self.__class__.__qualname__
-
-    @property
-    def _legacy_state_key(self) -> Type["Callback"]:
-        """State key for checkpoints saved prior to version 1.5.0."""
-        return type(self)
-
-    def _generate_state_key(self, **kwargs: Any) -> str:
-        """Formats a set of key-value pairs into a state key string with the callback class name prefixed. Useful
-        for defining a :attr:`state_key`.
-
-        Args:
-            **kwargs: A set of key-value pairs. Must be serializable to :class:`str`.
-        """
-        return f"{self.__class__.__qualname__}{repr(kwargs)}"
-
-
[docs] def on_configure_sharded_model(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - r""" - .. deprecated:: v1.6 - This callback hook was deprecated in v1.6 and will be removed in v1.8. Use `setup()` instead. - - Called before configure sharded model. - """
- - def on_before_accelerator_backend_setup(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - r""" - .. deprecated:: v1.6 - This callback hook was deprecated in v1.6 and will be removed in v1.8. Use ``setup()`` instead. - - Called before accelerator is being setup. - """ - -
[docs] def setup(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule", stage: Optional[str] = None) -> None: - """Called when fit, validate, test, predict, or tune begins."""
- -
[docs] def teardown(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule", stage: Optional[str] = None) -> None: - """Called when fit, validate, test, predict, or tune ends."""
- -
[docs] def on_init_start(self, trainer: "pl.Trainer") -> None: - r""" - .. deprecated:: v1.6 - This callback hook was deprecated in v1.6 and will be removed in v1.8. - - Called when the trainer initialization begins, model has not yet been set. - """
- -
[docs] def on_init_end(self, trainer: "pl.Trainer") -> None: - r""" - .. deprecated:: v1.6 - This callback hook was deprecated in v1.6 and will be removed in v1.8. - - Called when the trainer initialization ends, model has not yet been set. - """
- -
[docs] def on_fit_start(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when fit begins."""
- -
[docs] def on_fit_end(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when fit ends."""
- -
[docs] def on_sanity_check_start(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when the validation sanity check starts."""
- -
[docs] def on_sanity_check_end(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when the validation sanity check ends."""
- -
[docs] def on_train_batch_start( - self, - trainer: "pl.Trainer", - pl_module: "pl.LightningModule", - batch: Any, - batch_idx: int, - unused: int = 0, - ) -> None: - """Called when the train batch begins."""
- -
[docs] def on_train_batch_end( - self, - trainer: "pl.Trainer", - pl_module: "pl.LightningModule", - outputs: STEP_OUTPUT, - batch: Any, - batch_idx: int, - unused: int = 0, - ) -> None: - """Called when the train batch ends."""
- -
[docs] def on_train_epoch_start(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when the train epoch begins."""
- -
[docs] def on_train_epoch_end(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when the train epoch ends. - - To access all batch outputs at the end of the epoch, either: - - 1. Implement `training_epoch_end` in the `LightningModule` and access outputs via the module OR - 2. Cache data across train batch hooks inside the callback implementation to post-process in this hook. - """
- -
[docs] def on_validation_epoch_start(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when the val epoch begins."""
- -
[docs] def on_validation_epoch_end(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when the val epoch ends."""
- -
[docs] def on_test_epoch_start(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when the test epoch begins."""
- -
[docs] def on_test_epoch_end(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when the test epoch ends."""
- -
[docs] def on_predict_epoch_start(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when the predict epoch begins."""
- -
[docs] def on_predict_epoch_end(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule", outputs: List[Any]) -> None: - """Called when the predict epoch ends."""
- - def on_epoch_start(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - r""" - .. deprecated:: v1.6 - This callback hook was deprecated in v1.6 and will be removed in v1.8. Use - ``on_<train/validation/test>_epoch_start`` instead. - - Called when either of train/val/test epoch begins. - """ - -
[docs] def on_epoch_end(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - r""" - .. deprecated:: v1.6 - This callback hook was deprecated in v1.6 and will be removed in v1.8. Use - ``on_<train/validation/test>_epoch_end`` instead. - - Called when either of train/val/test epoch ends. - """
- - def on_batch_start(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - r""" - .. deprecated:: v1.6 - This callback hook was deprecated in v1.6 and will be removed in v1.8. Use - ``on_train_batch_start`` instead. - - Called when the training batch begins. - """ - - def on_batch_end(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - r""" - .. deprecated:: v1.6 - This callback hook was deprecated in v1.6 and will be removed in v1.8. Use - ``on_train_batch_end`` instead. - - Called when the training batch ends. - """ - -
[docs] def on_validation_batch_start( - self, trainer: "pl.Trainer", pl_module: "pl.LightningModule", batch: Any, batch_idx: int, dataloader_idx: int - ) -> None: - """Called when the validation batch begins."""
- -
[docs] def on_validation_batch_end( - self, - trainer: "pl.Trainer", - pl_module: "pl.LightningModule", - outputs: Optional[STEP_OUTPUT], - batch: Any, - batch_idx: int, - dataloader_idx: int, - ) -> None: - """Called when the validation batch ends."""
- -
[docs] def on_test_batch_start( - self, trainer: "pl.Trainer", pl_module: "pl.LightningModule", batch: Any, batch_idx: int, dataloader_idx: int - ) -> None: - """Called when the test batch begins."""
- -
[docs] def on_test_batch_end( - self, - trainer: "pl.Trainer", - pl_module: "pl.LightningModule", - outputs: Optional[STEP_OUTPUT], - batch: Any, - batch_idx: int, - dataloader_idx: int, - ) -> None: - """Called when the test batch ends."""
- -
[docs] def on_predict_batch_start( - self, trainer: "pl.Trainer", pl_module: "pl.LightningModule", batch: Any, batch_idx: int, dataloader_idx: int - ) -> None: - """Called when the predict batch begins."""
- -
[docs] def on_predict_batch_end( - self, - trainer: "pl.Trainer", - pl_module: "pl.LightningModule", - outputs: Any, - batch: Any, - batch_idx: int, - dataloader_idx: int, - ) -> None: - """Called when the predict batch ends."""
- -
[docs] def on_train_start(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when the train begins."""
- -
[docs] def on_train_end(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when the train ends."""
- - def on_pretrain_routine_start(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - r""" - .. deprecated:: v1.6 - - This callback hook was deprecated in v1.6 and will be removed in v1.8. Use ``on_fit_start`` instead. - - Called when the pretrain routine begins. - """ - - def on_pretrain_routine_end(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - r""" - .. deprecated:: v1.6 - - This callback hook was deprecated in v1.6 and will be removed in v1.8. Use ``on_fit_start`` instead. - - Called when the pretrain routine ends. - """ - -
[docs] def on_validation_start(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when the validation loop begins."""
- -
[docs] def on_validation_end(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when the validation loop ends."""
- -
[docs] def on_test_start(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when the test begins."""
- -
[docs] def on_test_end(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when the test ends."""
- -
[docs] def on_predict_start(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when the predict begins."""
- -
[docs] def on_predict_end(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called when predict ends."""
- -
[docs] def on_keyboard_interrupt(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - r""" - .. deprecated:: v1.5 - This callback hook was deprecated in v1.5 in favor of `on_exception` and will be removed in v1.7. - - Called when any trainer execution is interrupted by KeyboardInterrupt. - """
- -
[docs] def on_exception(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule", exception: BaseException) -> None: - """Called when any trainer execution is interrupted by an exception."""
- -
[docs] def state_dict(self) -> Dict[str, Any]: - """Called when saving a checkpoint, implement to generate callback's ``state_dict``. - - Returns: - A dictionary containing callback state. - """ - return {}
- -
[docs] def load_state_dict(self, state_dict: Dict[str, Any]) -> None: - """Called when loading a checkpoint, implement to reload callback state given callback's ``state_dict``. - - Args: - state_dict: the callback state returned by ``state_dict``. - """ - pass
- -
[docs] def on_save_checkpoint( - self, trainer: "pl.Trainer", pl_module: "pl.LightningModule", checkpoint: Dict[str, Any] - ) -> Optional[dict]: - r""" - Called when saving a checkpoint to give you a chance to store anything else you might want to save. - - Args: - trainer: the current :class:`~pytorch_lightning.trainer.Trainer` instance. - pl_module: the current :class:`~pytorch_lightning.core.lightning.LightningModule` instance. - checkpoint: the checkpoint dictionary that will be saved. - - Returns: - None or the callback state. Support for returning callback state will be removed in v1.8. - - .. deprecated:: v1.6 - Returning a value from this method was deprecated in v1.6 and will be removed in v1.8. - Implement ``Callback.state_dict`` instead to return state. - In v1.8 ``Callback.on_save_checkpoint`` can only return None. - """
- -
[docs] def on_load_checkpoint( - self, trainer: "pl.Trainer", pl_module: "pl.LightningModule", callback_state: Dict[str, Any] - ) -> None: - r""" - Called when loading a model checkpoint, use to reload state. - - Args: - trainer: the current :class:`~pytorch_lightning.trainer.Trainer` instance. - pl_module: the current :class:`~pytorch_lightning.core.lightning.LightningModule` instance. - callback_state: the callback state returned by ``on_save_checkpoint``. - - Note: - The ``on_load_checkpoint`` won't be called with an undefined state. - If your ``on_load_checkpoint`` hook behavior doesn't rely on a state, - you will still need to override ``on_save_checkpoint`` to return a ``dummy state``. - - .. deprecated:: v1.6 - This callback hook will change its signature and behavior in v1.8. - If you wish to load the state of the callback, use ``Callback.load_state_dict`` instead. - In v1.8 ``Callback.on_load_checkpoint(checkpoint)`` will receive the entire loaded - checkpoint dictionary instead of only the callback state from the checkpoint. - """
- -
[docs] def on_before_backward(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule", loss: torch.Tensor) -> None: - """Called before ``loss.backward()``."""
- -
[docs] def on_after_backward(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule") -> None: - """Called after ``loss.backward()`` and before optimizers are stepped."""
- -
[docs] def on_before_optimizer_step( - self, trainer: "pl.Trainer", pl_module: "pl.LightningModule", optimizer: Optimizer, opt_idx: int - ) -> None: - """Called before ``optimizer.step()``."""
- -
[docs] def on_before_zero_grad(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule", optimizer: Optimizer) -> None: - """Called before ``optimizer.zero_grad()``."""
-
- -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/_modules/pytorch_lightning/core/datamodule.html b/docs/_modules/pytorch_lightning/core/datamodule.html deleted file mode 100644 index 4ca3aff..0000000 --- a/docs/_modules/pytorch_lightning/core/datamodule.html +++ /dev/null @@ -1,944 +0,0 @@ - - - - - - - - - - - - - pytorch_lightning.core.datamodule — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -

Source code for pytorch_lightning.core.datamodule

-# Copyright The PyTorch Lightning team.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-"""LightningDataModule for loading DataLoaders with ease."""
-from argparse import ArgumentParser, Namespace
-from typing import Any, Dict, List, Mapping, Optional, Sequence, Tuple, Union
-
-from torch.utils.data import DataLoader, Dataset, IterableDataset
-
-from pytorch_lightning.core.hooks import CheckpointHooks, DataHooks
-from pytorch_lightning.core.mixins import HyperparametersMixin
-from pytorch_lightning.utilities import rank_zero_deprecation
-from pytorch_lightning.utilities.argparse import add_argparse_args, from_argparse_args, get_init_arguments_and_types
-
-
-class LightningDataModule(CheckpointHooks, DataHooks, HyperparametersMixin):
-    """A DataModule standardizes the training, val, test splits, data preparation and transforms. The main
-    advantage is consistent data splits, data preparation and transforms across models.
-
-    Example::
-
-        class MyDataModule(LightningDataModule):
-            def __init__(self):
-                super().__init__()
-            def prepare_data(self):
-                # download, split, etc...
-                # only called on 1 GPU/TPU in distributed
-            def setup(self, stage):
-                # make assignments here (val/train/test split)
-                # called on every process in DDP
-            def train_dataloader(self):
-                train_split = Dataset(...)
-                return DataLoader(train_split)
-            def val_dataloader(self):
-                val_split = Dataset(...)
-                return DataLoader(val_split)
-            def test_dataloader(self):
-                test_split = Dataset(...)
-                return DataLoader(test_split)
-            def teardown(self):
-                # clean up after fit or test
-                # called on every process in DDP
-    """
-
-    name: str = ...
-
-    def __init__(self, train_transforms=None, val_transforms=None, test_transforms=None, dims=None):
-        super().__init__()
-        if train_transforms is not None:
-            rank_zero_deprecation(
-                "DataModule property `train_transforms` was deprecated in v1.5 and will be removed in v1.7."
-            )
-        if val_transforms is not None:
-            rank_zero_deprecation(
-                "DataModule property `val_transforms` was deprecated in v1.5 and will be removed in v1.7."
-            )
-        if test_transforms is not None:
-            rank_zero_deprecation(
-                "DataModule property `test_transforms` was deprecated in v1.5 and will be removed in v1.7."
-            )
-        if dims is not None:
-            rank_zero_deprecation("DataModule property `dims` was deprecated in v1.5 and will be removed in v1.7.")
-        self._train_transforms = train_transforms
-        self._val_transforms = val_transforms
-        self._test_transforms = test_transforms
-        self._dims = dims if dims is not None else ()
-
-        # Pointer to the trainer object
-        self.trainer = None
-
-    @property
-    def train_transforms(self):
-        """Optional transforms (or collection of transforms) you can apply to train dataset.
-
-        .. deprecated:: v1.5     Will be removed in v1.7.0.
-        """
-
-        rank_zero_deprecation(
-            "DataModule property `train_transforms` was deprecated in v1.5 and will be removed in v1.7."
-        )
-        return self._train_transforms
-
-    @train_transforms.setter
-    def train_transforms(self, t):
-        rank_zero_deprecation(
-            "DataModule property `train_transforms` was deprecated in v1.5 and will be removed in v1.7."
-        )
-        self._train_transforms = t
-
-    @property
-    def val_transforms(self):
-        """Optional transforms (or collection of transforms) you can apply to validation dataset.
-
-        .. deprecated:: v1.5     Will be removed in v1.7.0.
-        """
-
-        rank_zero_deprecation(
-            "DataModule property `val_transforms` was deprecated in v1.5 and will be removed in v1.7."
-        )
-        return self._val_transforms
-
-    @val_transforms.setter
-    def val_transforms(self, t):
-        rank_zero_deprecation(
-            "DataModule property `val_transforms` was deprecated in v1.5 and will be removed in v1.7."
-        )
-        self._val_transforms = t
-
-    @property
-    def test_transforms(self):
-        """Optional transforms (or collection of transforms) you can apply to test dataset.
-
-        .. deprecated:: v1.5     Will be removed in v1.7.0.
-        """
-
-        rank_zero_deprecation(
-            "DataModule property `test_transforms` was deprecated in v1.5 and will be removed in v1.7."
-        )
-        return self._test_transforms
-
-    @test_transforms.setter
-    def test_transforms(self, t):
-        rank_zero_deprecation(
-            "DataModule property `test_transforms` was deprecated in v1.5 and will be removed in v1.7."
-        )
-        self._test_transforms = t
-
-    @property
-    def dims(self):
-        """A tuple describing the shape of your data. Extra functionality exposed in ``size``.
-
-        .. deprecated:: v1.5     Will be removed in v1.7.0.
-        """
-        rank_zero_deprecation("DataModule property `dims` was deprecated in v1.5 and will be removed in v1.7.")
-        return self._dims
-
-    @dims.setter
-    def dims(self, d):
-        rank_zero_deprecation("DataModule property `dims` was deprecated in v1.5 and will be removed in v1.7.")
-        self._dims = d
-
-    def size(self, dim=None) -> Union[Tuple, List[Tuple]]:
-        """Return the dimension of each input either as a tuple or list of tuples. You can index this just as you
-        would with a torch tensor.
-
-        .. deprecated:: v1.5     Will be removed in v1.7.0.
-        """
-        rank_zero_deprecation("DataModule property `size` was deprecated in v1.5 and will be removed in v1.7.")
-
-        if dim is not None:
-            return self.dims[dim]
-
-        return self.dims
-
-    @classmethod
-    def add_argparse_args(cls, parent_parser: ArgumentParser, **kwargs) -> ArgumentParser:
-        """Extends existing argparse by default `LightningDataModule` attributes."""
-        return add_argparse_args(cls, parent_parser, **kwargs)
-
-    @classmethod
-    def from_argparse_args(cls, args: Union[Namespace, ArgumentParser], **kwargs):
-        """Create an instance from CLI arguments.
-
-        Args:
-            args: The parser or namespace to take arguments from. Only known arguments will be
-                parsed and passed to the :class:`~pytorch_lightning.core.datamodule.LightningDataModule`.
-            **kwargs: Additional keyword arguments that may override ones in the parser or namespace.
-                These must be valid DataModule arguments.
-
-        Example::
-
-            parser = ArgumentParser(add_help=False)
-            parser = LightningDataModule.add_argparse_args(parser)
-            module = LightningDataModule.from_argparse_args(args)
-        """
-        return from_argparse_args(cls, args, **kwargs)
-
-    @classmethod
-    def get_init_arguments_and_types(cls) -> List[Tuple[str, Tuple, Any]]:
-        r"""Scans the DataModule signature and returns argument names, types and default values.
-
-        Returns:
-            List with tuples of 3 values:
-            (argument name, set with argument types, argument default value).
-        """
-        return get_init_arguments_and_types(cls)
-
-    @classmethod
-    def from_datasets(
-        cls,
-        train_dataset: Optional[Union[Dataset, Sequence[Dataset], Mapping[str, Dataset]]] = None,
-        val_dataset: Optional[Union[Dataset, Sequence[Dataset]]] = None,
-        test_dataset: Optional[Union[Dataset, Sequence[Dataset]]] = None,
-        batch_size: int = 1,
-        num_workers: int = 0,
-    ):
-        r"""
-        Create an instance from torch.utils.data.Dataset.
-
-        Args:
-            train_dataset: (optional) Dataset to be used for train_dataloader()
-            val_dataset: (optional) Dataset or list of Dataset to be used for val_dataloader()
-            test_dataset: (optional) Dataset or list of Dataset to be used for test_dataloader()
-            batch_size: Batch size to use for each dataloader. Default is 1.
-            num_workers: Number of subprocesses to use for data loading. 0 means that the
-                data will be loaded in the main process. Number of CPUs available.
-
-        """
-
-        def dataloader(ds: Dataset, shuffle: bool = False) -> DataLoader:
-            shuffle &= not isinstance(ds, IterableDataset)
-            return DataLoader(ds, batch_size=batch_size, shuffle=shuffle, num_workers=num_workers, pin_memory=True)
-
-        def train_dataloader():
-            if isinstance(train_dataset, Mapping):
-                return {key: dataloader(ds, shuffle=True) for key, ds in train_dataset.items()}
-            if isinstance(train_dataset, Sequence):
-                return [dataloader(ds, shuffle=True) for ds in train_dataset]
-            return dataloader(train_dataset, shuffle=True)
-
-        def val_dataloader():
-            if isinstance(val_dataset, Sequence):
-                return [dataloader(ds) for ds in val_dataset]
-            return dataloader(val_dataset)
-
-        def test_dataloader():
-            if isinstance(test_dataset, Sequence):
-                return [dataloader(ds) for ds in test_dataset]
-            return dataloader(test_dataset)
-
-        datamodule = cls()
-        if train_dataset is not None:
-            datamodule.train_dataloader = train_dataloader
-        if val_dataset is not None:
-            datamodule.val_dataloader = val_dataloader
-        if test_dataset is not None:
-            datamodule.test_dataloader = test_dataloader
-        return datamodule
-
-
[docs] def state_dict(self) -> Dict[str, Any]: - """Called when saving a checkpoint, implement to generate and save datamodule state. - - Returns: - A dictionary containing datamodule state. - """ - return {}
- -
[docs] def load_state_dict(self, state_dict: Dict[str, Any]) -> None: - """Called when loading a checkpoint, implement to reload datamodule state given datamodule state_dict. - - Args: - state_dict: the datamodule state returned by ``state_dict``. - """ - pass
-
- -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/_modules/pytorch_lightning/core/lightning.html b/docs/_modules/pytorch_lightning/core/lightning.html deleted file mode 100644 index e80c879..0000000 --- a/docs/_modules/pytorch_lightning/core/lightning.html +++ /dev/null @@ -1,2729 +0,0 @@ - - - - - - - - - - - - - pytorch_lightning.core.lightning — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -

Source code for pytorch_lightning.core.lightning

-# Copyright The PyTorch Lightning team.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-"""The LightningModule - an nn.Module with many additional features."""
-
-import collections
-import inspect
-import logging
-import numbers
-import os
-import tempfile
-from contextlib import contextmanager
-from pathlib import Path
-from typing import Any, Callable, Dict, List, Mapping, Optional, overload, Sequence, Tuple, Union
-
-import torch
-from torch import ScriptModule, Tensor
-from torch.nn import Module
-from torch.optim.optimizer import Optimizer
-from torchmetrics import Metric
-from typing_extensions import Literal
-
-import pytorch_lightning as pl
-from pytorch_lightning.callbacks.base import Callback
-from pytorch_lightning.callbacks.progress import base as progress_base
-from pytorch_lightning.core.hooks import CheckpointHooks, DataHooks, ModelHooks
-from pytorch_lightning.core.mixins import DeviceDtypeModuleMixin, HyperparametersMixin
-from pytorch_lightning.core.optimizer import LightningOptimizer
-from pytorch_lightning.core.saving import ModelIO
-from pytorch_lightning.loggers import LightningLoggerBase
-from pytorch_lightning.trainer.connectors.data_connector import _DataHookSelector
-from pytorch_lightning.trainer.connectors.logger_connector.fx_validator import _FxValidator
-from pytorch_lightning.utilities import _IS_WINDOWS, _TORCH_GREATER_EQUAL_1_10, GradClipAlgorithmType
-from pytorch_lightning.utilities.apply_func import apply_to_collection, convert_to_tensors
-from pytorch_lightning.utilities.cloud_io import get_filesystem
-from pytorch_lightning.utilities.distributed import distributed_available, sync_ddp
-from pytorch_lightning.utilities.exceptions import MisconfigurationException
-from pytorch_lightning.utilities.memory import get_model_size_mb
-from pytorch_lightning.utilities.model_summary import ModelSummary, summarize
-from pytorch_lightning.utilities.parsing import collect_init_args
-from pytorch_lightning.utilities.rank_zero import rank_zero_debug, rank_zero_deprecation, rank_zero_warn
-from pytorch_lightning.utilities.signature_utils import is_param_in_hook_signature
-from pytorch_lightning.utilities.types import _METRIC_COLLECTION, EPOCH_OUTPUT, LRSchedulerTypeUnion, STEP_OUTPUT
-from pytorch_lightning.utilities.warnings import WarningCache
-
-warning_cache = WarningCache()
-log = logging.getLogger(__name__)
-
-
-class LightningModule(
-    DeviceDtypeModuleMixin,
-    HyperparametersMixin,
-    ModelIO,
-    ModelHooks,
-    DataHooks,
-    CheckpointHooks,
-    Module,
-):
-    # Below is for property support of JIT
-    # since none of these are important when using JIT, we are going to ignore them.
-    __jit_unused_properties__ = (
-        [
-            "example_input_array",
-            "on_gpu",
-            "current_epoch",
-            "global_step",
-            "global_rank",
-            "local_rank",
-            "logger",
-            "loggers",
-            "model_size",
-            "automatic_optimization",
-            "truncated_bptt_steps",
-            "use_amp",
-        ]
-        + DeviceDtypeModuleMixin.__jit_unused_properties__
-        + HyperparametersMixin.__jit_unused_properties__
-    )
-
-    def __init__(self, *args: Any, **kwargs: Any) -> None:
-        super().__init__(*args, **kwargs)
-
-        # see (https://github.com/pytorch/pytorch/blob/3e6bb5233f9ca2c5aa55d9cda22a7ee85439aa6e/
-        # torch/nn/modules/module.py#L227)
-        torch._C._log_api_usage_once(f"lightning.module.{self.__class__.__name__}")
-
-        # pointer to the trainer object
-        self.trainer: Optional["pl.Trainer"] = None
-
-        self._use_amp: bool = False
-
-        # the precision used
-        self.precision: int = 32
-
-        # optionally can be set by user
-        self._example_input_array = None
-        self._current_fx_name: Optional[str] = None
-        self._automatic_optimization: bool = True
-        self._truncated_bptt_steps: int = 0
-        self._param_requires_grad_state = {}
-        self._metric_attributes: Optional[Dict[int, str]] = None
-        self._should_prevent_trainer_and_dataloaders_deepcopy: bool = False
-        # TODO: remove in 1.8
-        self._running_torchscript = False
-
-        self._register_sharded_tensor_state_dict_hooks_if_available()
-
-    @overload
-    def optimizers(self, use_pl_optimizer: Literal[True] = True) -> Union[LightningOptimizer, List[LightningOptimizer]]:
-        ...
-
-    @overload
-    def optimizers(self, use_pl_optimizer: Literal[False]) -> Union[Optimizer, List[Optimizer]]:
-        ...
-
-    @overload
-    def optimizers(
-        self, use_pl_optimizer: bool
-    ) -> Union[Optimizer, LightningOptimizer, List[Optimizer], List[LightningOptimizer]]:
-        ...
-
-
[docs] def optimizers( - self, use_pl_optimizer: bool = True - ) -> Union[Optimizer, LightningOptimizer, List[Optimizer], List[LightningOptimizer]]: - """Returns the optimizer(s) that are being used during training. Useful for manual optimization. - - Args: - use_pl_optimizer: If ``True``, will wrap the optimizer(s) in a - :class:`~pytorch_lightning.core.optimizer.LightningOptimizer` for automatic handling of precision and - profiling. - - Returns: - A single optimizer, or a list of optimizers in case multiple ones are present. - """ - if use_pl_optimizer: - opts = list(self.trainer.strategy._lightning_optimizers.values()) - else: - opts = self.trainer.optimizers - - # single optimizer - if isinstance(opts, list) and len(opts) == 1 and isinstance(opts[0], (Optimizer, LightningOptimizer)): - return opts[0] - # multiple opts - return opts
- -
[docs] def lr_schedulers(self) -> Optional[Union[LRSchedulerTypeUnion, List[LRSchedulerTypeUnion]]]: - """Returns the learning rate scheduler(s) that are being used during training. Useful for manual - optimization. - - Returns: - A single scheduler, or a list of schedulers in case multiple ones are present, or ``None`` if no - schedulers were returned in :meth:`configure_optimizers`. - """ - if not self.trainer.lr_scheduler_configs: - return None - - # ignore other keys "interval", "frequency", etc. - lr_schedulers = [config.scheduler for config in self.trainer.lr_scheduler_configs] - - # single scheduler - if len(lr_schedulers) == 1: - return lr_schedulers[0] - - # multiple schedulers - return lr_schedulers
- - @property - def example_input_array(self) -> Any: - """The example input array is a specification of what the module can consume in the :meth:`forward` method. - The return type is interpreted as follows: - - - Single tensor: It is assumed the model takes a single argument, i.e., - ``model.forward(model.example_input_array)`` - - Tuple: The input array should be interpreted as a sequence of positional arguments, i.e., - ``model.forward(*model.example_input_array)`` - - Dict: The input array represents named keyword arguments, i.e., - ``model.forward(**model.example_input_array)`` - """ - return self._example_input_array - - @example_input_array.setter - def example_input_array(self, example: Any) -> None: - self._example_input_array = example - - @property - def current_epoch(self) -> int: - """The current epoch in the ``Trainer``, or 0 if not attached.""" - return self.trainer.current_epoch if self.trainer else 0 - - @property - def global_step(self) -> int: - """Total training batches seen across all epochs. - - If no Trainer is attached, this propery is 0. - """ - return self.trainer.global_step if self.trainer else 0 - - @property - def global_rank(self) -> int: - """The index of the current process across all nodes and devices.""" - return self.trainer.global_rank if self.trainer else 0 - - @property - def local_rank(self) -> int: - """The index of the current process within a single node.""" - return self.trainer.local_rank if self.trainer else 0 - - @property - def on_gpu(self): - """Returns ``True`` if this model is currently located on a GPU. - - Useful to set flags around the LightningModule for different CPU vs GPU behavior. - """ - return self.device.type == "cuda" - - @property - def automatic_optimization(self) -> bool: - """If set to ``False`` you are responsible for calling ``.backward()``, ``.step()``, ``.zero_grad()``.""" - return self._automatic_optimization - - @automatic_optimization.setter - def automatic_optimization(self, automatic_optimization: bool) -> None: - self._automatic_optimization = automatic_optimization - - @property - def truncated_bptt_steps(self) -> int: - """Enables `Truncated Backpropagation Through Time` in the Trainer when set to a positive integer. - - It represents - the number of times :meth:`training_step` gets called before backpropagation. If this is > 0, the - :meth:`training_step` receives an additional argument ``hiddens`` and is expected to return a hidden state. - """ - return self._truncated_bptt_steps - - @truncated_bptt_steps.setter - def truncated_bptt_steps(self, truncated_bptt_steps: int) -> None: - self._truncated_bptt_steps = truncated_bptt_steps - - @property - def logger(self) -> Optional[LightningLoggerBase]: - """Reference to the logger object in the Trainer.""" - return self.trainer.logger if self.trainer else None - - @property - def loggers(self) -> List[LightningLoggerBase]: - """Reference to the list of loggers in the Trainer.""" - return self.trainer.loggers if self.trainer else [] - - def _apply_batch_transfer_handler( - self, batch: Any, device: Optional[torch.device] = None, dataloader_idx: int = 0 - ) -> Any: - device = device or self.device - datahook_selector = ( - _DataHookSelector(self, None) if self.trainer is None else self.trainer._data_connector._datahook_selector - ) - - hook = datahook_selector.get_hook("on_before_batch_transfer") - batch = hook(batch, dataloader_idx) - hook = datahook_selector.get_hook("transfer_batch_to_device") - batch = hook(batch, device, dataloader_idx) - hook = datahook_selector.get_hook("on_after_batch_transfer") - batch = hook(batch, dataloader_idx) - return batch - -
[docs] def print(self, *args, **kwargs) -> None: - r""" - Prints only from process 0. Use this in any distributed mode to log only once. - - Args: - *args: The thing to print. The same as for Python's built-in print function. - **kwargs: The same as for Python's built-in print function. - - Example:: - - def forward(self, x): - self.print(x, 'in forward') - - """ - if self.trainer.is_global_zero: - progress_bar = self.trainer.progress_bar_callback - if progress_bar is not None and progress_bar.is_enabled: - progress_bar.print(*args, **kwargs) - else: - print(*args, **kwargs)
- -
[docs] def log( - self, - name: str, - value: _METRIC_COLLECTION, - prog_bar: bool = False, - logger: bool = True, - on_step: Optional[bool] = None, - on_epoch: Optional[bool] = None, - reduce_fx: Union[str, Callable] = "mean", - enable_graph: bool = False, - sync_dist: bool = False, - sync_dist_group: Optional[Any] = None, - add_dataloader_idx: bool = True, - batch_size: Optional[int] = None, - metric_attribute: Optional[str] = None, - rank_zero_only: bool = False, - ) -> None: - """Log a key, value pair. - - Example:: - - self.log('train_loss', loss) - - The default behavior per hook is documented here: :ref:`extensions/logging:Automatic Logging`. - - Args: - name: key to log. - value: value to log. Can be a ``float``, ``Tensor``, ``Metric``, or a dictionary of the former. - prog_bar: if ``True`` logs to the progress bar. - logger: if ``True`` logs to the logger. - on_step: if ``True`` logs at this step. The default value is determined by the hook. - See :ref:`extensions/logging:Automatic Logging` for details. - on_epoch: if ``True`` logs epoch accumulated metrics. The default value is determined by the hook. - See :ref:`extensions/logging:Automatic Logging` for details. - reduce_fx: reduction function over step values for end of epoch. :meth:`torch.mean` by default. - enable_graph: if ``True``, will not auto detach the graph. - sync_dist: if ``True``, reduces the metric across devices. Use with care as this may lead to a significant - communication overhead. - sync_dist_group: the DDP group to sync across. - add_dataloader_idx: if ``True``, appends the index of the current dataloader to - the name (when using multiple dataloaders). If False, user needs to give unique names for - each dataloader to not mix the values. - batch_size: Current batch_size. This will be directly inferred from the loaded batch, - but for some data structures you might need to explicitly provide it. - metric_attribute: To restore the metric state, Lightning requires the reference of the - :class:`torchmetrics.Metric` in your model. This is found automatically if it is a model attribute. - rank_zero_only: Whether the value will be logged only on rank 0. This will prevent synchronization which - would produce a deadlock as not all processes would perform this log call. - """ - # check for invalid values - apply_to_collection(value, dict, self.__check_not_nested, name) - apply_to_collection( - value, object, self.__check_allowed, name, value, wrong_dtype=(numbers.Number, Metric, Tensor, dict) - ) - - if self.trainer is None: - # not an error to support testing the `*_step` methods without a `Trainer` reference - rank_zero_warn( - "You are trying to `self.log()` but the `self.trainer` reference is not registered on the model yet." - " This is most likely because the model hasn't been passed to the `Trainer`" - ) - return - results = self.trainer._results - if results is None: - raise MisconfigurationException( - "You are trying to `self.log()` but the loop's result collection is not registered" - " yet. This is most likely because you are trying to log in a `predict` hook," - " but it doesn't support logging" - ) - if self._current_fx_name is None: - raise MisconfigurationException( - "You are trying to `self.log()` but it is not managed by the `Trainer` control flow" - ) - - on_step, on_epoch = _FxValidator.check_logging_and_get_default_levels( - self._current_fx_name, on_step=on_step, on_epoch=on_epoch - ) - - # make sure user doesn't introduce logic for multi-dataloaders - if "/dataloader_idx_" in name: - raise MisconfigurationException( - f"You called `self.log` with the key `{name}`" - " but it should not contain information about `dataloader_idx`" - ) - - value = apply_to_collection(value, numbers.Number, self.__to_tensor) - - if self.trainer._logger_connector.should_reset_tensors(self._current_fx_name): - # if we started a new epoch (running its first batch) the hook name has changed - # reset any tensors for the new hook name - results.reset(metrics=False, fx=self._current_fx_name) - - if metric_attribute is None and isinstance(value, Metric): - if self._metric_attributes is None: - # compute once - self._metric_attributes = { - id(module): name for name, module in self.named_modules() if isinstance(module, Metric) - } - if not self._metric_attributes: - raise MisconfigurationException( - "Could not find the `LightningModule` attribute for the `torchmetrics.Metric` logged." - " You can fix this by setting an attribute for the metric in your `LightningModule`." - ) - # try to find the passed metric in the LightningModule - metric_attribute = self._metric_attributes.get(id(value), None) - if metric_attribute is None: - raise MisconfigurationException( - "Could not find the `LightningModule` attribute for the `torchmetrics.Metric` logged." - f" You can fix this by calling `self.log({name}, ..., metric_attribute=name)` where `name` is one" - f" of {list(self._metric_attributes.values())}" - ) - - if ( - self.trainer.training - and is_param_in_hook_signature(self.training_step, "dataloader_iter", explicit=True) - and batch_size is None - ): - raise MisconfigurationException( - "With `def training_step(self, dataloader_iter)`, `self.log(..., batch_size=...)` should be provided." - ) - - results.log( - self._current_fx_name, - name, - value, - prog_bar=prog_bar, - logger=logger, - on_step=on_step, - on_epoch=on_epoch, - reduce_fx=reduce_fx, - enable_graph=enable_graph, - add_dataloader_idx=add_dataloader_idx, - batch_size=batch_size, - sync_dist=sync_dist and distributed_available(), - sync_dist_fn=self.trainer.strategy.reduce or sync_ddp, - sync_dist_group=sync_dist_group, - metric_attribute=metric_attribute, - rank_zero_only=rank_zero_only, - ) - - self.trainer._logger_connector._current_fx = self._current_fx_name
- -
[docs] def log_dict( - self, - dictionary: Mapping[str, _METRIC_COLLECTION], - prog_bar: bool = False, - logger: bool = True, - on_step: Optional[bool] = None, - on_epoch: Optional[bool] = None, - reduce_fx: Union[str, Callable] = "mean", - enable_graph: bool = False, - sync_dist: bool = False, - sync_dist_group: Optional[Any] = None, - add_dataloader_idx: bool = True, - batch_size: Optional[int] = None, - rank_zero_only: bool = False, - ) -> None: - """Log a dictionary of values at once. - - Example:: - - values = {'loss': loss, 'acc': acc, ..., 'metric_n': metric_n} - self.log_dict(values) - - Args: - dictionary: key value pairs. - The values can be a ``float``, ``Tensor``, ``Metric``, or a dictionary of the former. - prog_bar: if ``True`` logs to the progress base. - logger: if ``True`` logs to the logger. - on_step: if ``True`` logs at this step. - ``None`` auto-logs for training_step but not validation/test_step. - The default value is determined by the hook. - See :ref:`extensions/logging:Automatic Logging` for details. - on_epoch: if ``True`` logs epoch accumulated metrics. - ``None`` auto-logs for val/test step but not ``training_step``. - The default value is determined by the hook. - See :ref:`extensions/logging:Automatic Logging` for details. - reduce_fx: reduction function over step values for end of epoch. :meth:`torch.mean` by default. - enable_graph: if ``True``, will not auto-detach the graph - sync_dist: if ``True``, reduces the metric across GPUs/TPUs. Use with care as this may lead to a significant - communication overhead. - sync_dist_group: the ddp group to sync across. - add_dataloader_idx: if ``True``, appends the index of the current dataloader to - the name (when using multiple). If ``False``, user needs to give unique names for - each dataloader to not mix values. - batch_size: Current batch size. This will be directly inferred from the loaded batch, - but some data structures might need to explicitly provide it. - rank_zero_only: Whether the value will be logged only on rank 0. This will prevent synchronization which - would produce a deadlock as not all processes would perform this log call. - """ - for k, v in dictionary.items(): - self.log( - name=k, - value=v, - prog_bar=prog_bar, - logger=logger, - on_step=on_step, - on_epoch=on_epoch, - reduce_fx=reduce_fx, - enable_graph=enable_graph, - sync_dist=sync_dist, - sync_dist_group=sync_dist_group, - add_dataloader_idx=add_dataloader_idx, - batch_size=batch_size, - rank_zero_only=rank_zero_only, - )
- - @staticmethod - def __check_not_nested(value: dict, name: str) -> dict: - # self-imposed restriction. for simplicity - if any(isinstance(v, dict) for v in value.values()): - raise ValueError(f"`self.log({name}, {value})` was called, but nested dictionaries cannot be logged") - return value - - @staticmethod - def __check_allowed(v: Any, name: str, value: Any) -> None: - raise ValueError(f"`self.log({name}, {value})` was called, but `{type(v).__name__}` values cannot be logged") - - def __to_tensor(self, value: numbers.Number) -> torch.Tensor: - return torch.tensor(value, device=self.device) - - def log_grad_norm(self, grad_norm_dict: Dict[str, float]) -> None: - """Override this method to change the default behaviour of ``log_grad_norm``. - - If clipping gradients, the gradients will not have been clipped yet. - - Args: - grad_norm_dict: Dictionary containing current grad norm metrics - - Example:: - - # DEFAULT - def log_grad_norm(self, grad_norm_dict): - self.log_dict(grad_norm_dict, on_step=True, on_epoch=True, prog_bar=False, logger=True) - """ - self.log_dict(grad_norm_dict, on_step=True, on_epoch=True, prog_bar=False, logger=True) - -
[docs] def all_gather( - self, data: Union[torch.Tensor, Dict, List, Tuple], group: Optional[Any] = None, sync_grads: bool = False - ): - r""" - Allows users to call ``self.all_gather()`` from the LightningModule, thus making the ``all_gather`` operation - accelerator agnostic. ``all_gather`` is a function provided by accelerators to gather a tensor from several - distributed processes. - - Args: - data: int, float, tensor of shape (batch, ...), or a (possibly nested) collection thereof. - group: the process group to gather results from. Defaults to all processes (world) - sync_grads: flag that allows users to synchronize gradients for the all_gather operation - - Return: - A tensor of shape (world_size, batch, ...), or if the input was a collection - the output will also be a collection with tensors of this shape. - """ - group = group if group is not None else torch.distributed.group.WORLD - all_gather = self.trainer.strategy.all_gather - data = convert_to_tensors(data, device=self.device) - return apply_to_collection(data, torch.Tensor, all_gather, group=group, sync_grads=sync_grads)
- -
[docs] def forward(self, *args, **kwargs) -> Any: - r""" - Same as :meth:`torch.nn.Module.forward()`. - - Args: - *args: Whatever you decide to pass into the forward method. - **kwargs: Keyword arguments are also possible. - - Return: - Your model's output - """ - return super().forward(*args, **kwargs)
- -
[docs] def training_step(self, *args, **kwargs) -> STEP_OUTPUT: - r""" - Here you compute and return the training loss and some additional metrics for e.g. - the progress bar or logger. - - Args: - batch (:class:`~torch.Tensor` | (:class:`~torch.Tensor`, ...) | [:class:`~torch.Tensor`, ...]): - The output of your :class:`~torch.utils.data.DataLoader`. A tensor, tuple or list. - batch_idx (``int``): Integer displaying index of this batch - optimizer_idx (``int``): When using multiple optimizers, this argument will also be present. - hiddens (``Any``): Passed in if - :paramref:`~pytorch_lightning.core.lightning.LightningModule.truncated_bptt_steps` > 0. - - Return: - Any of. - - - :class:`~torch.Tensor` - The loss tensor - - ``dict`` - A dictionary. Can include any keys, but must include the key ``'loss'`` - - ``None`` - Training will skip to the next batch. This is only for automatic optimization. - This is not supported for multi-GPU, TPU, IPU, or DeepSpeed. - - In this step you'd normally do the forward pass and calculate the loss for a batch. - You can also do fancier things like multiple forward passes or something model specific. - - Example:: - - def training_step(self, batch, batch_idx): - x, y, z = batch - out = self.encoder(x) - loss = self.loss(out, x) - return loss - - If you define multiple optimizers, this step will be called with an additional - ``optimizer_idx`` parameter. - - .. code-block:: python - - # Multiple optimizers (e.g.: GANs) - def training_step(self, batch, batch_idx, optimizer_idx): - if optimizer_idx == 0: - # do training_step with encoder - ... - if optimizer_idx == 1: - # do training_step with decoder - ... - - - If you add truncated back propagation through time you will also get an additional - argument with the hidden states of the previous step. - - .. code-block:: python - - # Truncated back-propagation through time - def training_step(self, batch, batch_idx, hiddens): - # hiddens are the hidden states from the previous truncated backprop step - out, hiddens = self.lstm(data, hiddens) - loss = ... - return {"loss": loss, "hiddens": hiddens} - - Note: - The loss value shown in the progress bar is smoothed (averaged) over the last values, - so it differs from the actual loss returned in train/validation step. - """ - rank_zero_warn("`training_step` must be implemented to be used with the Lightning Trainer")
- -
[docs] def training_step_end(self, step_output: STEP_OUTPUT) -> STEP_OUTPUT: - """Use this when training with dp or ddp2 because :meth:`training_step` will operate on only part of the - batch. However, this is still optional and only needed for things like softmax or NCE loss. - - Note: - If you later switch to ddp or some other mode, this will still be called - so that you don't have to change your code - - .. code-block:: python - - # pseudocode - sub_batches = split_batches_for_dp(batch) - step_output = [training_step(sub_batch) for sub_batch in sub_batches] - training_step_end(step_output) - - Args: - step_output: What you return in `training_step` for each batch part. - - Return: - Anything - - When using dp/ddp2 distributed backends, only a portion of the batch is inside the training_step: - - .. code-block:: python - - def training_step(self, batch, batch_idx): - # batch is 1/num_gpus big - x, y = batch - - out = self(x) - - # softmax uses only a portion of the batch in the denominator - loss = self.softmax(out) - loss = nce_loss(loss) - return loss - - If you wish to do something with all the parts of the batch, then use this method to do it: - - .. code-block:: python - - def training_step(self, batch, batch_idx): - # batch is 1/num_gpus big - x, y = batch - - out = self.encoder(x) - return {"pred": out} - - - def training_step_end(self, training_step_outputs): - gpu_0_pred = training_step_outputs[0]["pred"] - gpu_1_pred = training_step_outputs[1]["pred"] - gpu_n_pred = training_step_outputs[n]["pred"] - - # this softmax now uses the full batch - loss = nce_loss([gpu_0_pred, gpu_1_pred, gpu_n_pred]) - return loss - - See Also: - See the :ref:`accelerators/gpu:Multi GPU Training` guide for more details. - """
- -
[docs] def training_epoch_end(self, outputs: EPOCH_OUTPUT) -> None: - """Called at the end of the training epoch with the outputs of all training steps. Use this in case you - need to do something with all the outputs returned by :meth:`training_step`. - - .. code-block:: python - - # the pseudocode for these calls - train_outs = [] - for train_batch in train_data: - out = training_step(train_batch) - train_outs.append(out) - training_epoch_end(train_outs) - - Args: - outputs: List of outputs you defined in :meth:`training_step`. If there are multiple optimizers or when - using ``truncated_bptt_steps > 0``, the lists have the dimensions - (n_batches, tbptt_steps, n_optimizers). Dimensions of length 1 are squeezed. - - Return: - None - - Note: - If this method is not overridden, this won't be called. - - .. code-block:: python - - def training_epoch_end(self, training_step_outputs): - # do something with all training_step outputs - for out in training_step_outputs: - ... - """
- -
[docs] def validation_step(self, *args, **kwargs) -> Optional[STEP_OUTPUT]: - r""" - Operates on a single batch of data from the validation set. - In this step you'd might generate examples or calculate anything of interest like accuracy. - - .. code-block:: python - - # the pseudocode for these calls - val_outs = [] - for val_batch in val_data: - out = validation_step(val_batch) - val_outs.append(out) - validation_epoch_end(val_outs) - - Args: - batch: The output of your :class:`~torch.utils.data.DataLoader`. - batch_idx: The index of this batch. - dataloader_idx: The index of the dataloader that produced this batch. - (only if multiple val dataloaders used) - - Return: - - Any object or value - - ``None`` - Validation will skip to the next batch - - .. code-block:: python - - # pseudocode of order - val_outs = [] - for val_batch in val_data: - out = validation_step(val_batch) - if defined("validation_step_end"): - out = validation_step_end(out) - val_outs.append(out) - val_outs = validation_epoch_end(val_outs) - - - .. code-block:: python - - # if you have one val dataloader: - def validation_step(self, batch, batch_idx): - ... - - - # if you have multiple val dataloaders: - def validation_step(self, batch, batch_idx, dataloader_idx=0): - ... - - Examples:: - - # CASE 1: A single validation dataset - def validation_step(self, batch, batch_idx): - x, y = batch - - # implement your own - out = self(x) - loss = self.loss(out, y) - - # log 6 example images - # or generated text... or whatever - sample_imgs = x[:6] - grid = torchvision.utils.make_grid(sample_imgs) - self.logger.experiment.add_image('example_images', grid, 0) - - # calculate acc - labels_hat = torch.argmax(out, dim=1) - val_acc = torch.sum(y == labels_hat).item() / (len(y) * 1.0) - - # log the outputs! - self.log_dict({'val_loss': loss, 'val_acc': val_acc}) - - If you pass in multiple val dataloaders, :meth:`validation_step` will have an additional argument. We recommend - setting the default value of 0 so that you can quickly switch between single and multiple dataloaders. - - .. code-block:: python - - # CASE 2: multiple validation dataloaders - def validation_step(self, batch, batch_idx, dataloader_idx=0): - # dataloader_idx tells you which dataset this is. - ... - - Note: - If you don't need to validate you don't need to implement this method. - - Note: - When the :meth:`validation_step` is called, the model has been put in eval mode - and PyTorch gradients have been disabled. At the end of validation, - the model goes back to training mode and gradients are enabled. - """
- -
[docs] def validation_step_end(self, *args, **kwargs) -> Optional[STEP_OUTPUT]: - """Use this when validating with dp or ddp2 because :meth:`validation_step` will operate on only part of - the batch. However, this is still optional and only needed for things like softmax or NCE loss. - - Note: - If you later switch to ddp or some other mode, this will still be called - so that you don't have to change your code. - - .. code-block:: python - - # pseudocode - sub_batches = split_batches_for_dp(batch) - step_output = [validation_step(sub_batch) for sub_batch in sub_batches] - validation_step_end(step_output) - - Args: - step_output: What you return in :meth:`validation_step` for each batch part. - - Return: - None or anything - - .. code-block:: python - - # WITHOUT validation_step_end - # if used in DP or DDP2, this batch is 1/num_gpus large - def validation_step(self, batch, batch_idx): - # batch is 1/num_gpus big - x, y = batch - - out = self.encoder(x) - loss = self.softmax(out) - loss = nce_loss(loss) - self.log("val_loss", loss) - - - # -------------- - # with validation_step_end to do softmax over the full batch - def validation_step(self, batch, batch_idx): - # batch is 1/num_gpus big - x, y = batch - - out = self(x) - return out - - - def validation_step_end(self, val_step_outputs): - for out in val_step_outputs: - ... - - See Also: - See the :ref:`accelerators/gpu:Multi GPU Training` guide for more details. - """
- -
[docs] def validation_epoch_end(self, outputs: Union[EPOCH_OUTPUT, List[EPOCH_OUTPUT]]) -> None: - """Called at the end of the validation epoch with the outputs of all validation steps. - - .. code-block:: python - - # the pseudocode for these calls - val_outs = [] - for val_batch in val_data: - out = validation_step(val_batch) - val_outs.append(out) - validation_epoch_end(val_outs) - - Args: - outputs: List of outputs you defined in :meth:`validation_step`, or if there - are multiple dataloaders, a list containing a list of outputs for each dataloader. - - Return: - None - - Note: - If you didn't define a :meth:`validation_step`, this won't be called. - - Examples: - With a single dataloader: - - .. code-block:: python - - def validation_epoch_end(self, val_step_outputs): - for out in val_step_outputs: - ... - - With multiple dataloaders, `outputs` will be a list of lists. The outer list contains - one entry per dataloader, while the inner list contains the individual outputs of - each validation step for that dataloader. - - .. code-block:: python - - def validation_epoch_end(self, outputs): - for dataloader_output_result in outputs: - dataloader_outs = dataloader_output_result.dataloader_i_outputs - - self.log("final_metric", final_value) - """
- -
[docs] def test_step(self, *args, **kwargs) -> Optional[STEP_OUTPUT]: - r""" - Operates on a single batch of data from the test set. - In this step you'd normally generate examples or calculate anything of interest - such as accuracy. - - .. code-block:: python - - # the pseudocode for these calls - test_outs = [] - for test_batch in test_data: - out = test_step(test_batch) - test_outs.append(out) - test_epoch_end(test_outs) - - Args: - batch: The output of your :class:`~torch.utils.data.DataLoader`. - batch_idx: The index of this batch. - dataloader_id: The index of the dataloader that produced this batch. - (only if multiple test dataloaders used). - - Return: - Any of. - - - Any object or value - - ``None`` - Testing will skip to the next batch - - .. code-block:: python - - # if you have one test dataloader: - def test_step(self, batch, batch_idx): - ... - - - # if you have multiple test dataloaders: - def test_step(self, batch, batch_idx, dataloader_idx=0): - ... - - Examples:: - - # CASE 1: A single test dataset - def test_step(self, batch, batch_idx): - x, y = batch - - # implement your own - out = self(x) - loss = self.loss(out, y) - - # log 6 example images - # or generated text... or whatever - sample_imgs = x[:6] - grid = torchvision.utils.make_grid(sample_imgs) - self.logger.experiment.add_image('example_images', grid, 0) - - # calculate acc - labels_hat = torch.argmax(out, dim=1) - test_acc = torch.sum(y == labels_hat).item() / (len(y) * 1.0) - - # log the outputs! - self.log_dict({'test_loss': loss, 'test_acc': test_acc}) - - If you pass in multiple test dataloaders, :meth:`test_step` will have an additional argument. We recommend - setting the default value of 0 so that you can quickly switch between single and multiple dataloaders. - - .. code-block:: python - - # CASE 2: multiple test dataloaders - def test_step(self, batch, batch_idx, dataloader_idx=0): - # dataloader_idx tells you which dataset this is. - ... - - Note: - If you don't need to test you don't need to implement this method. - - Note: - When the :meth:`test_step` is called, the model has been put in eval mode and - PyTorch gradients have been disabled. At the end of the test epoch, the model goes back - to training mode and gradients are enabled. - """
- -
[docs] def test_step_end(self, *args, **kwargs) -> Optional[STEP_OUTPUT]: - """Use this when testing with dp or ddp2 because :meth:`test_step` will operate on only part of the batch. - However, this is still optional and only needed for things like softmax or NCE loss. - - Note: - If you later switch to ddp or some other mode, this will still be called - so that you don't have to change your code. - - .. code-block:: python - - # pseudocode - sub_batches = split_batches_for_dp(batch) - step_output = [test_step(sub_batch) for sub_batch in sub_batches] - test_step_end(step_output) - - Args: - step_output: What you return in :meth:`test_step` for each batch part. - - Return: - None or anything - - .. code-block:: python - - # WITHOUT test_step_end - # if used in DP or DDP2, this batch is 1/num_gpus large - def test_step(self, batch, batch_idx): - # batch is 1/num_gpus big - x, y = batch - - out = self(x) - loss = self.softmax(out) - self.log("test_loss", loss) - - - # -------------- - # with test_step_end to do softmax over the full batch - def test_step(self, batch, batch_idx): - # batch is 1/num_gpus big - x, y = batch - - out = self.encoder(x) - return out - - - def test_step_end(self, output_results): - # this out is now the full size of the batch - all_test_step_outs = output_results.out - loss = nce_loss(all_test_step_outs) - self.log("test_loss", loss) - - See Also: - See the :ref:`accelerators/gpu:Multi GPU Training` guide for more details. - """
- -
[docs] def test_epoch_end(self, outputs: Union[EPOCH_OUTPUT, List[EPOCH_OUTPUT]]) -> None: - """Called at the end of a test epoch with the output of all test steps. - - .. code-block:: python - - # the pseudocode for these calls - test_outs = [] - for test_batch in test_data: - out = test_step(test_batch) - test_outs.append(out) - test_epoch_end(test_outs) - - Args: - outputs: List of outputs you defined in :meth:`test_step_end`, or if there - are multiple dataloaders, a list containing a list of outputs for each dataloader - - Return: - None - - Note: - If you didn't define a :meth:`test_step`, this won't be called. - - Examples: - With a single dataloader: - - .. code-block:: python - - def test_epoch_end(self, outputs): - # do something with the outputs of all test batches - all_test_preds = test_step_outputs.predictions - - some_result = calc_all_results(all_test_preds) - self.log(some_result) - - With multiple dataloaders, `outputs` will be a list of lists. The outer list contains - one entry per dataloader, while the inner list contains the individual outputs of - each test step for that dataloader. - - .. code-block:: python - - def test_epoch_end(self, outputs): - final_value = 0 - for dataloader_outputs in outputs: - for test_step_out in dataloader_outputs: - # do something - final_value += test_step_out - - self.log("final_metric", final_value) - """
- -
[docs] def predict_step(self, batch: Any, batch_idx: int, dataloader_idx: int = 0) -> Any: - """Step function called during :meth:`~pytorch_lightning.trainer.trainer.Trainer.predict`. By default, it - calls :meth:`~pytorch_lightning.core.lightning.LightningModule.forward`. Override to add any processing - logic. - - The :meth:`~pytorch_lightning.core.lightning.LightningModule.predict_step` is used - to scale inference on multi-devices. - - To prevent an OOM error, it is possible to use :class:`~pytorch_lightning.callbacks.BasePredictionWriter` - callback to write the predictions to disk or database after each batch or on epoch end. - - The :class:`~pytorch_lightning.callbacks.BasePredictionWriter` should be used while using a spawn - based accelerator. This happens for ``Trainer(strategy="ddp_spawn")`` - or training on 8 TPU cores with ``Trainer(accelerator="tpu", devices=8)`` as predictions won't be returned. - - Example :: - - class MyModel(LightningModule): - - def predicts_step(self, batch, batch_idx, dataloader_idx=0): - return self(batch) - - dm = ... - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=2) - predictions = trainer.predict(model, dm) - - - Args: - batch: Current batch. - batch_idx: Index of current batch. - dataloader_idx: Index of the current dataloader. - - Return: - Predicted output - """ - return self(batch)
- -
[docs] def configure_callbacks(self) -> Union[Sequence[Callback], Callback]: - """Configure model-specific callbacks. When the model gets attached, e.g., when ``.fit()`` or ``.test()`` - gets called, the list or a callback returned here will be merged with the list of callbacks passed to the - Trainer's ``callbacks`` argument. If a callback returned here has the same type as one or several callbacks - already present in the Trainer's callbacks list, it will take priority and replace them. In addition, - Lightning will make sure :class:`~pytorch_lightning.callbacks.model_checkpoint.ModelCheckpoint` callbacks - run last. - - Return: - A callback or a list of callbacks which will extend the list of callbacks in the Trainer. - - Example:: - - def configure_callbacks(self): - early_stop = EarlyStopping(monitor="val_acc", mode="max") - checkpoint = ModelCheckpoint(monitor="val_loss") - return [early_stop, checkpoint] - - Note: - Certain callback methods like :meth:`~pytorch_lightning.callbacks.base.Callback.on_init_start` - will never be invoked on the new callbacks returned here. - """ - return []
- -
[docs] def configure_optimizers(self): - r""" - Choose what optimizers and learning-rate schedulers to use in your optimization. - Normally you'd need one. But in the case of GANs or similar you might have multiple. - - Return: - Any of these 6 options. - - - **Single optimizer**. - - **List or Tuple** of optimizers. - - **Two lists** - The first list has multiple optimizers, and the second has multiple LR schedulers - (or multiple ``lr_scheduler_config``). - - **Dictionary**, with an ``"optimizer"`` key, and (optionally) a ``"lr_scheduler"`` - key whose value is a single LR scheduler or ``lr_scheduler_config``. - - **Tuple of dictionaries** as described above, with an optional ``"frequency"`` key. - - **None** - Fit will run without any optimizer. - - The ``lr_scheduler_config`` is a dictionary which contains the scheduler and its associated configuration. - The default configuration is shown below. - - .. code-block:: python - - lr_scheduler_config = { - # REQUIRED: The scheduler instance - "scheduler": lr_scheduler, - # The unit of the scheduler's step size, could also be 'step'. - # 'epoch' updates the scheduler on epoch end whereas 'step' - # updates it after a optimizer update. - "interval": "epoch", - # How many epochs/steps should pass between calls to - # `scheduler.step()`. 1 corresponds to updating the learning - # rate after every epoch/step. - "frequency": 1, - # Metric to to monitor for schedulers like `ReduceLROnPlateau` - "monitor": "val_loss", - # If set to `True`, will enforce that the value specified 'monitor' - # is available when the scheduler is updated, thus stopping - # training if not found. If set to `False`, it will only produce a warning - "strict": True, - # If using the `LearningRateMonitor` callback to monitor the - # learning rate progress, this keyword can be used to specify - # a custom logged name - "name": None, - } - - When there are schedulers in which the ``.step()`` method is conditioned on a value, such as the - :class:`torch.optim.lr_scheduler.ReduceLROnPlateau` scheduler, Lightning requires that the - ``lr_scheduler_config`` contains the keyword ``"monitor"`` set to the metric name that the scheduler - should be conditioned on. - - .. testcode:: - - # The ReduceLROnPlateau scheduler requires a monitor - def configure_optimizers(self): - optimizer = Adam(...) - return { - "optimizer": optimizer, - "lr_scheduler": { - "scheduler": ReduceLROnPlateau(optimizer, ...), - "monitor": "metric_to_track", - "frequency": "indicates how often the metric is updated" - # If "monitor" references validation metrics, then "frequency" should be set to a - # multiple of "trainer.check_val_every_n_epoch". - }, - } - - - # In the case of two optimizers, only one using the ReduceLROnPlateau scheduler - def configure_optimizers(self): - optimizer1 = Adam(...) - optimizer2 = SGD(...) - scheduler1 = ReduceLROnPlateau(optimizer1, ...) - scheduler2 = LambdaLR(optimizer2, ...) - return ( - { - "optimizer": optimizer1, - "lr_scheduler": { - "scheduler": scheduler1, - "monitor": "metric_to_track", - }, - }, - {"optimizer": optimizer2, "lr_scheduler": scheduler2}, - ) - - Metrics can be made available to monitor by simply logging it using - ``self.log('metric_to_track', metric_val)`` in your :class:`~pytorch_lightning.core.lightning.LightningModule`. - - Note: - The ``frequency`` value specified in a dict along with the ``optimizer`` key is an int corresponding - to the number of sequential batches optimized with the specific optimizer. - It should be given to none or to all of the optimizers. - There is a difference between passing multiple optimizers in a list, - and passing multiple optimizers in dictionaries with a frequency of 1: - - - In the former case, all optimizers will operate on the given batch in each optimization step. - - In the latter, only one optimizer will operate on the given batch at every step. - - This is different from the ``frequency`` value specified in the ``lr_scheduler_config`` mentioned above. - - .. code-block:: python - - def configure_optimizers(self): - optimizer_one = torch.optim.SGD(self.model.parameters(), lr=0.01) - optimizer_two = torch.optim.SGD(self.model.parameters(), lr=0.01) - return [ - {"optimizer": optimizer_one, "frequency": 5}, - {"optimizer": optimizer_two, "frequency": 10}, - ] - - In this example, the first optimizer will be used for the first 5 steps, - the second optimizer for the next 10 steps and that cycle will continue. - If an LR scheduler is specified for an optimizer using the ``lr_scheduler`` key in the above dict, - the scheduler will only be updated when its optimizer is being used. - - Examples:: - - # most cases. no learning rate scheduler - def configure_optimizers(self): - return Adam(self.parameters(), lr=1e-3) - - # multiple optimizer case (e.g.: GAN) - def configure_optimizers(self): - gen_opt = Adam(self.model_gen.parameters(), lr=0.01) - dis_opt = Adam(self.model_dis.parameters(), lr=0.02) - return gen_opt, dis_opt - - # example with learning rate schedulers - def configure_optimizers(self): - gen_opt = Adam(self.model_gen.parameters(), lr=0.01) - dis_opt = Adam(self.model_dis.parameters(), lr=0.02) - dis_sch = CosineAnnealing(dis_opt, T_max=10) - return [gen_opt, dis_opt], [dis_sch] - - # example with step-based learning rate schedulers - # each optimizer has its own scheduler - def configure_optimizers(self): - gen_opt = Adam(self.model_gen.parameters(), lr=0.01) - dis_opt = Adam(self.model_dis.parameters(), lr=0.02) - gen_sch = { - 'scheduler': ExponentialLR(gen_opt, 0.99), - 'interval': 'step' # called after each training step - } - dis_sch = CosineAnnealing(dis_opt, T_max=10) # called every epoch - return [gen_opt, dis_opt], [gen_sch, dis_sch] - - # example with optimizer frequencies - # see training procedure in `Improved Training of Wasserstein GANs`, Algorithm 1 - # https://arxiv.org/abs/1704.00028 - def configure_optimizers(self): - gen_opt = Adam(self.model_gen.parameters(), lr=0.01) - dis_opt = Adam(self.model_dis.parameters(), lr=0.02) - n_critic = 5 - return ( - {'optimizer': dis_opt, 'frequency': n_critic}, - {'optimizer': gen_opt, 'frequency': 1} - ) - - Note: - Some things to know: - - - Lightning calls ``.backward()`` and ``.step()`` on each optimizer and learning rate scheduler as needed. - - If you use 16-bit precision (``precision=16``), Lightning will automatically handle the optimizers. - - If you use multiple optimizers, :meth:`training_step` will have an additional ``optimizer_idx`` parameter. - - If you use :class:`torch.optim.LBFGS`, Lightning handles the closure function automatically for you. - - If you use multiple optimizers, gradients will be calculated only for the parameters of current optimizer - at each training step. - - If you need to control how often those optimizers step or override the default ``.step()`` schedule, - override the :meth:`optimizer_step` hook. - """ - rank_zero_warn("`configure_optimizers` must be implemented to be used with the Lightning Trainer")
- -
[docs] def manual_backward(self, loss: Tensor, *args, **kwargs) -> None: - """Call this directly from your :meth:`training_step` when doing optimizations manually. By using this, - Lightning can ensure that all the proper scaling gets applied when using mixed precision. - - See :ref:`manual optimization<common/optimization:Manual optimization>` for more examples. - - Example:: - - def training_step(...): - opt = self.optimizers() - loss = ... - opt.zero_grad() - # automatically applies scaling, etc... - self.manual_backward(loss) - opt.step() - - Args: - loss: The tensor on which to compute gradients. Must have a graph attached. - *args: Additional positional arguments to be forwarded to :meth:`~torch.Tensor.backward` - **kwargs: Additional keyword arguments to be forwarded to :meth:`~torch.Tensor.backward` - """ - self._verify_is_manual_optimization("manual_backward") - self.trainer.strategy.backward(loss, None, None, *args, **kwargs)
- -
[docs] def backward( - self, loss: Tensor, optimizer: Optional[Optimizer], optimizer_idx: Optional[int], *args, **kwargs - ) -> None: - """Called to perform backward on the loss returned in :meth:`training_step`. Override this hook with your - own implementation if you need to. - - Args: - loss: The loss tensor returned by :meth:`training_step`. If gradient accumulation is used, the loss here - holds the normalized value (scaled by 1 / accumulation steps). - optimizer: Current optimizer being used. ``None`` if using manual optimization. - optimizer_idx: Index of the current optimizer being used. ``None`` if using manual optimization. - - Example:: - - def backward(self, loss, optimizer, optimizer_idx): - loss.backward() - """ - loss.backward(*args, **kwargs)
- -
[docs] def toggle_optimizer(self, optimizer: Union[Optimizer, LightningOptimizer], optimizer_idx: int) -> None: - """Makes sure only the gradients of the current optimizer's parameters are calculated in the training step - to prevent dangling gradients in multiple-optimizer setup. - - This is only called automatically when automatic optimization is enabled and multiple optimizers are used. - It works with :meth:`untoggle_optimizer` to make sure ``param_requires_grad_state`` is properly reset. - - Args: - optimizer: The optimizer to toggle. - optimizer_idx: The index of the optimizer to toggle. - """ - # Iterate over all optimizer parameters to preserve their `requires_grad` information - # in case these are pre-defined during `configure_optimizers` - param_requires_grad_state = {} - for opt in self.trainer.optimizers: - for group in opt.param_groups: - for param in group["params"]: - # If a param already appear in param_requires_grad_state, continue - if param in param_requires_grad_state: - continue - param_requires_grad_state[param] = param.requires_grad - param.requires_grad = False - - # Then iterate over the current optimizer's parameters and set its `requires_grad` - # properties accordingly - for group in optimizer.param_groups: - for param in group["params"]: - param.requires_grad = param_requires_grad_state[param] - self._param_requires_grad_state = param_requires_grad_state
- -
[docs] def untoggle_optimizer(self, optimizer_idx: int) -> None: - """Resets the state of required gradients that were toggled with :meth:`toggle_optimizer`. - - This is only called automatically when automatic optimization is enabled and multiple optimizers are used. - - Args: - optimizer_idx: The index of the optimizer to untoggle. - """ - for opt_idx, opt in enumerate(self.trainer.optimizers): - if optimizer_idx != opt_idx: - for group in opt.param_groups: - for param in group["params"]: - if param in self._param_requires_grad_state: - param.requires_grad = self._param_requires_grad_state[param] - # save memory - self._param_requires_grad_state = {}
- - def clip_gradients( - self, - optimizer: Optimizer, - gradient_clip_val: Optional[Union[int, float]] = None, - gradient_clip_algorithm: Optional[str] = None, - ): - """Handles gradient clipping internally. - - Note: - Do not override this method. If you want to customize gradient clipping, consider - using :meth:`configure_gradient_clipping` method. - - Args: - optimizer: Current optimizer being used. - gradient_clip_val: The value at which to clip gradients. - gradient_clip_algorithm: The gradient clipping algorithm to use. Pass ``gradient_clip_algorithm="value"`` - to clip by value, and ``gradient_clip_algorithm="norm"`` to clip by norm. - """ - if gradient_clip_val is None: - gradient_clip_val = self.trainer.gradient_clip_val or 0.0 - elif self.trainer.gradient_clip_val is not None and self.trainer.gradient_clip_val != gradient_clip_val: - raise MisconfigurationException( - f"You have set `Trainer(gradient_clip_val={self.trainer.gradient_clip_val!r})`" - f" and have passed `clip_gradients(gradient_clip_val={gradient_clip_val!r})`." - " Please use only one of them." - ) - - if gradient_clip_algorithm is None: - gradient_clip_algorithm = self.trainer.gradient_clip_algorithm or "norm" - else: - gradient_clip_algorithm = gradient_clip_algorithm.lower() - if ( - self.trainer.gradient_clip_algorithm is not None - and self.trainer.gradient_clip_algorithm != gradient_clip_algorithm - ): - raise MisconfigurationException( - f"You have set `Trainer(gradient_clip_algorithm={self.trainer.gradient_clip_algorithm.value!r})`" - f" and have passed `clip_gradients(gradient_clip_algorithm={gradient_clip_algorithm!r})" - " Please use only one of them." - ) - - if not isinstance(gradient_clip_val, (int, float)): - raise TypeError(f"`gradient_clip_val` should be an int or a float. Got {gradient_clip_val}.") - - if not GradClipAlgorithmType.supported_type(gradient_clip_algorithm.lower()): - raise MisconfigurationException( - f"`gradient_clip_algorithm` {gradient_clip_algorithm} is invalid." - f" Allowed algorithms: {GradClipAlgorithmType.supported_types()}." - ) - - gradient_clip_algorithm = GradClipAlgorithmType(gradient_clip_algorithm) - self.trainer.precision_plugin.clip_gradients(optimizer, gradient_clip_val, gradient_clip_algorithm) - -
[docs] def configure_gradient_clipping( - self, - optimizer: Optimizer, - optimizer_idx: int, - gradient_clip_val: Optional[Union[int, float]] = None, - gradient_clip_algorithm: Optional[str] = None, - ): - """Perform gradient clipping for the optimizer parameters. Called before :meth:`optimizer_step`. - - Args: - optimizer: Current optimizer being used. - optimizer_idx: Index of the current optimizer being used. - gradient_clip_val: The value at which to clip gradients. By default value passed in Trainer - will be available here. - gradient_clip_algorithm: The gradient clipping algorithm to use. By default value - passed in Trainer will be available here. - - Example:: - - # Perform gradient clipping on gradients associated with discriminator (optimizer_idx=1) in GAN - def configure_gradient_clipping(self, optimizer, optimizer_idx, gradient_clip_val, gradient_clip_algorithm): - if optimizer_idx == 1: - # Lightning will handle the gradient clipping - self.clip_gradients( - optimizer, - gradient_clip_val=gradient_clip_val, - gradient_clip_algorithm=gradient_clip_algorithm - ) - else: - # implement your own custom logic to clip gradients for generator (optimizer_idx=0) - """ - self.clip_gradients( - optimizer, gradient_clip_val=gradient_clip_val, gradient_clip_algorithm=gradient_clip_algorithm - )
- - def lr_scheduler_step( - self, - scheduler: LRSchedulerTypeUnion, - optimizer_idx: int, - metric: Optional[Any], - ) -> None: - r""" - Override this method to adjust the default way the - :class:`~pytorch_lightning.trainer.trainer.Trainer` calls each scheduler. - By default, Lightning calls ``step()`` and as shown in the example - for each scheduler based on its ``interval``. - - Args: - scheduler: Learning rate scheduler. - optimizer_idx: Index of the optimizer associated with this scheduler. - metric: Value of the monitor used for schedulers like ``ReduceLROnPlateau``. - - Examples:: - - # DEFAULT - def lr_scheduler_step(self, scheduler, optimizer_idx, metric): - if metric is None: - scheduler.step() - else: - scheduler.step(metric) - - # Alternative way to update schedulers if it requires an epoch value - def lr_scheduler_step(self, scheduler, optimizer_idx, metric): - scheduler.step(epoch=self.current_epoch) - - """ - if metric is None: - scheduler.step() - else: - scheduler.step(metric) - -
[docs] def optimizer_step( - self, - epoch: int, - batch_idx: int, - optimizer: Union[Optimizer, LightningOptimizer], - optimizer_idx: int = 0, - optimizer_closure: Optional[Callable[[], Any]] = None, - on_tpu: bool = False, - using_native_amp: bool = False, - using_lbfgs: bool = False, - ) -> None: - r""" - Override this method to adjust the default way the :class:`~pytorch_lightning.trainer.trainer.Trainer` calls - each optimizer. - - By default, Lightning calls ``step()`` and ``zero_grad()`` as shown in the example once per optimizer. - This method (and ``zero_grad()``) won't be called during the accumulation phase when - ``Trainer(accumulate_grad_batches != 1)``. Overriding this hook has no benefit with manual optimization. - - Args: - epoch: Current epoch - batch_idx: Index of current batch - optimizer: A PyTorch optimizer - optimizer_idx: If you used multiple optimizers, this indexes into that list. - optimizer_closure: The optimizer closure. This closure must be executed as it includes the - calls to ``training_step()``, ``optimizer.zero_grad()``, and ``backward()``. - on_tpu: ``True`` if TPU backward is required - using_native_amp: ``True`` if using native amp - using_lbfgs: True if the matching optimizer is :class:`torch.optim.LBFGS` - - Examples:: - - # DEFAULT - def optimizer_step(self, epoch, batch_idx, optimizer, optimizer_idx, - optimizer_closure, on_tpu, using_native_amp, using_lbfgs): - optimizer.step(closure=optimizer_closure) - - # Alternating schedule for optimizer steps (i.e.: GANs) - def optimizer_step(self, epoch, batch_idx, optimizer, optimizer_idx, - optimizer_closure, on_tpu, using_native_amp, using_lbfgs): - # update generator opt every step - if optimizer_idx == 0: - optimizer.step(closure=optimizer_closure) - - # update discriminator opt every 2 steps - if optimizer_idx == 1: - if (batch_idx + 1) % 2 == 0 : - optimizer.step(closure=optimizer_closure) - else: - # call the closure by itself to run `training_step` + `backward` without an optimizer step - optimizer_closure() - - # ... - # add as many optimizers as you want - - Here's another example showing how to use this for more advanced things such as - learning rate warm-up: - - .. code-block:: python - - # learning rate warm-up - def optimizer_step( - self, - epoch, - batch_idx, - optimizer, - optimizer_idx, - optimizer_closure, - on_tpu, - using_native_amp, - using_lbfgs, - ): - # update params - optimizer.step(closure=optimizer_closure) - - # manually warm up lr without a scheduler - if self.trainer.global_step < 500: - lr_scale = min(1.0, float(self.trainer.global_step + 1) / 500.0) - for pg in optimizer.param_groups: - pg["lr"] = lr_scale * self.learning_rate - - """ - optimizer.step(closure=optimizer_closure)
- -
[docs] def optimizer_zero_grad(self, epoch: int, batch_idx: int, optimizer: Optimizer, optimizer_idx: int): - """Override this method to change the default behaviour of ``optimizer.zero_grad()``. - - Args: - epoch: Current epoch - batch_idx: Index of current batch - optimizer: A PyTorch optimizer - optimizer_idx: If you used multiple optimizers this indexes into that list. - - Examples:: - - # DEFAULT - def optimizer_zero_grad(self, epoch, batch_idx, optimizer, optimizer_idx): - optimizer.zero_grad() - - # Set gradients to `None` instead of zero to improve performance. - def optimizer_zero_grad(self, epoch, batch_idx, optimizer, optimizer_idx): - optimizer.zero_grad(set_to_none=True) - - See :meth:`torch.optim.Optimizer.zero_grad` for the explanation of the above example. - """ - optimizer.zero_grad()
- -
[docs] def tbptt_split_batch(self, batch: Any, split_size: int) -> List[Any]: - r""" - When using truncated backpropagation through time, each batch must be split along the - time dimension. Lightning handles this by default, but for custom behavior override - this function. - - Args: - batch: Current batch - split_size: The size of the split - - Return: - List of batch splits. Each split will be passed to :meth:`training_step` to enable truncated - back propagation through time. The default implementation splits root level Tensors and - Sequences at dim=1 (i.e. time dim). It assumes that each time dim is the same length. - - Examples:: - - def tbptt_split_batch(self, batch, split_size): - splits = [] - for t in range(0, time_dims[0], split_size): - batch_split = [] - for i, x in enumerate(batch): - if isinstance(x, torch.Tensor): - split_x = x[:, t:t + split_size] - elif isinstance(x, collections.Sequence): - split_x = [None] * len(x) - for batch_idx in range(len(x)): - split_x[batch_idx] = x[batch_idx][t:t + split_size] - batch_split.append(split_x) - splits.append(batch_split) - return splits - - Note: - Called in the training loop after - :meth:`~pytorch_lightning.callbacks.base.Callback.on_train_batch_start` - if :paramref:`~pytorch_lightning.core.lightning.LightningModule.truncated_bptt_steps` > 0. - Each returned batch split is passed separately to :meth:`training_step`. - """ - time_dims = [len(x[0]) for x in batch if isinstance(x, (torch.Tensor, collections.Sequence))] - assert len(time_dims) >= 1, "Unable to determine batch time dimension" - assert all(x == time_dims[0] for x in time_dims), "Batch time dimension length is ambiguous" - - splits = [] - for t in range(0, time_dims[0], split_size): - batch_split = [] - for i, x in enumerate(batch): - if isinstance(x, torch.Tensor): - split_x = x[:, t : t + split_size] - elif isinstance(x, collections.Sequence): - split_x = [None] * len(x) - for batch_idx in range(len(x)): - split_x[batch_idx] = x[batch_idx][t : t + split_size] - - batch_split.append(split_x) - - splits.append(batch_split) - - return splits
- - def summarize(self, max_depth: int = 1) -> ModelSummary: - """Summarize this LightningModule. - - .. deprecated:: v1.5 - This method was deprecated in v1.5 in favor of `pytorch_lightning.utilities.model_summary.summarize` - and will be removed in v1.7. - - Args: - max_depth: The maximum depth of layer nesting that the summary will include. A value of 0 turns the - layer summary off. Default: 1. - - Return: - The model summary object - """ - rank_zero_deprecation( - "The `LightningModule.summarize` method is deprecated in v1.5 and will be removed in v1.7. " - "Use `pytorch_lightning.utilities.model_summary.summarize` instead.", - stacklevel=6, - ) - - return summarize(self, max_depth) - -
[docs] def freeze(self) -> None: - r""" - Freeze all params for inference. - - Example:: - - model = MyLightningModule(...) - model.freeze() - - """ - for param in self.parameters(): - param.requires_grad = False - - self.eval()
- -
[docs] def unfreeze(self) -> None: - """Unfreeze all parameters for training. - - .. code-block:: python - - model = MyLightningModule(...) - model.unfreeze() - """ - for param in self.parameters(): - param.requires_grad = True - - self.train()
- - def get_progress_bar_dict(self) -> Dict[str, Union[int, str]]: - r""" - .. deprecated:: v1.5 - This method was deprecated in v1.5 in favor of - `pytorch_lightning.callbacks.progress.base.get_metrics` and will be removed in v1.7. - - Implement this to override the default items displayed in the progress bar. - By default it includes the average loss value, split index of BPTT (if used) - and the version of the experiment when using a logger. - - .. code-block:: - - Epoch 1: 4%|▎ | 40/1095 [00:03<01:37, 10.84it/s, loss=4.501, v_num=10] - - Here is an example how to override the defaults: - - .. code-block:: python - - def get_progress_bar_dict(self): - # don't show the version number - items = super().get_progress_bar_dict() - items.pop("v_num", None) - return items - - Return: - Dictionary with the items to be displayed in the progress bar. - """ - return progress_base.get_standard_metrics(self.trainer, self) - - def _verify_is_manual_optimization(self, fn_name): - if self.automatic_optimization: - raise MisconfigurationException( - f"to use {fn_name}, please disable automatic optimization:" - " set model property `automatic_optimization` as False" - ) - - @classmethod - def _auto_collect_arguments(cls, frame=None) -> Tuple[Dict, Dict]: - """Collect all module arguments in the current constructor and all child constructors. The child - constructors are all the ``__init__`` methods that reach the current class through (chained) - ``super().__init__()`` calls. - - Args: - frame: instance frame - - Returns: - self_arguments: arguments dictionary of the first instance - parents_arguments: arguments dictionary of the parent's instances - """ - if not frame: - frame = inspect.currentframe() - - frame_args = collect_init_args(frame.f_back, []) - self_arguments = frame_args[-1] - - # set hyper_parameters in child - self_arguments = self_arguments - parents_arguments = {} - - # add all arguments from parents - for args in frame_args[:-1]: - parents_arguments.update(args) - return self_arguments, parents_arguments - -
[docs] @torch.no_grad() - def to_onnx(self, file_path: Union[str, Path], input_sample: Optional[Any] = None, **kwargs): - """Saves the model in ONNX format. - - Args: - file_path: The path of the file the onnx model should be saved to. - input_sample: An input for tracing. Default: None (Use self.example_input_array) - **kwargs: Will be passed to torch.onnx.export function. - - Example: - >>> class SimpleModel(LightningModule): - ... def __init__(self): - ... super().__init__() - ... self.l1 = torch.nn.Linear(in_features=64, out_features=4) - ... - ... def forward(self, x): - ... return torch.relu(self.l1(x.view(x.size(0), -1))) - - >>> with tempfile.NamedTemporaryFile(suffix='.onnx', delete=False) as tmpfile: - ... model = SimpleModel() - ... input_sample = torch.randn((1, 64)) - ... model.to_onnx(tmpfile.name, input_sample, export_params=True) - ... os.path.isfile(tmpfile.name) - True - """ - mode = self.training - - if input_sample is None: - if self.example_input_array is None: - raise ValueError( - "Could not export to ONNX since neither `input_sample` nor" - " `model.example_input_array` attribute is set." - ) - input_sample = self.example_input_array - - input_sample = self._apply_batch_transfer_handler(input_sample) - - if not _TORCH_GREATER_EQUAL_1_10 and "example_outputs" not in kwargs: - self.eval() - if isinstance(input_sample, Tuple): - kwargs["example_outputs"] = self(*input_sample) - else: - kwargs["example_outputs"] = self(input_sample) - - torch.onnx.export(self, input_sample, file_path, **kwargs) - self.train(mode)
- -
[docs] @torch.no_grad() - def to_torchscript( - self, - file_path: Optional[Union[str, Path]] = None, - method: Optional[str] = "script", - example_inputs: Optional[Any] = None, - **kwargs, - ) -> Union[ScriptModule, Dict[str, ScriptModule]]: - """By default compiles the whole model to a :class:`~torch.jit.ScriptModule`. If you want to use tracing, - please provided the argument ``method='trace'`` and make sure that either the `example_inputs` argument is - provided, or the model has :attr:`example_input_array` set. If you would like to customize the modules that - are scripted you should override this method. In case you want to return multiple modules, we recommend - using a dictionary. - - Args: - file_path: Path where to save the torchscript. Default: None (no file saved). - method: Whether to use TorchScript's script or trace method. Default: 'script' - example_inputs: An input to be used to do tracing when method is set to 'trace'. - Default: None (uses :attr:`example_input_array`) - **kwargs: Additional arguments that will be passed to the :func:`torch.jit.script` or - :func:`torch.jit.trace` function. - - Note: - - Requires the implementation of the - :meth:`~pytorch_lightning.core.lightning.LightningModule.forward` method. - - The exported script will be set to evaluation mode. - - It is recommended that you install the latest supported version of PyTorch - to use this feature without limitations. See also the :mod:`torch.jit` - documentation for supported features. - - Example: - >>> class SimpleModel(LightningModule): - ... def __init__(self): - ... super().__init__() - ... self.l1 = torch.nn.Linear(in_features=64, out_features=4) - ... - ... def forward(self, x): - ... return torch.relu(self.l1(x.view(x.size(0), -1))) - ... - >>> model = SimpleModel() - >>> model.to_torchscript(file_path="model.pt") # doctest: +SKIP - >>> os.path.isfile("model.pt") # doctest: +SKIP - >>> torch.jit.save(model.to_torchscript(file_path="model_trace.pt", method='trace', # doctest: +SKIP - ... example_inputs=torch.randn(1, 64))) # doctest: +SKIP - >>> os.path.isfile("model_trace.pt") # doctest: +SKIP - True - - Return: - This LightningModule as a torchscript, regardless of whether `file_path` is - defined or not. - """ - mode = self.training - - self._running_torchscript = True - - if method == "script": - torchscript_module = torch.jit.script(self.eval(), **kwargs) - elif method == "trace": - # if no example inputs are provided, try to see if model has example_input_array set - if example_inputs is None: - if self.example_input_array is None: - raise ValueError( - "Choosing method=`trace` requires either `example_inputs`" - " or `model.example_input_array` to be defined." - ) - example_inputs = self.example_input_array - - # automatically send example inputs to the right device and use trace - example_inputs = self._apply_batch_transfer_handler(example_inputs) - torchscript_module = torch.jit.trace(func=self.eval(), example_inputs=example_inputs, **kwargs) - else: - raise ValueError(f"The 'method' parameter only supports 'script' or 'trace', but value given was: {method}") - - self.train(mode) - - if file_path is not None: - fs = get_filesystem(file_path) - with fs.open(file_path, "wb") as f: - torch.jit.save(torchscript_module, f) - - self._running_torchscript = False - - return torchscript_module
- - @property - def model_size(self) -> float: - """Returns the model size in MegaBytes (MB) - - Note: - This property will not return correct value for Deepspeed (stage 3) and fully-sharded training. - """ - if not self._running_torchscript: # remove with the deprecation removal - rank_zero_deprecation( - "The `LightningModule.model_size` property was deprecated in v1.5 and will be removed in v1.7." - " Please use the `pytorch_lightning.utilities.memory.get_model_size_mb`.", - stacklevel=5, - ) - return get_model_size_mb(self) - - @property - def use_amp(self) -> bool: - r""" - .. deprecated:: v1.6. - - This property was deprecated in v1.6 and will be removed in v1.8. - """ - if not self._running_torchscript: # remove with the deprecation removal - rank_zero_deprecation( - "`LightningModule.use_amp` was deprecated in v1.6 and will be removed in v1.8." - " Please use `Trainer.amp_backend`.", - stacklevel=5, - ) - return self._use_amp - - @use_amp.setter - def use_amp(self, use_amp: bool) -> None: - r""" - .. deprecated:: v1.6. - - This property was deprecated in v1.6 and will be removed in v1.8. - """ - if not self._running_torchscript: # remove with the deprecation removal - rank_zero_deprecation( - "`LightningModule.use_amp` was deprecated in v1.6 and will be removed in v1.8." - " Please use `Trainer.amp_backend`.", - stacklevel=5, - ) - self._use_amp = use_amp - -
[docs] def add_to_queue(self, queue: pl.strategies.launchers.spawn._FakeQueue) -> None: - """Appends the :attr:`trainer.callback_metrics` dictionary to the given queue. To avoid issues with memory - sharing, we cast the data to numpy. - - Args: - queue: the instance of the queue to append the data. - - .. deprecated:: v1.5 - This method was deprecated in v1.5 and will be removed in v1.7. - """
- -
[docs] def get_from_queue(self, queue: pl.strategies.launchers.spawn._FakeQueue) -> None: - """Retrieve the :attr:`trainer.callback_metrics` dictionary from the given queue. To preserve consistency, - we cast back the data to ``torch.Tensor``. - - Args: - queue: the instance of the queue from where to get the data. - - .. deprecated:: v1.5 - This method was deprecated in v1.5 and will be removed in v1.7. - """
- - @contextmanager - def _prevent_trainer_and_dataloaders_deepcopy(self) -> None: - self._should_prevent_trainer_and_dataloaders_deepcopy = True - yield - self._should_prevent_trainer_and_dataloaders_deepcopy = False - - def __getstate__(self) -> Dict[str, Any]: - state = dict(self.__dict__) - if self._should_prevent_trainer_and_dataloaders_deepcopy: - state["trainer"] = None - state.pop("train_dataloader", None) - state.pop("val_dataloader", None) - state.pop("test_dataloader", None) - state.pop("predict_dataloader", None) - return state - - def _register_sharded_tensor_state_dict_hooks_if_available(self) -> None: - """Adds ShardedTensor state dict hooks if ShardedTensors are supported. - - These hooks ensure that ShardedTensors are included when saving, and are loaded the LightningModule correctly. - """ - if not _TORCH_GREATER_EQUAL_1_10 or _IS_WINDOWS or not torch.distributed.is_available(): - rank_zero_debug("Could not register sharded tensor state dict hooks") - return - - from torch.distributed._sharded_tensor import pre_load_state_dict_hook, state_dict_hook - - self._register_state_dict_hook(state_dict_hook) - self._register_load_state_dict_pre_hook(pre_load_state_dict_hook, True) -
- -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/_modules/pytorch_lightning/loggers/comet.html b/docs/_modules/pytorch_lightning/loggers/comet.html deleted file mode 100644 index c13671c..0000000 --- a/docs/_modules/pytorch_lightning/loggers/comet.html +++ /dev/null @@ -1,1026 +0,0 @@ - - - - - - - - - - - - - pytorch_lightning.loggers.comet — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -

Source code for pytorch_lightning.loggers.comet

-# Copyright The PyTorch Lightning team.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-"""
-Comet Logger
-------------
-"""
-
-import logging
-import os
-from argparse import Namespace
-from typing import Any, Callable, Dict, Mapping, Optional, Sequence, Union
-
-import torch
-from torch import is_tensor
-
-import pytorch_lightning as pl
-from pytorch_lightning.loggers.base import LightningLoggerBase, rank_zero_experiment
-from pytorch_lightning.utilities.exceptions import MisconfigurationException
-from pytorch_lightning.utilities.imports import _module_available
-from pytorch_lightning.utilities.logger import _add_prefix, _convert_params, _flatten_dict
-from pytorch_lightning.utilities.rank_zero import rank_zero_only
-
-log = logging.getLogger(__name__)
-_COMET_AVAILABLE = _module_available("comet_ml")
-
-if _COMET_AVAILABLE:
-    import comet_ml
-    from comet_ml import ExistingExperiment as CometExistingExperiment
-    from comet_ml import Experiment as CometExperiment
-    from comet_ml import OfflineExperiment as CometOfflineExperiment
-
-    try:
-        from comet_ml.api import API
-    except ModuleNotFoundError:  # pragma: no-cover
-        # For more information, see: https://www.comet.ml/docs/python-sdk/releases/#release-300
-        from comet_ml.papi import API  # pragma: no-cover
-else:
-    # needed for test mocks, these tests shall be updated
-    comet_ml = None
-    CometExperiment, CometExistingExperiment, CometOfflineExperiment = None, None, None
-    API = None
-
-
-
[docs]class CometLogger(LightningLoggerBase): - r""" - Log using `Comet.ml <https://www.comet.ml>`_. - - Install it with pip: - - .. code-block:: bash - - pip install comet-ml - - Comet requires either an API Key (online mode) or a local directory path (offline mode). - - **ONLINE MODE** - - .. code-block:: python - - import os - from pytorch_lightning import Trainer - from pytorch_lightning.loggers import CometLogger - - # arguments made to CometLogger are passed on to the comet_ml.Experiment class - comet_logger = CometLogger( - api_key=os.environ.get("COMET_API_KEY"), - workspace=os.environ.get("COMET_WORKSPACE"), # Optional - save_dir=".", # Optional - project_name="default_project", # Optional - rest_api_key=os.environ.get("COMET_REST_API_KEY"), # Optional - experiment_key=os.environ.get("COMET_EXPERIMENT_KEY"), # Optional - experiment_name="lightning_logs", # Optional - ) - trainer = Trainer(logger=comet_logger) - - **OFFLINE MODE** - - .. code-block:: python - - from pytorch_lightning.loggers import CometLogger - - # arguments made to CometLogger are passed on to the comet_ml.Experiment class - comet_logger = CometLogger( - save_dir=".", - workspace=os.environ.get("COMET_WORKSPACE"), # Optional - project_name="default_project", # Optional - rest_api_key=os.environ.get("COMET_REST_API_KEY"), # Optional - experiment_name="lightning_logs", # Optional - ) - trainer = Trainer(logger=comet_logger) - - Args: - api_key: Required in online mode. API key, found on Comet.ml. If not given, this - will be loaded from the environment variable COMET_API_KEY or ~/.comet.config - if either exists. - save_dir: Required in offline mode. The path for the directory to save local - comet logs. If given, this also sets the directory for saving checkpoints. - project_name: Optional. Send your experiment to a specific project. - Otherwise will be sent to Uncategorized Experiments. - If the project name does not already exist, Comet.ml will create a new project. - rest_api_key: Optional. Rest API key found in Comet.ml settings. - This is used to determine version number - experiment_name: Optional. String representing the name for this particular experiment on Comet.ml. - experiment_key: Optional. If set, restores from existing experiment. - offline: If api_key and save_dir are both given, this determines whether - the experiment will be in online or offline mode. This is useful if you use - save_dir to control the checkpoints directory and have a ~/.comet.config - file but still want to run offline experiments. - prefix: A string to put at the beginning of metric keys. - \**kwargs: Additional arguments like `workspace`, `log_code`, etc. used by - :class:`CometExperiment` can be passed as keyword arguments in this logger. - - Raises: - ModuleNotFoundError: - If required Comet package is not installed on the device. - MisconfigurationException: - If neither ``api_key`` nor ``save_dir`` are passed as arguments. - """ - - LOGGER_JOIN_CHAR = "-" - - def __init__( - self, - api_key: Optional[str] = None, - save_dir: Optional[str] = None, - project_name: Optional[str] = None, - rest_api_key: Optional[str] = None, - experiment_name: Optional[str] = None, - experiment_key: Optional[str] = None, - offline: bool = False, - prefix: str = "", - agg_key_funcs: Optional[Mapping[str, Callable[[Sequence[float]], float]]] = None, - agg_default_func: Optional[Callable[[Sequence[float]], float]] = None, - **kwargs, - ): - if comet_ml is None: - raise ModuleNotFoundError( - "You want to use `comet_ml` logger which is not installed yet, install it with `pip install comet-ml`." - ) - super().__init__(agg_key_funcs=agg_key_funcs, agg_default_func=agg_default_func) - self._experiment = None - - # Determine online or offline mode based on which arguments were passed to CometLogger - api_key = api_key or comet_ml.config.get_api_key(None, comet_ml.config.get_config()) - - if api_key is not None and save_dir is not None: - self.mode = "offline" if offline else "online" - self.api_key = api_key - self._save_dir = save_dir - elif api_key is not None: - self.mode = "online" - self.api_key = api_key - self._save_dir = None - elif save_dir is not None: - self.mode = "offline" - self._save_dir = save_dir - else: - # If neither api_key nor save_dir are passed as arguments, raise an exception - raise MisconfigurationException("CometLogger requires either api_key or save_dir during initialization.") - - log.info(f"CometLogger will be initialized in {self.mode} mode") - - self._project_name = project_name - self._experiment_key = experiment_key - self._experiment_name = experiment_name - self._prefix = prefix - self._kwargs = kwargs - self._future_experiment_key = None - - if rest_api_key is not None: - # Comet.ml rest API, used to determine version number - self.rest_api_key = rest_api_key - self.comet_api = API(self.rest_api_key) - else: - self.rest_api_key = None - self.comet_api = None - - self._kwargs = kwargs - - @property - @rank_zero_experiment - def experiment(self) -> Union[CometExperiment, CometExistingExperiment, CometOfflineExperiment]: - r""" - Actual Comet object. To use Comet features in your - :class:`~pytorch_lightning.core.lightning.LightningModule` do the following. - - Example:: - - self.logger.experiment.some_comet_function() - - """ - if self._experiment is not None: - return self._experiment - - if self._future_experiment_key is not None: - os.environ["COMET_EXPERIMENT_KEY"] = self._future_experiment_key - - try: - if self.mode == "online": - if self._experiment_key is None: - self._experiment = CometExperiment( - api_key=self.api_key, project_name=self._project_name, **self._kwargs - ) - self._experiment_key = self._experiment.get_key() - else: - self._experiment = CometExistingExperiment( - api_key=self.api_key, - project_name=self._project_name, - previous_experiment=self._experiment_key, - **self._kwargs, - ) - else: - self._experiment = CometOfflineExperiment( - offline_directory=self.save_dir, project_name=self._project_name, **self._kwargs - ) - finally: - if self._future_experiment_key is not None: - os.environ.pop("COMET_EXPERIMENT_KEY") - self._future_experiment_key = None - - if self._experiment_name: - self._experiment.set_name(self._experiment_name) - - return self._experiment - -
[docs] @rank_zero_only - def log_hyperparams(self, params: Union[Dict[str, Any], Namespace]) -> None: - params = _convert_params(params) - params = _flatten_dict(params) - self.experiment.log_parameters(params)
- -
[docs] @rank_zero_only - def log_metrics(self, metrics: Dict[str, Union[torch.Tensor, float]], step: Optional[int] = None) -> None: - assert rank_zero_only.rank == 0, "experiment tried to log from global_rank != 0" - # Comet.ml expects metrics to be a dictionary of detached tensors on CPU - metrics_without_epoch = metrics.copy() - for key, val in metrics_without_epoch.items(): - if is_tensor(val): - metrics_without_epoch[key] = val.cpu().detach() - - epoch = metrics_without_epoch.pop("epoch", None) - metrics_without_epoch = _add_prefix(metrics_without_epoch, self._prefix, self.LOGGER_JOIN_CHAR) - self.experiment.log_metrics(metrics_without_epoch, step=step, epoch=epoch)
- - def reset_experiment(self): - self._experiment = None - -
[docs] @rank_zero_only - def finalize(self, status: str) -> None: - r""" - When calling ``self.experiment.end()``, that experiment won't log any more data to Comet. - That's why, if you need to log any more data, you need to create an ExistingCometExperiment. - For example, to log data when testing your model after training, because when training is - finalized :meth:`CometLogger.finalize` is called. - - This happens automatically in the :meth:`~CometLogger.experiment` property, when - ``self._experiment`` is set to ``None``, i.e. ``self.reset_experiment()``. - """ - self.experiment.end() - self.reset_experiment()
- - @property - def save_dir(self) -> Optional[str]: - """Gets the save directory. - - Returns: - The path to the save directory. - """ - return self._save_dir - - @property - def name(self) -> str: - """Gets the project name. - - Returns: - The project name if it is specified, else "comet-default". - """ - # Don't create an experiment if we don't have one - if self._experiment is not None and self._experiment.project_name is not None: - return self._experiment.project_name - - if self._project_name is not None: - return self._project_name - - return "comet-default" - - @property - def version(self) -> str: - """Gets the version. - - Returns: - The first one of the following that is set in the following order - - 1. experiment id. - 2. experiment key. - 3. "COMET_EXPERIMENT_KEY" environment variable. - 4. future experiment key. - - If none are present generates a new guid. - """ - # Don't create an experiment if we don't have one - if self._experiment is not None: - return self._experiment.id - - if self._experiment_key is not None: - return self._experiment_key - - if "COMET_EXPERIMENT_KEY" in os.environ: - return os.environ["COMET_EXPERIMENT_KEY"] - - if self._future_experiment_key is not None: - return self._future_experiment_key - - # Pre-generate an experiment key - self._future_experiment_key = comet_ml.generate_guid() - - return self._future_experiment_key - - def __getstate__(self): - state = self.__dict__.copy() - - # Save the experiment id in case an experiment object already exists, - # this way we could create an ExistingExperiment pointing to the same - # experiment - state["_experiment_key"] = self._experiment.id if self._experiment is not None else None - - # Remove the experiment object as it contains hard to pickle objects - # (like network connections), the experiment object will be recreated if - # needed later - state["_experiment"] = None - return state - -
[docs] def log_graph(self, model: "pl.LightningModule", input_array=None) -> None: - if self._experiment is not None: - self._experiment.set_model_graph(model)
-
- -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/_modules/pytorch_lightning/loggers/csv_logs.html b/docs/_modules/pytorch_lightning/loggers/csv_logs.html deleted file mode 100644 index 8d742fa..0000000 --- a/docs/_modules/pytorch_lightning/loggers/csv_logs.html +++ /dev/null @@ -1,928 +0,0 @@ - - - - - - - - - - - - - pytorch_lightning.loggers.csv_logs — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -

Source code for pytorch_lightning.loggers.csv_logs

-# Copyright The PyTorch Lightning team.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-"""
-CSV logger
-----------
-
-CSV logger for basic experiment logging that does not require opening ports
-
-"""
-import csv
-import logging
-import os
-from argparse import Namespace
-from typing import Any, Dict, Optional, Union
-
-import torch
-
-from pytorch_lightning.core.saving import save_hparams_to_yaml
-from pytorch_lightning.loggers.base import LightningLoggerBase, rank_zero_experiment
-from pytorch_lightning.utilities.logger import _add_prefix, _convert_params
-from pytorch_lightning.utilities.rank_zero import rank_zero_only, rank_zero_warn
-
-log = logging.getLogger(__name__)
-
-
-class ExperimentWriter:
-    r"""
-    Experiment writer for CSVLogger.
-
-    Currently supports to log hyperparameters and metrics in YAML and CSV
-    format, respectively.
-
-    Args:
-        log_dir: Directory for the experiment logs
-    """
-
-    NAME_HPARAMS_FILE = "hparams.yaml"
-    NAME_METRICS_FILE = "metrics.csv"
-
-    def __init__(self, log_dir: str) -> None:
-        self.hparams = {}
-        self.metrics = []
-
-        self.log_dir = log_dir
-        if os.path.exists(self.log_dir) and os.listdir(self.log_dir):
-            rank_zero_warn(
-                f"Experiment logs directory {self.log_dir} exists and is not empty."
-                " Previous log files in this directory will be deleted when the new ones are saved!"
-            )
-        os.makedirs(self.log_dir, exist_ok=True)
-
-        self.metrics_file_path = os.path.join(self.log_dir, self.NAME_METRICS_FILE)
-
-    def log_hparams(self, params: Dict[str, Any]) -> None:
-        """Record hparams."""
-        self.hparams.update(params)
-
-    def log_metrics(self, metrics_dict: Dict[str, float], step: Optional[int] = None) -> None:
-        """Record metrics."""
-
-        def _handle_value(value):
-            if isinstance(value, torch.Tensor):
-                return value.item()
-            return value
-
-        if step is None:
-            step = len(self.metrics)
-
-        metrics = {k: _handle_value(v) for k, v in metrics_dict.items()}
-        metrics["step"] = step
-        self.metrics.append(metrics)
-
-    def save(self) -> None:
-        """Save recorded hparams and metrics into files."""
-        hparams_file = os.path.join(self.log_dir, self.NAME_HPARAMS_FILE)
-        save_hparams_to_yaml(hparams_file, self.hparams)
-
-        if not self.metrics:
-            return
-
-        last_m = {}
-        for m in self.metrics:
-            last_m.update(m)
-        metrics_keys = list(last_m.keys())
-
-        with open(self.metrics_file_path, "w", newline="") as f:
-            writer = csv.DictWriter(f, fieldnames=metrics_keys)
-            writer.writeheader()
-            writer.writerows(self.metrics)
-
-
-
[docs]class CSVLogger(LightningLoggerBase): - r""" - Log to local file system in yaml and CSV format. - - Logs are saved to ``os.path.join(save_dir, name, version)``. - - Example: - >>> from pytorch_lightning import Trainer - >>> from pytorch_lightning.loggers import CSVLogger - >>> logger = CSVLogger("logs", name="my_exp_name") - >>> trainer = Trainer(logger=logger) - - Args: - save_dir: Save directory - name: Experiment name. Defaults to ``'default'``. - version: Experiment version. If version is not specified the logger inspects the save - directory for existing versions, then automatically assigns the next available version. - prefix: A string to put at the beginning of metric keys. - flush_logs_every_n_steps: How often to flush logs to disk (defaults to every 100 steps). - """ - - LOGGER_JOIN_CHAR = "-" - - def __init__( - self, - save_dir: str, - name: Optional[str] = "lightning_logs", - version: Optional[Union[int, str]] = None, - prefix: str = "", - flush_logs_every_n_steps: int = 100, - ): - super().__init__() - self._save_dir = save_dir - self._name = name or "" - self._version = version - self._prefix = prefix - self._experiment = None - self._flush_logs_every_n_steps = flush_logs_every_n_steps - - @property - def root_dir(self) -> str: - """Parent directory for all checkpoint subdirectories. - - If the experiment name parameter is an empty string, no experiment subdirectory is used and the checkpoint will - be saved in "save_dir/version" - """ - return os.path.join(self.save_dir, self.name) - - @property - def log_dir(self) -> str: - """The log directory for this run. - - By default, it is named ``'version_${self.version}'`` but it can be overridden by passing a string value for the - constructor's version parameter instead of ``None`` or an int. - """ - # create a pseudo standard path - version = self.version if isinstance(self.version, str) else f"version_{self.version}" - log_dir = os.path.join(self.root_dir, version) - return log_dir - - @property - def save_dir(self) -> Optional[str]: - """The current directory where logs are saved. - - Returns: - The path to current directory where logs are saved. - """ - return self._save_dir - - @property - @rank_zero_experiment - def experiment(self) -> ExperimentWriter: - r""" - - Actual ExperimentWriter object. To use ExperimentWriter features in your - :class:`~pytorch_lightning.core.lightning.LightningModule` do the following. - - Example:: - - self.logger.experiment.some_experiment_writer_function() - - """ - if self._experiment: - return self._experiment - - os.makedirs(self.root_dir, exist_ok=True) - self._experiment = ExperimentWriter(log_dir=self.log_dir) - return self._experiment - -
[docs] @rank_zero_only - def log_hyperparams(self, params: Union[Dict[str, Any], Namespace]) -> None: - params = _convert_params(params) - self.experiment.log_hparams(params)
- -
[docs] @rank_zero_only - def log_metrics(self, metrics: Dict[str, float], step: Optional[int] = None) -> None: - metrics = _add_prefix(metrics, self._prefix, self.LOGGER_JOIN_CHAR) - self.experiment.log_metrics(metrics, step) - if step is not None and (step + 1) % self._flush_logs_every_n_steps == 0: - self.save()
- -
[docs] @rank_zero_only - def save(self) -> None: - super().save() - self.experiment.save()
- -
[docs] @rank_zero_only - def finalize(self, status: str) -> None: - self.save()
- - @property - def name(self) -> str: - """Gets the name of the experiment. - - Returns: - The name of the experiment. - """ - return self._name - - @property - def version(self) -> int: - """Gets the version of the experiment. - - Returns: - The version of the experiment if it is specified, else the next version. - """ - if self._version is None: - self._version = self._get_next_version() - return self._version - - def _get_next_version(self): - root_dir = self.root_dir - - if not os.path.isdir(root_dir): - log.warning("Missing logger folder: %s", root_dir) - return 0 - - existing_versions = [] - for d in os.listdir(root_dir): - if os.path.isdir(os.path.join(root_dir, d)) and d.startswith("version_"): - existing_versions.append(int(d.split("_")[1])) - - if len(existing_versions) == 0: - return 0 - - return max(existing_versions) + 1
-
- -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/_modules/pytorch_lightning/loggers/mlflow.html b/docs/_modules/pytorch_lightning/loggers/mlflow.html deleted file mode 100644 index d22932b..0000000 --- a/docs/_modules/pytorch_lightning/loggers/mlflow.html +++ /dev/null @@ -1,959 +0,0 @@ - - - - - - - - - - - - - pytorch_lightning.loggers.mlflow — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -

Source code for pytorch_lightning.loggers.mlflow

-# Copyright The PyTorch Lightning team.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-"""
-MLflow Logger
--------------
-"""
-import logging
-import os
-import re
-from argparse import Namespace
-from time import time
-from typing import Any, Dict, Optional, Union
-
-from pytorch_lightning.loggers.base import LightningLoggerBase, rank_zero_experiment
-from pytorch_lightning.utilities.imports import _module_available
-from pytorch_lightning.utilities.logger import _add_prefix, _convert_params, _flatten_dict
-from pytorch_lightning.utilities.rank_zero import rank_zero_only, rank_zero_warn
-
-log = logging.getLogger(__name__)
-LOCAL_FILE_URI_PREFIX = "file:"
-_MLFLOW_AVAILABLE = _module_available("mlflow")
-try:
-    import mlflow
-    from mlflow.tracking import context, MlflowClient
-    from mlflow.utils.mlflow_tags import MLFLOW_RUN_NAME
-# todo: there seems to be still some remaining import error with Conda env
-except ModuleNotFoundError:
-    _MLFLOW_AVAILABLE = False
-    mlflow, MlflowClient, context = None, None, None
-    MLFLOW_RUN_NAME = "mlflow.runName"
-
-# before v1.1.0
-if hasattr(context, "resolve_tags"):
-    from mlflow.tracking.context import resolve_tags
-
-
-# since v1.1.0
-elif hasattr(context, "registry"):
-    from mlflow.tracking.context.registry import resolve_tags
-else:
-
-    def resolve_tags(tags=None):
-        return tags
-
-
-
[docs]class MLFlowLogger(LightningLoggerBase): - """Log using `MLflow <https://mlflow.org>`_. - - Install it with pip: - - .. code-block:: bash - - pip install mlflow - - .. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.loggers import MLFlowLogger - - mlf_logger = MLFlowLogger(experiment_name="lightning_logs", tracking_uri="file:./ml-runs") - trainer = Trainer(logger=mlf_logger) - - Use the logger anywhere in your :class:`~pytorch_lightning.core.lightning.LightningModule` as follows: - - .. code-block:: python - - from pytorch_lightning import LightningModule - - - class LitModel(LightningModule): - def training_step(self, batch, batch_idx): - # example - self.logger.experiment.whatever_ml_flow_supports(...) - - def any_lightning_module_function_or_hook(self): - self.logger.experiment.whatever_ml_flow_supports(...) - - Args: - experiment_name: The name of the experiment. - run_name: Name of the new run. The `run_name` is internally stored as a ``mlflow.runName`` tag. - If the ``mlflow.runName`` tag has already been set in `tags`, the value is overridden by the `run_name`. - tracking_uri: Address of local or remote tracking server. - If not provided, defaults to `MLFLOW_TRACKING_URI` environment variable if set, otherwise it falls - back to `file:<save_dir>`. - tags: A dictionary tags for the experiment. - save_dir: A path to a local directory where the MLflow runs get saved. - Defaults to `./mlflow` if `tracking_uri` is not provided. - Has no effect if `tracking_uri` is provided. - prefix: A string to put at the beginning of metric keys. - artifact_location: The location to store run artifacts. If not provided, the server picks an appropriate - default. - run_id: The run identifier of the experiment. If not provided, a new run is started. - - Raises: - ModuleNotFoundError: - If required MLFlow package is not installed on the device. - """ - - LOGGER_JOIN_CHAR = "-" - - def __init__( - self, - experiment_name: str = "lightning_logs", - run_name: Optional[str] = None, - tracking_uri: Optional[str] = os.getenv("MLFLOW_TRACKING_URI"), - tags: Optional[Dict[str, Any]] = None, - save_dir: Optional[str] = "./mlruns", - prefix: str = "", - artifact_location: Optional[str] = None, - run_id: Optional[str] = None, - ): - if mlflow is None: - raise ModuleNotFoundError( - "You want to use `mlflow` logger which is not installed yet, install it with `pip install mlflow`." - ) - super().__init__() - if not tracking_uri: - tracking_uri = f"{LOCAL_FILE_URI_PREFIX}{save_dir}" - - self._experiment_name = experiment_name - self._experiment_id = None - self._tracking_uri = tracking_uri - self._run_name = run_name - self._run_id = run_id - self.tags = tags - self._prefix = prefix - self._artifact_location = artifact_location - - self._initialized = False - - self._mlflow_client = MlflowClient(tracking_uri) - - @property - @rank_zero_experiment - def experiment(self) -> MlflowClient: - r""" - Actual MLflow object. To use MLflow features in your - :class:`~pytorch_lightning.core.lightning.LightningModule` do the following. - - Example:: - - self.logger.experiment.some_mlflow_function() - - """ - - if self._initialized: - return self._mlflow_client - - if self._run_id is not None: - run = self._mlflow_client.get_run(self._run_id) - self._experiment_id = run.info.experiment_id - self._initialized = True - return self._mlflow_client - - if self._experiment_id is None: - expt = self._mlflow_client.get_experiment_by_name(self._experiment_name) - if expt is not None: - self._experiment_id = expt.experiment_id - else: - log.warning(f"Experiment with name {self._experiment_name} not found. Creating it.") - self._experiment_id = self._mlflow_client.create_experiment( - name=self._experiment_name, artifact_location=self._artifact_location - ) - - if self._run_id is None: - if self._run_name is not None: - self.tags = self.tags or {} - if MLFLOW_RUN_NAME in self.tags: - log.warning( - f"The tag {MLFLOW_RUN_NAME} is found in tags. The value will be overridden by {self._run_name}." - ) - self.tags[MLFLOW_RUN_NAME] = self._run_name - run = self._mlflow_client.create_run(experiment_id=self._experiment_id, tags=resolve_tags(self.tags)) - self._run_id = run.info.run_id - self._initialized = True - return self._mlflow_client - - @property - def run_id(self) -> str: - """Create the experiment if it does not exist to get the run id. - - Returns: - The run id. - """ - _ = self.experiment - return self._run_id - - @property - def experiment_id(self) -> str: - """Create the experiment if it does not exist to get the experiment id. - - Returns: - The experiment id. - """ - _ = self.experiment - return self._experiment_id - -
[docs] @rank_zero_only - def log_hyperparams(self, params: Union[Dict[str, Any], Namespace]) -> None: - params = _convert_params(params) - params = _flatten_dict(params) - for k, v in params.items(): - if len(str(v)) > 250: - rank_zero_warn( - f"Mlflow only allows parameters with up to 250 characters. Discard {k}={v}", category=RuntimeWarning - ) - continue - - self.experiment.log_param(self.run_id, k, v)
- -
[docs] @rank_zero_only - def log_metrics(self, metrics: Dict[str, float], step: Optional[int] = None) -> None: - assert rank_zero_only.rank == 0, "experiment tried to log from global_rank != 0" - - metrics = _add_prefix(metrics, self._prefix, self.LOGGER_JOIN_CHAR) - - timestamp_ms = int(time() * 1000) - for k, v in metrics.items(): - if isinstance(v, str): - log.warning(f"Discarding metric with string value {k}={v}.") - continue - - new_k = re.sub("[^a-zA-Z0-9_/. -]+", "", k) - if k != new_k: - rank_zero_warn( - "MLFlow only allows '_', '/', '.' and ' ' special characters in metric name." - f" Replacing {k} with {new_k}.", - category=RuntimeWarning, - ) - k = new_k - - self.experiment.log_metric(self.run_id, k, v, timestamp_ms, step)
- -
[docs] @rank_zero_only - def finalize(self, status: str = "FINISHED") -> None: - super().finalize(status) - status = "FINISHED" if status == "success" else status - if self.experiment.get_run(self.run_id): - self.experiment.set_terminated(self.run_id, status)
- - @property - def save_dir(self) -> Optional[str]: - """The root file directory in which MLflow experiments are saved. - - Return: - Local path to the root experiment directory if the tracking uri is local. - Otherwise returns `None`. - """ - if self._tracking_uri.startswith(LOCAL_FILE_URI_PREFIX): - return self._tracking_uri.lstrip(LOCAL_FILE_URI_PREFIX) - - @property - def name(self) -> str: - """Get the experiment id. - - Returns: - The experiment id. - """ - return self.experiment_id - - @property - def version(self) -> str: - """Get the run id. - - Returns: - The run id. - """ - return self.run_id
-
- -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/_modules/pytorch_lightning/loggers/neptune.html b/docs/_modules/pytorch_lightning/loggers/neptune.html deleted file mode 100644 index 3e9bd1a..0000000 --- a/docs/_modules/pytorch_lightning/loggers/neptune.html +++ /dev/null @@ -1,1360 +0,0 @@ - - - - - - - - - - - - - pytorch_lightning.loggers.neptune — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -

Source code for pytorch_lightning.loggers.neptune

-# Copyright The PyTorch Lightning team.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-"""
-Neptune Logger
---------------
-"""
-__all__ = [
-    "NeptuneLogger",
-]
-
-import logging
-import os
-import warnings
-from argparse import Namespace
-from functools import reduce
-from typing import Any, Callable, Dict, Generator, Mapping, Optional, Sequence, Set, Union
-from weakref import ReferenceType
-
-import torch
-
-from pytorch_lightning import __version__
-from pytorch_lightning.callbacks.model_checkpoint import ModelCheckpoint
-from pytorch_lightning.loggers.base import LightningLoggerBase, rank_zero_experiment
-from pytorch_lightning.utilities.imports import _NEPTUNE_AVAILABLE, _NEPTUNE_GREATER_EQUAL_0_9
-from pytorch_lightning.utilities.logger import _add_prefix, _convert_params, _sanitize_callable_params
-from pytorch_lightning.utilities.model_summary import ModelSummary
-from pytorch_lightning.utilities.rank_zero import rank_zero_only
-
-if _NEPTUNE_AVAILABLE and _NEPTUNE_GREATER_EQUAL_0_9:
-    try:
-        from neptune import new as neptune
-        from neptune.new.exceptions import NeptuneLegacyProjectException, NeptuneOfflineModeFetchException
-        from neptune.new.run import Run
-        from neptune.new.types import File as NeptuneFile
-    except ModuleNotFoundError:
-        import neptune
-        from neptune.exceptions import NeptuneLegacyProjectException, NeptuneOfflineModeFetchException
-        from neptune.run import Run
-        from neptune.types import File as NeptuneFile
-else:
-    # needed for test mocks, and function signatures
-    neptune, Run, NeptuneFile = None, None, None
-
-log = logging.getLogger(__name__)
-
-_INTEGRATION_VERSION_KEY = "source_code/integrations/pytorch-lightning"
-
-# kwargs used in previous NeptuneLogger version, now deprecated
-_LEGACY_NEPTUNE_INIT_KWARGS = [
-    "project_name",
-    "offline_mode",
-    "experiment_name",
-    "experiment_id",
-    "params",
-    "properties",
-    "upload_source_files",
-    "abort_callback",
-    "logger",
-    "upload_stdout",
-    "upload_stderr",
-    "send_hardware_metrics",
-    "run_monitoring_thread",
-    "handle_uncaught_exceptions",
-    "git_info",
-    "hostname",
-    "notebook_id",
-    "notebook_path",
-]
-
-# kwargs used in legacy NeptuneLogger from neptune-pytorch-lightning package
-_LEGACY_NEPTUNE_LOGGER_KWARGS = [
-    "base_namespace",
-    "close_after_fit",
-]
-
-
-
[docs]class NeptuneLogger(LightningLoggerBase): - r""" - Log using `Neptune <https://neptune.ai>`_. - - Install it with pip: - - .. code-block:: bash - - pip install neptune-client - - or conda: - - .. code-block:: bash - - conda install -c conda-forge neptune-client - - **Quickstart** - - Pass NeptuneLogger instance to the Trainer to log metadata with Neptune: - - .. code-block:: python - - - from pytorch_lightning import Trainer - from pytorch_lightning.loggers import NeptuneLogger - - neptune_logger = NeptuneLogger( - api_key="ANONYMOUS", # replace with your own - project="common/pytorch-lightning-integration", # format "<WORKSPACE/PROJECT>" - tags=["training", "resnet"], # optional - ) - trainer = Trainer(max_epochs=10, logger=neptune_logger) - - **How to use NeptuneLogger?** - - Use the logger anywhere in your :class:`~pytorch_lightning.core.lightning.LightningModule` as follows: - - .. code-block:: python - - from neptune.new.types import File - from pytorch_lightning import LightningModule - - - class LitModel(LightningModule): - def training_step(self, batch, batch_idx): - # log metrics - acc = ... - self.log("train/loss", loss) - - def any_lightning_module_function_or_hook(self): - # log images - img = ... - self.logger.experiment["train/misclassified_images"].log(File.as_image(img)) - - # generic recipe - metadata = ... - self.logger.experiment["your/metadata/structure"].log(metadata) - - Note that syntax: ``self.logger.experiment["your/metadata/structure"].log(metadata)`` is specific to Neptune - and it extends logger capabilities. Specifically, it allows you to log various types of metadata - like scores, files, images, interactive visuals, CSVs, etc. - Refer to the `Neptune docs <https://docs.neptune.ai/you-should-know/logging-metadata#essential-logging-methods>`_ - for more detailed explanations. - You can also use regular logger methods ``log_metrics()``, and ``log_hyperparams()`` with NeptuneLogger - as these are also supported. - - **Log after fitting or testing is finished** - - You can log objects after the fitting or testing methods are finished: - - .. code-block:: python - - neptune_logger = NeptuneLogger(project="common/pytorch-lightning-integration") - - trainer = pl.Trainer(logger=neptune_logger) - model = ... - datamodule = ... - trainer.fit(model, datamodule=datamodule) - trainer.test(model, datamodule=datamodule) - - # Log objects after `fit` or `test` methods - # model summary - neptune_logger.log_model_summary(model=model, max_depth=-1) - - # generic recipe - metadata = ... - neptune_logger.experiment["your/metadata/structure"].log(metadata) - - **Log model checkpoints** - - If you have :class:`~pytorch_lightning.callbacks.ModelCheckpoint` configured, - Neptune logger automatically logs model checkpoints. - Model weights will be uploaded to the: "model/checkpoints" namespace in the Neptune Run. - You can disable this option: - - .. code-block:: python - - neptune_logger = NeptuneLogger(project="common/pytorch-lightning-integration", log_model_checkpoints=False) - - **Pass additional parameters to the Neptune run** - - You can also pass ``neptune_run_kwargs`` to specify the run in the greater detail, like ``tags`` or ``description``: - - .. testcode:: - - from pytorch_lightning import Trainer - from pytorch_lightning.loggers import NeptuneLogger - - neptune_logger = NeptuneLogger( - project="common/pytorch-lightning-integration", - name="lightning-run", - description="mlp quick run with pytorch-lightning", - tags=["mlp", "quick-run"], - ) - trainer = Trainer(max_epochs=3, logger=neptune_logger) - - Check `run documentation <https://docs.neptune.ai/essentials/api-reference/run>`_ - for more info about additional run parameters. - - **Details about Neptune run structure** - - Runs can be viewed as nested dictionary-like structures that you can define in your code. - Thanks to this you can easily organize your metadata in a way that is most convenient for you. - - The hierarchical structure that you apply to your metadata will be reflected later in the UI. - - You can organize this way any type of metadata - images, parameters, metrics, model checkpoint, CSV files, etc. - - See Also: - - Read about - `what object you can log to Neptune <https://docs.neptune.ai/you-should-know/what-can-you-log-and-display>`_. - - Check `example run <https://app.neptune.ai/o/common/org/pytorch-lightning-integration/e/PTL-1/all>`_ - with multiple types of metadata logged. - - For more detailed info check - `user guide <https://docs.neptune.ai/integrations-and-supported-tools/model-training/pytorch-lightning>`_. - - Args: - api_key: Optional. - Neptune API token, found on https://neptune.ai upon registration. - Read: `how to find and set Neptune API token <https://docs.neptune.ai/administration/security-and-privacy/ - how-to-find-and-set-neptune-api-token>`_. - It is recommended to keep it in the `NEPTUNE_API_TOKEN` - environment variable and then you can drop ``api_key=None``. - project: Optional. - Name of a project in a form of "my_workspace/my_project" for example "tom/mask-rcnn". - If ``None``, the value of `NEPTUNE_PROJECT` environment variable will be taken. - You need to create the project in https://neptune.ai first. - name: Optional. Editable name of the run. - Run name appears in the "all metadata/sys" section in Neptune UI. - run: Optional. Default is ``None``. The Neptune ``Run`` object. - If specified, this `Run`` will be used for logging, instead of a new Run. - When run object is passed you can't specify other neptune properties. - log_model_checkpoints: Optional. Default is ``True``. Log model checkpoint to Neptune. - Works only if ``ModelCheckpoint`` is passed to the ``Trainer``. - prefix: Optional. Default is ``"training"``. Root namespace for all metadata logging. - \**neptune_run_kwargs: Additional arguments like ``tags``, ``description``, ``capture_stdout``, etc. - used when run is created. - - Raises: - ModuleNotFoundError: - If required Neptune package in version >=0.9 is not installed on the device. - TypeError: - If configured project has not been migrated to new structure yet. - ValueError: - If argument passed to the logger's constructor is incorrect. - """ - - LOGGER_JOIN_CHAR = "/" - PARAMETERS_KEY = "hyperparams" - ARTIFACTS_KEY = "artifacts" - - def __init__( - self, - *, # force users to call `NeptuneLogger` initializer with `kwargs` - api_key: Optional[str] = None, - project: Optional[str] = None, - name: Optional[str] = None, - run: Optional["Run"] = None, - log_model_checkpoints: Optional[bool] = True, - prefix: str = "training", - agg_key_funcs: Optional[Mapping[str, Callable[[Sequence[float]], float]]] = None, - agg_default_func: Optional[Callable[[Sequence[float]], float]] = None, - **neptune_run_kwargs, - ): - # verify if user passed proper init arguments - self._verify_input_arguments(api_key, project, name, run, neptune_run_kwargs) - if neptune is None: - raise ModuleNotFoundError( - "You want to use the `Neptune` logger which is not installed yet, install it with" - " `pip install neptune-client`." - ) - - super().__init__(agg_key_funcs=agg_key_funcs, agg_default_func=agg_default_func) - self._log_model_checkpoints = log_model_checkpoints - self._prefix = prefix - self._run_name = name - self._project_name = project - self._api_key = api_key - self._run_instance = run - self._neptune_run_kwargs = neptune_run_kwargs - self._run_short_id = None - - if self._run_instance is not None: - self._retrieve_run_data() - - # make sure that we've log integration version for outside `Run` instances - self._run_instance[_INTEGRATION_VERSION_KEY] = __version__ - - def _retrieve_run_data(self): - try: - self._run_instance.wait() - self._run_short_id = self._run_instance["sys/id"].fetch() - self._run_name = self._run_instance["sys/name"].fetch() - except NeptuneOfflineModeFetchException: - self._run_short_id = "OFFLINE" - self._run_name = "offline-name" - - @property - def _neptune_init_args(self): - args = {} - # Backward compatibility in case of previous version retrieval - try: - args = self._neptune_run_kwargs - except AttributeError: - pass - - if self._project_name is not None: - args["project"] = self._project_name - - if self._api_key is not None: - args["api_token"] = self._api_key - - if self._run_short_id is not None: - args["run"] = self._run_short_id - - # Backward compatibility in case of previous version retrieval - try: - if self._run_name is not None: - args["name"] = self._run_name - except AttributeError: - pass - - return args - - def _construct_path_with_prefix(self, *keys) -> str: - """Return sequence of keys joined by `LOGGER_JOIN_CHAR`, started with `_prefix` if defined.""" - if self._prefix: - return self.LOGGER_JOIN_CHAR.join([self._prefix, *keys]) - return self.LOGGER_JOIN_CHAR.join(keys) - - @staticmethod - def _verify_input_arguments( - api_key: Optional[str], - project: Optional[str], - name: Optional[str], - run: Optional["Run"], - neptune_run_kwargs: dict, - ): - legacy_kwargs_msg = ( - "Following kwargs are deprecated: {legacy_kwargs}.\n" - "If you are looking for the Neptune logger using legacy Python API," - " it's still available as part of neptune-contrib package:\n" - " - https://docs-legacy.neptune.ai/integrations/pytorch_lightning.html\n" - "The NeptuneLogger was re-written to use the neptune.new Python API\n" - " - https://neptune.ai/blog/neptune-new\n" - " - https://docs.neptune.ai/integrations-and-supported-tools/model-training/pytorch-lightning\n" - "You should use arguments accepted by either NeptuneLogger.init() or neptune.init()" - ) - - # check if user used legacy kwargs expected in `NeptuneLegacyLogger` - used_legacy_kwargs = [ - legacy_kwarg for legacy_kwarg in neptune_run_kwargs if legacy_kwarg in _LEGACY_NEPTUNE_INIT_KWARGS - ] - if used_legacy_kwargs: - raise ValueError(legacy_kwargs_msg.format(legacy_kwargs=used_legacy_kwargs)) - - # check if user used legacy kwargs expected in `NeptuneLogger` from neptune-pytorch-lightning package - used_legacy_neptune_kwargs = [ - legacy_kwarg for legacy_kwarg in neptune_run_kwargs if legacy_kwarg in _LEGACY_NEPTUNE_LOGGER_KWARGS - ] - if used_legacy_neptune_kwargs: - raise ValueError(legacy_kwargs_msg.format(legacy_kwargs=used_legacy_neptune_kwargs)) - - # check if user passed new client `Run` object - if run is not None and not isinstance(run, Run): - raise ValueError( - "Run parameter expected to be of type `neptune.new.Run`.\n" - "If you are looking for the Neptune logger using legacy Python API," - " it's still available as part of neptune-contrib package:\n" - " - https://docs-legacy.neptune.ai/integrations/pytorch_lightning.html\n" - "The NeptuneLogger was re-written to use the neptune.new Python API\n" - " - https://neptune.ai/blog/neptune-new\n" - " - https://docs.neptune.ai/integrations-and-supported-tools/model-training/pytorch-lightning\n" - ) - - # check if user passed redundant neptune.init arguments when passed run - any_neptune_init_arg_passed = any(arg is not None for arg in [api_key, project, name]) or neptune_run_kwargs - if run is not None and any_neptune_init_arg_passed: - raise ValueError( - "When an already initialized run object is provided" - " you can't provide other neptune.init() parameters.\n" - ) - - def __getstate__(self): - state = self.__dict__.copy() - # Run instance can't be pickled - state["_run_instance"] = None - return state - - def __setstate__(self, state): - self.__dict__ = state - self._run_instance = neptune.init(**self._neptune_init_args) - - @property - @rank_zero_experiment - def experiment(self) -> Run: - r""" - Actual Neptune run object. Allows you to use neptune logging features in your - :class:`~pytorch_lightning.core.lightning.LightningModule`. - - Example:: - - class LitModel(LightningModule): - def training_step(self, batch, batch_idx): - # log metrics - acc = ... - self.logger.experiment["train/acc"].log(acc) - - # log images - img = ... - self.logger.experiment["train/misclassified_images"].log(File.as_image(img)) - - Note that syntax: ``self.logger.experiment["your/metadata/structure"].log(metadata)`` - is specific to Neptune and it extends logger capabilities. - Specifically, it allows you to log various types of metadata like scores, files, - images, interactive visuals, CSVs, etc. Refer to the - `Neptune docs <https://docs.neptune.ai/you-should-know/logging-metadata#essential-logging-methods>`_ - for more detailed explanations. - You can also use regular logger methods ``log_metrics()``, and ``log_hyperparams()`` - with NeptuneLogger as these are also supported. - """ - return self.run - - @property - @rank_zero_experiment - def run(self) -> Run: - try: - if not self._run_instance: - self._run_instance = neptune.init(**self._neptune_init_args) - self._retrieve_run_data() - # make sure that we've log integration version for newly created - self._run_instance[_INTEGRATION_VERSION_KEY] = __version__ - - return self._run_instance - except NeptuneLegacyProjectException as e: - raise TypeError( - f"Project {self._project_name} has not been migrated to the new structure." - " You can still integrate it with the Neptune logger using legacy Python API" - " available as part of neptune-contrib package:" - " https://docs-legacy.neptune.ai/integrations/pytorch_lightning.html\n" - ) from e - -
[docs] @rank_zero_only - def log_hyperparams(self, params: Union[Dict[str, Any], Namespace]) -> None: # skipcq: PYL-W0221 - r""" - Log hyper-parameters to the run. - - Hyperparams will be logged under the "<prefix>/hyperparams" namespace. - - Note: - - You can also log parameters by directly using the logger instance: - ``neptune_logger.experiment["model/hyper-parameters"] = params_dict``. - - In this way you can keep hierarchical structure of the parameters. - - Args: - params: `dict`. - Python dictionary structure with parameters. - - Example:: - - from pytorch_lightning.loggers import NeptuneLogger - - PARAMS = { - "batch_size": 64, - "lr": 0.07, - "decay_factor": 0.97 - } - - neptune_logger = NeptuneLogger( - api_key="ANONYMOUS", - project="common/pytorch-lightning-integration" - ) - - neptune_logger.log_hyperparams(PARAMS) - """ - params = _convert_params(params) - params = _sanitize_callable_params(params) - - parameters_key = self.PARAMETERS_KEY - parameters_key = self._construct_path_with_prefix(parameters_key) - - self.run[parameters_key] = params
- -
[docs] @rank_zero_only - def log_metrics(self, metrics: Dict[str, Union[torch.Tensor, float]], step: Optional[int] = None) -> None: - """Log metrics (numeric values) in Neptune runs. - - Args: - metrics: Dictionary with metric names as keys and measured quantities as values. - step: Step number at which the metrics should be recorded, currently ignored. - """ - if rank_zero_only.rank != 0: - raise ValueError("run tried to log from global_rank != 0") - - metrics = _add_prefix(metrics, self._prefix, self.LOGGER_JOIN_CHAR) - - for key, val in metrics.items(): - # `step` is ignored because Neptune expects strictly increasing step values which - # Lightning does not always guarantee. - self.run[key].log(val)
- -
[docs] @rank_zero_only - def finalize(self, status: str) -> None: - if status: - self.run[self._construct_path_with_prefix("status")] = status - - super().finalize(status)
- - @property - def save_dir(self) -> Optional[str]: - """Gets the save directory of the experiment which in this case is ``None`` because Neptune does not save - locally. - - Returns: - the root directory where experiment logs get saved - """ - return os.path.join(os.getcwd(), ".neptune") - - @rank_zero_only - def log_model_summary(self, model, max_depth=-1): - model_str = str(ModelSummary(model=model, max_depth=max_depth)) - self.run[self._construct_path_with_prefix("model/summary")] = neptune.types.File.from_content( - content=model_str, extension="txt" - ) - -
[docs] @rank_zero_only - def after_save_checkpoint(self, checkpoint_callback: "ReferenceType[ModelCheckpoint]") -> None: - """Automatically log checkpointed model. Called after model checkpoint callback saves a new checkpoint. - - Args: - checkpoint_callback: the model checkpoint callback instance - """ - if not self._log_model_checkpoints: - return - - file_names = set() - checkpoints_namespace = self._construct_path_with_prefix("model/checkpoints") - - # save last model - if checkpoint_callback.last_model_path: - model_last_name = self._get_full_model_name(checkpoint_callback.last_model_path, checkpoint_callback) - file_names.add(model_last_name) - self.run[f"{checkpoints_namespace}/{model_last_name}"].upload(checkpoint_callback.last_model_path) - - # save best k models - for key in checkpoint_callback.best_k_models.keys(): - model_name = self._get_full_model_name(key, checkpoint_callback) - file_names.add(model_name) - self.run[f"{checkpoints_namespace}/{model_name}"].upload(key) - - # log best model path and checkpoint - if checkpoint_callback.best_model_path: - self.run[self._construct_path_with_prefix("model/best_model_path")] = checkpoint_callback.best_model_path - - model_name = self._get_full_model_name(checkpoint_callback.best_model_path, checkpoint_callback) - file_names.add(model_name) - self.run[f"{checkpoints_namespace}/{model_name}"].upload(checkpoint_callback.best_model_path) - - # remove old models logged to experiment if they are not part of best k models at this point - if self.run.exists(checkpoints_namespace): - exp_structure = self.run.get_structure() - uploaded_model_names = self._get_full_model_names_from_exp_structure(exp_structure, checkpoints_namespace) - - for file_to_drop in list(uploaded_model_names - file_names): - del self.run[f"{checkpoints_namespace}/{file_to_drop}"] - - # log best model score - if checkpoint_callback.best_model_score: - self.run[self._construct_path_with_prefix("model/best_model_score")] = ( - checkpoint_callback.best_model_score.cpu().detach().numpy() - )
- - @staticmethod - def _get_full_model_name(model_path: str, checkpoint_callback: "ReferenceType[ModelCheckpoint]") -> str: - """Returns model name which is string `model_path` appended to `checkpoint_callback.dirpath`.""" - expected_model_path = f"{checkpoint_callback.dirpath}{os.path.sep}" - if not model_path.startswith(expected_model_path): - raise ValueError(f"{model_path} was expected to start with {expected_model_path}.") - # Remove extension from filepath - filepath, _ = os.path.splitext(model_path[len(expected_model_path) :]) - - return filepath - - @classmethod - def _get_full_model_names_from_exp_structure(cls, exp_structure: dict, namespace: str) -> Set[str]: - """Returns all paths to properties which were already logged in `namespace`""" - structure_keys = namespace.split(cls.LOGGER_JOIN_CHAR) - uploaded_models_dict = reduce(lambda d, k: d[k], [exp_structure, *structure_keys]) - return set(cls._dict_paths(uploaded_models_dict)) - - @classmethod - def _dict_paths(cls, d: dict, path_in_build: str = None) -> Generator: - for k, v in d.items(): - path = f"{path_in_build}/{k}" if path_in_build is not None else k - if not isinstance(v, dict): - yield path - else: - yield from cls._dict_paths(v, path) - - @property - def name(self) -> str: - """Return the experiment name or 'offline-name' when exp is run in offline mode.""" - return self._run_name - - @property - def version(self) -> str: - """Return the experiment version. - - It's Neptune Run's short_id - """ - return self._run_short_id - - @staticmethod - def _signal_deprecated_api_usage(f_name, sample_code, raise_exception=False): - msg_suffix = ( - f"If you are looking for the Neptune logger using legacy Python API," - f" it's still available as part of neptune-contrib package:\n" - f" - https://docs-legacy.neptune.ai/integrations/pytorch_lightning.html\n" - f"The NeptuneLogger was re-written to use the neptune.new Python API\n" - f" - https://neptune.ai/blog/neptune-new\n" - f" - https://docs.neptune.ai/integrations-and-supported-tools/model-training/pytorch-lightning\n" - f"Instead of `logger.{f_name}` you can use:\n" - f"\t{sample_code}" - ) - - if not raise_exception: - warnings.warn( - "The function you've used is deprecated in v1.5.0 and will be removed in v1.7.0. " + msg_suffix - ) - else: - raise ValueError("The function you've used is deprecated.\n" + msg_suffix) - - @rank_zero_only - def log_metric(self, metric_name: str, metric_value: Union[torch.Tensor, float, str], step: Optional[int] = None): - key = f"{self._prefix}/{metric_name}" - self._signal_deprecated_api_usage("log_metric", f"logger.run['{key}'].log(42)") - if torch.is_tensor(metric_value): - metric_value = metric_value.cpu().detach() - - self.run[key].log(metric_value, step=step) - - @rank_zero_only - def log_text(self, log_name: str, text: str, step: Optional[int] = None) -> None: - key = f"{self._prefix}/{log_name}" - self._signal_deprecated_api_usage("log_text", f"logger.run['{key}].log('text')") - self.run[key].log(str(text), step=step) - - @rank_zero_only - def log_image(self, log_name: str, image: Union[str, Any], step: Optional[int] = None) -> None: - key = f"{self._prefix}/{log_name}" - self._signal_deprecated_api_usage("log_image", f"logger.run['{key}'].log(File('path_to_image'))") - if isinstance(image, str): - # if `img` is path to file, convert it to file object - image = NeptuneFile(image) - self.run[key].log(image, step=step) - - @rank_zero_only - def log_artifact(self, artifact: str, destination: Optional[str] = None) -> None: - key = f"{self._prefix}/{self.ARTIFACTS_KEY}/{artifact}" - self._signal_deprecated_api_usage("log_artifact", f"logger.run['{key}].log('path_to_file')") - self.run[key].log(destination) - - def set_property(self, *args, **kwargs): - self._signal_deprecated_api_usage( - "log_artifact", f"logger.run['{self._prefix}/{self.PARAMETERS_KEY}/key'].log(value)", raise_exception=True - ) - - def append_tags(self, *args, **kwargs): - self._signal_deprecated_api_usage( - "append_tags", "logger.run['sys/tags'].add(['foo', 'bar'])", raise_exception=True - )
-
- -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/_modules/pytorch_lightning/loggers/tensorboard.html b/docs/_modules/pytorch_lightning/loggers/tensorboard.html deleted file mode 100644 index 328b8eb..0000000 --- a/docs/_modules/pytorch_lightning/loggers/tensorboard.html +++ /dev/null @@ -1,1004 +0,0 @@ - - - - - - - - - - - - - pytorch_lightning.loggers.tensorboard — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -

Source code for pytorch_lightning.loggers.tensorboard

-# Copyright The PyTorch Lightning team.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-"""
-TensorBoard Logger
-------------------
-"""
-
-import logging
-import os
-from argparse import Namespace
-from typing import Any, Callable, Dict, Mapping, Optional, Sequence, Union
-
-import numpy as np
-import torch
-from torch.utils.tensorboard import SummaryWriter
-from torch.utils.tensorboard.summary import hparams
-
-import pytorch_lightning as pl
-from pytorch_lightning.core.saving import save_hparams_to_yaml
-from pytorch_lightning.loggers.base import LightningLoggerBase, rank_zero_experiment
-from pytorch_lightning.utilities.cloud_io import get_filesystem
-from pytorch_lightning.utilities.imports import _OMEGACONF_AVAILABLE
-from pytorch_lightning.utilities.logger import _add_prefix, _convert_params, _flatten_dict
-from pytorch_lightning.utilities.logger import _sanitize_params as _utils_sanitize_params
-from pytorch_lightning.utilities.rank_zero import rank_zero_only, rank_zero_warn
-
-log = logging.getLogger(__name__)
-
-if _OMEGACONF_AVAILABLE:
-    from omegaconf import Container, OmegaConf
-
-
-
[docs]class TensorBoardLogger(LightningLoggerBase): - r""" - Log to local file system in `TensorBoard <https://www.tensorflow.org/tensorboard>`_ format. - - Implemented using :class:`~torch.utils.tensorboard.SummaryWriter`. Logs are saved to - ``os.path.join(save_dir, name, version)``. This is the default logger in Lightning, it comes - preinstalled. - - Example: - - .. testcode:: - - from pytorch_lightning import Trainer - from pytorch_lightning.loggers import TensorBoardLogger - - logger = TensorBoardLogger("tb_logs", name="my_model") - trainer = Trainer(logger=logger) - - Args: - save_dir: Save directory - name: Experiment name. Defaults to ``'default'``. If it is the empty string then no per-experiment - subdirectory is used. - version: Experiment version. If version is not specified the logger inspects the save - directory for existing versions, then automatically assigns the next available version. - If it is a string then it is used as the run-specific subdirectory name, - otherwise ``'version_${version}'`` is used. - log_graph: Adds the computational graph to tensorboard. This requires that - the user has defined the `self.example_input_array` attribute in their - model. - default_hp_metric: Enables a placeholder metric with key `hp_metric` when `log_hyperparams` is - called without a metric (otherwise calls to log_hyperparams without a metric are ignored). - prefix: A string to put at the beginning of metric keys. - sub_dir: Sub-directory to group TensorBoard logs. If a sub_dir argument is passed - then logs are saved in ``/save_dir/name/version/sub_dir/``. Defaults to ``None`` in which - logs are saved in ``/save_dir/name/version/``. - \**kwargs: Additional arguments used by :class:`SummaryWriter` can be passed as keyword - arguments in this logger. To automatically flush to disk, `max_queue` sets the size - of the queue for pending logs before flushing. `flush_secs` determines how many seconds - elapses before flushing. - - """ - NAME_HPARAMS_FILE = "hparams.yaml" - LOGGER_JOIN_CHAR = "-" - - def __init__( - self, - save_dir: str, - name: Optional[str] = "lightning_logs", - version: Optional[Union[int, str]] = None, - log_graph: bool = False, - default_hp_metric: bool = True, - prefix: str = "", - sub_dir: Optional[str] = None, - agg_key_funcs: Optional[Mapping[str, Callable[[Sequence[float]], float]]] = None, - agg_default_func: Optional[Callable[[Sequence[float]], float]] = None, - **kwargs, - ): - super().__init__(agg_key_funcs=agg_key_funcs, agg_default_func=agg_default_func) - self._save_dir = save_dir - self._name = name or "" - self._version = version - self._sub_dir = sub_dir - self._log_graph = log_graph - self._default_hp_metric = default_hp_metric - self._prefix = prefix - self._fs = get_filesystem(save_dir) - - self._experiment = None - self.hparams = {} - self._kwargs = kwargs - - @property - def root_dir(self) -> str: - """Parent directory for all tensorboard checkpoint subdirectories. - - If the experiment name parameter is an empty string, no experiment subdirectory is used and the checkpoint will - be saved in "save_dir/version" - """ - return os.path.join(self.save_dir, self.name) - - @property - def log_dir(self) -> str: - """The directory for this run's tensorboard checkpoint. - - By default, it is named ``'version_${self.version}'`` but it can be overridden by passing a string value for the - constructor's version parameter instead of ``None`` or an int. - """ - # create a pseudo standard path ala test-tube - version = self.version if isinstance(self.version, str) else f"version_{self.version}" - log_dir = os.path.join(self.root_dir, version) - if isinstance(self.sub_dir, str): - log_dir = os.path.join(log_dir, self.sub_dir) - log_dir = os.path.expandvars(log_dir) - log_dir = os.path.expanduser(log_dir) - return log_dir - - @property - def save_dir(self) -> Optional[str]: - """Gets the save directory where the TensorBoard experiments are saved. - - Returns: - The local path to the save directory where the TensorBoard experiments are saved. - """ - return self._save_dir - - @property - def sub_dir(self) -> Optional[str]: - """Gets the sub directory where the TensorBoard experiments are saved. - - Returns: - The local path to the sub directory where the TensorBoard experiments are saved. - """ - return self._sub_dir - - @property - @rank_zero_experiment - def experiment(self) -> SummaryWriter: - r""" - Actual tensorboard object. To use TensorBoard features in your - :class:`~pytorch_lightning.core.lightning.LightningModule` do the following. - - Example:: - - self.logger.experiment.some_tensorboard_function() - - """ - if self._experiment is not None: - return self._experiment - - assert rank_zero_only.rank == 0, "tried to init log dirs in non global_rank=0" - if self.root_dir: - self._fs.makedirs(self.root_dir, exist_ok=True) - self._experiment = SummaryWriter(log_dir=self.log_dir, **self._kwargs) - return self._experiment - -
[docs] @rank_zero_only - def log_hyperparams( - self, params: Union[Dict[str, Any], Namespace], metrics: Optional[Dict[str, Any]] = None - ) -> None: - """Record hyperparameters. TensorBoard logs with and without saved hyperparameters are incompatible, the - hyperparameters are then not displayed in the TensorBoard. Please delete or move the previously saved logs - to display the new ones with hyperparameters. - - Args: - params: a dictionary-like container with the hyperparameters - metrics: Dictionary with metric names as keys and measured quantities as values - """ - - params = _convert_params(params) - - # store params to output - if _OMEGACONF_AVAILABLE and isinstance(params, Container): - self.hparams = OmegaConf.merge(self.hparams, params) - else: - self.hparams.update(params) - - # format params into the suitable for tensorboard - params = _flatten_dict(params) - params = self._sanitize_params(params) - - if metrics is None: - if self._default_hp_metric: - metrics = {"hp_metric": -1} - elif not isinstance(metrics, dict): - metrics = {"hp_metric": metrics} - - if metrics: - self.log_metrics(metrics, 0) - exp, ssi, sei = hparams(params, metrics) - writer = self.experiment._get_file_writer() - writer.add_summary(exp) - writer.add_summary(ssi) - writer.add_summary(sei)
- -
[docs] @rank_zero_only - def log_metrics(self, metrics: Dict[str, float], step: Optional[int] = None) -> None: - assert rank_zero_only.rank == 0, "experiment tried to log from global_rank != 0" - - metrics = _add_prefix(metrics, self._prefix, self.LOGGER_JOIN_CHAR) - - for k, v in metrics.items(): - if isinstance(v, torch.Tensor): - v = v.item() - - if isinstance(v, dict): - self.experiment.add_scalars(k, v, step) - else: - try: - self.experiment.add_scalar(k, v, step) - # todo: specify the possible exception - except Exception as ex: - m = f"\n you tried to log {v} which is currently not supported. Try a dict or a scalar/tensor." - raise ValueError(m) from ex
- -
[docs] @rank_zero_only - def log_graph(self, model: "pl.LightningModule", input_array=None): - if self._log_graph: - if input_array is None: - input_array = model.example_input_array - - if input_array is not None: - input_array = model._apply_batch_transfer_handler(input_array) - model._running_torchscript = True - self.experiment.add_graph(model, input_array) - model._running_torchscript = False - else: - rank_zero_warn( - "Could not log computational graph since the" - " `model.example_input_array` attribute is not set" - " or `input_array` was not given", - )
- -
[docs] @rank_zero_only - def save(self) -> None: - super().save() - dir_path = self.log_dir - - # prepare the file path - hparams_file = os.path.join(dir_path, self.NAME_HPARAMS_FILE) - - # save the metatags file if it doesn't exist and the log directory exists - if self._fs.isdir(dir_path) and not self._fs.isfile(hparams_file): - save_hparams_to_yaml(hparams_file, self.hparams)
- -
[docs] @rank_zero_only - def finalize(self, status: str) -> None: - self.experiment.flush() - self.experiment.close() - self.save()
- - @property - def name(self) -> str: - """Get the name of the experiment. - - Returns: - The name of the experiment. - """ - return self._name - - @property - def version(self) -> int: - """Get the experiment version. - - Returns: - The experiment version if specified else the next version. - """ - if self._version is None: - self._version = self._get_next_version() - return self._version - - def _get_next_version(self): - root_dir = self.root_dir - - try: - listdir_info = self._fs.listdir(root_dir) - except OSError: - log.warning("Missing logger folder: %s", root_dir) - return 0 - - existing_versions = [] - for listing in listdir_info: - d = listing["name"] - bn = os.path.basename(d) - if self._fs.isdir(d) and bn.startswith("version_"): - dir_ver = bn.split("_")[1].replace("/", "") - existing_versions.append(int(dir_ver)) - if len(existing_versions) == 0: - return 0 - - return max(existing_versions) + 1 - - @staticmethod - def _sanitize_params(params: Dict[str, Any]) -> Dict[str, Any]: - params = _utils_sanitize_params(params) - # logging of arrays with dimension > 1 is not supported, sanitize as string - return {k: str(v) if isinstance(v, (torch.Tensor, np.ndarray)) and v.ndim > 1 else v for k, v in params.items()} - - def __getstate__(self): - state = self.__dict__.copy() - state["_experiment"] = None - return state
-
- -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/_modules/pytorch_lightning/loggers/wandb.html b/docs/_modules/pytorch_lightning/loggers/wandb.html deleted file mode 100644 index ed249ab..0000000 --- a/docs/_modules/pytorch_lightning/loggers/wandb.html +++ /dev/null @@ -1,1197 +0,0 @@ - - - - - - - - - - - - - pytorch_lightning.loggers.wandb — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -

Source code for pytorch_lightning.loggers.wandb

-# Copyright The PyTorch Lightning team.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-"""
-Weights and Biases Logger
--------------------------
-"""
-import os
-from argparse import Namespace
-from pathlib import Path
-from typing import Any, Callable, Dict, List, Mapping, Optional, Sequence, Union
-from weakref import ReferenceType
-
-import torch.nn as nn
-
-from pytorch_lightning.callbacks.model_checkpoint import ModelCheckpoint
-from pytorch_lightning.loggers.base import LightningLoggerBase, rank_zero_experiment
-from pytorch_lightning.utilities.exceptions import MisconfigurationException
-from pytorch_lightning.utilities.imports import _WANDB_GREATER_EQUAL_0_10_22, _WANDB_GREATER_EQUAL_0_12_10
-from pytorch_lightning.utilities.logger import _add_prefix, _convert_params, _flatten_dict, _sanitize_callable_params
-from pytorch_lightning.utilities.rank_zero import rank_zero_only, rank_zero_warn
-
-try:
-    import wandb
-    from wandb.wandb_run import Run
-except ModuleNotFoundError:
-    # needed for test mocks, these tests shall be updated
-    wandb, Run = None, None
-
-
-
[docs]class WandbLogger(LightningLoggerBase): - r""" - Log using `Weights and Biases <https://docs.wandb.ai/integrations/lightning>`_. - - **Installation and set-up** - - Install with pip: - - .. code-block:: bash - - pip install wandb - - Create a `WandbLogger` instance: - - .. code-block:: python - - from pytorch_lightning.loggers import WandbLogger - - wandb_logger = WandbLogger(project="MNIST") - - Pass the logger instance to the `Trainer`: - - .. code-block:: python - - trainer = Trainer(logger=wandb_logger) - - A new W&B run will be created when training starts if you have not created one manually before with `wandb.init()`. - - **Log metrics** - - Log from :class:`~pytorch_lightning.core.lightning.LightningModule`: - - .. code-block:: python - - class LitModule(LightningModule): - def training_step(self, batch, batch_idx): - self.log("train/loss", loss) - - Use directly wandb module: - - .. code-block:: python - - wandb.log({"train/loss": loss}) - - **Log hyper-parameters** - - Save :class:`~pytorch_lightning.core.lightning.LightningModule` parameters: - - .. code-block:: python - - class LitModule(LightningModule): - def __init__(self, *args, **kwarg): - self.save_hyperparameters() - - Add other config parameters: - - .. code-block:: python - - # add one parameter - wandb_logger.experiment.config["key"] = value - - # add multiple parameters - wandb_logger.experiment.config.update({key1: val1, key2: val2}) - - # use directly wandb module - wandb.config["key"] = value - wandb.config.update() - - **Log gradients, parameters and model topology** - - Call the `watch` method for automatically tracking gradients: - - .. code-block:: python - - # log gradients and model topology - wandb_logger.watch(model) - - # log gradients, parameter histogram and model topology - wandb_logger.watch(model, log="all") - - # change log frequency of gradients and parameters (100 steps by default) - wandb_logger.watch(model, log_freq=500) - - # do not log graph (in case of errors) - wandb_logger.watch(model, log_graph=False) - - The `watch` method adds hooks to the model which can be removed at the end of training: - - .. code-block:: python - - wandb_logger.unwatch(model) - - **Log model checkpoints** - - Log model checkpoints at the end of training: - - .. code-block:: python - - wandb_logger = WandbLogger(log_model=True) - - Log model checkpoints as they get created during training: - - .. code-block:: python - - wandb_logger = WandbLogger(log_model="all") - - Custom checkpointing can be set up through :class:`~pytorch_lightning.callbacks.ModelCheckpoint`: - - .. code-block:: python - - # log model only if `val_accuracy` increases - wandb_logger = WandbLogger(log_model="all") - checkpoint_callback = ModelCheckpoint(monitor="val_accuracy", mode="max") - trainer = Trainer(logger=wandb_logger, callbacks=[checkpoint_callback]) - - `latest` and `best` aliases are automatically set to easily retrieve a model checkpoint: - - .. code-block:: python - - # reference can be retrieved in artifacts panel - # "VERSION" can be a version (ex: "v2") or an alias ("latest or "best") - checkpoint_reference = "USER/PROJECT/MODEL-RUN_ID:VERSION" - - # download checkpoint locally (if not already cached) - run = wandb.init(project="MNIST") - artifact = run.use_artifact(checkpoint_reference, type="model") - artifact_dir = artifact.download() - - # load checkpoint - model = LitModule.load_from_checkpoint(Path(artifact_dir) / "model.ckpt") - - **Log media** - - Log text with: - - .. code-block:: python - - # using columns and data - columns = ["input", "label", "prediction"] - data = [["cheese", "english", "english"], ["fromage", "french", "spanish"]] - wandb_logger.log_text(key="samples", columns=columns, data=data) - - # using a pandas DataFrame - wandb_logger.log_text(key="samples", dataframe=my_dataframe) - - Log images with: - - .. code-block:: python - - # using tensors, numpy arrays or PIL images - wandb_logger.log_image(key="samples", images=[img1, img2]) - - # adding captions - wandb_logger.log_image(key="samples", images=[img1, img2], caption=["tree", "person"]) - - # using file path - wandb_logger.log_image(key="samples", images=["img_1.jpg", "img_2.jpg"]) - - More arguments can be passed for logging segmentation masks and bounding boxes. Refer to - `Image Overlays documentation <https://docs.wandb.ai/guides/track/log/media#image-overlays>`_. - - **Log Tables** - - `W&B Tables <https://docs.wandb.ai/guides/data-vis>`_ can be used to log, query and analyze tabular data. - - They support any type of media (text, image, video, audio, molecule, html, etc) and are great for storing, - understanding and sharing any form of data, from datasets to model predictions. - - .. code-block:: python - - columns = ["caption", "image", "sound"] - data = [["cheese", wandb.Image(img_1), wandb.Audio(snd_1)], ["wine", wandb.Image(img_2), wandb.Audio(snd_2)]] - wandb_logger.log_table(key="samples", columns=columns, data=data) - - See Also: - - `Demo in Google Colab <http://wandb.me/lightning>`__ with hyperparameter search and model logging - - `W&B Documentation <https://docs.wandb.ai/integrations/lightning>`__ - - Args: - name: Display name for the run. - save_dir: Path where data is saved (wandb dir by default). - offline: Run offline (data can be streamed later to wandb servers). - id: Sets the version, mainly used to resume a previous run. - version: Same as id. - anonymous: Enables or explicitly disables anonymous logging. - project: The name of the project to which this run will belong. - log_model: Log checkpoints created by :class:`~pytorch_lightning.callbacks.model_checkpoint.ModelCheckpoint` - as W&B artifacts. `latest` and `best` aliases are automatically set. - - * if ``log_model == 'all'``, checkpoints are logged during training. - * if ``log_model == True``, checkpoints are logged at the end of training, except when - :paramref:`~pytorch_lightning.callbacks.model_checkpoint.ModelCheckpoint.save_top_k` ``== -1`` - which also logs every checkpoint during training. - * if ``log_model == False`` (default), no checkpoint is logged. - - prefix: A string to put at the beginning of metric keys. - experiment: WandB experiment object. Automatically set when creating a run. - \**kwargs: Arguments passed to :func:`wandb.init` like `entity`, `group`, `tags`, etc. - - Raises: - ModuleNotFoundError: - If required WandB package is not installed on the device. - MisconfigurationException: - If both ``log_model`` and ``offline`` is set to ``True``. - - """ - - LOGGER_JOIN_CHAR = "-" - - def __init__( - self, - name: Optional[str] = None, - save_dir: Optional[str] = None, - offline: Optional[bool] = False, - id: Optional[str] = None, - anonymous: Optional[bool] = None, - version: Optional[str] = None, - project: Optional[str] = None, - log_model: Union[str, bool] = False, - experiment=None, - prefix: Optional[str] = "", - agg_key_funcs: Optional[Mapping[str, Callable[[Sequence[float]], float]]] = None, - agg_default_func: Optional[Callable[[Sequence[float]], float]] = None, - **kwargs, - ): - if wandb is None: - raise ModuleNotFoundError( - "You want to use `wandb` logger which is not installed yet," - " install it with `pip install wandb`." # pragma: no-cover - ) - - if offline and log_model: - raise MisconfigurationException( - f"Providing log_model={log_model} and offline={offline} is an invalid configuration" - " since model checkpoints cannot be uploaded in offline mode.\n" - "Hint: Set `offline=False` to log your model." - ) - - if log_model and not _WANDB_GREATER_EQUAL_0_10_22: - rank_zero_warn( - f"Providing log_model={log_model} requires wandb version >= 0.10.22" - " for logging associated model metadata.\n" - "Hint: Upgrade with `pip install --upgrade wandb`." - ) - - super().__init__(agg_key_funcs=agg_key_funcs, agg_default_func=agg_default_func) - self._offline = offline - self._log_model = log_model - self._prefix = prefix - self._experiment = experiment - self._logged_model_time = {} - self._checkpoint_callback = None - # set wandb init arguments - anonymous_lut = {True: "allow", False: None} - self._wandb_init = dict( - name=name, - project=project, - id=version or id, - dir=save_dir, - resume="allow", - anonymous=anonymous_lut.get(anonymous, anonymous), - ) - self._wandb_init.update(**kwargs) - # extract parameters - self._save_dir = self._wandb_init.get("dir") - self._name = self._wandb_init.get("name") - self._id = self._wandb_init.get("id") - # start wandb run (to create an attach_id for distributed modes) - if _WANDB_GREATER_EQUAL_0_12_10: - wandb.require("service") - _ = self.experiment - - def __getstate__(self): - state = self.__dict__.copy() - # args needed to reload correct experiment - if self._experiment is not None: - state["_id"] = getattr(self._experiment, "id", None) - state["_attach_id"] = getattr(self._experiment, "_attach_id", None) - state["_name"] = self._experiment.project_name() - - # cannot be pickled - state["_experiment"] = None - return state - - @property - @rank_zero_experiment - def experiment(self) -> Run: - r""" - - Actual wandb object. To use wandb features in your - :class:`~pytorch_lightning.core.lightning.LightningModule` do the following. - - Example:: - - .. code-block:: python - - self.logger.experiment.some_wandb_function() - - """ - if self._experiment is None: - if self._offline: - os.environ["WANDB_MODE"] = "dryrun" - - attach_id = getattr(self, "_attach_id", None) - if wandb.run is not None: - # wandb process already created in this instance - rank_zero_warn( - "There is a wandb run already in progress and newly created instances of `WandbLogger` will reuse" - " this run. If this is not desired, call `wandb.finish()` before instantiating `WandbLogger`." - ) - self._experiment = wandb.run - elif attach_id is not None and hasattr(wandb, "_attach"): - # attach to wandb process referenced - self._experiment = wandb._attach(attach_id) - else: - # create new wandb process - self._experiment = wandb.init(**self._wandb_init) - - # define default x-axis - if getattr(self._experiment, "define_metric", None): - self._experiment.define_metric("trainer/global_step") - self._experiment.define_metric("*", step_metric="trainer/global_step", step_sync=True) - - return self._experiment - - def watch(self, model: nn.Module, log: str = "gradients", log_freq: int = 100, log_graph: bool = True): - self.experiment.watch(model, log=log, log_freq=log_freq, log_graph=log_graph) - -
[docs] @rank_zero_only - def log_hyperparams(self, params: Union[Dict[str, Any], Namespace]) -> None: - params = _convert_params(params) - params = _flatten_dict(params) - params = _sanitize_callable_params(params) - self.experiment.config.update(params, allow_val_change=True)
- -
[docs] @rank_zero_only - def log_metrics(self, metrics: Dict[str, float], step: Optional[int] = None) -> None: - assert rank_zero_only.rank == 0, "experiment tried to log from global_rank != 0" - - metrics = _add_prefix(metrics, self._prefix, self.LOGGER_JOIN_CHAR) - if step is not None: - self.experiment.log({**metrics, "trainer/global_step": step}) - else: - self.experiment.log(metrics)
- -
[docs] @rank_zero_only - def log_table( - self, - key: str, - columns: List[str] = None, - data: List[List[Any]] = None, - dataframe: Any = None, - step: Optional[int] = None, - ) -> None: - """Log a Table containing any object type (text, image, audio, video, molecule, html, etc). - - Can be defined either with `columns` and `data` or with `dataframe`. - """ - - metrics = {key: wandb.Table(columns=columns, data=data, dataframe=dataframe)} - self.log_metrics(metrics, step)
- -
[docs] @rank_zero_only - def log_text( - self, - key: str, - columns: List[str] = None, - data: List[List[str]] = None, - dataframe: Any = None, - step: Optional[int] = None, - ) -> None: - """Log text as a Table. - - Can be defined either with `columns` and `data` or with `dataframe`. - """ - - self.log_table(key, columns, data, dataframe, step)
- -
[docs] @rank_zero_only - def log_image(self, key: str, images: List[Any], step: Optional[int] = None, **kwargs: str) -> None: - """Log images (tensors, numpy arrays, PIL Images or file paths). - - Optional kwargs are lists passed to each image (ex: caption, masks, boxes). - """ - if not isinstance(images, list): - raise TypeError(f'Expected a list as "images", found {type(images)}') - n = len(images) - for k, v in kwargs.items(): - if len(v) != n: - raise ValueError(f"Expected {n} items but only found {len(v)} for {k}") - kwarg_list = [{k: kwargs[k][i] for k in kwargs.keys()} for i in range(n)] - metrics = {key: [wandb.Image(img, **kwarg) for img, kwarg in zip(images, kwarg_list)]} - self.log_metrics(metrics, step)
- - @property - def save_dir(self) -> Optional[str]: - """Gets the save directory. - - Returns: - The path to the save directory. - """ - return self._save_dir - - @property - def name(self) -> Optional[str]: - """Gets the name of the experiment. - - Returns: - The name of the experiment if the experiment exists else the name given to the constructor. - """ - # don't create an experiment if we don't have one - return self._experiment.project_name() if self._experiment else self._name - - @property - def version(self) -> Optional[str]: - """Gets the id of the experiment. - - Returns: - The id of the experiment if the experiment exists else the id given to the constructor. - """ - # don't create an experiment if we don't have one - return self._experiment.id if self._experiment else self._id - -
[docs] def after_save_checkpoint(self, checkpoint_callback: "ReferenceType[ModelCheckpoint]") -> None: - # log checkpoints as artifacts - if self._log_model == "all" or self._log_model is True and checkpoint_callback.save_top_k == -1: - self._scan_and_log_checkpoints(checkpoint_callback) - elif self._log_model is True: - self._checkpoint_callback = checkpoint_callback
- -
[docs] @rank_zero_only - def finalize(self, status: str) -> None: - # log checkpoints as artifacts - if self._checkpoint_callback: - self._scan_and_log_checkpoints(self._checkpoint_callback)
- - def _scan_and_log_checkpoints(self, checkpoint_callback: "ReferenceType[ModelCheckpoint]") -> None: - # get checkpoints to be saved with associated score - checkpoints = { - checkpoint_callback.last_model_path: checkpoint_callback.current_score, - checkpoint_callback.best_model_path: checkpoint_callback.best_model_score, - **checkpoint_callback.best_k_models, - } - checkpoints = sorted((Path(p).stat().st_mtime, p, s) for p, s in checkpoints.items() if Path(p).is_file()) - checkpoints = [ - c for c in checkpoints if c[1] not in self._logged_model_time.keys() or self._logged_model_time[c[1]] < c[0] - ] - - # log iteratively all new checkpoints - for t, p, s in checkpoints: - metadata = ( - { - "score": s, - "original_filename": Path(p).name, - "ModelCheckpoint": { - k: getattr(checkpoint_callback, k) - for k in [ - "monitor", - "mode", - "save_last", - "save_top_k", - "save_weights_only", - "_every_n_train_steps", - ] - # ensure it does not break if `ModelCheckpoint` args change - if hasattr(checkpoint_callback, k) - }, - } - if _WANDB_GREATER_EQUAL_0_10_22 - else None - ) - artifact = wandb.Artifact(name=f"model-{self.experiment.id}", type="model", metadata=metadata) - artifact.add_file(p, name="model.ckpt") - aliases = ["latest", "best"] if p == checkpoint_callback.best_model_path else ["latest"] - self.experiment.log_artifact(artifact, aliases=aliases) - # remember logged models - timestamp needed in case filename didn't change (lastkckpt or custom name) - self._logged_model_time[p] = t
-
- -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/_modules/pytorch_lightning/loops/base.html b/docs/_modules/pytorch_lightning/loops/base.html deleted file mode 100644 index b2f5283..0000000 --- a/docs/_modules/pytorch_lightning/loops/base.html +++ /dev/null @@ -1,1033 +0,0 @@ - - - - - - - - - - - - - pytorch_lightning.loops.base — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -

Source code for pytorch_lightning.loops.base

-# Copyright The PyTorch Lightning team.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-import inspect
-from abc import ABC, abstractmethod
-from typing import Any, Dict, Generic, Optional, Type, TypeVar, Union
-
-from deprecate import void
-from torchmetrics import Metric
-
-import pytorch_lightning as pl
-from pytorch_lightning.trainer.connectors.logger_connector.result import _ResultCollection
-from pytorch_lightning.trainer.progress import BaseProgress
-from pytorch_lightning.utilities.exceptions import MisconfigurationException
-from pytorch_lightning.utilities.imports import _fault_tolerant_training
-
-T = TypeVar("T")  # the output type of `run`
-
-
-class Loop(ABC, Generic[T]):
-    """Basic Loops interface. All classes derived from this must implement the following properties and methods:
-
-        * :attr:`done` (property): Condition to break the loop
-        * :attr:`reset` (method): Resets the internal state between multiple calls of :attr:`run`
-        * :attr:`advance` (method): Implements one step of the loop
-
-    This class implements the following loop structure:
-
-    .. code-block:: python
-
-        on_run_start()
-
-        while not done:
-            on_advance_start()
-            advance()
-            on_advance_end()
-
-        on_run_end()
-    """
-
-    def __init__(self) -> None:
-        self._restarting = False
-        self._trainer: Optional["pl.Trainer"] = None
-
-    @property
-    def trainer(self) -> "pl.Trainer":
-        if self._trainer is None:
-            raise RuntimeError("The loop is not attached to a Trainer.")
-        return self._trainer
-
-    @trainer.setter
-    def trainer(self, trainer: "pl.Trainer") -> None:
-        """Connects this loop's trainer and its children."""
-        if not isinstance(trainer, pl.Trainer):
-            raise MisconfigurationException(
-                f"Loop {self.__class__.__name__} should be connected to a `Trainer`, found: {trainer}."
-            )
-        self._trainer = trainer
-        for v in self.__dict__.values():
-            if isinstance(v, Loop):
-                v.trainer = trainer
-
-    @property
-    def restarting(self) -> bool:
-        """Whether the state of this loop was reloaded and it needs to restart."""
-        return self._restarting
-
-    @restarting.setter
-    def restarting(self, restarting: bool) -> None:
-        """Connects this loop's restarting value and its children."""
-        self._restarting = restarting
-        for loop in vars(self).values():
-            if isinstance(loop, Loop):
-                loop.restarting = restarting
-
-    @property
-    @abstractmethod
-    def done(self) -> bool:
-        """Property indicating when the loop is finished.
-
-        Example::
-
-            @property
-            def done(self):
-                return self.trainer.global_step >= self.trainer.max_steps
-        """
-
-    @property
-    def skip(self) -> bool:
-        """Determine whether to return immediately from the call to :meth:`run`.
-
-        Example::
-
-            @property
-            def skip(self):
-                return len(self.trainer.train_dataloader) == 0
-        """
-        return False
-
-    def connect(self, **kwargs: "Loop") -> None:
-        """Optionally connect one or multiple loops to this one.
-
-        Linked loops should form a tree.
-        """
-
-    def replace(self, **loops: Union["Loop", Type["Loop"]]) -> None:
-        """Optionally replace one or multiple of this loop's sub-loops.
-
-        This methods takes care of instantiating the class (if necessary) with all existing arguments, connecting all
-        sub-loops of the old loop to the new instance, setting the ``Trainer`` reference, and connecting the new loop to
-        the parent.
-
-        Args:
-            **loops: ``Loop`` subclasses or instances. The name used should match the loop attribute name you want to
-                replace.
-
-        Raises:
-            MisconfigurationException: When passing a ``Loop`` class, if the ``__init__`` arguments do not match those
-                of the Loop class it replaces.
-        """
-        new_loops = {}
-
-        for name, type_or_object in loops.items():
-            old_loop = getattr(self, name)
-
-            if isinstance(type_or_object, type):
-                # compare the signatures
-                old_parameters = inspect.signature(old_loop.__class__.__init__).parameters
-                current_parameters = inspect.signature(type_or_object.__init__).parameters
-                if old_parameters != current_parameters:
-                    raise MisconfigurationException(
-                        f"`{self.__class__.__name__}.replace({type_or_object.__name__})` can only be used if the"
-                        f" `__init__` signatures match but `{old_loop.__class__.__name__}` does not."
-                    )
-                # instantiate the loop
-                kwargs = {p: getattr(old_loop, p) for p in old_parameters if p != "self"}
-                loop = type_or_object(**kwargs)
-            else:
-                loop = type_or_object
-
-            # connect sub-loops
-            kwargs = {n: l for n, l in old_loop.__dict__.items() if isinstance(l, Loop)}
-            loop.connect(**kwargs)
-            # set the trainer reference
-            loop.trainer = self.trainer
-
-            new_loops[name] = loop
-        # connect to self
-        self.connect(**new_loops)
-
-    def on_skip(self) -> T:
-        """The function to run when :meth:`run` should be skipped, determined by the condition in :attr:`skip`.
-
-        Returns:
-            the default output value of :meth:`on_run_end`
-        """
-
-
[docs] def run(self, *args: Any, **kwargs: Any) -> T: - """The main entry point to the loop. - - Will frequently check the :attr:`done` condition and calls :attr:`advance` - until :attr:`done` evaluates to ``True``. - - Override this if you wish to change the default behavior. The default implementation is: - - Example:: - - def run(self, *args, **kwargs): - if self.skip: - return self.on_skip() - - self.reset() - self.on_run_start(*args, **kwargs) - - while not self.done: - self.advance(*args, **kwargs) - - output = self.on_run_end() - return output - - Returns: - The output of :attr:`on_run_end` (often outputs collected from each step of the loop) - """ - if self.skip: - return self.on_skip() - - self.reset() - - self.on_run_start(*args, **kwargs) - - while not self.done: - try: - self.on_advance_start(*args, **kwargs) - self.advance(*args, **kwargs) - self.on_advance_end() - self._restarting = False - except StopIteration: - break - self._restarting = False - - output = self.on_run_end() - return output
- -
[docs] @abstractmethod - def reset(self) -> None: - """Resets the internal state of the loop at the beginning of each call to :attr:`run`. - - Example:: - - def reset(self): - # reset your internal state or add custom logic - # if you expect run() to be called multiple times - self.current_iteration = 0 - self.outputs = [] - """
- - def on_run_start(self, *args: Any, **kwargs: Any) -> None: - """Hook to be called as the first thing after entering :attr:`run` (except the state reset). - - Accepts all arguments passed to :attr:`run`. - """ - void(*args, **kwargs) - - def on_advance_start(self, *args: Any, **kwargs: Any) -> None: - """Hook to be called each time before :attr:`advance` is called. - - Accepts all arguments passed to :attr`run`. - """ - void(*args, **kwargs) - -
[docs] @abstractmethod - def advance(self, *args: Any, **kwargs: Any) -> None: - """Performs a single step. - - Accepts all arguments passed to :attr:`run`. - - Example:: - - def advance(self, iterator): - batch = next(iterator) - loss = self.trainer.lightning_module.training_step(batch, batch_idx) - ... - """
- - def on_advance_end(self) -> None: - """Hook to be called each time after :attr:`advance` is called.""" - - def on_run_end(self) -> T: - """Hook to be called at the end of the run. - - Its return argument is returned from :attr:`run`. - """ - - def teardown(self) -> None: - """Use to release memory etc.""" - - def on_save_checkpoint(self) -> Dict: - """Called when saving a model checkpoint, use to persist loop state. - - Returns: - The current loop state. - """ - return {} - - def on_load_checkpoint(self, state_dict: Dict) -> None: - """Called when loading a model checkpoint, use to reload loop state.""" - - def state_dict(self, destination: Optional[Dict] = None, prefix: str = "") -> Dict: - """The state dict is determined by the state and progress of this loop and all its children. - - Args: - destination: An existing dictionary to update with this loop's state. By default a new dictionary - is returned. - prefix: A prefix for each key in the state dictionary - """ - if destination is None: - destination = {} - - destination[prefix + "state_dict"] = self.on_save_checkpoint() - - # do not get the mode from `self.trainer` because it might not have been attached yet - ft_enabled = _fault_tolerant_training() - for k, v in self.__dict__.items(): - key = prefix + k - if isinstance(v, BaseProgress): - destination[key] = v.state_dict() - elif isinstance(v, Loop): - v.state_dict(destination, key + ".") - elif ft_enabled and isinstance(v, _ResultCollection): - # sync / unsync metrics - v.sync() - destination[key] = v.state_dict() - v.unsync() - - return destination - - def load_state_dict( - self, - state_dict: Dict, - prefix: str = "", - metrics: Optional[Dict[str, Metric]] = None, - ) -> None: - """Loads the state of this loop and all its children.""" - self._load_from_state_dict(state_dict.copy(), prefix, metrics) - for k, v in self.__dict__.items(): - if isinstance(v, Loop): - v.load_state_dict(state_dict.copy(), prefix + k + ".") - self.restarting = True - - def _load_from_state_dict(self, state_dict: Dict, prefix: str, metrics: Optional[Dict[str, Metric]] = None) -> None: - for k, v in self.__dict__.items(): - key = prefix + k - if key not in state_dict: - # compatibility with old checkpoints - continue - - if isinstance(v, BaseProgress): - v.load_state_dict(state_dict[key]) - elif ( - isinstance(v, _ResultCollection) - and self.trainer is not None - and self.trainer.lightning_module is not None - ): - metric_attributes = { - name: module - for name, module in self.trainer.lightning_module.named_modules() - if isinstance(module, Metric) - } - if metrics: - metric_attributes.update(metrics) - - # The `_ResultCollection` objects have 2 types of metrics: `Tensor` and `torchmetrics.Metric`. - # When creating a checkpoint, the `Metric`s are dropped from the loop `state_dict` to serialize only - # Python primitives. However, their states are saved with the model's `state_dict`. - # On reload, we need to re-attach the `Metric`s back to the `_ResultCollection`. - # The references are provided through the `metric_attributes` dictionary. - v.load_state_dict(state_dict[key], metrics=metric_attributes, sync_fn=self.trainer.strategy.reduce) - - if not self.trainer.is_global_zero: - v.reset(metrics=False) - - if prefix + "state_dict" in state_dict: # compatibility with old checkpoints - self.on_load_checkpoint(state_dict[prefix + "state_dict"]) -
- -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/_modules/pytorch_lightning/trainer/trainer.html b/docs/_modules/pytorch_lightning/trainer/trainer.html deleted file mode 100644 index a83010b..0000000 --- a/docs/_modules/pytorch_lightning/trainer/trainer.html +++ /dev/null @@ -1,3544 +0,0 @@ - - - - - - - - - - - - - pytorch_lightning.trainer.trainer — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -

Source code for pytorch_lightning.trainer.trainer

-# Copyright The PyTorch Lightning team.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-"""Trainer to automate the training."""
-import inspect
-import logging
-import math
-import os
-import traceback
-import warnings
-from argparse import ArgumentParser, Namespace
-from copy import deepcopy
-from datetime import timedelta
-from pathlib import Path
-from typing import Any, Callable, cast, Dict, Iterable, List, Optional, Type, Union
-from weakref import proxy
-
-import torch
-from packaging.version import Version
-from torch.optim import Optimizer
-from torch.utils.data import DataLoader
-
-import pytorch_lightning as pl
-from pytorch_lightning.accelerators import Accelerator, GPUAccelerator, HPUAccelerator, IPUAccelerator, TPUAccelerator
-from pytorch_lightning.callbacks import Callback, EarlyStopping, ModelCheckpoint, ProgressBarBase
-from pytorch_lightning.callbacks.prediction_writer import BasePredictionWriter
-from pytorch_lightning.core.datamodule import LightningDataModule
-from pytorch_lightning.core.optimizer import LightningOptimizer
-from pytorch_lightning.loggers import LightningLoggerBase
-from pytorch_lightning.loggers.base import DummyLogger, LoggerCollection
-from pytorch_lightning.loggers.tensorboard import TensorBoardLogger
-from pytorch_lightning.loops import PredictionLoop, TrainingEpochLoop
-from pytorch_lightning.loops.dataloader.evaluation_loop import EvaluationLoop
-from pytorch_lightning.loops.fit_loop import FitLoop
-from pytorch_lightning.loops.utilities import _parse_loop_limits, _reset_progress
-from pytorch_lightning.plugins import (
-    ApexMixedPrecisionPlugin,
-    NativeMixedPrecisionPlugin,
-    PLUGIN_INPUT,
-    PrecisionPlugin,
-)
-from pytorch_lightning.plugins.environments.slurm_environment import SLURMEnvironment
-from pytorch_lightning.profiler import (
-    AdvancedProfiler,
-    BaseProfiler,
-    PassThroughProfiler,
-    Profiler,
-    PyTorchProfiler,
-    SimpleProfiler,
-    XLAProfiler,
-)
-from pytorch_lightning.strategies import ParallelStrategy, Strategy
-from pytorch_lightning.strategies.ddp_spawn import DDPSpawnStrategy
-from pytorch_lightning.trainer.callback_hook import TrainerCallbackHookMixin
-from pytorch_lightning.trainer.configuration_validator import verify_loop_configurations
-from pytorch_lightning.trainer.connectors.accelerator_connector import AcceleratorConnector
-from pytorch_lightning.trainer.connectors.callback_connector import CallbackConnector
-from pytorch_lightning.trainer.connectors.checkpoint_connector import CheckpointConnector
-from pytorch_lightning.trainer.connectors.data_connector import DataConnector
-from pytorch_lightning.trainer.connectors.logger_connector import LoggerConnector
-from pytorch_lightning.trainer.connectors.logger_connector.result import _ResultCollection
-from pytorch_lightning.trainer.connectors.signal_connector import SignalConnector
-from pytorch_lightning.trainer.data_loading import TrainerDataLoadingMixin
-from pytorch_lightning.trainer.optimizers import TrainerOptimizersMixin
-from pytorch_lightning.trainer.states import RunningStage, TrainerFn, TrainerState, TrainerStatus
-from pytorch_lightning.trainer.supporters import CombinedLoader
-from pytorch_lightning.tuner.lr_finder import _LRFinder
-from pytorch_lightning.tuner.tuning import Tuner
-from pytorch_lightning.utilities import (
-    _HPU_AVAILABLE,
-    _IPU_AVAILABLE,
-    _TPU_AVAILABLE,
-    AMPType,
-    GradClipAlgorithmType,
-    parsing,
-)
-from pytorch_lightning.utilities.apply_func import apply_to_collection
-from pytorch_lightning.utilities.argparse import (
-    _defaults_from_env_vars,
-    add_argparse_args,
-    from_argparse_args,
-    parse_argparser,
-    parse_env_variables,
-)
-from pytorch_lightning.utilities.auto_restart import _add_capture_metadata_collate
-from pytorch_lightning.utilities.cloud_io import get_filesystem
-from pytorch_lightning.utilities.data import _auto_add_worker_init_fn, has_len_all_ranks
-from pytorch_lightning.utilities.distributed import distributed_available
-from pytorch_lightning.utilities.exceptions import ExitGracefullyException, MisconfigurationException
-from pytorch_lightning.utilities.imports import _fault_tolerant_training
-from pytorch_lightning.utilities.meta import is_on_meta_device, materialize_module
-from pytorch_lightning.utilities.model_helpers import is_overridden
-from pytorch_lightning.utilities.rank_zero import rank_zero_deprecation, rank_zero_info, rank_zero_warn
-from pytorch_lightning.utilities.seed import isolate_rng
-from pytorch_lightning.utilities.signature_utils import is_param_in_hook_signature
-from pytorch_lightning.utilities.types import (
-    _EVALUATE_OUTPUT,
-    _PATH,
-    _PREDICT_OUTPUT,
-    EVAL_DATALOADERS,
-    LRSchedulerConfig,
-    STEP_OUTPUT,
-    TRAIN_DATALOADERS,
-)
-from pytorch_lightning.utilities.warnings import PossibleUserWarning
-
-log = logging.getLogger(__name__)
-# warnings to ignore in trainer
-warnings.filterwarnings(
-    "ignore", message="torch.distributed.reduce_op is deprecated, please use torch.distributed.ReduceOp instead"
-)
-
-
-class Trainer(
-    TrainerCallbackHookMixin,  # TODO: Remove in v1.8
-    TrainerOptimizersMixin,  # TODO: Remove in v1.8
-    TrainerDataLoadingMixin,  # TODO: Remove in v1.8
-):
-
[docs] @_defaults_from_env_vars - def __init__( - self, - logger: Union[LightningLoggerBase, Iterable[LightningLoggerBase], bool] = True, - checkpoint_callback: Optional[bool] = None, - enable_checkpointing: bool = True, - callbacks: Optional[Union[List[Callback], Callback]] = None, - default_root_dir: Optional[str] = None, - gradient_clip_val: Optional[Union[int, float]] = None, - gradient_clip_algorithm: Optional[str] = None, - process_position: int = 0, - num_nodes: int = 1, - num_processes: Optional[int] = None, - devices: Optional[Union[List[int], str, int]] = None, - gpus: Optional[Union[List[int], str, int]] = None, - auto_select_gpus: bool = False, - tpu_cores: Optional[Union[List[int], str, int]] = None, - ipus: Optional[int] = None, - log_gpu_memory: Optional[str] = None, # TODO: Remove in 1.7 - progress_bar_refresh_rate: Optional[int] = None, # TODO: remove in v1.7 - enable_progress_bar: bool = True, - overfit_batches: Union[int, float] = 0.0, - track_grad_norm: Union[int, float, str] = -1, - check_val_every_n_epoch: int = 1, - fast_dev_run: Union[int, bool] = False, - accumulate_grad_batches: Optional[Union[int, Dict[int, int]]] = None, - max_epochs: Optional[int] = None, - min_epochs: Optional[int] = None, - max_steps: int = -1, - min_steps: Optional[int] = None, - max_time: Optional[Union[str, timedelta, Dict[str, int]]] = None, - limit_train_batches: Optional[Union[int, float]] = None, - limit_val_batches: Optional[Union[int, float]] = None, - limit_test_batches: Optional[Union[int, float]] = None, - limit_predict_batches: Optional[Union[int, float]] = None, - val_check_interval: Optional[Union[int, float]] = None, - flush_logs_every_n_steps: Optional[int] = None, - log_every_n_steps: int = 50, - accelerator: Optional[Union[str, Accelerator]] = None, - strategy: Optional[Union[str, Strategy]] = None, - sync_batchnorm: bool = False, - precision: Union[int, str] = 32, - enable_model_summary: bool = True, - weights_summary: Optional[str] = "top", - weights_save_path: Optional[str] = None, # TODO: Remove in 1.8 - num_sanity_val_steps: int = 2, - resume_from_checkpoint: Optional[Union[Path, str]] = None, - profiler: Optional[Union[BaseProfiler, str]] = None, - benchmark: Optional[bool] = None, - deterministic: bool = False, - reload_dataloaders_every_n_epochs: int = 0, - auto_lr_find: Union[bool, str] = False, - replace_sampler_ddp: bool = True, - detect_anomaly: bool = False, - auto_scale_batch_size: Union[str, bool] = False, - prepare_data_per_node: Optional[bool] = None, - plugins: Optional[Union[PLUGIN_INPUT, List[PLUGIN_INPUT]]] = None, - amp_backend: str = "native", - amp_level: Optional[str] = None, - move_metrics_to_cpu: bool = False, - multiple_trainloader_mode: str = "max_size_cycle", - stochastic_weight_avg: bool = False, - terminate_on_nan: Optional[bool] = None, - ) -> None: - r""" - Customize every aspect of training via flags. - - Args: - - accelerator: Supports passing different accelerator types ("cpu", "gpu", "tpu", "ipu", "hpu", "auto") - as well as custom accelerator instances. - - .. deprecated:: v1.5 - Passing training strategies (e.g., 'ddp') to ``accelerator`` has been deprecated in v1.5.0 - and will be removed in v1.7.0. Please use the ``strategy`` argument instead. - - accumulate_grad_batches: Accumulates grads every k batches or as set up in the dict. - Default: ``None``. - - amp_backend: The mixed precision backend to use ("native" or "apex"). - Default: ``'native''``. - - amp_level: The optimization level to use (O1, O2, etc...). By default it will be set to "O2" - if ``amp_backend`` is set to "apex". - - auto_lr_find: If set to True, will make trainer.tune() run a learning rate finder, - trying to optimize initial learning for faster convergence. trainer.tune() method will - set the suggested learning rate in self.lr or self.learning_rate in the LightningModule. - To use a different key set a string instead of True with the key name. - Default: ``False``. - - auto_scale_batch_size: If set to True, will `initially` run a batch size - finder trying to find the largest batch size that fits into memory. - The result will be stored in self.batch_size in the LightningModule. - Additionally, can be set to either `power` that estimates the batch size through - a power search or `binsearch` that estimates the batch size through a binary search. - Default: ``False``. - - auto_select_gpus: If enabled and ``gpus`` or ``devices`` is an integer, pick available - gpus automatically. This is especially useful when - GPUs are configured to be in "exclusive mode", such - that only one process at a time can access them. - Default: ``False``. - - benchmark: Sets ``torch.backends.cudnn.benchmark``. - Defaults to ``True`` if :paramref:`~pytorch_lightning.trainer.trainer.Trainer.deterministic` - is ``False``. Overwrite to manually set a different value. Default: ``None``. - - callbacks: Add a callback or list of callbacks. - Default: ``None``. - - checkpoint_callback: If ``True``, enable checkpointing. - Default: ``None``. - - .. deprecated:: v1.5 - ``checkpoint_callback`` has been deprecated in v1.5 and will be removed in v1.7. - Please consider using ``enable_checkpointing`` instead. - - enable_checkpointing: If ``True``, enable checkpointing. - It will configure a default ModelCheckpoint callback if there is no user-defined ModelCheckpoint in - :paramref:`~pytorch_lightning.trainer.trainer.Trainer.callbacks`. - Default: ``True``. - - check_val_every_n_epoch: Check val every n train epochs. - Default: ``1``. - - - default_root_dir: Default path for logs and weights when no logger/ckpt_callback passed. - Default: ``os.getcwd()``. - Can be remote file paths such as `s3://mybucket/path` or 'hdfs://path/' - - detect_anomaly: Enable anomaly detection for the autograd engine. - Default: ``False``. - - deterministic: If ``True``, sets whether PyTorch operations must use deterministic algorithms. - Default: ``False``. - - devices: Will be mapped to either `gpus`, `tpu_cores`, `num_processes` or `ipus`, - based on the accelerator type. - - fast_dev_run: Runs n if set to ``n`` (int) else 1 if set to ``True`` batch(es) - of train, val and test to find any bugs (ie: a sort of unit test). - Default: ``False``. - - flush_logs_every_n_steps: How often to flush logs to disk (defaults to every 100 steps). - - .. deprecated:: v1.5 - ``flush_logs_every_n_steps`` has been deprecated in v1.5 and will be removed in v1.7. - Please configure flushing directly in the logger instead. - - gpus: Number of GPUs to train on (int) or which GPUs to train on (list or str) applied per node - Default: ``None``. - - gradient_clip_val: The value at which to clip gradients. Passing ``gradient_clip_val=None`` disables - gradient clipping. If using Automatic Mixed Precision (AMP), the gradients will be unscaled before. - Default: ``None``. - - gradient_clip_algorithm: The gradient clipping algorithm to use. Pass ``gradient_clip_algorithm="value"`` - to clip by value, and ``gradient_clip_algorithm="norm"`` to clip by norm. By default it will - be set to ``"norm"``. - - limit_train_batches: How much of training dataset to check (float = fraction, int = num_batches). - Default: ``1.0``. - - limit_val_batches: How much of validation dataset to check (float = fraction, int = num_batches). - Default: ``1.0``. - - limit_test_batches: How much of test dataset to check (float = fraction, int = num_batches). - Default: ``1.0``. - - limit_predict_batches: How much of prediction dataset to check (float = fraction, int = num_batches). - Default: ``1.0``. - - logger: Logger (or iterable collection of loggers) for experiment tracking. A ``True`` value uses - the default ``TensorBoardLogger``. ``False`` will disable logging. If multiple loggers are - provided and the `save_dir` property of that logger is not set, local files (checkpoints, - profiler traces, etc.) are saved in ``default_root_dir`` rather than in the ``log_dir`` of any - of the individual loggers. - Default: ``True``. - - log_gpu_memory: None, 'min_max', 'all'. Might slow performance. - - .. deprecated:: v1.5 - Deprecated in v1.5.0 and will be removed in v1.7.0 - Please use the ``DeviceStatsMonitor`` callback directly instead. - - log_every_n_steps: How often to log within steps. - Default: ``50``. - - prepare_data_per_node: If True, each LOCAL_RANK=0 will call prepare data. - Otherwise only NODE_RANK=0, LOCAL_RANK=0 will prepare data - - .. deprecated:: v1.5 - Deprecated in v1.5.0 and will be removed in v1.7.0 - Please set ``prepare_data_per_node`` in ``LightningDataModule`` and/or - ``LightningModule`` directly instead. - - process_position: Orders the progress bar when running multiple models on same machine. - - .. deprecated:: v1.5 - ``process_position`` has been deprecated in v1.5 and will be removed in v1.7. - Please pass :class:`~pytorch_lightning.callbacks.progress.TQDMProgressBar` with ``process_position`` - directly to the Trainer's ``callbacks`` argument instead. - - progress_bar_refresh_rate: How often to refresh progress bar (in steps). Value ``0`` disables progress bar. - Ignored when a custom progress bar is passed to :paramref:`~Trainer.callbacks`. Default: None, means - a suitable value will be chosen based on the environment (terminal, Google COLAB, etc.). - - .. deprecated:: v1.5 - ``progress_bar_refresh_rate`` has been deprecated in v1.5 and will be removed in v1.7. - Please pass :class:`~pytorch_lightning.callbacks.progress.TQDMProgressBar` with ``refresh_rate`` - directly to the Trainer's ``callbacks`` argument instead. To disable the progress bar, - pass ``enable_progress_bar = False`` to the Trainer. - - enable_progress_bar: Whether to enable to progress bar by default. - Default: ``False``. - - profiler: To profile individual steps during training and assist in identifying bottlenecks. - Default: ``None``. - - overfit_batches: Overfit a fraction of training data (float) or a set number of batches (int). - Default: ``0.0``. - - plugins: Plugins allow modification of core behavior like ddp and amp, and enable custom lightning plugins. - Default: ``None``. - - precision: Double precision (64), full precision (32), half precision (16) or bfloat16 precision (bf16). - Can be used on CPU, GPU, TPUs, HPUs or IPUs. - Default: ``32``. - - max_epochs: Stop training once this number of epochs is reached. Disabled by default (None). - If both max_epochs and max_steps are not specified, defaults to ``max_epochs = 1000``. - To enable infinite training, set ``max_epochs = -1``. - - min_epochs: Force training for at least these many epochs. Disabled by default (None). - - max_steps: Stop training after this number of steps. Disabled by default (-1). If ``max_steps = -1`` - and ``max_epochs = None``, will default to ``max_epochs = 1000``. To enable infinite training, set - ``max_epochs`` to ``-1``. - - min_steps: Force training for at least these number of steps. Disabled by default (``None``). - - max_time: Stop training after this amount of time has passed. Disabled by default (``None``). - The time duration can be specified in the format DD:HH:MM:SS (days, hours, minutes seconds), as a - :class:`datetime.timedelta`, or a dictionary with keys that will be passed to - :class:`datetime.timedelta`. - - num_nodes: Number of GPU nodes for distributed training. - Default: ``1``. - - num_processes: Number of processes for distributed training with ``accelerator="cpu"``. - Default: ``1``. - - num_sanity_val_steps: Sanity check runs n validation batches before starting the training routine. - Set it to `-1` to run all batches in all validation dataloaders. - Default: ``2``. - - reload_dataloaders_every_n_epochs: Set to a non-negative integer to reload dataloaders every n epochs. - Default: ``0``. - - replace_sampler_ddp: Explicitly enables or disables sampler replacement. If not specified this - will toggled automatically when DDP is used. By default it will add ``shuffle=True`` for - train sampler and ``shuffle=False`` for val/test sampler. If you want to customize it, - you can set ``replace_sampler_ddp=False`` and add your own distributed sampler. - - resume_from_checkpoint: Path/URL of the checkpoint from which training is resumed. If there is - no checkpoint file at the path, an exception is raised. If resuming from mid-epoch checkpoint, - training will start from the beginning of the next epoch. - - .. deprecated:: v1.5 - ``resume_from_checkpoint`` is deprecated in v1.5 and will be removed in v2.0. - Please pass the path to ``Trainer.fit(..., ckpt_path=...)`` instead. - - strategy: Supports different training strategies with aliases - as well custom strategies. - Default: ``None``. - - sync_batchnorm: Synchronize batch norm layers between process groups/whole world. - Default: ``False``. - - terminate_on_nan: If set to True, will terminate training (by raising a `ValueError`) at the - end of each training batch, if any of the parameters or the loss are NaN or +/-inf. - - .. deprecated:: v1.5 - Trainer argument ``terminate_on_nan`` was deprecated in v1.5 and will be removed in 1.7. - Please use ``detect_anomaly`` instead. - - detect_anomaly: Enable anomaly detection for the autograd engine. - Default: ``False``. - - tpu_cores: How many TPU cores to train on (1 or 8) / Single TPU to train on (1) - Default: ``None``. - - ipus: How many IPUs to train on. - Default: ``None``. - - track_grad_norm: -1 no tracking. Otherwise tracks that p-norm. May be set to 'inf' infinity-norm. If using - Automatic Mixed Precision (AMP), the gradients will be unscaled before logging them. - Default: ``-1``. - - val_check_interval: How often to check the validation set. Pass a ``float`` in the range [0.0, 1.0] to check - after a fraction of the training epoch. Pass an ``int`` to check after a fixed number of training - batches. - Default: ``1.0``. - - enable_model_summary: Whether to enable model summarization by default. - Default: ``True``. - - weights_summary: Prints a summary of the weights when training begins. - - .. deprecated:: v1.5 - ``weights_summary`` has been deprecated in v1.5 and will be removed in v1.7. - To disable the summary, pass ``enable_model_summary = False`` to the Trainer. - To customize the summary, pass :class:`~pytorch_lightning.callbacks.model_summary.ModelSummary` - directly to the Trainer's ``callbacks`` argument. - - weights_save_path: Where to save weights if specified. Will override default_root_dir - for checkpoints only. Use this if for whatever reason you need the checkpoints - stored in a different place than the logs written in `default_root_dir`. - Can be remote file paths such as `s3://mybucket/path` or 'hdfs://path/' - Defaults to `default_root_dir`. - - .. deprecated:: v1.6 - ``weights_save_path`` has been deprecated in v1.6 and will be removed in v1.8. Please pass - ``dirpath`` directly to the :class:`~pytorch_lightning.callbacks.model_checkpoint.ModelCheckpoint` - callback. - - move_metrics_to_cpu: Whether to force internal logged metrics to be moved to cpu. - This can save some gpu memory, but can make training slower. Use with attention. - Default: ``False``. - - multiple_trainloader_mode: How to loop over the datasets when there are multiple train loaders. - In 'max_size_cycle' mode, the trainer ends one epoch when the largest dataset is traversed, - and smaller datasets reload when running out of their data. In 'min_size' mode, all the datasets - reload when reaching the minimum length of datasets. - Default: ``"max_size_cycle"``. - - stochastic_weight_avg: Whether to use `Stochastic Weight Averaging (SWA) - <https://pytorch.org/blog/pytorch-1.6-now-includes-stochastic-weight-averaging/>`_. - Default: ``False``. - - .. deprecated:: v1.5 - ``stochastic_weight_avg`` has been deprecated in v1.5 and will be removed in v1.7. - Please pass :class:`~pytorch_lightning.callbacks.stochastic_weight_avg.StochasticWeightAveraging` - directly to the Trainer's ``callbacks`` argument instead. - """ - super().__init__() - Trainer._log_api_event("init") - log.detail(f"{self.__class__.__name__}: Initializing trainer with parameters: {locals()}") - self.state = TrainerState() - - # init connectors - self._data_connector = DataConnector(self, multiple_trainloader_mode) - - self._accelerator_connector = AcceleratorConnector( - num_processes=num_processes, - devices=devices, - tpu_cores=tpu_cores, - ipus=ipus, - accelerator=accelerator, - strategy=strategy, - gpus=gpus, - num_nodes=num_nodes, - sync_batchnorm=sync_batchnorm, - benchmark=benchmark, - replace_sampler_ddp=replace_sampler_ddp, - deterministic=deterministic, - auto_select_gpus=auto_select_gpus, - precision=precision, - amp_type=amp_backend, - amp_level=amp_level, - plugins=plugins, - ) - self._logger_connector = LoggerConnector(self, log_gpu_memory) - self._callback_connector = CallbackConnector(self) - self._checkpoint_connector = CheckpointConnector(self, resume_from_checkpoint) - self._signal_connector = SignalConnector(self) - self.tuner = Tuner(self) - - min_steps, max_steps, min_epochs, max_epochs, max_time = _parse_loop_limits( - min_steps, max_steps, min_epochs, max_epochs, max_time - ) - fit_loop = FitLoop(min_epochs=min_epochs, max_epochs=max_epochs) - training_epoch_loop = TrainingEpochLoop(min_steps=min_steps, max_steps=max_steps) - fit_loop.connect(epoch_loop=training_epoch_loop) - - # default .fit() loop - self.fit_loop = fit_loop - - # default .validate() loop - self.validate_loop = EvaluationLoop() - - # default .test() loop - self.test_loop = EvaluationLoop() - - # default .predict() loop - self.predict_loop = PredictionLoop() - - # set when a checkpoint is loaded via `Trainer.{fit,validate,test,predict}`. - self._ckpt_path: Optional[str] = None - - # .validate(), predict() and .test() set these when they load a checkpoint. They will be removed in favor of - # the unified read-only `Trainer.ckpt_path` attribute in v1.8 - self._validated_ckpt_path: Optional[str] = None # TODO: remove in v1.8 - self._tested_ckpt_path: Optional[str] = None # TODO: remove in v1.8 - self._predicted_ckpt_path: Optional[str] = None # TODO: remove in v1.8 - - # todo: remove in v1.7 - self._weights_summary: Optional[str] = None - - # init callbacks - # Declare attributes to be set in _callback_connector on_trainer_init - self._callback_connector.on_trainer_init( - callbacks, - checkpoint_callback, - enable_checkpointing, - enable_progress_bar, - progress_bar_refresh_rate, - process_position, - default_root_dir, - weights_save_path, - enable_model_summary, - weights_summary, - stochastic_weight_avg, - max_time, - accumulate_grad_batches, - ) - - # hook - self._call_callback_hooks("on_init_start") - - # init data flags - self.check_val_every_n_epoch: int - self._data_connector.on_trainer_init( - check_val_every_n_epoch, - reload_dataloaders_every_n_epochs, - prepare_data_per_node, - ) - - if terminate_on_nan is not None: - rank_zero_deprecation( - "Trainer argument `terminate_on_nan` was deprecated in v1.5 and will be removed in 1.7." - " Please use `Trainer(detect_anomaly=True)` instead." - ) - if not isinstance(terminate_on_nan, bool): - raise TypeError(f"`terminate_on_nan` should be a bool, got {terminate_on_nan}.") - - # gradient clipping - if gradient_clip_val is not None and not isinstance(gradient_clip_val, (int, float)): - raise TypeError(f"`gradient_clip_val` should be an int or a float. Got {gradient_clip_val}.") - - if gradient_clip_algorithm is not None and not GradClipAlgorithmType.supported_type( - gradient_clip_algorithm.lower() - ): - raise MisconfigurationException( - f"`gradient_clip_algorithm` {gradient_clip_algorithm} is invalid. " - f"Allowed algorithms: {GradClipAlgorithmType.supported_types()}." - ) - - # gradient norm tracking - if track_grad_norm != -1 and not ( - (isinstance(track_grad_norm, (int, float)) or track_grad_norm == "inf") and float(track_grad_norm) > 0 - ): - raise MisconfigurationException( - f"`track_grad_norm` must be a positive number or 'inf' (infinity norm). Got {track_grad_norm}." - ) - - self._terminate_on_nan = terminate_on_nan - self.gradient_clip_val: Union[int, float] = gradient_clip_val - self.gradient_clip_algorithm: Optional[GradClipAlgorithmType] = ( - GradClipAlgorithmType(gradient_clip_algorithm.lower()) if gradient_clip_algorithm is not None else None - ) - self.track_grad_norm: float = float(track_grad_norm) - - self._detect_anomaly: bool = detect_anomaly - self._setup_on_init(num_sanity_val_steps) - - # configure tuner - self.tuner.on_trainer_init(auto_lr_find, auto_scale_batch_size) - - # configure profiler - self.__init_profiler(profiler) - - # init logger flags - self._loggers: List[LightningLoggerBase] - self._logger_connector.on_trainer_init(logger, flush_logs_every_n_steps, log_every_n_steps, move_metrics_to_cpu) - - # init debugging flags - self.val_check_interval: Union[int, float] - self._init_debugging_flags( - limit_train_batches, - limit_val_batches, - limit_test_batches, - limit_predict_batches, - val_check_interval, - overfit_batches, - fast_dev_run, - ) - - # Callback system - self._call_callback_hooks("on_init_end")
- - def _init_debugging_flags( - self, - limit_train_batches: Optional[Union[int, float]], - limit_val_batches: Optional[Union[int, float]], - limit_test_batches: Optional[Union[int, float]], - limit_predict_batches: Optional[Union[int, float]], - val_check_interval: Optional[Union[int, float]], - overfit_batches: Union[int, float], - fast_dev_run: Union[int, bool], - ) -> None: - if isinstance(fast_dev_run, int) and (fast_dev_run < 0): - raise MisconfigurationException( - f"fast_dev_run={fast_dev_run} is not a valid configuration. It should be >= 0." - ) - - self.fast_dev_run = fast_dev_run - - # set fast_dev_run=True when it is 1, used while logging - if fast_dev_run == 1: - self.fast_dev_run = True - - if fast_dev_run: - num_batches = int(fast_dev_run) - limit_train_batches = num_batches - limit_val_batches = num_batches - limit_test_batches = num_batches - limit_predict_batches = num_batches - self.fit_loop.max_steps = num_batches - self.num_sanity_val_steps = 0 - self.fit_loop.max_epochs = 1 - val_check_interval = 1.0 - self.check_val_every_n_epoch = 1 - self.loggers = [DummyLogger()] if self.loggers else [] - - rank_zero_info( - "Running in fast_dev_run mode: will run a full train," - f" val, test and prediction loop using {num_batches} batch(es)." - ) - - self.limit_train_batches = _determine_batch_limits(limit_train_batches, "limit_train_batches") - self.limit_val_batches = _determine_batch_limits(limit_val_batches, "limit_val_batches") - self.limit_test_batches = _determine_batch_limits(limit_test_batches, "limit_test_batches") - self.limit_predict_batches = _determine_batch_limits(limit_predict_batches, "limit_predict_batches") - self.val_check_interval = _determine_batch_limits(val_check_interval, "val_check_interval") - self.overfit_batches = _determine_batch_limits(overfit_batches, "overfit_batches") - self._determine_data_use_amount(self.overfit_batches) - - def _determine_data_use_amount(self, overfit_batches: float) -> None: - """Use less data for debugging purposes.""" - if overfit_batches > 0: - self.limit_train_batches = overfit_batches - self.limit_val_batches = 0 - - def _setup_on_init(self, num_sanity_val_steps: int) -> None: - self._log_device_info() - - self.should_stop = False - self.state = TrainerState() - self.num_training_batches = float("inf") - self.train_dataloader = None - - if num_sanity_val_steps == -1: - self.num_sanity_val_steps = float("inf") - else: - self.num_sanity_val_steps = num_sanity_val_steps - - self.num_sanity_val_batches = [] - self.num_test_batches = [] - self.num_val_batches = [] - self.test_dataloaders = None - self.val_dataloaders = None - self._last_train_dl_reload_epoch = float("-inf") - self._last_val_dl_reload_epoch = float("-inf") - - self.num_predict_batches = [] - - def _call_and_handle_interrupt(self, trainer_fn: Callable, *args: Any, **kwargs: Any) -> Any: - r""" - Error handling, intended to be used only for main trainer function entry points (fit, validate, test, predict) - as all errors should funnel through them - - Args: - trainer_fn: one of (fit, validate, test, predict) - *args: positional arguments to be passed to the `trainer_fn` - **kwargs: keyword arguments to be passed to `trainer_fn` - """ - try: - if self.strategy.launcher is not None: - return self.strategy.launcher.launch(trainer_fn, *args, trainer=self, **kwargs) - else: - return trainer_fn(*args, **kwargs) - # TODO: treat KeyboardInterrupt as BaseException (delete the code below) in v1.7 - except KeyboardInterrupt as exception: - rank_zero_warn("Detected KeyboardInterrupt, attempting graceful shutdown...") - # user could press Ctrl+c many times... only shutdown once - if not self.interrupted: - self.state.status = TrainerStatus.INTERRUPTED - self._call_callback_hooks("on_keyboard_interrupt") - self._call_callback_hooks("on_exception", exception) - except BaseException as exception: - self.state.status = TrainerStatus.INTERRUPTED - if distributed_available() and self.world_size > 1: - # try syncing remaining processes, kill otherwise - self.strategy.reconciliate_processes(traceback.format_exc()) - self._call_callback_hooks("on_exception", exception) - self._teardown() - # teardown might access the stage so we reset it after - self.state.stage = None - raise - -
[docs] def fit( - self, - model: "pl.LightningModule", - train_dataloaders: Optional[Union[TRAIN_DATALOADERS, LightningDataModule]] = None, - val_dataloaders: Optional[EVAL_DATALOADERS] = None, - datamodule: Optional[LightningDataModule] = None, - ckpt_path: Optional[str] = None, - ) -> None: - r""" - Runs the full optimization routine. - - Args: - model: Model to fit. - - train_dataloaders: A collection of :class:`torch.utils.data.DataLoader` or a - :class:`~pytorch_lightning.core.datamodule.LightningDataModule` specifying training samples. - In the case of multiple dataloaders, please see this :ref:`section <multiple-dataloaders>`. - - val_dataloaders: A :class:`torch.utils.data.DataLoader` or a sequence of them specifying validation samples. - - ckpt_path: Path/URL of the checkpoint from which training is resumed. If there is - no checkpoint file at the path, an exception is raised. If resuming from mid-epoch checkpoint, - training will start from the beginning of the next epoch. - - datamodule: An instance of :class:`~pytorch_lightning.core.datamodule.LightningDataModule`. - """ - self.strategy.model = model - self._call_and_handle_interrupt( - self._fit_impl, model, train_dataloaders, val_dataloaders, datamodule, ckpt_path - )
- - def _fit_impl( - self, - model: "pl.LightningModule", - train_dataloaders: Optional[Union[TRAIN_DATALOADERS, LightningDataModule]] = None, - val_dataloaders: Optional[EVAL_DATALOADERS] = None, - datamodule: Optional[LightningDataModule] = None, - ckpt_path: Optional[str] = None, - ) -> None: - Trainer._log_api_event("fit") - log.detail(f"{self.__class__.__name__}: trainer fit stage") - - self.state.fn = TrainerFn.FITTING - self.state.status = TrainerStatus.RUNNING - self.training = True - self._last_train_dl_reload_epoch = float("-inf") - self._last_val_dl_reload_epoch = float("-inf") - - # if a datamodule comes in as the second arg, then fix it for the user - if isinstance(train_dataloaders, LightningDataModule): - datamodule = train_dataloaders - train_dataloaders = None - # If you supply a datamodule you can't supply train_dataloader or val_dataloaders - if (train_dataloaders is not None or val_dataloaders is not None) and datamodule is not None: - raise MisconfigurationException( - "You cannot pass `train_dataloader` or `val_dataloaders` to `trainer.fit(datamodule=...)`" - ) - - # links data to the trainer - self._data_connector.attach_data( - model, train_dataloaders=train_dataloaders, val_dataloaders=val_dataloaders, datamodule=datamodule - ) - - # TODO: ckpt_path only in v2.0 - ckpt_path = ckpt_path or self.resume_from_checkpoint - self._ckpt_path = self.__set_ckpt_path( - ckpt_path, model_provided=True, model_connected=self.lightning_module is not None - ) - results = self._run(model, ckpt_path=self.ckpt_path) - - assert self.state.stopped - self.training = False - return results - -
[docs] def validate( - self, - model: Optional["pl.LightningModule"] = None, - dataloaders: Optional[Union[EVAL_DATALOADERS, LightningDataModule]] = None, - ckpt_path: Optional[str] = None, - verbose: bool = True, - datamodule: Optional[LightningDataModule] = None, - ) -> _EVALUATE_OUTPUT: - r""" - Perform one evaluation epoch over the validation set. - - Args: - model: The model to validate. - - dataloaders: A :class:`torch.utils.data.DataLoader` or a sequence of them, - or a :class:`~pytorch_lightning.core.datamodule.LightningDataModule` specifying validation samples. - - ckpt_path: Either ``best`` or path to the checkpoint you wish to validate. - If ``None`` and the model instance was passed, use the current weights. - Otherwise, the best model checkpoint from the previous ``trainer.fit`` call will be loaded - if a checkpoint callback is configured. - - verbose: If True, prints the validation results. - - datamodule: An instance of :class:`~pytorch_lightning.core.datamodule.LightningDataModule`. - - Returns: - List of dictionaries with metrics logged during the validation phase, e.g., in model- or callback hooks - like :meth:`~pytorch_lightning.core.lightning.LightningModule.validation_step`, - :meth:`~pytorch_lightning.core.lightning.LightningModule.validation_epoch_end`, etc. - The length of the list corresponds to the number of validation dataloaders used. - """ - self.strategy.model = model or self.lightning_module - return self._call_and_handle_interrupt(self._validate_impl, model, dataloaders, ckpt_path, verbose, datamodule)
- - def _validate_impl( - self, - model: Optional["pl.LightningModule"] = None, - dataloaders: Optional[Union[EVAL_DATALOADERS, LightningDataModule]] = None, - ckpt_path: Optional[str] = None, - verbose: bool = True, - datamodule: Optional[LightningDataModule] = None, - ) -> _EVALUATE_OUTPUT: - # -------------------- - # SETUP HOOK - # -------------------- - Trainer._log_api_event("validate") - log.detail(f"{self.__class__.__name__}: trainer validate stage") - - self.state.fn = TrainerFn.VALIDATING - self.state.status = TrainerStatus.RUNNING - self.validating = True - - # if a datamodule comes in as the second arg, then fix it for the user - if isinstance(dataloaders, LightningDataModule): - datamodule = dataloaders - dataloaders = None - # If you supply a datamodule you can't supply val_dataloaders - if dataloaders is not None and datamodule: - raise MisconfigurationException("You cannot pass both `trainer.validate(dataloaders=..., datamodule=...)`") - - model_provided = model is not None - model = model or self.lightning_module - if model is None: - raise MisconfigurationException( - "`model` must be provided to `trainer.validate()` when it hasn't been passed in a previous run" - ) - - self.validate_loop.verbose = verbose - - # links data to the trainer - self._data_connector.attach_data(model, val_dataloaders=dataloaders, datamodule=datamodule) - - self._ckpt_path = self.__set_ckpt_path( - ckpt_path, model_provided=model_provided, model_connected=self.lightning_module is not None - ) - - self._validated_ckpt_path = self.ckpt_path # TODO: remove in v1.8 - - # run validate - results = self._run(model, ckpt_path=self.ckpt_path) - - assert self.state.stopped - self.validating = False - - return results - -
[docs] def test( - self, - model: Optional["pl.LightningModule"] = None, - dataloaders: Optional[Union[EVAL_DATALOADERS, LightningDataModule]] = None, - ckpt_path: Optional[str] = None, - verbose: bool = True, - datamodule: Optional[LightningDataModule] = None, - ) -> _EVALUATE_OUTPUT: - r""" - Perform one evaluation epoch over the test set. - It's separated from fit to make sure you never run on your test set until you want to. - - Args: - model: The model to test. - - dataloaders: A :class:`torch.utils.data.DataLoader` or a sequence of them, - or a :class:`~pytorch_lightning.core.datamodule.LightningDataModule` specifying test samples. - - ckpt_path: Either ``best`` or path to the checkpoint you wish to test. - If ``None`` and the model instance was passed, use the current weights. - Otherwise, the best model checkpoint from the previous ``trainer.fit`` call will be loaded - if a checkpoint callback is configured. - - verbose: If True, prints the test results. - - datamodule: An instance of :class:`~pytorch_lightning.core.datamodule.LightningDataModule`. - - Returns: - List of dictionaries with metrics logged during the test phase, e.g., in model- or callback hooks - like :meth:`~pytorch_lightning.core.lightning.LightningModule.test_step`, - :meth:`~pytorch_lightning.core.lightning.LightningModule.test_epoch_end`, etc. - The length of the list corresponds to the number of test dataloaders used. - """ - self.strategy.model = model or self.lightning_module - return self._call_and_handle_interrupt(self._test_impl, model, dataloaders, ckpt_path, verbose, datamodule)
- - def _test_impl( - self, - model: Optional["pl.LightningModule"] = None, - dataloaders: Optional[Union[EVAL_DATALOADERS, LightningDataModule]] = None, - ckpt_path: Optional[str] = None, - verbose: bool = True, - datamodule: Optional[LightningDataModule] = None, - ) -> _EVALUATE_OUTPUT: - # -------------------- - # SETUP HOOK - # -------------------- - Trainer._log_api_event("test") - log.detail(f"{self.__class__.__name__}: trainer test stage") - - self.state.fn = TrainerFn.TESTING - self.state.status = TrainerStatus.RUNNING - self.testing = True - - # if a datamodule comes in as the second arg, then fix it for the user - if isinstance(dataloaders, LightningDataModule): - datamodule = dataloaders - dataloaders = None - # If you supply a datamodule you can't supply test_dataloaders - if dataloaders is not None and datamodule: - raise MisconfigurationException("You cannot pass both `trainer.test(dataloaders=..., datamodule=...)`") - - model_provided = model is not None - model = model or self.lightning_module - if model is None: - raise MisconfigurationException( - "`model` must be provided to `trainer.test()` when it hasn't been passed in a previous run" - ) - - self.test_loop.verbose = verbose - - # links data to the trainer - self._data_connector.attach_data(model, test_dataloaders=dataloaders, datamodule=datamodule) - - self._ckpt_path = self.__set_ckpt_path( - ckpt_path, model_provided=model_provided, model_connected=self.lightning_module is not None - ) - - self._tested_ckpt_path = self.ckpt_path # TODO: remove in v1.8 - - # run test - results = self._run(model, ckpt_path=self.ckpt_path) - - assert self.state.stopped - self.testing = False - - return results - -
[docs] def predict( - self, - model: Optional["pl.LightningModule"] = None, - dataloaders: Optional[Union[EVAL_DATALOADERS, LightningDataModule]] = None, - datamodule: Optional[LightningDataModule] = None, - return_predictions: Optional[bool] = None, - ckpt_path: Optional[str] = None, - ) -> Optional[_PREDICT_OUTPUT]: - r""" - Run inference on your data. - This will call the model forward function to compute predictions. Useful to perform distributed - and batched predictions. Logging is disabled in the predict hooks. - - Args: - model: The model to predict with. - - dataloaders: A :class:`torch.utils.data.DataLoader` or a sequence of them, - or a :class:`~pytorch_lightning.core.datamodule.LightningDataModule` specifying prediction samples. - - datamodule: The datamodule with a predict_dataloader method that returns one or more dataloaders. - - return_predictions: Whether to return predictions. - ``True`` by default except when an accelerator that spawns processes is used (not supported). - - ckpt_path: Either ``best`` or path to the checkpoint you wish to predict. - If ``None`` and the model instance was passed, use the current weights. - Otherwise, the best model checkpoint from the previous ``trainer.fit`` call will be loaded - if a checkpoint callback is configured. - - Returns: - Returns a list of dictionaries, one for each provided dataloader containing their respective predictions. - """ - self.strategy.model = model or self.lightning_module - return self._call_and_handle_interrupt( - self._predict_impl, model, dataloaders, datamodule, return_predictions, ckpt_path - )
- - def _predict_impl( - self, - model: Optional["pl.LightningModule"] = None, - dataloaders: Optional[Union[EVAL_DATALOADERS, LightningDataModule]] = None, - datamodule: Optional[LightningDataModule] = None, - return_predictions: Optional[bool] = None, - ckpt_path: Optional[str] = None, - ) -> Optional[_PREDICT_OUTPUT]: - # -------------------- - # SETUP HOOK - # -------------------- - Trainer._log_api_event("predict") - log.detail(f"{self.__class__.__name__}: trainer predict stage") - - self.state.fn = TrainerFn.PREDICTING - self.state.status = TrainerStatus.RUNNING - self.predicting = True - - self.predict_loop.return_predictions = return_predictions - - # if a datamodule comes in as the second arg, then fix it for the user - if isinstance(dataloaders, LightningDataModule): - datamodule = dataloaders - dataloaders = None - if dataloaders is not None and datamodule: - raise MisconfigurationException("You cannot pass both `trainer.predict(dataloaders=..., datamodule=...)`") - - model_provided = model is not None - model = model or self.lightning_module - if model is None: - raise MisconfigurationException( - "`model` must be provided to `trainer.predict()` when it hasn't been passed in a previous run" - ) - - # links data to the trainer - self._data_connector.attach_data(model, predict_dataloaders=dataloaders, datamodule=datamodule) - - self._ckpt_path = self.__set_ckpt_path( - ckpt_path, model_provided=model_provided, model_connected=self.lightning_module is not None - ) - - self._predicted_ckpt_path = self.ckpt_path # TODO: remove in v1.8 - - results = self._run(model, ckpt_path=self.ckpt_path) - - assert self.state.stopped - self.predicting = False - - return results - -
[docs] def tune( - self, - model: "pl.LightningModule", - train_dataloaders: Optional[Union[TRAIN_DATALOADERS, LightningDataModule]] = None, - val_dataloaders: Optional[EVAL_DATALOADERS] = None, - datamodule: Optional[LightningDataModule] = None, - scale_batch_size_kwargs: Optional[Dict[str, Any]] = None, - lr_find_kwargs: Optional[Dict[str, Any]] = None, - ) -> Dict[str, Optional[Union[int, _LRFinder]]]: - r""" - Runs routines to tune hyperparameters before training. - - Args: - model: Model to tune. - - train_dataloaders: A collection of :class:`torch.utils.data.DataLoader` or a - :class:`~pytorch_lightning.core.datamodule.LightningDataModule` specifying training samples. - In the case of multiple dataloaders, please see this :ref:`section <multiple-dataloaders>`. - - val_dataloaders: A :class:`torch.utils.data.DataLoader` or a sequence of them specifying validation samples. - - datamodule: An instance of :class:`~pytorch_lightning.core.datamodule.LightningDataModule`. - - scale_batch_size_kwargs: Arguments for :func:`~pytorch_lightning.tuner.batch_size_scaling.scale_batch_size` - - lr_find_kwargs: Arguments for :func:`~pytorch_lightning.tuner.lr_finder.lr_find` - """ - Trainer._log_api_event("tune") - - self.state.fn = TrainerFn.TUNING - self.state.status = TrainerStatus.RUNNING - self.tuning = True - - # if a datamodule comes in as the second arg, then fix it for the user - if isinstance(train_dataloaders, LightningDataModule): - datamodule = train_dataloaders - train_dataloaders = None - # If you supply a datamodule you can't supply train_dataloader or val_dataloaders - if (train_dataloaders is not None or val_dataloaders is not None) and datamodule is not None: - raise MisconfigurationException( - "You cannot pass `train_dataloader` or `val_dataloaders` to `trainer.tune(datamodule=...)`" - ) - - # links data to the trainer - self._data_connector.attach_data( - model, train_dataloaders=train_dataloaders, val_dataloaders=val_dataloaders, datamodule=datamodule - ) - - with isolate_rng(): - result = self.tuner._tune( - model, scale_batch_size_kwargs=scale_batch_size_kwargs, lr_find_kwargs=lr_find_kwargs - ) - - assert self.state.stopped - self.tuning = False - - return result
- - def _restore_modules_and_callbacks(self, checkpoint_path: Optional[_PATH] = None) -> None: - # restore modules after setup - self._checkpoint_connector.resume_start(checkpoint_path) - self._checkpoint_connector._restore_quantization_callbacks() - self._checkpoint_connector.restore_model() - self._checkpoint_connector.restore_datamodule() - if self.state.fn == TrainerFn.FITTING: - # restore callback states - self._checkpoint_connector.restore_callbacks() - - def _run( - self, model: "pl.LightningModule", ckpt_path: Optional[str] = None - ) -> Optional[Union[_EVALUATE_OUTPUT, _PREDICT_OUTPUT]]: - # clean hparams - if hasattr(model, "hparams"): - parsing.clean_namespace(model.hparams) - - # attach model to the strategy - self.strategy.connect(model) - - self._callback_connector._attach_model_callbacks() - self._callback_connector._attach_model_logging_functions() - - verify_loop_configurations(self) - - # hook - log.detail(f"{self.__class__.__name__}: preparing data") - self._data_connector.prepare_data() - - # ---------------------------- - # SET UP TRAINING - # ---------------------------- - self._call_callback_hooks("on_before_accelerator_backend_setup") - log.detail(f"{self.__class__.__name__}: setting up strategy environment") - self.strategy.setup_environment() - self.__setup_profiler() - - self._call_setup_hook() # allow user to setup lightning_module in accelerator environment - - # check if we should delay restoring checkpoint till later - if not self.strategy.restore_checkpoint_after_setup: - log.detail(f"{self.__class__.__name__}: restoring module and callbacks from checkpoint path: {ckpt_path}") - self._restore_modules_and_callbacks(ckpt_path) - - log.detail(f"{self.__class__.__name__}: configuring sharded model") - self._call_configure_sharded_model() # allow user to setup in model sharded environment - - # ---------------------------- - # INSPECT THE CORE LOOPS - # ---------------------------- - rf""" - Lightning internal flow looks like this: - {Trainer.fit} or {Trainer.test} or {Trainer.predict} || - | || - spawn processes || - {self.strategy.setup_environment} || - | || - setup accelerator || - and strategy || LIGHTNING - | || - {self._run_stage} || FLOW - | || - {self._run_train} || DIRECTION - or {self._run_evaluate} || - or {self._run_predict} || - | || - results \/ - This is used to guide readers to the core loops: train, test, predict. - {self._run_predict} is the simplest to understand, use `Go to Definition` to read it :) - """ - - # ---------------------------- - # TRAIN - # ---------------------------- - - # reset logger connector - self._logger_connector.reset_results() - self._logger_connector.reset_metrics() - - # strategy will configure model and move it to the device - self.strategy.setup(self) - - # hook - if self.state.fn == TrainerFn.FITTING: - self._call_callback_hooks("on_fit_start") - self._call_lightning_module_hook("on_fit_start") - - self._log_hyperparams() - - if self.strategy.restore_checkpoint_after_setup: - log.detail(f"{self.__class__.__name__}: restoring module and callbacks from checkpoint path: {ckpt_path}") - self._restore_modules_and_callbacks(ckpt_path) - - # restore optimizers, etc. - log.detail(f"{self.__class__.__name__}: restoring training state") - self._checkpoint_connector.restore_training_state() - - self._checkpoint_connector.resume_end() - - results = self._run_stage() - - log.detail(f"{self.__class__.__name__}: trainer tearing down") - self._teardown() - - # ---------------------------- - # POST-Training CLEAN UP - # ---------------------------- - # hook - if self.state.fn == TrainerFn.FITTING: - self._call_callback_hooks("on_fit_end") - self._call_lightning_module_hook("on_fit_end") - - log.detail(f"{self.__class__.__name__}: calling teardown hooks") - self._call_teardown_hook() - - self.state.status = TrainerStatus.FINISHED - self.state.stage = None - - return results - - def _log_hyperparams(self) -> None: - if not self.loggers: - return - # log hyper-parameters - hparams_initial = None - - # save exp to get started (this is where the first experiment logs are written) - datamodule_log_hyperparams = self.datamodule._log_hyperparams if self.datamodule is not None else False - - if self.lightning_module._log_hyperparams and datamodule_log_hyperparams: - datamodule_hparams = self.datamodule.hparams_initial - lightning_hparams = self.lightning_module.hparams_initial - inconsistent_keys = [] - for key in lightning_hparams.keys() & datamodule_hparams.keys(): - lm_val, dm_val = lightning_hparams[key], datamodule_hparams[key] - if type(lm_val) != type(dm_val): - inconsistent_keys.append(key) - elif isinstance(lm_val, torch.Tensor) and id(lm_val) != id(dm_val): - inconsistent_keys.append(key) - elif lm_val != dm_val: - inconsistent_keys.append(key) - if inconsistent_keys: - raise MisconfigurationException( - f"Error while merging hparams: the keys {inconsistent_keys} are present " - "in both the LightningModule's and LightningDataModule's hparams " - "but have different values." - ) - hparams_initial = {**lightning_hparams, **datamodule_hparams} - elif self.lightning_module._log_hyperparams: - hparams_initial = self.lightning_module.hparams_initial - elif datamodule_log_hyperparams: - hparams_initial = self.datamodule.hparams_initial - - for logger in self.loggers: - if hparams_initial is not None: - logger.log_hyperparams(hparams_initial) - logger.log_graph(self.lightning_module) - logger.save() - - def _teardown(self): - """This is the Trainer's internal teardown, unrelated to the `teardown` hooks in LightningModule and - Callback; those are handled by :meth:`_call_teardown_hook`.""" - self.strategy.post_dispatch(self) - self.strategy.teardown() - loop = self._active_loop - # loop should never be `None` here but it can because we don't know the trainer stage with `ddp_spawn` - if loop is not None: - loop.teardown() - self._logger_connector.teardown() - self._signal_connector.teardown() - - def run_stage(self) -> None: - rank_zero_deprecation( - "`Trainer.run_stage` is deprecated in v1.6 and will be removed in v1.8. Use" - " `Trainer.{fit,validate,test,predict}` instead." - ) - return self._run_stage() - - def _run_stage(self): - self.strategy.barrier("run-stage") - self.strategy.dispatch(self) - - if self.evaluating: - return self._run_evaluate() - if self.predicting: - return self._run_predict() - return self._run_train() - - def _pre_training_routine(self): - # wait for all to join if on distributed - self.strategy.barrier("setup_training") - - # register signals - self._signal_connector.register_signal_handlers() - - # -------------------------- - # Pre-train - # -------------------------- - self._call_callback_hooks("on_pretrain_routine_start") - self._call_lightning_module_hook("on_pretrain_routine_start") - - self._call_callback_hooks("on_pretrain_routine_end") - self._call_lightning_module_hook("on_pretrain_routine_end") - - def _run_train(self) -> None: - self._pre_training_routine() - - with isolate_rng(): - self._run_sanity_check() - - # enable train mode - self.model.train() - torch.set_grad_enabled(True) - - self.fit_loop.trainer = self - with torch.autograd.set_detect_anomaly(self._detect_anomaly): - self.fit_loop.run() - - def _run_evaluate(self) -> _EVALUATE_OUTPUT: - assert self.evaluating - - # reload dataloaders - self._evaluation_loop._reload_evaluation_dataloaders() - - # reset trainer on this loop and all child loops in case user connected a custom loop - self._evaluation_loop.trainer = self - - with self.profiler.profile(f"run_{self.state.stage}_evaluation"), torch.no_grad(): - eval_loop_results = self._evaluation_loop.run() - - # remove the tensors from the eval results - for result in eval_loop_results: - if isinstance(result, dict): - for k, v in result.items(): - if isinstance(v, torch.Tensor): - result[k] = v.cpu().item() - - return eval_loop_results - - def _run_predict(self) -> Optional[_PREDICT_OUTPUT]: - self.reset_predict_dataloader(self.lightning_module) - # reset trainer on this loop and all child loops in case user connected a custom loop - self.predict_loop.trainer = self - with torch.no_grad(): - return self.predict_loop.run() - - def _run_sanity_check(self) -> None: - val_loop = self.fit_loop.epoch_loop.val_loop - - should_sanity_check = ( - self.enable_validation - and self.num_sanity_val_steps > 0 - # do not sanity check if restarting because it would mess up the loaded state - and not val_loop.restarting - ) - - # run tiny validation (if validation defined) - # to make sure program won't crash during val - if should_sanity_check: - stage = self.state.stage - self.sanity_checking = True - - # reset logger connector - self._logger_connector.reset_results() - self._logger_connector.reset_metrics() - - self._call_callback_hooks("on_sanity_check_start") - - # reload dataloaders - val_loop._reload_evaluation_dataloaders() - self.num_sanity_val_batches = [ - min(self.num_sanity_val_steps, val_batches) for val_batches in self.num_val_batches - ] - - # run eval step - with torch.no_grad(): - val_loop.run() - - self._call_callback_hooks("on_sanity_check_end") - - # reset logger connector - self._logger_connector.reset_results() - self._logger_connector.reset_metrics() - - # reset the progress tracking state after sanity checking. we don't need to set the state before - # because sanity check only runs when we are not restarting - _reset_progress(val_loop) - - # restore the previous stage when the sanity check if finished - self.state.stage = stage - - def __set_ckpt_path(self, ckpt_path: Optional[str], model_provided: bool, model_connected: bool) -> Optional[str]: - # fault-tolerance takes precedence - from pytorch_lightning.callbacks.fault_tolerance import _FaultToleranceCheckpoint - - ft_checkpoints = [cb for cb in self.callbacks if isinstance(cb, _FaultToleranceCheckpoint)] - if ft_checkpoints: - ft_ckpt_path = ft_checkpoints[0].ckpt_path - fs = get_filesystem(ft_ckpt_path) - if fs.exists(ft_ckpt_path): - return ft_ckpt_path - - if model_provided and ckpt_path is None: - # use passed model to function without loading weights - return - - fn = self.state.fn.value - - if model_connected and ckpt_path is None: - rank_zero_warn( - f"`.{fn}(ckpt_path=None)` was called without a model." - " The best model of the previous `fit` call will be used." - f" You can pass `{fn}(ckpt_path='best')` to use and best model" - " checkpoint and avoid this warning or" - " `ckpt_path=trainer.checkpoint_callback.last_model_path` to use the last model." - ) - ckpt_path = "best" - - if ckpt_path == "best": - if len(self.checkpoint_callbacks) > 1: - rank_zero_warn( - f'`.{fn}(ckpt_path="best")` is called with Trainer configured with multiple `ModelCheckpoint`' - " callbacks. It will use the best checkpoint path from first checkpoint callback." - ) - - if not self.checkpoint_callback: - raise MisconfigurationException( - f'`.{fn}(ckpt_path="best")` is set but `ModelCheckpoint` is not configured.' - ) - - if not self.checkpoint_callback.best_model_path: - if self.fast_dev_run: - raise MisconfigurationException( - f'You cannot execute `.{fn}(ckpt_path="best")` with `fast_dev_run=True`.' - f" Please pass an exact checkpoint path to `.{fn}(ckpt_path=...)`" - ) - raise MisconfigurationException( - f'`.{fn}(ckpt_path="best")` is set but `ModelCheckpoint` is not configured to save the best model.' - ) - # load best weights - ckpt_path = self.checkpoint_callback.best_model_path - - if not ckpt_path: - raise MisconfigurationException( - f"`.{fn}()` found no path for the best weights: {ckpt_path!r}. Please" - f" specify a path for a checkpoint `.{fn}(ckpt_path=PATH)`" - ) - return ckpt_path - - def _call_setup_hook(self) -> None: - fn = self.state.fn._setup_fn - - self.strategy.barrier("pre_setup") - - if self.datamodule is not None: - self.datamodule.setup(stage=fn) - self._call_callback_hooks("setup", stage=fn) - self._call_lightning_module_hook("setup", stage=fn) - - self.strategy.barrier("post_setup") - - def _call_configure_sharded_model(self) -> None: - with self.strategy.model_sharded_context(): - self._handle_meta_model() - self._call_lightning_module_hook("configure_sharded_model") - self._call_callback_hooks("on_configure_sharded_model") - - def _handle_meta_model(self) -> None: - if not is_on_meta_device(self.lightning_module): - return - - if isinstance(self.strategy, DDPSpawnStrategy): - raise MisconfigurationException("LightningModule on meta device isn't supported with spawn.") - - materialize_module(self.lightning_module) - # the trainer reference is lost during materialization - self.lightning_module.trainer = proxy(self) - - def _call_teardown_hook(self) -> None: - fn = self.state.fn._setup_fn - - if self.datamodule is not None: - self.datamodule.teardown(stage=fn) - - self._call_callback_hooks("teardown", stage=fn) - self._call_lightning_module_hook("teardown", stage=fn) - - self.lightning_module._current_fx_name = None - # these could have become stale if metrics are defined in `setup` - self.lightning_module._metric_attributes = None - - # todo: TPU 8 cores hangs in flush with TensorBoard. Might do for all loggers. - # It might be related to xla tensors blocked when moving the cpu kill loggers. - for logger in self.loggers: - logger.finalize("success") - - # summarize profile results - self.profiler.describe() - - def call_hook( - self, hook_name: str, *args: Any, pl_module: Optional["pl.LightningModule"] = None, **kwargs: Any - ) -> Any: - r""" - .. deprecated:: v1.6 - The Trainer's `call_hook` method was deprecated in v1.6 and will be removed in v1.8. - """ - rank_zero_deprecation("The Trainer's `call_hook` method was deprecated in v1.6 and will be removed in v1.8.") - pl_module = self.lightning_module or pl_module - if pl_module: - prev_fx_name = pl_module._current_fx_name - pl_module._current_fx_name = hook_name - - # always profile hooks - with self.profiler.profile(hook_name): - - # first call trainer hook - callback_fx = getattr(self, hook_name, None) - if callable(callback_fx): - callback_fx(*args, **kwargs) - - # next call hook in lightningModule - output = None - model_fx = getattr(pl_module, hook_name, None) - if callable(model_fx): - output = model_fx(*args, **kwargs) - - # call the strategy hook - if hook_name not in ("setup", "teardown", "on_train_start") and hasattr(self.strategy, hook_name): - strategy_hook = getattr(self.strategy, hook_name) - strategy_output = strategy_hook(*args, **kwargs) - output = strategy_output if output is None else output - - if pl_module: - # restore current_fx when nested context - pl_module._current_fx_name = prev_fx_name - - return output - - def _call_lightning_module_hook( - self, - hook_name: str, - *args: Any, - pl_module: Optional["pl.LightningModule"] = None, - **kwargs: Any, - ) -> Any: - pl_module = pl_module or self.lightning_module - - if pl_module is None: - raise TypeError("No Lightning Module is available to call hooks on") - - fn = getattr(pl_module, hook_name) - if not callable(fn): - return - - prev_fx_name = pl_module._current_fx_name - pl_module._current_fx_name = hook_name - - with self.profiler.profile(f"[LightningModule]{pl_module.__class__.__name__}.{hook_name}"): - output = fn(*args, **kwargs) - - # restore current_fx when nested context - pl_module._current_fx_name = prev_fx_name - - return output - - def _call_callback_hooks( - self, - hook_name: str, - *args: Any, - **kwargs: Any, - ) -> None: - log.debug(f"{self.__class__.__name__}: calling callback hook: {hook_name}") - # TODO: remove if block in v1.8 - if hook_name in ("on_init_start", "on_init_end"): - # these `Callback` hooks are the only ones that do not take a lightning module. - # we also don't profile bc profiler hasn't been set yet - for callback in self.callbacks: - fn = getattr(callback, hook_name) - if callable(fn): - fn(self, *args, **kwargs) - return - - pl_module = self.lightning_module - if pl_module: - prev_fx_name = pl_module._current_fx_name - pl_module._current_fx_name = hook_name - - # TODO: remove if block in v1.7 - if hook_name == "on_train_batch_start": - with self.profiler.profile(hook_name): - self._on_train_batch_start(*args, **kwargs) - elif hook_name == "on_train_batch_end": - with self.profiler.profile(hook_name): - self._on_train_batch_end(*args, **kwargs) - else: - for callback in self.callbacks: - fn = getattr(callback, hook_name) - if callable(fn): - with self.profiler.profile(f"[Callback]{callback.state_key}.{hook_name}"): - fn(self, self.lightning_module, *args, **kwargs) - - if pl_module: - # restore current_fx when nested context - pl_module._current_fx_name = prev_fx_name - - # TODO: Delete this in v1.7 (deprecations: #9816 and #11148) - def _on_train_batch_start(self, batch, batch_idx, dataloader_idx=0): - r"""Called when the training batch begins. This function is needed because of two different deprecations affecting - the original function in TrainerCallbackHookMixin: #9816 and #11148. - """ - for callback in self.callbacks: - if is_param_in_hook_signature(callback.on_train_batch_start, "dataloader_idx", explicit=True): - callback.on_train_batch_start(self, self.lightning_module, batch, batch_idx, 0) - else: - callback.on_train_batch_start(self, self.lightning_module, batch, batch_idx) - - # TODO: Delete this in v1.7 (deprecations: #9816 and #11148) - def _on_train_batch_end(self, outputs: STEP_OUTPUT, batch, batch_idx, dataloader_idx=0): - r"""Called when the training batch ends. This function is needed because of two different deprecations affecting - the original function in TrainerCallbackHookMixin: #9816 and #11148. - """ - for callback in self.callbacks: - if is_param_in_hook_signature(callback.on_train_batch_end, "dataloader_idx", explicit=True): - callback.on_train_batch_end(self, self.lightning_module, outputs, batch, batch_idx, 0) - else: - callback.on_train_batch_end(self, self.lightning_module, outputs, batch, batch_idx) - - def _call_callbacks_state_dict(self) -> Dict[str, dict]: - """Called when saving a model checkpoint, calls and returns every callback's `state_dict`, keyed by - `Callback.state_key`.""" - callback_state_dicts = {} - for callback in self.callbacks: - state_dict = callback.state_dict() - if state_dict: - callback_state_dicts[callback.state_key] = state_dict - return callback_state_dicts - - def _call_callbacks_on_save_checkpoint(self, checkpoint: Dict[str, Any]) -> None: - """Called when saving a model checkpoint, calls every callback's `on_save_checkpoint` hook. - - Will be removed in v1.8: If state is returned, we insert the callback state into - ``checkpoint["callbacks"][Callback.state_key]``. It overrides ``state_dict`` if already present. - """ - pl_module = self.lightning_module - if pl_module: - prev_fx_name = pl_module._current_fx_name - pl_module._current_fx_name = "on_save_checkpoint" - - for callback in self.callbacks: - with self.profiler.profile(f"[Callback]{callback.state_key}.on_save_checkpoint"): - state = callback.on_save_checkpoint(self, self.lightning_module, checkpoint) - if state: - rank_zero_deprecation( - f"Returning a value from `{callback.__class__.__name__}.on_save_checkpoint` is deprecated in v1.6" - " and will be removed in v1.8. Please override `Callback.state_dict`" - " to return state to be saved." - ) - checkpoint["callbacks"][callback.state_key] = state - - if pl_module: - # restore current_fx when nested context - pl_module._current_fx_name = prev_fx_name - - def _call_callbacks_on_load_checkpoint(self, checkpoint: Dict[str, Any]) -> None: - """Called when loading a model checkpoint. - - Calls every callback's `on_load_checkpoint` hook. We have a dedicated function for this rather than using - `_call_callback_hooks` because we have special logic for getting callback_states. - """ - pl_module = self.lightning_module - if pl_module: - prev_fx_name = pl_module._current_fx_name - pl_module._current_fx_name = "on_load_checkpoint" - - callback_states: Dict[Union[Type, str], Dict] = checkpoint.get("callbacks") - - if callback_states is None: - return - - is_legacy_ckpt = Version(checkpoint["pytorch-lightning_version"]) < Version("1.5.0dev") - current_callbacks_keys = {cb._legacy_state_key if is_legacy_ckpt else cb.state_key for cb in self.callbacks} - difference = callback_states.keys() - current_callbacks_keys - if difference: - rank_zero_warn( - "Be aware that when using `ckpt_path`," - " callbacks used to create the checkpoint need to be provided during `Trainer` instantiation." - f" Please add the following callbacks: {list(difference)}.", - ) - - for callback in self.callbacks: - state = callback_states.get(callback.state_key, callback_states.get(callback._legacy_state_key)) - if state: - state = deepcopy(state) - with self.profiler.profile(f"[Callback]{callback.state_key}.on_load_checkpoint"): - callback.on_load_checkpoint(self, self.lightning_module, state) - - if pl_module: - # restore current_fx when nested context - pl_module._current_fx_name = prev_fx_name - - def _call_callbacks_load_state_dict(self, checkpoint: Dict[str, Any]) -> None: - """Called when loading a model checkpoint, calls every callback's `load_state_dict`.""" - callback_states: Dict[Union[Type, str], Dict] = checkpoint.get("callbacks") - - if callback_states is None: - return - - for callback in self.callbacks: - state = callback_states.get(callback.state_key, callback_states.get(callback._legacy_state_key)) - if state: - state = deepcopy(state) - callback.load_state_dict(state) - - def _call_strategy_hook( - self, - hook_name: str, - *args: Any, - **kwargs: Any, - ) -> Any: - pl_module = self.lightning_module - prev_fx_name = pl_module._current_fx_name - pl_module._current_fx_name = hook_name - - fn = getattr(self.strategy, hook_name) - if not callable(fn): - return - - with self.profiler.profile(f"[Strategy]{self.strategy.__class__.__name__}.{hook_name}"): - output = fn(*args, **kwargs) - - # restore current_fx when nested context - pl_module._current_fx_name = prev_fx_name - - return output - - @staticmethod - def _log_api_event(event: str) -> None: - torch._C._log_api_usage_once("lightning.trainer." + event) - - def __init_profiler(self, profiler: Optional[Union[Profiler, str]]) -> None: - if isinstance(profiler, str): - PROFILERS = { - "simple": SimpleProfiler, - "advanced": AdvancedProfiler, - "pytorch": PyTorchProfiler, - "xla": XLAProfiler, - } - profiler = profiler.lower() - if profiler not in PROFILERS: - raise MisconfigurationException( - "When passing string value for the `profiler` parameter of `Trainer`," - f" it can only be one of {list(PROFILERS.keys())}" - ) - profiler_class = PROFILERS[profiler] - profiler = profiler_class() - self.profiler: Profiler = profiler or PassThroughProfiler() - - def __setup_profiler(self) -> None: - local_rank = self.local_rank if self.world_size > 1 else None - self.profiler._lightning_module = proxy(self.lightning_module) - self.profiler.setup(stage=self.state.fn._setup_fn, local_rank=local_rank, log_dir=self.log_dir) - - def _log_device_info(self) -> None: - rank_zero_info( - f"GPU available: {torch.cuda.is_available()}, used: {isinstance(self.accelerator, GPUAccelerator)}" - ) - - num_tpu_cores = self.num_devices if isinstance(self.accelerator, TPUAccelerator) else 0 - rank_zero_info(f"TPU available: {_TPU_AVAILABLE}, using: {num_tpu_cores} TPU cores") - - num_ipus = self.num_devices if isinstance(self.accelerator, IPUAccelerator) else 0 - rank_zero_info(f"IPU available: {_IPU_AVAILABLE}, using: {num_ipus} IPUs") - - num_hpus = self.num_devices if isinstance(self.accelerator, HPUAccelerator) else 0 - rank_zero_info(f"HPU available: {_HPU_AVAILABLE}, using: {num_hpus} HPUs") - - if torch.cuda.is_available() and not isinstance(self.accelerator, GPUAccelerator): - rank_zero_warn( - "GPU available but not used. Set `accelerator` and `devices` using" - f" `Trainer(accelerator='gpu', devices={GPUAccelerator.auto_device_count()})`.", - category=PossibleUserWarning, - ) - - if _TPU_AVAILABLE and not isinstance(self.accelerator, TPUAccelerator): - rank_zero_warn( - "TPU available but not used. Set `accelerator` and `devices` using" - f" `Trainer(accelerator='tpu', devices={TPUAccelerator.auto_device_count()})`." - ) - - if _IPU_AVAILABLE and not isinstance(self.accelerator, IPUAccelerator): - rank_zero_warn( - "IPU available but not used. Set `accelerator` and `devices` using" - f" `Trainer(accelerator='ipu', devices={IPUAccelerator.auto_device_count()})`." - ) - - if _HPU_AVAILABLE and not isinstance(self.accelerator, HPUAccelerator): - rank_zero_warn( - "HPU available but not used. Set `accelerator` and `devices` using" - f" `Trainer(accelerator='hpu', devices={HPUAccelerator.auto_device_count()})`." - ) - - """ - Data loading methods - """ - - def reset_train_dataloader(self, model: Optional["pl.LightningModule"] = None) -> None: - """Resets the train dataloader and initialises required variables (number of batches, when to validate, - etc.). - - Args: - model: The ``LightningModule`` if calling this outside of the trainer scope. - """ - source = self._data_connector._train_dataloader_source - pl_module = self.lightning_module or model - has_step = is_overridden("training_step", pl_module) - enable_training = self.limit_train_batches > 0 - if not (source.is_defined() and has_step and enable_training): - return - - self.train_dataloader = self._data_connector._request_dataloader(RunningStage.TRAINING, model=model) - - if self.overfit_batches > 0: - self.train_dataloader = self._data_connector._resolve_overfit_batches(self.train_dataloader) - - # automatically add samplers - self.train_dataloader = apply_to_collection( - self.train_dataloader, - (DataLoader, CombinedLoader), - self._data_connector._prepare_dataloader, - mode=RunningStage.TRAINING, - ) - loaders = ( - self.train_dataloader.loaders - if isinstance(self.train_dataloader, CombinedLoader) - else self.train_dataloader - ) - - # check the workers recursively - apply_to_collection(loaders, DataLoader, self._data_connector._worker_check, "train_dataloader") - - # add worker_init_fn for correct seeding in worker processes - apply_to_collection(loaders, DataLoader, _auto_add_worker_init_fn, rank=self.global_rank) - - # add collate_fn to collect metadata for fault tolerant training - if _fault_tolerant_training(): - apply_to_collection(loaders, DataLoader, _add_capture_metadata_collate) - - # wrap the sequence of train loaders to a CombinedLoader object for computing the num_training_batches - if not isinstance(self.train_dataloader, CombinedLoader): - self.train_dataloader = CombinedLoader(loaders, self._data_connector.multiple_trainloader_mode) - - module = model or self.lightning_module or self.datamodule - self.num_training_batches = ( - len(self.train_dataloader) - if has_len_all_ranks(self.train_dataloader, self.strategy, module) - else float("inf") - ) - - if isinstance(self.limit_train_batches, int): - self.num_training_batches = min(self.num_training_batches, int(self.limit_train_batches)) - elif self.num_training_batches != float("inf"): - self.num_training_batches = int(self.num_training_batches * self.limit_train_batches) - elif self.limit_train_batches != 1.0: - raise MisconfigurationException( - "When using an IterableDataset for `limit_train_batches`," - " `Trainer(limit_train_batches)` must be `1.0` or an int. An int k specifies" - " `num_training_batches` to use." - ) - - if isinstance(self.val_check_interval, int): - self.val_check_batch = self.val_check_interval - if self.val_check_batch > self.num_training_batches: - raise ValueError( - f"`val_check_interval` ({self.val_check_interval}) must be less than or equal " - f"to the number of the training batches ({self.num_training_batches}). " - "If you want to disable validation set `limit_val_batches` to 0.0 instead." - ) - else: - if not has_len_all_ranks(self.train_dataloader, self.strategy, module): - if self.val_check_interval == 1.0: - self.val_check_batch = float("inf") - else: - raise MisconfigurationException( - "When using an IterableDataset for `train_dataloader`," - " `Trainer(val_check_interval)` must be `1.0` or an int. An int k specifies" - " checking validation every k training batches." - ) - else: - self.val_check_batch = int(self.num_training_batches * self.val_check_interval) - self.val_check_batch = max(1, self.val_check_batch) - - if self.loggers and self.num_training_batches < self.log_every_n_steps: - rank_zero_warn( - f"The number of training batches ({self.num_training_batches}) is smaller than the logging interval" - f" Trainer(log_every_n_steps={self.log_every_n_steps}). Set a lower value for log_every_n_steps if" - " you want to see logs for the training epoch.", - category=PossibleUserWarning, - ) - - # store epoch of dataloader reset for reload_dataloaders_every_n_epochs - self._last_train_dl_reload_epoch = self.current_epoch - - def reset_val_dataloader(self, model: Optional["pl.LightningModule"] = None) -> None: - """Resets the validation dataloader and determines the number of batches. - - Args: - model: The ``LightningModule`` if called outside of the trainer scope. - """ - source = self._data_connector._val_dataloader_source - pl_module = self.lightning_module or model - has_step = is_overridden("validation_step", pl_module) - enable_validation = self.limit_val_batches > 0 - if source.is_defined() and has_step and enable_validation: - self.num_val_batches, self.val_dataloaders = self._data_connector._reset_eval_dataloader( - RunningStage.VALIDATING, model=pl_module - ) - - # store epoch of dataloader reset for reload_dataloaders_every_n_epochs - self._last_val_dl_reload_epoch = self.current_epoch - - def reset_test_dataloader(self, model: Optional["pl.LightningModule"] = None) -> None: - """Resets the test dataloader and determines the number of batches. - - Args: - model: The ``LightningModule`` if called outside of the trainer scope. - """ - source = self._data_connector._test_dataloader_source - pl_module = self.lightning_module or model - has_step = is_overridden("test_step", pl_module) - enable_testing = self.limit_test_batches > 0 - if source.is_defined() and has_step and enable_testing: - self.num_test_batches, self.test_dataloaders = self._data_connector._reset_eval_dataloader( - RunningStage.TESTING, model=pl_module - ) - - def reset_predict_dataloader(self, model: Optional["pl.LightningModule"] = None) -> None: - """Resets the predict dataloader and determines the number of batches. - - Args: - model: The ``LightningModule`` if called outside of the trainer scope. - """ - source = self._data_connector._predict_dataloader_source - pl_module = self.lightning_module or model - enable_prediction = self.limit_predict_batches > 0 - if source.is_defined() and enable_prediction: - self.num_predict_batches, self.predict_dataloaders = self._data_connector._reset_eval_dataloader( - RunningStage.PREDICTING, model=pl_module - ) - - def reset_train_val_dataloaders(self, model: Optional["pl.LightningModule"] = None) -> None: - """Resets train and val dataloaders if none are attached to the trainer. - - The val dataloader must be initialized before training loop starts, as the training loop - inspects the val dataloader to determine whether to run the evaluation loop. - Args: - model: The ``LightningModule`` if called outside of the trainer scope. - """ - if self.train_dataloader is None: - self.reset_train_dataloader(model=model) - if self.val_dataloaders is None: - self.reset_val_dataloader(model=model) - - """ - Accelerator properties - """ - - @property - def accelerator(self) -> Accelerator: - return self.strategy.accelerator - - @property - def strategy(self) -> Strategy: - return self._accelerator_connector.strategy - - @property - def training_type_plugin(self) -> Strategy: - rank_zero_deprecation( - "`Trainer.training_type_plugin` is deprecated in v1.6 and will be removed in v1.8. Use" - " `Trainer.strategy` instead." - ) - return self.strategy - - @property - def precision_plugin(self) -> PrecisionPlugin: - return self.strategy.precision_plugin - - @property - def global_rank(self) -> int: - return self.strategy.global_rank - - @property - def local_rank(self) -> int: - # some strategies define a local rank - return getattr(self.strategy, "local_rank", 0) - - @property - def node_rank(self) -> int: - # some strategies define a node rank - return getattr(self.strategy, "node_rank", 0) - - @property - def world_size(self) -> int: - # some strategies define a world size - return getattr(self.strategy, "world_size", 1) - - @property - def should_rank_save_checkpoint(self) -> bool: - rank_zero_deprecation( - "`Trainer.should_rank_save_checkpoint` is deprecated in v1.6 and will be removed in v1.8.", stacklevel=5 - ) - strategy = self.strategy - return ( - isinstance(strategy, pl.strategies.TPUSpawnStrategy) and strategy.local_rank == 0 or strategy.is_global_zero - ) - - @property - def num_nodes(self) -> int: - return getattr(self.strategy, "num_nodes", 1) - - @property - def device_ids(self) -> List[int]: - """List of device indexes per node.""" - devices = ( - self.strategy.parallel_devices - if isinstance(self.strategy, ParallelStrategy) - else [self.strategy.root_device] - ) - device_ids = [] - for idx, device in enumerate(devices): - if isinstance(device, torch.device): - device_ids.append(device.index or idx) - elif isinstance(device, int): - device_ids.append(device) - return device_ids - - @property - def num_devices(self) -> int: - """Number of devices the trainer uses per node.""" - return len(self.device_ids) - - @property - def num_processes(self) -> int: - rank_zero_deprecation( - "`Trainer.num_processes` is deprecated in v1.6 and will be removed in v1.8. " - "Please use `Trainer.num_devices` instead." - ) - return self.num_devices - - @property - def root_gpu(self) -> Optional[int]: - rank_zero_deprecation( - "`Trainer.root_gpu` is deprecated in v1.6 and will be removed in v1.8. " - "Please use `Trainer.strategy.root_device.index` instead." - ) - return self.strategy.root_device.index if isinstance(self.accelerator, GPUAccelerator) else None - - @property - def tpu_cores(self) -> int: - rank_zero_deprecation( - "`Trainer.tpu_cores` is deprecated in v1.6 and will be removed in v1.8. " - "Please use `Trainer.num_devices` instead." - ) - return self.num_devices if isinstance(self.accelerator, TPUAccelerator) else 0 - - @property - def ipus(self) -> int: - rank_zero_deprecation( - "`Trainer.ipus` was deprecated in v1.6 and will be removed in v1.8." - " Please use `Trainer.num_devices` instead." - ) - return self.num_devices if isinstance(self.accelerator, IPUAccelerator) else 0 - - @property - def num_gpus(self) -> int: - rank_zero_deprecation( - "`Trainer.num_gpus` was deprecated in v1.6 and will be removed in v1.8." - " Please use `Trainer.num_devices` instead." - ) - return self.num_devices if isinstance(self.accelerator, GPUAccelerator) else 0 - - @property - def devices(self) -> int: - rank_zero_deprecation( - "`Trainer.devices` was deprecated in v1.6 and will be removed in v1.8." - " Please use `Trainer.num_devices` or `Trainer.device_ids` to get device information instead." - ) - return self.num_devices - - @property - def data_parallel_device_ids(self) -> Optional[List[int]]: - rank_zero_deprecation( - "`Trainer.data_parallel_device_ids` was deprecated in v1.6 and will be removed in v1.8." - " Please use `Trainer.device_ids` instead." - ) - return self.device_ids if isinstance(self.accelerator, GPUAccelerator) else None - - @property - def lightning_module(self) -> "pl.LightningModule": - # TODO: this is actually an optional return - return self.strategy.lightning_module - - @property - def optimizers(self) -> List[Optimizer]: - return self.strategy.optimizers - - @optimizers.setter - def optimizers(self, new_optims: Optional[List[Optimizer]]) -> None: - self.strategy.optimizers = new_optims - - @property - def lightning_optimizers(self) -> Dict[int, LightningOptimizer]: - rank_zero_deprecation( - "`Trainer.lightning_optimizers` is deprecated in v1.6 and will be removed in v1.8", stacklevel=5 - ) - return self.strategy._lightning_optimizers - - @property - def lr_scheduler_configs(self) -> List[LRSchedulerConfig]: - return self.strategy.lr_scheduler_configs - - @property - def lr_schedulers(self) -> List[Dict[str, Any]]: - rank_zero_deprecation( - "`Trainer.lr_schedulers` is deprecated in v1.6 and will be removed in v1.8." - " You can use `trainer.lr_scheduler_configs` instead which contains dataclasses instead of dictionaries.", - stacklevel=5, - ) - from dataclasses import asdict - - return [asdict(config) for config in self.strategy.lr_scheduler_configs] - - @property - def optimizer_frequencies(self) -> List[int]: - return self.strategy.optimizer_frequencies - - @optimizer_frequencies.setter - def optimizer_frequencies(self, new_freqs: List[int]) -> None: - self.strategy.optimizer_frequencies = new_freqs - - @property - def amp_backend(self) -> Optional[AMPType]: - if isinstance(self.precision_plugin, ApexMixedPrecisionPlugin): - return AMPType.APEX - if isinstance(self.precision_plugin, NativeMixedPrecisionPlugin): - return AMPType.NATIVE - return None - - @property - def precision(self) -> Union[str, int]: - return self.strategy.precision_plugin.precision - - @property - def scaler(self) -> Optional[Any]: - return getattr(self.precision_plugin, "scaler", None) - - @property - def gpus(self) -> Optional[Union[List[int], str, int]]: - rank_zero_deprecation( - "`Trainer.gpus` was deprecated in v1.6 and will be removed in v1.8." - " Please use `Trainer.num_devices` or `Trainer.device_ids` to get device information instead." - ) - return self._accelerator_connector.gpus - - @property - def model(self) -> torch.nn.Module: - """The LightningModule, but possibly wrapped into DataParallel or DistributedDataParallel. - - To access the pure LightningModule, use - :meth:`~pytorch_lightning.trainer.trainer.Trainer.lightning_module` instead. - """ - return self.strategy.model - - @model.setter - def model(self, model: torch.nn.Module) -> None: - """Setter for the model, pass-through to accelerator and plugin where the model reference is stored. Used - by the Tuner to reset the state of Trainer and Accelerator. - - Args: - model: The LightningModule, possibly wrapped into DataParallel or DistributedDataParallel, depending - on the backend. - """ - self.strategy.model = model - - """ - General properties - """ - - @property - def log_dir(self) -> Optional[str]: - if len(self.loggers) == 1: - if isinstance(self.logger, TensorBoardLogger): - dirpath = self.logger.log_dir - else: - dirpath = self.logger.save_dir - else: - dirpath = self.default_root_dir - - dirpath = self.strategy.broadcast(dirpath) - return dirpath - - @property - def use_amp(self) -> bool: - rank_zero_deprecation( - "`Trainer.use_amp` is deprecated in v1.6.0 and will be removed in v1.8.0." - " Please use `Trainer.amp_backend` instead." - ) - return self.precision == 16 - - @property - def is_global_zero(self) -> bool: - return self.strategy.is_global_zero - - @property - def slurm_job_id(self) -> Optional[int]: - rank_zero_deprecation("Method `slurm_job_id` is deprecated in v1.6.0 and will be removed in v1.7.0.") - return SLURMEnvironment.job_id() - - @property - def distributed_sampler_kwargs(self) -> Optional[dict]: - if isinstance(self.strategy, ParallelStrategy): - return self.strategy.distributed_sampler_kwargs - - @property - def data_parallel(self) -> bool: - return isinstance(self.strategy, ParallelStrategy) - - @property - def progress_bar_dict(self) -> dict: - """Read-only for progress bar metrics.""" - rank_zero_deprecation( - "`trainer.progress_bar_dict` is deprecated in v1.5 and will be removed in v1.7." - " Use `ProgressBarBase.get_metrics` instead." - ) - ref_model = self.lightning_module - ref_model = cast(pl.LightningModule, ref_model) - if self.progress_bar_callback: - return self.progress_bar_callback.get_metrics(self, ref_model) - return self.progress_bar_metrics - - @property - def enable_validation(self) -> bool: - """Check if we should run validation during training.""" - return ( - self._data_connector._val_dataloader_source.is_defined() - and is_overridden("validation_step", self.lightning_module) - and self.limit_val_batches > 0 - ) - - @property - def default_root_dir(self) -> str: - """The default location to save artifacts of loggers, checkpoints etc. - - It is used as a fallback if logger or checkpoint callback do not define specific save paths. - """ - if get_filesystem(self._default_root_dir).protocol == "file": - return os.path.normpath(self._default_root_dir) - return self._default_root_dir - - @property - def weights_save_path(self) -> str: - """ - The default root location to save weights (checkpoints), e.g., when the - :class:`~pytorch_lightning.callbacks.model_checkpoint.ModelCheckpoint` does not define a file path. - - .. deprecated:: v1.6 - `Trainer.weights_save_path` has been deprecated in v1.6 and will be removed in v1.8. - """ - rank_zero_deprecation("`Trainer.weights_save_path` has been deprecated in v1.6 and will be removed in v1.8.") - return self._weights_save_path_internal - - # TODO: Remove _weights_save_path_internal in v1.8 - @property - def _weights_save_path_internal(self) -> str: - """This is an internal implementation of weights_save_path which allows weights_save_path to be used - internally by the framework without emitting a deprecation warning. - - To be removed in v1.8. - """ - if get_filesystem(self._weights_save_path).protocol == "file": - return os.path.normpath(self._weights_save_path) - return self._weights_save_path - - @property - def early_stopping_callback(self) -> Optional[EarlyStopping]: - """The first :class:`~pytorch_lightning.callbacks.early_stopping.EarlyStopping` callback in the - Trainer.callbacks list, or ``None`` if it doesn't exist.""" - callbacks = self.early_stopping_callbacks - return callbacks[0] if len(callbacks) > 0 else None - - @property - def early_stopping_callbacks(self) -> List[EarlyStopping]: - """A list of all instances of :class:`~pytorch_lightning.callbacks.early_stopping.EarlyStopping` found in - the Trainer.callbacks list.""" - return [c for c in self.callbacks if isinstance(c, EarlyStopping)] - - @property - def prediction_writer_callbacks(self) -> List[BasePredictionWriter]: - """A list of all instances of :class:`~pytorch_lightning.callbacks.prediction_writer.BasePredictionWriter` - found in the Trainer.callbacks list.""" - return [cb for cb in self.callbacks if isinstance(cb, BasePredictionWriter)] - - @property - def checkpoint_callback(self) -> Optional[ModelCheckpoint]: - """The first :class:`~pytorch_lightning.callbacks.model_checkpoint.ModelCheckpoint` callback in the - Trainer.callbacks list, or ``None`` if it doesn't exist.""" - callbacks = self.checkpoint_callbacks - return callbacks[0] if len(callbacks) > 0 else None - - @property - def checkpoint_callbacks(self) -> List[ModelCheckpoint]: - """A list of all instances of :class:`~pytorch_lightning.callbacks.model_checkpoint.ModelCheckpoint` found - in the Trainer.callbacks list.""" - return [c for c in self.callbacks if isinstance(c, ModelCheckpoint)] - - @property - def progress_bar_callback(self) -> Optional[ProgressBarBase]: - """An instance of :class:`~pytorch_lightning.callbacks.progress.base.ProgressBarBase` found in the - Trainer.callbacks list, or ``None`` if one doesn't exist.""" - for c in self.callbacks: - if isinstance(c, ProgressBarBase): - return c - return None - - @property - def resume_from_checkpoint(self) -> Optional[Union[str, Path]]: - resume_from_checkpoint = self._checkpoint_connector.resume_from_checkpoint_fit_path - if resume_from_checkpoint is not None: - rank_zero_deprecation( - "`trainer.resume_from_checkpoint` is deprecated in v1.5 and will be removed in v2.0." - " Specify the fit checkpoint path with `trainer.fit(ckpt_path=)` instead.", - stacklevel=5, - ) - - return resume_from_checkpoint - - @property - def ckpt_path(self) -> Optional[str]: - """Set to the path/URL of a checkpoint loaded via :meth:`~pytorch_lightning.trainer.trainer.Trainer.fit`, - :meth:`~pytorch_lightning.trainer.trainer.Trainer.validate`, - :meth:`~pytorch_lightning.trainer.trainer.Trainer.test`, or - :meth:`~pytorch_lightning.trainer.trainer.Trainer.predict`. ``None`` otherwise.""" - return self._ckpt_path - - @property - def validated_ckpt_path(self) -> Optional[str]: - rank_zero_deprecation( - "The `Trainer.validated_ckpt_path` attribute was deprecated in v1.6 and will be removed in v1.8. The" - " path of a checkpoint loaded via `Trainer.{fit,validate,test,predict}` should be accessed via" - " `Trainer.ckpt_path` instead.", - stacklevel=5, - ) - return self._validated_ckpt_path - - @validated_ckpt_path.setter - def validated_ckpt_path(self, ckpt_path: Optional[str]) -> None: - rank_zero_deprecation( - "The `Trainer.validated_ckpt_path` attribute was deprecated in v1.6 and will be removed in v1.8. The" - " path of a checkpoint loaded via `Trainer.{fit,validate,test,predict}` should be accessed via the" - " read-only `Trainer.ckpt_path`.", - stacklevel=5, - ) - self._validated_ckpt_path = ckpt_path - - @property - def tested_ckpt_path(self) -> Optional[str]: - rank_zero_deprecation( - "The `Trainer.tested_ckpt_path` attribute was deprecated in v1.6 and will be removed in v1.8. The" - " path of a checkpoint loaded via `Trainer.{fit,validate,test,predict}` should be accessed via" - " `Trainer.ckpt_path` instead.", - stacklevel=5, - ) - return self._tested_ckpt_path - - @tested_ckpt_path.setter - def tested_ckpt_path(self, ckpt_path: Optional[str]) -> None: - rank_zero_deprecation( - "The `Trainer.tested_ckpt_path` attribute was deprecated in v1.6 and will be removed in v1.8. The" - " path of a checkpoint loaded via `Trainer.{fit,validate,test,predict}` should be accessed via the" - " read-only `Trainer.ckpt_path` instead.", - stacklevel=5, - ) - self._tested_ckpt_path = ckpt_path - - @property - def predicted_ckpt_path(self) -> Optional[str]: - rank_zero_deprecation( - "The `Trainer.predicted_ckpt_path` attribute was deprecated in v1.6 and will be removed in v1.8. The" - " path of a checkpoint loaded via `Trainer.{fit,validate,test,predict}` should be accessed via" - " `Trainer.ckpt_path` instead.", - stacklevel=5, - ) - return self._predicted_ckpt_path - - @predicted_ckpt_path.setter - def predicted_ckpt_path(self, ckpt_path: Optional[str]) -> None: - rank_zero_deprecation( - "The `Trainer.predicted_ckpt_path` attribute was deprecated in v1.6 and will be removed in v1.8. The" - " path of a checkpoint loaded via `Trainer.{fit,validate,test,predict}` should be accessed via the" - " read-only `Trainer.ckpt_path` instead.", - stacklevel=5, - ) - self._predicted_ckpt_path = ckpt_path - - def save_checkpoint( - self, filepath: _PATH, weights_only: bool = False, storage_options: Optional[Any] = None - ) -> None: - r""" - Runs routine to create a checkpoint. - - Args: - filepath: Path where checkpoint is saved. - weights_only: If ``True``, will only save the model weights. - storage_options: parameter for how to save to storage, passed to ``CheckpointIO`` plugin - - """ - self._checkpoint_connector.save_checkpoint(filepath, weights_only=weights_only, storage_options=storage_options) - - """ - Parsing properties - """ - - @classmethod - def default_attributes(cls) -> dict: - init_signature = inspect.signature(cls) - return {k: v.default for k, v in init_signature.parameters.items()} - - @classmethod - def get_deprecated_arg_names(cls) -> List: - """Returns a list with deprecated Trainer arguments.""" - depr_arg_names = [] - for name, val in cls.__dict__.items(): - if name.startswith("DEPRECATED") and isinstance(val, (tuple, list)): - depr_arg_names.extend(val) - return depr_arg_names - - @classmethod - def from_argparse_args(cls: Any, args: Union[Namespace, ArgumentParser], **kwargs) -> Any: - return from_argparse_args(cls, args, **kwargs) - - @classmethod - def parse_argparser(cls, arg_parser: Union[ArgumentParser, Namespace]) -> Namespace: - return parse_argparser(cls, arg_parser) - - @classmethod - def match_env_arguments(cls) -> Namespace: - return parse_env_variables(cls) - - @classmethod - def add_argparse_args(cls, parent_parser: ArgumentParser, **kwargs) -> ArgumentParser: - return add_argparse_args(cls, parent_parser, **kwargs) - - """ - State properties - """ - - @property - def interrupted(self) -> bool: - return self.state.status == TrainerStatus.INTERRUPTED - - @property - def training(self) -> bool: - return self.state.stage == RunningStage.TRAINING - - @training.setter - def training(self, val: bool) -> None: - if val: - self.state.stage = RunningStage.TRAINING - elif self.training: - self.state.stage = None - - @property - def testing(self) -> bool: - return self.state.stage == RunningStage.TESTING - - @testing.setter - def testing(self, val: bool) -> None: - if val: - self.state.stage = RunningStage.TESTING - elif self.testing: - self.state.stage = None - - @property - def predicting(self) -> bool: - return self.state.stage == RunningStage.PREDICTING - - @predicting.setter - def predicting(self, val: bool) -> None: - if val: - self.state.stage = RunningStage.PREDICTING - elif self.predicting: - self.state.stage = None - - @property - def tuning(self) -> bool: - return self.state.stage == RunningStage.TUNING - - @tuning.setter - def tuning(self, val: bool) -> None: - if val: - self.state.stage = RunningStage.TUNING - elif self.tuning: - self.state.stage = None - - @property - def validating(self) -> bool: - return self.state.stage == RunningStage.VALIDATING - - @validating.setter - def validating(self, val: bool) -> None: - if val: - self.state.stage = RunningStage.VALIDATING - elif self.validating: - self.state.stage = None - - @property - def evaluating(self) -> bool: - return self.state.stage and self.state.stage.evaluating - - @property - def sanity_checking(self) -> bool: - return self.state.stage == RunningStage.SANITY_CHECKING - - @sanity_checking.setter - def sanity_checking(self, val: bool) -> None: - if val: - self.state.stage = RunningStage.SANITY_CHECKING - elif self.sanity_checking: - self.state.stage = None - - """ - Loop properties - """ - - @property - def global_step(self) -> int: - """The number of optimizer steps taken (does not reset each epoch). - - This includes multiple optimizers and TBPTT steps (if enabled). - """ - return self.fit_loop.epoch_loop.global_step - - @property - def current_epoch(self) -> int: - """The current epoch, updated after the epoch end hooks are run.""" - return self.fit_loop.epoch_progress.current.completed - - @property - def max_epochs(self) -> int: - return self.fit_loop.max_epochs - - @property - def min_epochs(self) -> int: - return self.fit_loop.min_epochs - - @property - def max_steps(self) -> int: - return self.fit_loop.max_steps - - @property - def min_steps(self) -> Optional[int]: - return self.fit_loop.min_steps - - @property - def is_last_batch(self) -> bool: - return self.fit_loop.epoch_loop.batch_progress.is_last_batch - - @property - def fit_loop(self) -> FitLoop: - return self._fit_loop - - @fit_loop.setter - def fit_loop(self, loop: FitLoop): - """Attach a custom fit loop to this Trainer. - - It will run with - :meth:`~pytorch_lightning.trainer.trainer.Trainer.fit`. - """ - loop.trainer = self - self._fit_loop = loop - - @property - def validate_loop(self) -> EvaluationLoop: - return self._validate_loop - - @validate_loop.setter - def validate_loop(self, loop: EvaluationLoop): - """Attach a custom validation loop to this Trainer. - - It will run with - :meth:`~pytorch_lightning.trainer.trainer.Trainer.validate`. Note that this loop is different from the one - running during training inside the :meth:`pytorch_lightning.trainer.trainer.Trainer.fit` call. - """ - loop.trainer = self - self._validate_loop = loop - - @property - def test_loop(self) -> EvaluationLoop: - return self._test_loop - - @test_loop.setter - def test_loop(self, loop: EvaluationLoop): - """Attach a custom test loop to this Trainer. - - It will run with - :meth:`~pytorch_lightning.trainer.trainer.Trainer.test`. - """ - loop.trainer = self - self._test_loop = loop - - @property - def predict_loop(self) -> PredictionLoop: - return self._predict_loop - - @predict_loop.setter - def predict_loop(self, loop: PredictionLoop): - """Attach a custom prediction loop to this Trainer. - - It will run with - :meth:`~pytorch_lightning.trainer.trainer.Trainer.predict`. - """ - loop.trainer = self - self._predict_loop = loop - - @property - def verbose_evaluate(self) -> bool: - rank_zero_deprecation( - "The `Trainer.verbose_evaluate` property has been deprecated and will be removed in v1.8. The current value" - " returned is the union of the validate and test loop values. You can choose which one to access with" - " `trainer.{validate,test}_loop.verbose`.", - stacklevel=5, - ) - return self.validate_loop.verbose or self.test_loop.verbose - - @verbose_evaluate.setter - def verbose_evaluate(self, verbose: bool) -> None: - rank_zero_deprecation( - "The `Trainer.verbose_evaluate` property has been deprecated and will be removed in v1.8. This will set" - " the value for both trainer.{validate,test}_loop.verbose`.", - stacklevel=5, - ) - self.validate_loop.verbose = verbose - self.test_loop.verbose = verbose - - @property - def _evaluation_loop(self) -> EvaluationLoop: - if self.state.fn in (TrainerFn.FITTING, TrainerFn.TUNING): - return self.fit_loop.epoch_loop.val_loop - if self.state.fn == TrainerFn.VALIDATING: - return self.validate_loop - if self.state.fn == TrainerFn.TESTING: - return self.test_loop - raise RuntimeError("The `Trainer._evaluation_loop` property isn't defined. Accessed outside of scope") - - @property - def _active_loop(self) -> Optional[Union[FitLoop, EvaluationLoop, PredictionLoop]]: - if self.training: - return self.fit_loop - if self.sanity_checking or self.evaluating: - return self._evaluation_loop - if self.predicting: - return self.predict_loop - - """ - Logging properties - """ - - @property - def logger(self) -> Optional[LightningLoggerBase]: - if len(self.loggers) == 0: - return None - if len(self.loggers) == 1: - return self.loggers[0] - else: - rank_zero_warn( - "Using trainer.logger when Trainer is configured to use multiple loggers." - " This behavior will change in v1.8 when LoggerCollection is removed, and" - " trainer.logger will return the first logger in trainer.loggers" - ) - with warnings.catch_warnings(): - warnings.simplefilter("ignore") - return LoggerCollection(self.loggers) - - @logger.setter - def logger(self, logger: Optional[LightningLoggerBase]) -> None: - if not logger: - self.loggers = [] - elif isinstance(logger, LoggerCollection): - self.loggers = list(logger) - else: - self.loggers = [logger] - - @property - def loggers(self) -> List[LightningLoggerBase]: - return self._loggers - - @loggers.setter - def loggers(self, loggers: Optional[List[LightningLoggerBase]]) -> None: - self._loggers = loggers if loggers else [] - - @property - def callback_metrics(self) -> dict: - return self._logger_connector.callback_metrics - - @property - def logged_metrics(self) -> dict: - return self._logger_connector.logged_metrics - - @property - def progress_bar_metrics(self) -> dict: - return self._logger_connector.progress_bar_metrics - - @property - def _results(self) -> Optional[_ResultCollection]: - active_loop = self._active_loop - if active_loop is not None: - return active_loop._results - - def _exit_gracefully_on_signal(self) -> None: - if not _fault_tolerant_training() or not self._should_terminate_gracefully(): - return - raise ExitGracefullyException(0) - - def _should_terminate_gracefully(self) -> bool: - value = torch.tensor(int(self._terminate_gracefully), device=self.strategy.root_device) - return self.strategy.reduce(value, reduce_op="sum") > 0 - - @property - def weights_summary(self) -> Optional[str]: - rank_zero_deprecation("`Trainer.weights_summary` is deprecated in v1.5 and will be removed in v1.7.") - return self._weights_summary - - @weights_summary.setter - def weights_summary(self, val: Optional[str]) -> None: - rank_zero_deprecation("Setting `Trainer.weights_summary` is deprecated in v1.5 and will be removed in v1.7.") - self._weights_summary = val - - """ - Other - """ - - @property - def estimated_stepping_batches(self) -> Union[int, float]: - r""" - Estimated stepping batches for the complete training inferred from DataLoaders, gradient - accumulation factor and distributed setup. - - Examples:: - - def configure_optimizers(self): - optimizer = ... - scheduler = torch.optim.lr_scheduler.OneCycleLR( - optimizer, max_lr=1e-3, total_steps=self.trainer.estimated_stepping_batches - ) - return [optimizer], [scheduler] - - """ - accumulation_scheduler = self.accumulation_scheduler - - if accumulation_scheduler.epochs != [0]: - raise MisconfigurationException( - "Estimated stepping batches cannot be computed with different" - " `accumulate_grad_batches` at different epochs." - ) - - # infinite training - if self.max_epochs == -1 and self.max_steps == -1: - return float("inf") - - if self.train_dataloader is None: - rank_zero_info("Loading `train_dataloader` to estimate number of stepping batches.") - self.reset_train_dataloader() - - total_batches = self.num_training_batches - - # iterable dataset - if total_batches == float("inf"): - return self.max_steps - - self.accumulate_grad_batches = accumulation_scheduler.get_accumulate_grad_batches(self.current_epoch) - effective_batch_size = self.accumulate_grad_batches - max_estimated_steps = math.ceil(total_batches / effective_batch_size) * max(self.max_epochs, 1) - - max_estimated_steps = min(max_estimated_steps, self.max_steps) if self.max_steps != -1 else max_estimated_steps - return max_estimated_steps - - @property - def terminate_on_nan(self) -> bool: - rank_zero_deprecation("`Trainer.terminate_on_nan` is deprecated in v1.5 and will be removed in 1.7.") - return self._terminate_on_nan - - @terminate_on_nan.setter - def terminate_on_nan(self, val: bool) -> None: - rank_zero_deprecation( - f"Setting `Trainer.terminate_on_nan = {val}` is deprecated in v1.5 and will be removed in 1.7." - f" Please set `Trainer(detect_anomaly={val})` instead." - ) - self._terminate_on_nan = val # : 212 - - -def _determine_batch_limits(batches: Optional[Union[int, float]], name: str) -> Union[int, float]: - if batches is None: - # batches is optional to know if the user passed a value so that we can show the above info messages only to the - # users that set a value explicitly - return 1.0 - - # differentiating based on the type can be error-prone for users. show a message describing the chosen behaviour - if isinstance(batches, int) and batches == 1: - if name == "limit_train_batches": - message = "1 batch per epoch will be used." - elif name == "val_check_interval": - message = "validation will run after every batch." - else: - message = "1 batch will be used." - rank_zero_info(f"`Trainer({name}=1)` was configured so {message}") - elif isinstance(batches, float) and batches == 1.0: - if name == "limit_train_batches": - message = "100% of the batches per epoch will be used." - elif name == "val_check_interval": - message = "validation will run at the end of the training epoch." - else: - message = "100% of the batches will be used." - rank_zero_info(f"`Trainer({name}=1.0)` was configured so {message}.") - - if 0 <= batches <= 1: - return batches - if batches > 1 and batches % 1.0 == 0: - return int(batches) - raise MisconfigurationException( - f"You have passed invalid value {batches} for {name}, it has to be in [0.0, 1.0] or an int." - ) -
- -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/_sources/accelerators/accelerator_prepare.rst.txt b/docs/_sources/accelerators/accelerator_prepare.rst.txt deleted file mode 100644 index 38921f4..0000000 --- a/docs/_sources/accelerators/accelerator_prepare.rst.txt +++ /dev/null @@ -1,165 +0,0 @@ -:orphan: - -.. _gpu_prepare: - -######################################## -Hardware agnostic training (preparation) -######################################## - -To train on CPU/GPU/TPU without changing your code, we need to build a few good habits :) - ----- - -***************************** -Delete .cuda() or .to() calls -***************************** - -Delete any calls to .cuda() or .to(device). - -.. testcode:: - - # before lightning - def forward(self, x): - x = x.cuda(0) - layer_1.cuda(0) - x_hat = layer_1(x) - - - # after lightning - def forward(self, x): - x_hat = layer_1(x) - ----- - -********************************************** -Init tensors using type_as and register_buffer -********************************************** -When you need to create a new tensor, use ``type_as``. -This will make your code scale to any arbitrary number of GPUs or TPUs with Lightning. - -.. testcode:: - - # before lightning - def forward(self, x): - z = torch.Tensor(2, 3) - z = z.cuda(0) - - - # with lightning - def forward(self, x): - z = torch.Tensor(2, 3) - z = z.type_as(x) - -The :class:`~pytorch_lightning.core.lightning.LightningModule` knows what device it is on. You can access the reference via ``self.device``. -Sometimes it is necessary to store tensors as module attributes. However, if they are not parameters they will -remain on the CPU even if the module gets moved to a new device. To prevent that and remain device agnostic, -register the tensor as a buffer in your modules' ``__init__`` method with :meth:`~torch.nn.Module.register_buffer`. - -.. testcode:: - - class LitModel(LightningModule): - def __init__(self): - ... - self.register_buffer("sigma", torch.eye(3)) - # you can now access self.sigma anywhere in your module - ----- - -*************** -Remove samplers -*************** - -:class:`~torch.utils.data.distributed.DistributedSampler` is automatically handled by Lightning. - -See :ref:`replace-sampler-ddp` for more information. - ----- - -*************************************** -Synchronize validation and test logging -*************************************** - -When running in distributed mode, we have to ensure that the validation and test step logging calls are synchronized across processes. -This is done by adding ``sync_dist=True`` to all ``self.log`` calls in the validation and test step. -This ensures that each GPU worker has the same behaviour when tracking model checkpoints, which is important for later downstream tasks such as testing the best checkpoint across all workers. -The ``sync_dist`` option can also be used in logging calls during the step methods, but be aware that this can lead to significant communication overhead and slow down your training. - -Note if you use any built in metrics or custom metrics that use `TorchMetrics `_, these do not need to be updated and are automatically handled for you. - -.. testcode:: - - def validation_step(self, batch, batch_idx): - x, y = batch - logits = self(x) - loss = self.loss(logits, y) - # Add sync_dist=True to sync logging across all GPU workers (may have performance impact) - self.log("validation_loss", loss, on_step=True, on_epoch=True, sync_dist=True) - - - def test_step(self, batch, batch_idx): - x, y = batch - logits = self(x) - loss = self.loss(logits, y) - # Add sync_dist=True to sync logging across all GPU workers (may have performance impact) - self.log("test_loss", loss, on_step=True, on_epoch=True, sync_dist=True) - -It is possible to perform some computation manually and log the reduced result on rank 0 as follows: - -.. testcode:: - - def test_step(self, batch, batch_idx): - x, y = batch - tensors = self(x) - return tensors - - - def test_epoch_end(self, outputs): - mean = torch.mean(self.all_gather(outputs)) - - # When logging only on rank 0, don't forget to add - # ``rank_zero_only=True`` to avoid deadlocks on synchronization. - if self.trainer.is_global_zero: - self.log("my_reduced_metric", mean, rank_zero_only=True) - ----- - -********************** -Make models pickleable -********************** -It's very likely your code is already `pickleable `_, -in that case no change in necessary. -However, if you run a distributed model and get the following error: - -.. code-block:: - - self._launch(process_obj) - File "/net/software/local/python/3.6.5/lib/python3.6/multiprocessing/popen_spawn_posix.py", line 47, - in _launch reduction.dump(process_obj, fp) - File "/net/software/local/python/3.6.5/lib/python3.6/multiprocessing/reduction.py", line 60, in dump - ForkingPickler(file, protocol).dump(obj) - _pickle.PicklingError: Can't pickle at 0x2b599e088ae8>: - attribute lookup on __main__ failed - -This means something in your model definition, transforms, optimizer, dataloader or callbacks cannot be pickled, and the following code will fail: - -.. code-block:: python - - import pickle - - pickle.dump(some_object) - -This is a limitation of using multiple processes for distributed training within PyTorch. -To fix this issue, find your piece of code that cannot be pickled. The end of the stacktrace -is usually helpful. -ie: in the stacktrace example here, there seems to be a lambda function somewhere in the code -which cannot be pickled. - -.. code-block:: - - self._launch(process_obj) - File "/net/software/local/python/3.6.5/lib/python3.6/multiprocessing/popen_spawn_posix.py", line 47, - in _launch reduction.dump(process_obj, fp) - File "/net/software/local/python/3.6.5/lib/python3.6/multiprocessing/reduction.py", line 60, in dump - ForkingPickler(file, protocol).dump(obj) - _pickle.PicklingError: Can't pickle [THIS IS THE THING TO FIND AND DELETE]: - attribute lookup on __main__ failed diff --git a/docs/_sources/accelerators/gpu.rst.txt b/docs/_sources/accelerators/gpu.rst.txt deleted file mode 100644 index dff7646..0000000 --- a/docs/_sources/accelerators/gpu.rst.txt +++ /dev/null @@ -1,63 +0,0 @@ -.. _gpu: - -Accelerator: GPU training -========================= - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Prepare your code (Optional) - :description: Prepare your code to run on any hardware - :col_css: col-md-4 - :button_link: accelerator_prepare.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Basic - :description: Learn the basics of single and multi-GPU training. - :col_css: col-md-4 - :button_link: gpu_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Intermediate - :description: Learn about different distributed strategies, torchelastic and how to optimize communication layers. - :col_css: col-md-4 - :button_link: gpu_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Advanced - :description: Train 1 trillion+ parameter models with these techniques. - :col_css: col-md-4 - :button_link: gpu_advanced.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Expert - :description: Develop new strategies for training and deploying larger and larger models. - :col_css: col-md-4 - :button_link: gpu_expert.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: FAQ - :description: Frequently asked questions about GPU training. - :col_css: col-md-4 - :button_link: gpu_faq.html - :height: 150 - -.. raw:: html - -
-
diff --git a/docs/_sources/accelerators/gpu_advanced.rst.txt b/docs/_sources/accelerators/gpu_advanced.rst.txt deleted file mode 100644 index eadeb03..0000000 --- a/docs/_sources/accelerators/gpu_advanced.rst.txt +++ /dev/null @@ -1,16 +0,0 @@ -:orphan: - -.. _gpu_advanced: - -GPU training (Advanced) -======================= -**Audience:** Users looking to scale massive models (ie: 1 Trillion parameters). - ----- - -For experts pushing the state-of-the-art in model development, Lightning offers various techniques to enable Trillion+ parameter-scale models. - ----- - -.. - .. include:: ../advanced/model_parallel.rst diff --git a/docs/_sources/accelerators/gpu_basic.rst.txt b/docs/_sources/accelerators/gpu_basic.rst.txt deleted file mode 100644 index 43be718..0000000 --- a/docs/_sources/accelerators/gpu_basic.rst.txt +++ /dev/null @@ -1,97 +0,0 @@ -:orphan: - -.. _gpu_basic: - -GPU training (Basic) -==================== -**Audience:** Users looking to save money and run large models faster using single or multiple - ----- - -What is a GPU? --------------- -A Graphics Processing Unit (GPU), is a specialized hardware accelerator designed to speed up mathematical computations used in gaming and deep learning. - ----- - -Train on 1 GPU --------------- - -Make sure you're running on a machine with at least one GPU. There's no need to specify any NVIDIA flags -as Lightning will do it for you. - -.. testcode:: - :skipif: torch.cuda.device_count() < 1 - - trainer = Trainer(accelerator="gpu", devices=1) - ----------------- - - -.. _multi_gpu: - -Train on multiple GPUs ----------------------- - -To use multiple GPUs, set the number of devices in the Trainer or the index of the GPUs. - -.. code:: - - trainer = Trainer(accelerator="gpu", devices=4) - -Choosing GPU devices -^^^^^^^^^^^^^^^^^^^^ - -You can select the GPU devices using ranges, a list of indices or a string containing -a comma separated list of GPU ids: - -.. testsetup:: - - k = 1 - -.. testcode:: - :skipif: torch.cuda.device_count() < 2 - - # DEFAULT (int) specifies how many GPUs to use per node - Trainer(accelerator="gpu", devices=k) - - # Above is equivalent to - Trainer(accelerator="gpu", devices=list(range(k))) - - # Specify which GPUs to use (don't use when running on cluster) - Trainer(accelerator="gpu", devices=[0, 1]) - - # Equivalent using a string - Trainer(accelerator="gpu", devices="0, 1") - - # To use all available GPUs put -1 or '-1' - # equivalent to list(range(torch.cuda.device_count())) - Trainer(accelerator="gpu", devices=-1) - -The table below lists examples of possible input formats and how they are interpreted by Lightning. - -+------------------+-----------+---------------------+---------------------------------+ -| `devices` | Type | Parsed | Meaning | -+==================+===========+=====================+=================================+ -| 3 | int | [0, 1, 2] | first 3 GPUs | -+------------------+-----------+---------------------+---------------------------------+ -| -1 | int | [0, 1, 2, ...] | all available GPUs | -+------------------+-----------+---------------------+---------------------------------+ -| [0] | list | [0] | GPU 0 | -+------------------+-----------+---------------------+---------------------------------+ -| [1, 3] | list | [1, 3] | GPUs 1 and 3 | -+------------------+-----------+---------------------+---------------------------------+ -| "3" | str | [0, 1, 2] | first 3 GPUs | -+------------------+-----------+---------------------+---------------------------------+ -| "1, 3" | str | [1, 3] | GPUs 1 and 3 | -+------------------+-----------+---------------------+---------------------------------+ -| "-1" | str | [0, 1, 2, ...] | all available GPUs | -+------------------+-----------+---------------------+---------------------------------+ - -.. note:: - - When specifying number of ``devices`` as an integer ``devices=k``, setting the trainer flag - ``auto_select_gpus=True`` will automatically help you find ``k`` GPUs that are not - occupied by other processes. This is especially useful when GPUs are configured - to be in "exclusive mode", such that only one process at a time can access them. - For more details see the :doc:`trainer guide <../common/trainer>`. diff --git a/docs/_sources/accelerators/gpu_expert.rst.txt b/docs/_sources/accelerators/gpu_expert.rst.txt deleted file mode 100644 index a2178a3..0000000 --- a/docs/_sources/accelerators/gpu_expert.rst.txt +++ /dev/null @@ -1,21 +0,0 @@ -:orphan: - -.. _gpu_expert: - -GPU training (Expert) -===================== -**Audience:** Experts creating new scaling techniques such as Deepspeed or FSDP - ----- - -Lightning enables experts focused on researching new ways of optimizing distributed training/inference strategies to create new strategies and plug them into Lightning. - -For example, Lightning worked closely with the Microsoft team to develop a Deepspeed integration and with the Facebook(Meta) team to develop a FSDP integration. - ----- - -.. include:: ../advanced/strategy_registry.rst - ----- - -.. include:: ../extensions/strategy.rst diff --git a/docs/_sources/accelerators/gpu_faq.rst.txt b/docs/_sources/accelerators/gpu_faq.rst.txt deleted file mode 100644 index c697b2c..0000000 --- a/docs/_sources/accelerators/gpu_faq.rst.txt +++ /dev/null @@ -1,97 +0,0 @@ -:orphan: - -.. _gpu_faq: - -GPU training (FAQ) -================== - -****************************************************************** -How should I adjust the learning rate when using multiple devices? -****************************************************************** - -When using distributed training make sure to modify your learning rate according to your effective -batch size. - -Let's say you have a batch size of 7 in your dataloader. - -.. testcode:: - - class LitModel(LightningModule): - def train_dataloader(self): - return Dataset(..., batch_size=7) - -In DDP, DDP_SPAWN, Deepspeed, DDP_SHARDED, or Horovod your effective batch size will be 7 * devices * num_nodes. - -.. code-block:: python - - # effective batch size = 7 * 8 - Trainer(accelerator="gpu", devices=8, strategy="ddp") - Trainer(accelerator="gpu", devices=8, strategy="ddp_spawn") - Trainer(accelerator="gpu", devices=8, strategy="ddp_sharded") - Trainer(accelerator="gpu", devices=8, strategy="horovod") - - # effective batch size = 7 * 8 * 10 - Trainer(accelerator="gpu", devices=8, num_nodes=10, strategy="ddp") - Trainer(accelerator="gpu", devices=8, num_nodes=10, strategy="ddp_spawn") - Trainer(accelerator="gpu", devices=8, num_nodes=10, strategy="ddp_sharded") - Trainer(accelerator="gpu", devices=8, num_nodes=10, strategy="horovod") - -In DDP2 or DP, your effective batch size will be 7 * num_nodes. -The reason is that the full batch is visible to all GPUs on the node when using DDP2. - -.. code-block:: python - - # effective batch size = 7 - Trainer(accelerator="gpu", devices=8, strategy="ddp2") - Trainer(accelerator="gpu", devices=8, strategy="dp") - - # effective batch size = 7 * 10 - Trainer(accelerator="gpu", devices=8, num_nodes=10, strategy="ddp2") - Trainer(accelerator="gpu", devices=8, strategy="dp") - - -.. note:: Huge batch sizes are actually really bad for convergence. Check out: - `Accurate, Large Minibatch SGD: Training ImageNet in 1 Hour `_ - ----- - -********************************************************* -How do I use multiple GPUs on Jupyter or Colab notebooks? -********************************************************* - -To use multiple GPUs on notebooks, use the *DP* mode. - -.. code-block:: python - - Trainer(accelerator="gpu", devices=4, strategy="dp") - -If you want to use other models, please launch your training via the command-shell. - -.. note:: Learn how to :ref:`access a cloud machine with multiple GPUs ` in this guide. - ----- - -***************************************************** -I'm getting errors related to Pickling. What do I do? -***************************************************** - -Pickle is Python's mechanism for serializing and unserializing data. A majority of distributed modes require that your code is fully pickle compliant. If you run into an issue with pickling try the following to figure out the issue - -.. code-block:: python - - import pickle - - model = YourModel() - pickle.dumps(model) - -If you `ddp` your code doesn't need to be pickled. - -.. code-block:: python - - Trainer(accelerator="gpu", devices=4, strategy="ddp") - -If you use `ddp_spawn` the pickling requirement remains. This is a limitation of Python. - -.. code-block:: python - - Trainer(accelerator="gpu", devices=4, strategy="ddp_spawn") diff --git a/docs/_sources/accelerators/gpu_intermediate.rst.txt b/docs/_sources/accelerators/gpu_intermediate.rst.txt deleted file mode 100644 index c4d9ad8..0000000 --- a/docs/_sources/accelerators/gpu_intermediate.rst.txt +++ /dev/null @@ -1,533 +0,0 @@ -:orphan: - -.. _gpu_intermediate: - -GPU training (Intermediate) -=========================== -**Audience:** Users looking to train across machines or experiment with different scaling techniques. - ----- - -Distributed Training strategies -------------------------------- -Lightning supports multiple ways of doing distributed training. - -.. raw:: html - - - -| - -- Data Parallel (``strategy='dp'``) (multiple-gpus, 1 machine) -- DistributedDataParallel (``strategy='ddp'``) (multiple-gpus across many machines (python script based)). -- DistributedDataParallel (``strategy='ddp_spawn'``) (multiple-gpus across many machines (spawn based)). -- DistributedDataParallel 2 (``strategy='ddp2'``) (DP in a machine, DDP across machines). -- Horovod (``strategy='horovod'``) (multi-machine, multi-gpu, configured at runtime) -- Bagua (``strategy='bagua'``) (multiple-gpus across many machines with advanced training algorithms) - -.. note:: - If you request multiple GPUs or nodes without setting a mode, DDP Spawn will be automatically used. - -For a deeper understanding of what Lightning is doing, feel free to read this -`guide `_. - - -Data Parallel -^^^^^^^^^^^^^ -:class:`~torch.nn.DataParallel` (DP) splits a batch across k GPUs. -That is, if you have a batch of 32 and use DP with 2 GPUs, each GPU will process 16 samples, -after which the root node will aggregate the results. - -.. warning:: DP use is discouraged by PyTorch and Lightning. State is not maintained on the replicas created by the - :class:`~torch.nn.DataParallel` wrapper and you may see errors or misbehavior if you assign state to the module - in the ``forward()`` or ``*_step()`` methods. For the same reason we cannot fully support - :doc:`Manual Optimization <../model/manual_optimization>` with DP. Use DDP which is more stable and at least 3x faster. - -.. warning:: DP only supports scattering and gathering primitive collections of tensors like lists, dicts, etc. - Therefore the :meth:`~pytorch_lightning.core.hooks.ModelHooks.transfer_batch_to_device` hook does not apply in - this mode and if you have overridden it, it will not be called. - -.. testcode:: - :skipif: torch.cuda.device_count() < 2 - - # train on 2 GPUs (using DP mode) - trainer = Trainer(accelerator="gpu", devices=2, strategy="dp") - -Distributed Data Parallel -^^^^^^^^^^^^^^^^^^^^^^^^^ -:class:`~torch.nn.parallel.DistributedDataParallel` (DDP) works as follows: - -1. Each GPU across each node gets its own process. - -2. Each GPU gets visibility into a subset of the overall dataset. It will only ever see that subset. - -3. Each process inits the model. - -4. Each process performs a full forward and backward pass in parallel. - -5. The gradients are synced and averaged across all processes. - -6. Each process updates its optimizer. - -.. code-block:: python - - # train on 8 GPUs (same machine (ie: node)) - trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp") - - # train on 32 GPUs (4 nodes) - trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp", num_nodes=4) - -This Lightning implementation of DDP calls your script under the hood multiple times with the correct environment -variables: - -.. code-block:: bash - - # example for 3 GPUs DDP - MASTER_ADDR=localhost MASTER_PORT=random() WORLD_SIZE=3 NODE_RANK=0 LOCAL_RANK=0 python my_file.py --accelerator 'gpu' --devices 3 --etc - MASTER_ADDR=localhost MASTER_PORT=random() WORLD_SIZE=3 NODE_RANK=1 LOCAL_RANK=0 python my_file.py --accelerator 'gpu' --devices 3 --etc - MASTER_ADDR=localhost MASTER_PORT=random() WORLD_SIZE=3 NODE_RANK=2 LOCAL_RANK=0 python my_file.py --accelerator 'gpu' --devices 3 --etc - -We use DDP this way because `ddp_spawn` has a few limitations (due to Python and PyTorch): - -1. Since `.spawn()` trains the model in subprocesses, the model on the main process does not get updated. -2. Dataloader(num_workers=N), where N is large, bottlenecks training with DDP... ie: it will be VERY slow or won't work at all. This is a PyTorch limitation. -3. Forces everything to be picklable. - -There are cases in which it is NOT possible to use DDP. Examples are: - -- Jupyter Notebook, Google COLAB, Kaggle, etc. -- You have a nested script without a root package - -In these situations you should use `dp` or `ddp_spawn` instead. - -Distributed Data Parallel 2 -^^^^^^^^^^^^^^^^^^^^^^^^^^^ -In certain cases, it's advantageous to use all batches on the same machine instead of a subset. -For instance, you might want to compute a NCE loss where it pays to have more negative samples. - -In this case, we can use DDP2 which behaves like DP in a machine and DDP across nodes. DDP2 does the following: - -1. Copies a subset of the data to each node. - -2. Inits a model on each node. - -3. Runs a forward and backward pass using DP. - -4. Syncs gradients across nodes. - -5. Applies the optimizer updates. - -.. code-block:: python - - # train on 32 GPUs (4 nodes) - trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp2", num_nodes=4) - -Distributed Data Parallel Spawn -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -`ddp_spawn` is exactly like `ddp` except that it uses .spawn to start the training processes. - -.. warning:: It is STRONGLY recommended to use `DDP` for speed and performance. - -.. code-block:: python - - mp.spawn(self.ddp_train, nprocs=self.num_processes, args=(model,)) - -If your script does not support being called from the command line (ie: it is nested without a root -project module) you can use the following method: - -.. code-block:: python - - # train on 8 GPUs (same machine (ie: node)) - trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp_spawn") - -We STRONGLY discourage this use because it has limitations (due to Python and PyTorch): - -1. The model you pass in will not update. Please save a checkpoint and restore from there. -2. Set Dataloader(num_workers=0) or it will bottleneck training. - -`ddp` is MUCH faster than `ddp_spawn`. We recommend you - -1. Install a top-level module for your project using setup.py - -.. code-block:: python - - # setup.py - #!/usr/bin/env python - - from setuptools import setup, find_packages - - setup( - name="src", - version="0.0.1", - description="Describe Your Cool Project", - author="", - author_email="", - url="https://github.com/YourSeed", # REPLACE WITH YOUR OWN GITHUB PROJECT LINK - install_requires=["pytorch-lightning"], - packages=find_packages(), - ) - -2. Setup your project like so: - -.. code-block:: bash - - /project - /src - some_file.py - /or_a_folder - setup.py - -3. Install as a root-level package - -.. code-block:: bash - - cd /project - pip install -e . - -You can then call your scripts anywhere - -.. code-block:: bash - - cd /project/src - python some_file.py --accelerator 'gpu' --devices 8 --strategy 'ddp' - - -Horovod -^^^^^^^ -`Horovod `_ allows the same training script to be used for single-GPU, -multi-GPU, and multi-node training. - -Like Distributed Data Parallel, every process in Horovod operates on a single GPU with a fixed -subset of the data. Gradients are averaged across all GPUs in parallel during the backward pass, -then synchronously applied before beginning the next step. - -The number of worker processes is configured by a driver application (`horovodrun` or `mpirun`). In -the training script, Horovod will detect the number of workers from the environment, and automatically -scale the learning rate to compensate for the increased total batch size. - -Horovod can be configured in the training script to run with any number of GPUs / processes as follows: - -.. code-block:: python - - # train Horovod on GPU (number of GPUs / machines provided on command-line) - trainer = Trainer(strategy="horovod", accelerator="gpu", devices=1) - - # train Horovod on CPU (number of processes / machines provided on command-line) - trainer = Trainer(strategy="horovod") - -When starting the training job, the driver application will then be used to specify the total -number of worker processes: - -.. code-block:: bash - - # run training with 4 GPUs on a single machine - horovodrun -np 4 python train.py - - # run training with 8 GPUs on two machines (4 GPUs each) - horovodrun -np 8 -H hostname1:4,hostname2:4 python train.py - -See the official `Horovod documentation `_ for details -on installation and performance tuning. - - -Bagua -^^^^^ -`Bagua `_ is a deep learning training acceleration framework which supports -multiple advanced distributed training algorithms including: - -- `Gradient AllReduce `_ for centralized synchronous communication, where gradients are averaged among all workers. -- `Decentralized SGD `_ for decentralized synchronous communication, where each worker exchanges data with one or a few specific workers. -- `ByteGrad `_ and `QAdam `_ for low precision communication, where data is compressed into low precision before communication. -- `Asynchronous Model Average `_ for asynchronous communication, where workers are not required to be synchronized in the same iteration in a lock-step style. - -By default, Bagua uses *Gradient AllReduce* algorithm, which is also the algorithm implemented in Distributed Data Parallel and Horovod, -but Bagua can usually produce a higher training throughput due to its backend written in Rust. - -.. code-block:: python - - # train on 4 GPUs (using Bagua mode) - trainer = Trainer(strategy="bagua", accelerator="gpu", devices=4) - - -By specifying the ``algorithm`` in the ``BaguaStrategy``, you can select more advanced training algorithms featured by Bagua: - - -.. code-block:: python - - # train on 4 GPUs, using Bagua Gradient AllReduce algorithm - trainer = Trainer( - strategy=BaguaStrategy(algorithm="gradient_allreduce"), - accelerator="gpu", - devices=4, - ) - - # train on 4 GPUs, using Bagua ByteGrad algorithm - trainer = Trainer( - strategy=BaguaStrategy(algorithm="bytegrad"), - accelerator="gpu", - devices=4, - ) - - # train on 4 GPUs, using Bagua Decentralized SGD - trainer = Trainer( - strategy=BaguaStrategy(algorithm="decentralized"), - accelerator="gpu", - devices=4, - ) - - # train on 4 GPUs, using Bagua Low Precision Decentralized SGD - trainer = Trainer( - strategy=BaguaStrategy(algorithm="low_precision_decentralized"), - accelerator="gpu", - devices=4, - ) - - # train on 4 GPUs, using Asynchronous Model Average algorithm, with a synchronization interval of 100ms - trainer = Trainer( - strategy=BaguaStrategy(algorithm="async", sync_interval_ms=100), - accelerator="gpu", - devices=4, - ) - -To use *QAdam*, we need to initialize -`QAdamOptimizer `_ first: - -.. code-block:: python - - from pytorch_lightning.strategies import BaguaStrategy - from bagua.torch_api.algorithms.q_adam import QAdamOptimizer - - - class MyModel(pl.LightningModule): - ... - - def configure_optimizers(self): - # initialize QAdam Optimizer - return QAdamOptimizer(self.parameters(), lr=0.05, warmup_steps=100) - - - model = MyModel() - trainer = Trainer( - accelerator="gpu", - devices=4, - strategy=BaguaStrategy(algorithm="qadam"), - ) - trainer.fit(model) - -Bagua relies on its own `launcher `_ to schedule jobs. -Below, find examples using ``bagua.distributed.launch`` which follows ``torch.distributed.launch`` API: - -.. code-block:: bash - - # start training with 8 GPUs on a single node - python -m bagua.distributed.launch --nproc_per_node=8 train.py - -If the ssh service is available with passwordless login on each node, you can launch the distributed job on a -single node with ``baguarun`` which has a similar syntax as ``mpirun``. When staring the job, ``baguarun`` will -automatically spawn new processes on each of your training node provided by ``--host_list`` option and each node in it -is described as an ip address followed by a ssh port. - -.. code-block:: bash - - # Run on node1 (or node2) to start training on two nodes (node1 and node2), 8 GPUs per node - baguarun --host_list hostname1:ssh_port1,hostname2:ssh_port2 --nproc_per_node=8 --master_port=port1 train.py - - -.. note:: You can also start training in the same way as Distributed Data Parallel. However, system optimizations like - `Bagua-Net `_ and - `Performance autotuning `_ can only be enabled through bagua - launcher. It is worth noting that with ``Bagua-Net``, Distributed Data Parallel can also achieve - better performance without modifying the training script. - - -See `Bagua Tutorials `_ for more details on installation and advanced features. - - -DP/DDP2 caveats -^^^^^^^^^^^^^^^ -In DP and DDP2 each GPU within a machine sees a portion of a batch. -DP and ddp2 roughly do the following: - -.. testcode:: - - def distributed_forward(batch, model): - batch = torch.Tensor(32, 8) - gpu_0_batch = batch[:8] - gpu_1_batch = batch[8:16] - gpu_2_batch = batch[16:24] - gpu_3_batch = batch[24:] - - y_0 = model_copy_gpu_0(gpu_0_batch) - y_1 = model_copy_gpu_1(gpu_1_batch) - y_2 = model_copy_gpu_2(gpu_2_batch) - y_3 = model_copy_gpu_3(gpu_3_batch) - - return [y_0, y_1, y_2, y_3] - -So, when Lightning calls any of the `training_step`, `validation_step`, `test_step` -you will only be operating on one of those pieces. - -.. testcode:: - - # the batch here is a portion of the FULL batch - def training_step(self, batch, batch_idx): - y_0 = batch - -For most metrics, this doesn't really matter. However, if you want -to add something to your computational graph (like softmax) -using all batch parts you can use the `training_step_end` step. - -.. testcode:: - - def training_step_end(self, outputs): - # only use when on dp - outputs = torch.cat(outputs, dim=1) - softmax = softmax(outputs, dim=1) - out = softmax.mean() - return out - -In pseudocode, the full sequence is: - -.. code-block:: python - - # get data - batch = next(dataloader) - - # copy model and data to each gpu - batch_splits = split_batch(batch, num_gpus) - models = copy_model_to_gpus(model) - - # in parallel, operate on each batch chunk - all_results = [] - for gpu_num in gpus: - batch_split = batch_splits[gpu_num] - gpu_model = models[gpu_num] - out = gpu_model(batch_split) - all_results.append(out) - - # use the full batch for something like softmax - full_out = model.training_step_end(all_results) - -To illustrate why this is needed, let's look at DataParallel - -.. testcode:: - - def training_step(self, batch, batch_idx): - x, y = batch - y_hat = self(batch) - - # on dp or ddp2 if we did softmax now it would be wrong - # because batch is actually a piece of the full batch - return y_hat - - - def training_step_end(self, step_output): - # step_output has outputs of each part of the batch - - # do softmax here - outputs = torch.cat(outputs, dim=1) - softmax = softmax(outputs, dim=1) - out = softmax.mean() - - return out - -If `training_step_end` is defined it will be called regardless of TPU, DP, DDP, etc... which means -it will behave the same regardless of the backend. - -Validation and test step have the same option when using DP. - -.. testcode:: - - def validation_step_end(self, step_output): - ... - - - def test_step_end(self, step_output): - ... - - -Distributed and 16-bit precision -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - -Due to an issue with Apex and DataParallel (PyTorch and NVIDIA issue), Lightning does -not allow 16-bit and DP training. We tried to get this to work, but it's an issue on their end. - -Below are the possible configurations we support. - -+-------+---------+-----+-----+--------+-----------------------------------------------------------------------+ -| 1 GPU | 1+ GPUs | DP | DDP | 16-bit | command | -+=======+=========+=====+=====+========+=======================================================================+ -| Y | | | | | `Trainer(accelerator="gpu", devices=1)` | -+-------+---------+-----+-----+--------+-----------------------------------------------------------------------+ -| Y | | | | Y | `Trainer(accelerator="gpu", devices=1, precision=16)` | -+-------+---------+-----+-----+--------+-----------------------------------------------------------------------+ -| | Y | Y | | | `Trainer(accelerator="gpu", devices=k, strategy='dp')` | -+-------+---------+-----+-----+--------+-----------------------------------------------------------------------+ -| | Y | | Y | | `Trainer(accelerator="gpu", devices=k, strategy='ddp')` | -+-------+---------+-----+-----+--------+-----------------------------------------------------------------------+ -| | Y | | Y | Y | `Trainer(accelerator="gpu", devices=k, strategy='ddp', precision=16)` | -+-------+---------+-----+-----+--------+-----------------------------------------------------------------------+ - - -Implement Your Own Distributed (DDP) training -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -If you need your own way to init PyTorch DDP you can override :meth:`pytorch_lightning.strategies.ddp.DDPStrategy.init_dist_connection`. - -If you also need to use your own DDP implementation, override :meth:`pytorch_lightning.strategies.ddp.DDPStrategy.configure_ddp`. - ----------- - -Torch Distributed Elastic -------------------------- -Lightning supports the use of Torch Distributed Elastic to enable fault-tolerant and elastic distributed job scheduling. To use it, specify the 'ddp' or 'ddp2' backend and the number of GPUs you want to use in the trainer. - -.. code-block:: python - - Trainer(accelerator="gpu", devices=8, strategy="ddp") - -To launch a fault-tolerant job, run the following on all nodes. - -.. code-block:: bash - - python -m torch.distributed.run - --nnodes=NUM_NODES - --nproc_per_node=TRAINERS_PER_NODE - --rdzv_id=JOB_ID - --rdzv_backend=c10d - --rdzv_endpoint=HOST_NODE_ADDR - YOUR_LIGHTNING_TRAINING_SCRIPT.py (--arg1 ... train script args...) - -To launch an elastic job, run the following on at least ``MIN_SIZE`` nodes and at most ``MAX_SIZE`` nodes. - -.. code-block:: bash - - python -m torch.distributed.run - --nnodes=MIN_SIZE:MAX_SIZE - --nproc_per_node=TRAINERS_PER_NODE - --rdzv_id=JOB_ID - --rdzv_backend=c10d - --rdzv_endpoint=HOST_NODE_ADDR - YOUR_LIGHTNING_TRAINING_SCRIPT.py (--arg1 ... train script args...) - -See the official `Torch Distributed Elastic documentation `_ for details -on installation and more use cases. - -Optimize multi-machine communication ------------------------------------- - -By default, Lightning will select the ``nccl`` backend over ``gloo`` when running on GPUs. -Find more information about PyTorch's supported backends `here `__. - -Lightning allows explicitly specifying the backend via the `process_group_backend` constructor argument on the relevant Strategy classes. By default, Lightning will select the appropriate process group backend based on the hardware used. - -.. code-block:: python - - from pytorch_lightning.strategies import DDPStrategy - - # Explicitly specify the process group backend if you choose to - ddp = DDPStrategy(process_group_backend="nccl") - - # Configure the strategy on the Trainer - trainer = Trainer(strategy=ddp, accelerator="gpu", devices=8) diff --git a/docs/_sources/accelerators/hpu.rst.txt b/docs/_sources/accelerators/hpu.rst.txt deleted file mode 100644 index 13eeab8..0000000 --- a/docs/_sources/accelerators/hpu.rst.txt +++ /dev/null @@ -1,40 +0,0 @@ -.. _hpu: - -Accelerator: HPU training -========================= - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Prepare your code (Optional) - :description: Prepare your code to run on any hardware - :col_css: col-md-4 - :button_link: accelerator_prepare.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Basic - :description: Learn the basics of single and multi-HPU core training. - :col_css: col-md-4 - :button_link: hpu_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Intermediate - :description: Enable state-of-the-art scaling with advanced mix-precision settings. - :col_css: col-md-4 - :button_link: hpu_intermediate.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
diff --git a/docs/_sources/accelerators/hpu_basic.rst.txt b/docs/_sources/accelerators/hpu_basic.rst.txt deleted file mode 100644 index e07e153..0000000 --- a/docs/_sources/accelerators/hpu_basic.rst.txt +++ /dev/null @@ -1,83 +0,0 @@ -:orphan: - -.. _hpu_basics: - -Accelerator: HPU training -========================= -**Audience:** Users looking to save money and run large models faster using single or multiple Gaudi devices. - ----- - -What is an HPU? ---------------- - -`Habana® Gaudi® AI Processor (HPU) `__ training processors are built on a heterogeneous architecture with a cluster of fully programmable Tensor Processing Cores (TPC) along with its associated development tools and libraries, and a configurable Matrix Math engine. - -The TPC core is a VLIW SIMD processor with an instruction set and hardware tailored to serve training workloads efficiently. -The Gaudi memory architecture includes on-die SRAM and local memories in each TPC and, -Gaudi is the first DL training processor that has integrated RDMA over Converged Ethernet (RoCE v2) engines on-chip. - -On the software side, the PyTorch Habana bridge interfaces between the framework and SynapseAI software stack to enable the execution of deep learning models on the Habana Gaudi device. - -Gaudi offers a substantial price/performance advantage -- so you get to do more deep learning training while spending less. - -For more information, check out `Gaudi Architecture `__ and `Gaudi Developer Docs `__. - ----- - -Run on 1 Gaudi --------------- - -To enable PyTorch Lightning to utilize the HPU accelerator, simply provide ``accelerator="hpu"`` parameter to the Trainer class. - -.. code-block:: python - - trainer = Trainer(accelerator="hpu", devices=1) - ----- - -Run on multiple Gaudis ----------------------- -The ``devices=8`` and ``accelerator="hpu"`` parameters to the Trainer class enables the Habana accelerator for distributed training with 8 Gaudis. -It uses :class:`~pytorch_lightning.strategies.hpu_parallel.HPUParallelStrategy` internally which is based on DDP strategy with the addition of Habana's collective communication library (HCCL) to support scale-up within a node and scale-out across multiple nodes. - -.. code-block:: python - - trainer = Trainer(devices=8, accelerator="hpu") - ----- - -Select Gaudis automatically ---------------------------- - -Lightning can automatically detect the number of Gaudi devices to run on. This setting is enabled by default if the devices argument is missing. - -.. code-block:: python - - # equivalent - trainer = Trainer(accelerator="hpu") - trainer = Trainer(accelerator="hpu", devices="auto") - ----- - -How to access HPUs ------------------- - -To use HPUs, you must have access to a system with HPU devices. - -AWS -^^^ -You can either use `Gaudi-based AWS EC2 DL1 instances `__ or `Supermicro X12 Gaudi server `__ to get access to HPUs. - -Check out the `Get Started Guide with AWS and Habana `__. - ----- - -.. _known-limitations_hpu: - -Known limitations ------------------ - -* Multiple optimizers are not supported. -* `Habana dataloader `__ is not supported. -* :class:`~pytorch_lightning.callbacks.device_stats_monitor.DeviceStatsMonitor` is not supported. diff --git a/docs/_sources/accelerators/hpu_intermediate.rst.txt b/docs/_sources/accelerators/hpu_intermediate.rst.txt deleted file mode 100644 index 65dca85..0000000 --- a/docs/_sources/accelerators/hpu_intermediate.rst.txt +++ /dev/null @@ -1,68 +0,0 @@ -:orphan: - -.. _hpu_intermediate: - -Accelerator: HPU training -========================= -**Audience:** Gaudi chip users looking to save memory and scale models with mixed-precision training. - ----- - -Enable Mixed Precision ----------------------- - -Lightning also allows mixed precision training with HPUs. -By default, HPU training will use 32-bit precision. To enable mixed precision, set the ``precision`` flag. - -.. code-block:: python - - trainer = Trainer(devices=1, accelerator="hpu", precision=16) - ----- - -Customize Mixed Precision -------------------------- - -Internally, :class:`~pytorch_lightning.plugins.precision.hpu.HPUPrecisionPlugin` uses the Habana Mixed Precision (HMP) package to enable mixed precision training. - -You can execute the ops in FP32 or BF16 precision. The HMP package modifies the Python operators to add the appropriate cast operations for the arguments before execution. -The default settings enable users to enable mixed precision training with minimal code easily. - -In addition to the default settings in HMP, users also have the option of overriding these defaults and providing their -BF16 and FP32 operator lists by passing them as parameter to :class:`~pytorch_lightning.plugins.precision.hpu.HPUPrecisionPlugin`. - -The below snippet shows an example model using MNIST with a single Habana Gaudi device and making use of HMP by overriding the default parameters. -This enables advanced users to provide their own BF16 and FP32 operator list instead of using the HMP defaults. - -.. code-block:: python - - import pytorch_lightning as pl - from pytorch_lightning.plugins import HPUPrecisionPlugin - - # Initialize a trainer with HPU accelerator for HPU strategy for single device, - # with mixed precision using overidden HMP settings - trainer = pl.Trainer( - accelerator="hpu", - devices=1, - # Optional Habana mixed precision params to be set - # Checkout `pl_examples/hpu_examples/simple_mnist/ops_bf16_mnist.txt` for the format - plugins=[ - HPUPrecisionPlugin( - precision=16, - opt_level="O1", - verbose=False, - bf16_file_path="ops_bf16_mnist.txt", - fp32_file_path="ops_fp32_mnist.txt", - ) - ], - ) - - # Init our model - model = LitClassifier() - # Init the data - dm = MNISTDataModule(batch_size=batch_size) - - # Train the model ⚡ - trainer.fit(model, datamodule=dm) - -For more details, please refer to `PyTorch Mixed Precision Training on Gaudi `__. diff --git a/docs/_sources/accelerators/ipu.rst.txt b/docs/_sources/accelerators/ipu.rst.txt deleted file mode 100644 index 138814f..0000000 --- a/docs/_sources/accelerators/ipu.rst.txt +++ /dev/null @@ -1,48 +0,0 @@ -.. _ipu: - -Accelerator: IPU training -========================= - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Prepare your code (Optional) - :description: Prepare your code to run on any hardware - :col_css: col-md-6 - :button_link: accelerator_prepare.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Basic - :description: Learn the basics of single and multi-IPU training. - :col_css: col-md-6 - :button_link: ipu_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Intermediate - :description: Tune model performance with mix-precision settings and the performance analyser. - :col_css: col-md-6 - :button_link: ipu_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Advanced - :description: Learn advanced techniques to customize IPU training for massive models. - :col_css: col-md-6 - :button_link: ipu_advanced.html - :height: 150 - :tag: advanced - -.. raw:: html - -
-
diff --git a/docs/_sources/accelerators/ipu_advanced.rst.txt b/docs/_sources/accelerators/ipu_advanced.rst.txt deleted file mode 100644 index 1dc4e71..0000000 --- a/docs/_sources/accelerators/ipu_advanced.rst.txt +++ /dev/null @@ -1,143 +0,0 @@ -:orphan: - -.. _ipu_advanced: - -Accelerator: IPU training -========================= -**Audience:** Users looking to customize IPU training for massive models. - ----- - -Advanced IPU options --------------------- - -IPUs provide further optimizations to speed up training. By using the ``IPUStrategy`` we can set the ``device_iterations``, which controls the number of iterations run directly on the IPU devices before returning to the host. Increasing the number of on-device iterations will improve throughput, as there is less device to host communication required. - -.. note:: - - When using model parallelism, it is a hard requirement to increase the number of device iterations to ensure we fully saturate the devices via micro-batching. see :ref:`ipu-model-parallelism` for more information. - -.. code-block:: python - - import pytorch_lightning as pl - from pytorch_lightning.strategies import IPUStrategy - - model = MyLightningModule() - trainer = pl.Trainer(accelerator="ipu", devices=8, strategy=IPUStrategy(device_iterations=32)) - trainer.fit(model) - -Note that by default we return the last device iteration loss. You can override this by passing in your own ``poptorch.Options`` and setting the AnchorMode as described in the `PopTorch documentation `__. - -.. code-block:: python - - import poptorch - import pytorch_lightning as pl - from pytorch_lightning.strategies import IPUStrategy - - model = MyLightningModule() - inference_opts = poptorch.Options() - inference_opts.deviceIterations(32) - - training_opts = poptorch.Options() - training_opts.anchorMode(poptorch.AnchorMode.All) - training_opts.deviceIterations(32) - - trainer = Trainer( - accelerator="ipu", devices=8, strategy=IPUStrategy(inference_opts=inference_opts, training_opts=training_opts) - ) - trainer.fit(model) - -You can also override all options by passing the ``poptorch.Options`` to the plugin. See `PopTorch options documentation `__ for more information. - ----- - -.. _ipu-model-parallelism: - -Model parallelism ------------------ - -Due to the IPU architecture, larger models should be parallelized across IPUs by design. Currently PopTorch provides the capabilities via annotations as described in `parallel execution strategies `__. - -Below is an example using the block annotation in a LightningModule. - -.. note:: - - Currently, when using model parallelism we do not infer the number of IPUs required for you. This is done via the annotations themselves. If you specify 4 different IDs when defining Blocks, this means your model will be split onto 4 different IPUs. - - This is also mutually exclusive with the Trainer flag. In other words, if your model is split onto 2 IPUs and you set ``Trainer(accelerator="ipu", devices=4)`` this will require 8 IPUs in total: data parallelism will be used to replicate the two-IPU model 4 times. - - When pipelining the model you must also increase the `device_iterations` to ensure full data saturation of the devices data, i.e whilst one device in the model pipeline processes a batch of data, the other device can start on the next batch. For example if the model is split onto 4 IPUs, we require `device_iterations` to be at-least 4. - - -.. code-block:: python - - import pytorch_lightning as pl - import poptorch - - - class MyLightningModule(pl.LightningModule): - def __init__(self): - super().__init__() - # This will place layer1, layer2+layer3, layer4, softmax on different IPUs at runtime. - # BeginBlock will start a new id for all layers within this block - self.layer1 = poptorch.BeginBlock(torch.nn.Linear(5, 10), ipu_id=0) - - # This layer starts a new block, - # adding subsequent layers to this current block at runtime - # till the next block has been declared - self.layer2 = poptorch.BeginBlock(torch.nn.Linear(10, 5), ipu_id=1) - self.layer3 = torch.nn.Linear(5, 5) - - # Create new blocks - self.layer4 = poptorch.BeginBlock(torch.nn.Linear(5, 5), ipu_id=2) - self.softmax = poptorch.BeginBlock(torch.nn.Softmax(dim=1), ipu_id=3) - - ... - - - model = MyLightningModule() - trainer = pl.Trainer(accelerator="ipu", devices=8, strategy=IPUStrategy(device_iterations=20)) - trainer.fit(model) - - -You can also use the block context manager within the forward function, or any of the step functions. - -.. code-block:: python - - import pytorch_lightning as pl - import poptorch - - - class MyLightningModule(pl.LightningModule): - def __init__(self): - super().__init__() - self.layer1 = torch.nn.Linear(5, 10) - self.layer2 = torch.nn.Linear(10, 5) - self.layer3 = torch.nn.Linear(5, 5) - self.layer4 = torch.nn.Linear(5, 5) - - self.act = torch.nn.ReLU() - self.softmax = torch.nn.Softmax(dim=1) - - def forward(self, x): - - with poptorch.Block(ipu_id=0): - x = self.act(self.layer1(x)) - - with poptorch.Block(ipu_id=1): - x = self.act(self.layer2(x)) - - with poptorch.Block(ipu_id=2): - x = self.act(self.layer3(x)) - x = self.act(self.layer4(x)) - - with poptorch.Block(ipu_id=3): - x = self.softmax(x) - return x - - ... - - - model = MyLightningModule() - trainer = pl.Trainer(accelerator="ipu", devices=8, strategy=IPUStrategy(device_iterations=20)) - trainer.fit(model) diff --git a/docs/_sources/accelerators/ipu_basic.rst.txt b/docs/_sources/accelerators/ipu_basic.rst.txt deleted file mode 100644 index 492c7bf..0000000 --- a/docs/_sources/accelerators/ipu_basic.rst.txt +++ /dev/null @@ -1,68 +0,0 @@ -:orphan: - -.. _ipu_basic: - -Accelerator: IPU training -========================= -**Audience:** Users looking to save money and run large models faster using single or multiple IPU devices. - ----- - -What is an IPU? ---------------- - -The Graphcore `Intelligence Processing Unit (IPU) `__, built for Artificial Intelligence and Machine Learning, consists of many individual cores, called *tiles*, allowing highly parallel computation. Due to the high bandwidth between tiles, IPUs facilitate machine learning loads where parallelization is essential. Because computation is heavily parallelized, - -IPUs operate in a different way to conventional accelerators such as CPU/GPUs. IPUs do not require large batch sizes for maximum parallelization, can provide optimizations across the compiled graph and rely on model parallelism to fully utilize tiles for larger models. - -IPUs are used to build IPU-PODs, rack-based systems of IPU-Machines for larger workloads. See the `IPU Architecture `__ for more information. - -See the `Graphcore Glossary `__ for the definitions of other IPU-specific terminology. - -.. note:: - IPU support is experimental and a work in progress (see :ref:`known-limitations`). If you run into any problems, please leave an issue. - ----- - -Run on 1 IPU ------------- -To use a single IPU, set the accelerator and devices argument. - -.. code-block:: python - - trainer = pl.Trainer(accelerator="ipu", devices=1) - ----- - -Run on multiple IPUs --------------------- -To use multiple IPUs set the devices to a number that is a power of 2 (i.e: 2, 4, 8, 16, ...) - -.. code-block:: python - - trainer = pl.Trainer(accelerator="ipu", devices=8) - ----- - -How to access IPUs ------------------- - -To use IPUs you must have access to a system with IPU devices. To get access see `get started `__. - -You must ensure that the IPU system has enabled the PopART and Poplar packages from the SDK. Instructions are in the Get Started guide for your IPU system, on the Graphcore `documents portal `__. - ----- - -.. _known-limitations: - -Known limitations ------------------ - -Currently there are some known limitations that are being addressed in the near future to make the experience seamless when moving from different devices. - -Please see the `MNIST example `__ which displays most of the limitations and how to overcome them till they are resolved. - -* ``self.log`` is not supported in the ``training_step``, ``validation_step``, ``test_step`` or ``predict_step``. This is due to the step function being traced and sent to the IPU devices. We're actively working on fixing this -* Multiple optimizers are not supported. ``training_step`` only supports returning one loss from the ``training_step`` function as a result -* Since the step functions are traced, branching logic or any form of primitive values are traced into constants. Be mindful as this could lead to errors in your custom code -* Clipping gradients is not supported diff --git a/docs/_sources/accelerators/ipu_intermediate.rst.txt b/docs/_sources/accelerators/ipu_intermediate.rst.txt deleted file mode 100644 index 68c866e..0000000 --- a/docs/_sources/accelerators/ipu_intermediate.rst.txt +++ /dev/null @@ -1,63 +0,0 @@ -:orphan: - -.. _ipu_intermediate: - -Accelerator: IPU training -========================= -**Audience:** IPU users looking to increase performance via mixed precision and analysis tools. - ----- - -Mixed precision & 16 bit precision ----------------------------------- - -Lightning also supports training in mixed precision with IPUs. -By default, IPU training will use 32-bit precision. To enable mixed precision, -set the precision flag. - -.. note:: - Currently there is no dynamic scaling of the loss with mixed precision training. - -.. code-block:: python - - import pytorch_lightning as pl - - model = MyLightningModule() - trainer = pl.Trainer(accelerator="ipu", devices=8, precision=16) - trainer.fit(model) - -You can also use pure 16-bit training, where the weights are also in 16-bit precision. - -.. code-block:: python - - import pytorch_lightning as pl - from pytorch_lightning.strategies import IPUStrategy - - model = MyLightningModule() - model = model.half() - trainer = pl.Trainer(accelerator="ipu", devices=8, precision=16) - trainer.fit(model) - ----- - -PopVision Graph Analyser ------------------------- - -.. figure:: ../_static/images/accelerator/ipus/profiler.png - :alt: PopVision Graph Analyser - :width: 500 - -Lightning supports integration with the `PopVision Graph Analyser Tool `__. This helps to look at utilization of IPU devices and provides helpful metrics during the lifecycle of your trainer. Once you have gained access, The PopVision Graph Analyser Tool can be downloaded via the `GraphCore download website `__. - -Lightning supports dumping all reports to a directory to open using the tool. - -.. code-block:: python - - import pytorch_lightning as pl - from pytorch_lightning.strategies import IPUStrategy - - model = MyLightningModule() - trainer = pl.Trainer(accelerator="ipu", devices=8, strategy=IPUStrategy(autoreport_dir="report_dir/")) - trainer.fit(model) - -This will dump all reports to ``report_dir/`` which can then be opened using the Graph Analyser Tool, see `Opening Reports `__. diff --git a/docs/_sources/accelerators/tpu.rst.txt b/docs/_sources/accelerators/tpu.rst.txt deleted file mode 100644 index 6809277..0000000 --- a/docs/_sources/accelerators/tpu.rst.txt +++ /dev/null @@ -1,55 +0,0 @@ -.. _tpu: - -Accelerator: TPU training -========================= - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Prepare your code (Optional) - :description: Prepare your code to run on any hardware - :col_css: col-md-4 - :button_link: accelerator_prepare.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Basic - :description: Learn the basics of single and multi-TPU core training. - :col_css: col-md-4 - :button_link: tpu_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Intermediate - :description: Scale massive models using cloud TPUs. - :col_css: col-md-4 - :button_link: tpu_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Advanced - :description: Dive into XLA and advanced techniques to optimize TPU-powered models. - :col_css: col-md-4 - :button_link: tpu_advanced.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: FAQ - :description: Frequently asked questions about TPU training. - :col_css: col-md-4 - :button_link: gpu_faq.html - :height: 150 - -.. raw:: html - -
-
diff --git a/docs/_sources/accelerators/tpu_advanced.rst.txt b/docs/_sources/accelerators/tpu_advanced.rst.txt deleted file mode 100644 index 0aa490e..0000000 --- a/docs/_sources/accelerators/tpu_advanced.rst.txt +++ /dev/null @@ -1,68 +0,0 @@ -:orphan: - -TPU training (Advanced) -======================= -**Audience:** Users looking to apply advanced performance techniques to TPU training. - ----- - -Weight Sharing/Tying --------------------- -Weight Tying/Sharing is a technique where in the module weights are shared among two or more layers. -This is a common method to reduce memory consumption and is utilized in many State of the Art -architectures today. - -PyTorch XLA requires these weights to be tied/shared after moving the model -to the TPU device. To support this requirement Lightning provides a model hook which is -called after the model is moved to the device. Any weights that require to be tied should -be done in the `on_post_move_to_device` model hook. This will ensure that the weights -among the modules are shared and not copied. - -PyTorch Lightning has an inbuilt check which verifies that the model parameter lengths -match once the model is moved to the device. If the lengths do not match Lightning -throws a warning message. - -Example: - -.. code-block:: python - - from pytorch_lightning.core.lightning import LightningModule - from torch import nn - from pytorch_lightning.trainer.trainer import Trainer - - - class WeightSharingModule(LightningModule): - def __init__(self): - super().__init__() - self.layer_1 = nn.Linear(32, 10, bias=False) - self.layer_2 = nn.Linear(10, 32, bias=False) - self.layer_3 = nn.Linear(32, 10, bias=False) - # TPU shared weights are copied independently - # on the XLA device and this line won't have any effect. - # However, it works fine for CPU and GPU. - self.layer_3.weight = self.layer_1.weight - - def forward(self, x): - x = self.layer_1(x) - x = self.layer_2(x) - x = self.layer_3(x) - return x - - def on_post_move_to_device(self): - # Weights shared after the model has been moved to TPU Device - self.layer_3.weight = self.layer_1.weight - - - model = WeightSharingModule() - trainer = Trainer(max_epochs=1, accelerator="tpu", devices=8) - -See `XLA Documentation `_ - ----- - -XLA ---- -XLA is the library that interfaces PyTorch with the TPUs. -For more information check out `XLA `_. - -Guide for `troubleshooting XLA `_ diff --git a/docs/_sources/accelerators/tpu_basic.rst.txt b/docs/_sources/accelerators/tpu_basic.rst.txt deleted file mode 100644 index af7c45f..0000000 --- a/docs/_sources/accelerators/tpu_basic.rst.txt +++ /dev/null @@ -1,255 +0,0 @@ -:orphan: - -TPU training (Basic) -==================== -**Audience:** Users looking to train on single or multiple TPU cores. - ----- - -.. raw:: html - - - -| - -Lightning supports running on TPUs. At this moment, TPUs are available -on Google Cloud (GCP), Google Colab and Kaggle Environments. For more information on TPUs -`watch this video `_. - ----------------- - -What is a TPU? --------------- -Tensor Processing Unit (TPU) is an AI accelerator application-specific integrated circuit (ASIC) developed by Google specifically for neural networks. - -A TPU has 8 cores where each core is optimized for 128x128 matrix multiplies. In general, a single TPU is about as fast as 5 V100 GPUs! - -A TPU pod hosts many TPUs on it. Currently, TPU v3 Pod has up to 2048 TPU cores and 32 TiB of memory! -You can request a full pod from Google cloud or a "slice" which gives you -some subset of those 2048 cores. - ----- - -Run on 1 TPU core ------------------ -Enable the following Trainer arguments to run on 1 TPU. - -.. code:: - - trainer = Trainer(accelerator="tpu", devices=1) - ----- - -Run on multiple TPU cores -------------------------- -For multiple TPU cores, change the value of the devices flag. - -.. code:: - - trainer = Trainer(accelerator="tpu", devices=8) - ----- - -Run on a specific TPU core --------------------------- - -To run on a specific core, specify the index of the TPU core. - -.. code-block:: python - - trainer = pl.Trainer(accelerator="tpu", devices=[5]) - -This example runs on the 5th core, not on five cores. - ----- - -How to access TPUs ------------------- -To access TPUs, there are three main ways. - -Google Colab -^^^^^^^^^^^^ -Colab is like a jupyter notebook with a free GPU or TPU -hosted on GCP. - -To get a TPU on colab, follow these steps: - -1. Go to `https://colab.research.google.com/ `_. - -2. Click "new notebook" (bottom right of pop-up). - -3. Click runtime > change runtime settings. Select Python 3, and hardware accelerator "TPU". - This will give you a TPU with 8 cores. - -4. Next, insert this code into the first cell and execute. - This will install the xla library that interfaces between PyTorch and the TPU. - - .. code-block:: - - !pip install cloud-tpu-client==0.10 https://storage.googleapis.com/tpu-pytorch/wheels/torch_xla-1.9-cp37-cp37m-linux_x86_64.whl - -5. Once the above is done, install PyTorch Lightning. - - .. code-block:: - - !pip install pytorch-lightning - -6. Then set up your LightningModule as normal. - -Google Cloud (GCP) -^^^^^^^^^^^^^^^^^^ -? - -Kaggle -^^^^^^ -For starting Kaggle projects with TPUs, refer to this `kernel `_. - ----- - -Optimize Performance --------------------- - -The TPU was designed for specific workloads and operations to carry out large volumes of matrix multiplication, -convolution operations and other commonly used ops in applied deep learning. -The specialization makes it a strong choice for NLP tasks, sequential convolutional networks, and under low precision operation. -There are cases in which training on TPUs is slower when compared with GPUs, for possible reasons listed: - -- Too small batch size. -- Explicit evaluation of tensors during training, e.g. ``tensor.item()`` -- Tensor shapes (e.g. model inputs) change often during training. -- Limited resources when using TPU's with PyTorch `Link `_ -- XLA Graph compilation during the initial steps `Reference `_ -- Some tensor ops are not fully supported on TPU, or not supported at all. These operations will be performed on CPU (context switch). -- PyTorch integration is still experimental. Some performance bottlenecks may simply be the result of unfinished implementation. - -The official PyTorch XLA `performance guide `_ -has more detailed information on how PyTorch code can be optimized for TPU. In particular, the -`metrics report `_ allows -one to identify operations that lead to context switching. - ----- - -FAQ ---- - -**XLA configuration is missing** - -.. code-block:: - - File "/usr/local/lib/python3.8/dist-packages/torch_xla/core/xla_model.py", line 18, in - _DEVICES = xu.LazyProperty(lambda: torch_xla._XLAC._xla_get_devices()) - RuntimeError: tensorflow/compiler/xla/xla_client/computation_client.cc:273 : Missing XLA configuration - Traceback (most recent call last): - ... - File "/home/kaushikbokka/pytorch-lightning/pytorch_lightning/utilities/device_parser.py", line 125, in parse_tpu_cores - raise MisconfigurationException('No TPU devices were found.') - pytorch_lightning.utilities.exceptions.MisconfigurationException: No TPU devices were found. - -This means the system is missing XLA configuration. You would need to set up XRT TPU device configuration. - -For TPUVM architecture, you could set it in your terminal by: - -.. code-block:: bash - - export XRT_TPU_CONFIG="localservice;0;localhost:51011" - -And for the old TPU + 2VM architecture, you could set it by: - -.. code-block:: bash - - export TPU_IP_ADDRESS=10.39.209.42 # You could get the IP Address in the GCP TPUs section - export XRT_TPU_CONFIG="tpu_worker;0;$TPU_IP_ADDRESS:8470" - ----- - -**How to clear up the programs using TPUs in the background** - -.. code-block:: bash - - lsof -w /lib/libtpu.so | grep "python" | awk '{print $2}' | xargs -r kill -9 - -Sometimes, there can still be old programs running on the TPUs, which would make the TPUs unavailable to use. You could use the above command in the terminal to kill the running processes. - ----- - -**Replication issue** - -.. code-block:: - - File "/usr/local/lib/python3.6/dist-packages/torch_xla/core/xla_model.py", line 200, in set_replication - replication_devices = xla_replication_devices(devices) - File "/usr/local/lib/python3.6/dist-packages/torch_xla/core/xla_model.py", line 187, in xla_replication_devices - .format(len(local_devices), len(kind_devices))) - RuntimeError: Cannot replicate if number of devices (1) is different from 8 - -This error is raised when the XLA device is called outside the spawn process. Internally in `TPUSpawn` Strategy for training on multiple tpu cores, we use XLA's `xmp.spawn`. -Don't use ``xm.xla_device()`` while working on Lightning + TPUs! - ----- - -**Unsupported datatype transfer to TPU** - -.. code-block:: - - File "/usr/local/lib/python3.8/dist-packages/torch_xla/utils/utils.py", line 205, in _for_each_instance_rewrite - v = _for_each_instance_rewrite(result.__dict__[k], select_fn, fn, rwmap) - File "/usr/local/lib/python3.8/dist-packages/torch_xla/utils/utils.py", line 206, in _for_each_instance_rewrite - result.__dict__[k] = v - TypeError: 'mappingproxy' object does not support item assignment - -PyTorch XLA only supports Tensor objects for CPU to TPU data transfer. Might cause issues if the User is trying to send some non-tensor objects through the DataLoader or during saving states. - ----- - -**Using `tpu_spawn_debug` Strategy alias** - -.. code-block:: python - - import pytorch_lightning as pl - - my_model = MyLightningModule() - trainer = pl.Trainer(accelerator="tpu", devices=8, strategy="tpu_spawn_debug") - trainer.fit(my_model) - -Example Metrics report: - -.. code-block:: - - Metric: CompileTime - TotalSamples: 202 - Counter: 06m09s401ms746.001us - ValueRate: 778ms572.062us / second - Rate: 0.425201 / second - Percentiles: 1%=001ms32.778us; 5%=001ms61.283us; 10%=001ms79.236us; 20%=001ms110.973us; 50%=001ms228.773us; 80%=001ms339.183us; 90%=001ms434.305us; 95%=002ms921.063us; 99%=21s102ms853.173us - - -A lot of PyTorch operations aren't lowered to XLA, which could lead to significant slowdown of the training process. -These operations are moved to the CPU memory and evaluated, and then the results are transferred back to the XLA device(s). -By using the `tpu_spawn_debug` Strategy, users could create a metrics report to diagnose issues. - -The report includes things like (`XLA Reference `_): - -* how many times we issue XLA compilations and time spent on issuing. -* how many times we execute and time spent on execution -* how many device data handles we create/destroy etc. - ----- - -**TPU Pod Training Startup script** - -All TPU VMs in a Pod setup are required to access the model code and data. -One easy way to achieve this is to use the following startup script when creating the TPU VM pod. -It will perform the data downloading on all TPU VMs. Note that you need to export the corresponding environment variables following the instruction in Create TPU Node. - -.. code-block:: bash - - gcloud alpha compute tpus tpu-vm create ${TPU_NAME} --zone ${ZONE} --project ${PROJECT_ID} --accelerator-type v3-32 --version ${RUNTIME_VERSION} --metadata startup-script=setup.py - -Then users could ssh to any TPU worker, e.g. worker 0, check if data/model downloading is finished and -start the training after generating the ssh-keys to ssh between VM workers on a pod: - -.. code-block:: bash - - python3 -m torch_xla.distributed.xla_dist --tpu=$TPU_NAME -- python3 train.py --max_epochs=5 --batch_size=32 diff --git a/docs/_sources/accelerators/tpu_faq.rst.txt b/docs/_sources/accelerators/tpu_faq.rst.txt deleted file mode 100644 index af7c45f..0000000 --- a/docs/_sources/accelerators/tpu_faq.rst.txt +++ /dev/null @@ -1,255 +0,0 @@ -:orphan: - -TPU training (Basic) -==================== -**Audience:** Users looking to train on single or multiple TPU cores. - ----- - -.. raw:: html - - - -| - -Lightning supports running on TPUs. At this moment, TPUs are available -on Google Cloud (GCP), Google Colab and Kaggle Environments. For more information on TPUs -`watch this video `_. - ----------------- - -What is a TPU? --------------- -Tensor Processing Unit (TPU) is an AI accelerator application-specific integrated circuit (ASIC) developed by Google specifically for neural networks. - -A TPU has 8 cores where each core is optimized for 128x128 matrix multiplies. In general, a single TPU is about as fast as 5 V100 GPUs! - -A TPU pod hosts many TPUs on it. Currently, TPU v3 Pod has up to 2048 TPU cores and 32 TiB of memory! -You can request a full pod from Google cloud or a "slice" which gives you -some subset of those 2048 cores. - ----- - -Run on 1 TPU core ------------------ -Enable the following Trainer arguments to run on 1 TPU. - -.. code:: - - trainer = Trainer(accelerator="tpu", devices=1) - ----- - -Run on multiple TPU cores -------------------------- -For multiple TPU cores, change the value of the devices flag. - -.. code:: - - trainer = Trainer(accelerator="tpu", devices=8) - ----- - -Run on a specific TPU core --------------------------- - -To run on a specific core, specify the index of the TPU core. - -.. code-block:: python - - trainer = pl.Trainer(accelerator="tpu", devices=[5]) - -This example runs on the 5th core, not on five cores. - ----- - -How to access TPUs ------------------- -To access TPUs, there are three main ways. - -Google Colab -^^^^^^^^^^^^ -Colab is like a jupyter notebook with a free GPU or TPU -hosted on GCP. - -To get a TPU on colab, follow these steps: - -1. Go to `https://colab.research.google.com/ `_. - -2. Click "new notebook" (bottom right of pop-up). - -3. Click runtime > change runtime settings. Select Python 3, and hardware accelerator "TPU". - This will give you a TPU with 8 cores. - -4. Next, insert this code into the first cell and execute. - This will install the xla library that interfaces between PyTorch and the TPU. - - .. code-block:: - - !pip install cloud-tpu-client==0.10 https://storage.googleapis.com/tpu-pytorch/wheels/torch_xla-1.9-cp37-cp37m-linux_x86_64.whl - -5. Once the above is done, install PyTorch Lightning. - - .. code-block:: - - !pip install pytorch-lightning - -6. Then set up your LightningModule as normal. - -Google Cloud (GCP) -^^^^^^^^^^^^^^^^^^ -? - -Kaggle -^^^^^^ -For starting Kaggle projects with TPUs, refer to this `kernel `_. - ----- - -Optimize Performance --------------------- - -The TPU was designed for specific workloads and operations to carry out large volumes of matrix multiplication, -convolution operations and other commonly used ops in applied deep learning. -The specialization makes it a strong choice for NLP tasks, sequential convolutional networks, and under low precision operation. -There are cases in which training on TPUs is slower when compared with GPUs, for possible reasons listed: - -- Too small batch size. -- Explicit evaluation of tensors during training, e.g. ``tensor.item()`` -- Tensor shapes (e.g. model inputs) change often during training. -- Limited resources when using TPU's with PyTorch `Link `_ -- XLA Graph compilation during the initial steps `Reference `_ -- Some tensor ops are not fully supported on TPU, or not supported at all. These operations will be performed on CPU (context switch). -- PyTorch integration is still experimental. Some performance bottlenecks may simply be the result of unfinished implementation. - -The official PyTorch XLA `performance guide `_ -has more detailed information on how PyTorch code can be optimized for TPU. In particular, the -`metrics report `_ allows -one to identify operations that lead to context switching. - ----- - -FAQ ---- - -**XLA configuration is missing** - -.. code-block:: - - File "/usr/local/lib/python3.8/dist-packages/torch_xla/core/xla_model.py", line 18, in - _DEVICES = xu.LazyProperty(lambda: torch_xla._XLAC._xla_get_devices()) - RuntimeError: tensorflow/compiler/xla/xla_client/computation_client.cc:273 : Missing XLA configuration - Traceback (most recent call last): - ... - File "/home/kaushikbokka/pytorch-lightning/pytorch_lightning/utilities/device_parser.py", line 125, in parse_tpu_cores - raise MisconfigurationException('No TPU devices were found.') - pytorch_lightning.utilities.exceptions.MisconfigurationException: No TPU devices were found. - -This means the system is missing XLA configuration. You would need to set up XRT TPU device configuration. - -For TPUVM architecture, you could set it in your terminal by: - -.. code-block:: bash - - export XRT_TPU_CONFIG="localservice;0;localhost:51011" - -And for the old TPU + 2VM architecture, you could set it by: - -.. code-block:: bash - - export TPU_IP_ADDRESS=10.39.209.42 # You could get the IP Address in the GCP TPUs section - export XRT_TPU_CONFIG="tpu_worker;0;$TPU_IP_ADDRESS:8470" - ----- - -**How to clear up the programs using TPUs in the background** - -.. code-block:: bash - - lsof -w /lib/libtpu.so | grep "python" | awk '{print $2}' | xargs -r kill -9 - -Sometimes, there can still be old programs running on the TPUs, which would make the TPUs unavailable to use. You could use the above command in the terminal to kill the running processes. - ----- - -**Replication issue** - -.. code-block:: - - File "/usr/local/lib/python3.6/dist-packages/torch_xla/core/xla_model.py", line 200, in set_replication - replication_devices = xla_replication_devices(devices) - File "/usr/local/lib/python3.6/dist-packages/torch_xla/core/xla_model.py", line 187, in xla_replication_devices - .format(len(local_devices), len(kind_devices))) - RuntimeError: Cannot replicate if number of devices (1) is different from 8 - -This error is raised when the XLA device is called outside the spawn process. Internally in `TPUSpawn` Strategy for training on multiple tpu cores, we use XLA's `xmp.spawn`. -Don't use ``xm.xla_device()`` while working on Lightning + TPUs! - ----- - -**Unsupported datatype transfer to TPU** - -.. code-block:: - - File "/usr/local/lib/python3.8/dist-packages/torch_xla/utils/utils.py", line 205, in _for_each_instance_rewrite - v = _for_each_instance_rewrite(result.__dict__[k], select_fn, fn, rwmap) - File "/usr/local/lib/python3.8/dist-packages/torch_xla/utils/utils.py", line 206, in _for_each_instance_rewrite - result.__dict__[k] = v - TypeError: 'mappingproxy' object does not support item assignment - -PyTorch XLA only supports Tensor objects for CPU to TPU data transfer. Might cause issues if the User is trying to send some non-tensor objects through the DataLoader or during saving states. - ----- - -**Using `tpu_spawn_debug` Strategy alias** - -.. code-block:: python - - import pytorch_lightning as pl - - my_model = MyLightningModule() - trainer = pl.Trainer(accelerator="tpu", devices=8, strategy="tpu_spawn_debug") - trainer.fit(my_model) - -Example Metrics report: - -.. code-block:: - - Metric: CompileTime - TotalSamples: 202 - Counter: 06m09s401ms746.001us - ValueRate: 778ms572.062us / second - Rate: 0.425201 / second - Percentiles: 1%=001ms32.778us; 5%=001ms61.283us; 10%=001ms79.236us; 20%=001ms110.973us; 50%=001ms228.773us; 80%=001ms339.183us; 90%=001ms434.305us; 95%=002ms921.063us; 99%=21s102ms853.173us - - -A lot of PyTorch operations aren't lowered to XLA, which could lead to significant slowdown of the training process. -These operations are moved to the CPU memory and evaluated, and then the results are transferred back to the XLA device(s). -By using the `tpu_spawn_debug` Strategy, users could create a metrics report to diagnose issues. - -The report includes things like (`XLA Reference `_): - -* how many times we issue XLA compilations and time spent on issuing. -* how many times we execute and time spent on execution -* how many device data handles we create/destroy etc. - ----- - -**TPU Pod Training Startup script** - -All TPU VMs in a Pod setup are required to access the model code and data. -One easy way to achieve this is to use the following startup script when creating the TPU VM pod. -It will perform the data downloading on all TPU VMs. Note that you need to export the corresponding environment variables following the instruction in Create TPU Node. - -.. code-block:: bash - - gcloud alpha compute tpus tpu-vm create ${TPU_NAME} --zone ${ZONE} --project ${PROJECT_ID} --accelerator-type v3-32 --version ${RUNTIME_VERSION} --metadata startup-script=setup.py - -Then users could ssh to any TPU worker, e.g. worker 0, check if data/model downloading is finished and -start the training after generating the ssh-keys to ssh between VM workers on a pod: - -.. code-block:: bash - - python3 -m torch_xla.distributed.xla_dist --tpu=$TPU_NAME -- python3 train.py --max_epochs=5 --batch_size=32 diff --git a/docs/_sources/accelerators/tpu_intermediate.rst.txt b/docs/_sources/accelerators/tpu_intermediate.rst.txt deleted file mode 100644 index 826f568..0000000 --- a/docs/_sources/accelerators/tpu_intermediate.rst.txt +++ /dev/null @@ -1,113 +0,0 @@ -:orphan: - -TPU training (Intermediate) -=========================== -**Audience:** Users looking to use cloud TPUs. - ----- - -DistributedSamplers -------------------- -Lightning automatically inserts the correct samplers - no need to do this yourself! - -Usually, with TPUs (and DDP), you would need to define a DistributedSampler to move the right -chunk of data to the appropriate TPU. As mentioned, this is not needed in Lightning - -.. note:: Don't add distributedSamplers. Lightning does this automatically - -If for some reason you still need to, this is how to construct the sampler -for TPU use - -.. code-block:: python - - import torch_xla.core.xla_model as xm - - - def train_dataloader(self): - dataset = MNIST(os.getcwd(), train=True, download=True, transform=transforms.ToTensor()) - - # required for TPU support - sampler = None - if use_tpu: - sampler = torch.utils.data.distributed.DistributedSampler( - dataset, num_replicas=xm.xrt_world_size(), rank=xm.get_ordinal(), shuffle=True - ) - - loader = DataLoader(dataset, sampler=sampler, batch_size=32) - - return loader - -Configure the number of TPU cores in the trainer. You can only choose 1 or 8. -To use a full TPU pod skip to the TPU pod section. - -.. code-block:: python - - import pytorch_lightning as pl - - my_model = MyLightningModule() - trainer = pl.Trainer(accelerator="tpu", devices=8) - trainer.fit(my_model) - -That's it! Your model will train on all 8 TPU cores. - ----------------- - -Distributed Backend with TPU ----------------------------- -The ``accelerator`` option used for GPUs does not apply to TPUs. -TPUs work in DDP mode by default (distributing over each core) - ----------------- - -TPU VM ------- -Lightning supports training on the new Cloud TPU VMs. -Previously, we needed separate VMs to connect to the TPU machines, but as -Cloud TPU VMs run on the TPU Host machines, it allows direct SSH access -for the users. Hence, this architecture upgrade leads to cheaper and significantly -better performance and usability while working with TPUs. - -The TPUVMs come pre-installed with latest versions of PyTorch and PyTorch XLA. -After connecting to the VM and before running your Lightning code, you would need -to set the XRT TPU device configuration. - -.. code-block:: bash - - $ export XRT_TPU_CONFIG="localservice;0;localhost:51011" - -You could learn more about the Cloud TPU VM architecture `here `_ - ----------------- - -TPU Pod -------- -To train on more than 8 cores, your code actually doesn't change! -All you need to do is submit the following command: - -.. code-block:: bash - - $ python -m torch_xla.distributed.xla_dist - --tpu=$TPU_POD_NAME - --conda-env=torch-xla-nightly - -- python /usr/share/torch-xla-1.8.1/pytorch/xla/test/test_train_imagenet.py --fake_data - -See `this guide `_ -on how to set up the instance groups and VMs needed to run TPU Pods. - ----------------- - -16 bit precision ----------------- -Lightning also supports training in 16-bit precision with TPUs. -By default, TPU training will use 32-bit precision. To enable 16-bit, -set the 16-bit flag. - -.. code-block:: python - - import pytorch_lightning as pl - - my_model = MyLightningModule() - trainer = pl.Trainer(accelerator="tpu", devices=8, precision=16) - trainer.fit(my_model) - -Under the hood the xla library will use the `bfloat16 type `_. diff --git a/docs/_sources/advanced/model_parallel.rst.txt b/docs/_sources/advanced/model_parallel.rst.txt deleted file mode 100644 index 811bc57..0000000 --- a/docs/_sources/advanced/model_parallel.rst.txt +++ /dev/null @@ -1,905 +0,0 @@ -.. _model-parallel: - -Train 1 trillion+ parameter models -================================== - -When training large models, fitting larger batch sizes, or trying to increase throughput using multi-GPU compute, Lightning provides advanced optimized distributed training strategies to support these cases and offer substantial improvements in memory usage. - -In many cases these strategies are some flavour of model parallelism however we only introduce concepts at a high level to get you started. Refer to the `FairScale documentation `_ for more information about model parallelism. - -Note that some of the extreme memory saving configurations will affect the speed of training. This Speed/Memory trade-off in most cases can be adjusted. - -Some of these memory-efficient strategies rely on offloading onto other forms of memory, such as CPU RAM or NVMe. This means you can even see memory benefits on a **single GPU**, using a strategy such as :ref:`deepspeed-zero-stage-3-offload`. - -Check out this amazing video explaining model parallelism and how it works behind the scenes: - -.. raw:: html - - - - -Choosing an Advanced Distributed GPU Strategy -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - -If you would like to stick with PyTorch DDP, see :ref:`ddp-optimizations`. - -Unlike :class:`~torch.nn.parallel.DistributedDataParallel` (DDP) where the maximum trainable model size and batch size do not change with respect to the number of GPUs, memory-optimized strategies can accommodate bigger models and larger batches as more GPUs are used. This means as you scale up the number of GPUs, you can reach the number of model parameters you'd like to train. - -There are many considerations when choosing a strategy as described below. In addition, check out the visualization of various strategy benchmarks using `minGPT `__ `here `__. - -Pre-training vs Fine-tuning -""""""""""""""""""""""""""" - -When fine-tuning, we often use a magnitude less data compared to pre-training a model. This is important when choosing a distributed strategy as usually for pre-training, **we are compute-bound**. -This means we cannot sacrifice throughput as much as if we were fine-tuning, because in fine-tuning the data requirement is smaller. - -Overall: - -* When **fine-tuning** a model, use advanced memory efficient strategies such as :ref:`deepspeed-zero-stage-3` or :ref:`deepspeed-zero-stage-3-offload`, allowing you to fine-tune larger models if you are limited on compute -* When **pre-training** a model, use simpler optimizations such :ref:`sharded-training`, :ref:`deepspeed-zero-stage-2` or :ref:`fully-sharded-training`, scaling the number of GPUs to reach larger parameter sizes -* For both fine-tuning and pre-training, use :ref:`deepspeed-activation-checkpointing` or :ref:`fairscale-activation-checkpointing` as the throughput degradation is not significant - -For example when using 128 GPUs, you can **pre-train** large 10 to 20 Billion parameter models using :ref:`deepspeed-zero-stage-2` without having to take a performance hit with more advanced optimized multi-gpu strategy. - -But for **fine-tuning** a model, you can reach 10 to 20 Billion parameter models using :ref:`deepspeed-zero-stage-3-offload` on a **single GPU**. This does come with a significant throughput hit, which needs to be weighed accordingly. - -When Shouldn't I use an Optimized Distributed Strategy? -""""""""""""""""""""""""""""""""""""""""""""""""""""""" - -Sharding techniques help when model sizes are fairly large; roughly 500M+ parameters is where we've seen benefits. However, in the following cases, we recommend sticking to ordinary distributed strategies -* When your model is small (ResNet50 of around 80M Parameters), unless you are using unusually large batch sizes or inputs. -* Due to high distributed communication between devices, if running on a slow network/interconnect, the training might be much slower than expected and then it's up to you to determince the tradeoff here. - ----------- - -.. _sharded-training: - -Sharded Training -^^^^^^^^^^^^^^^^ -Lightning integration of optimizer sharded training provided by `FairScale `_. -The technique can be found within `DeepSpeed ZeRO `_ and -`ZeRO-2 `_, -however the implementation is built from the ground up to be PyTorch compatible and standalone. -Sharded Training allows you to maintain GPU scaling efficiency, whilst reducing memory overhead drastically. In short, expect near-normal linear scaling (if your network allows), and significantly reduced memory usage when training large models. - -Sharded Training still utilizes Data Parallel Training under the hood, except optimizer states and gradients are sharded across GPUs. -This means the memory overhead per GPU is lower, as each GPU only has to maintain a partition of your optimizer state and gradients. - -The benefits vary by model and parameter sizes, but we've recorded up to a 63% memory reduction per GPU allowing us to double our model sizes. Because of efficient communication, -these benefits in multi-GPU setups are almost free and throughput scales well with multi-node setups. - -It is highly recommended to use Sharded Training in multi-GPU environments where memory is limited, or where training larger models are beneficial (500M+ parameter models). -A technical note: as batch size scales, storing activations for the backwards pass becomes the bottleneck in training. As a result, sharding optimizer state and gradients becomes less impactful. -Use :ref:`fairscale-activation-checkpointing` to see even more benefit at the cost of some throughput. - -To use Sharded Training, you need to first install FairScale using the command below. - -.. code-block:: bash - - pip install fairscale - - -.. code-block:: python - - # train using Sharded DDP - trainer = Trainer(strategy="ddp_sharded") - -Sharded Training can work across all DDP variants by adding the additional ``--strategy ddp_sharded`` flag via command line using a PyTorch Lightning script. - -Internally we re-initialize your optimizers and shard them across your machines and processes. We handle all communication using PyTorch distributed, so no code changes are required. - ----------- - -.. _fully-sharded-training: - -Fully Sharded Training -^^^^^^^^^^^^^^^^^^^^^^ - -.. warning:: - Fully Sharded Training is in beta and the API is subject to change. Please create an `issue `_ if you run into any issues. - -`Fully Sharded `__ shards optimizer state, gradients and parameters across data parallel workers. This allows you to fit much larger models onto multiple GPUs into memory. - -Fully Sharded Training alleviates the need to worry about balancing layers onto specific devices using some form of pipe parallelism, and optimizes for distributed communication with minimal effort. - -Shard Parameters to Reach 10+ Billion Parameters -"""""""""""""""""""""""""""""""""""""""""""""""" - -To reach larger parameter sizes and be memory efficient, we have to shard parameters. There are various ways to enable this. - -.. note:: - Currently Fully Sharded Training relies on the user to wrap the model with Fully Sharded within the ``LightningModule``. - This means you must create a single model that is treated as a ``torch.nn.Module`` within the ``LightningModule``. - This is a limitation of Fully Sharded Training that will be resolved in the future. - -Enabling Module Sharding for Maximum Memory Efficiency -"""""""""""""""""""""""""""""""""""""""""""""""""""""" - -To activate parameter sharding, you must wrap your model using provided ``wrap`` or ``auto_wrap`` functions as described below. Internally in Lightning, we enable a context manager around the ``configure_sharded_model`` function to make sure the ``wrap`` and ``auto_wrap`` parameters are passed correctly. - -When not using Fully Sharded these wrap functions are a no-op. This means once the changes have been made, there is no need to remove the changes for other strategies. - -``auto_wrap`` will recursively wrap :class:`~torch.nn.Module` within the ``LightningModule`` with nested Fully Sharded Wrappers, -signalling that we'd like to partition these modules across data parallel devices, discarding the full weights when not required (information :class:`here `). - -``auto_wrap`` can have varying level of success based on the complexity of your model. **Auto Wrap does not support models with shared parameters**. - -``wrap`` will simply wrap the module with a Fully Sharded Parallel class with the correct parameters from the Lightning context manager. - -Below is an example of using both ``wrap`` and ``auto_wrap`` to create your model. - -.. code-block:: python - - import torch - import torch.nn as nn - import pytorch_lightning as pl - from pytorch_lightning import Trainer - from fairscale.nn import checkpoint_wrapper, auto_wrap, wrap - - - class MyModel(pl.LightningModule): - def __init__(self): - super().__init__() - self.linear_layer = nn.Linear(32, 32) - self.block = nn.Sequential(nn.Linear(32, 32), nn.ReLU()) - self.final_block = nn.Sequential(nn.Linear(32, 32), nn.ReLU()) - - def configure_sharded_model(self): - # modules are sharded across processes - # as soon as they are wrapped with ``wrap`` or ``auto_wrap``. - # During the forward/backward passes, weights get synced across processes - # and de-allocated once computation is complete, saving memory. - - # Wraps the layer in a Fully Sharded Wrapper automatically - linear_layer = wrap(self.linear_layer) - - # Wraps the module recursively - # based on a minimum number of parameters (default 100M parameters) - block = auto_wrap(self.block) - - # For best memory efficiency, - # add FairScale activation checkpointing - final_block = auto_wrap(checkpoint_wrapper(self.final_block)) - self.model = nn.Sequential(linear_layer, nn.ReLU(), block, final_block) - - def configure_optimizers(self): - return torch.optim.AdamW(self.model.parameters()) - - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="fsdp", precision=16) - trainer.fit(model) - - trainer.test() - trainer.predict() - - ----------- - -.. _fairscale-activation-checkpointing: - -FairScale Activation Checkpointing -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - -Activation checkpointing frees activations from memory as soon as they are not needed during the forward pass. They are then re-computed for the backwards pass as needed. Activation checkpointing is very useful when you have intermediate layers that produce large activations. - -FairScales' checkpointing wrapper also handles batch norm layers correctly unlike the PyTorch implementation, ensuring stats are tracked correctly due to the multiple forward passes. - -This saves memory when training larger models however requires wrapping modules you'd like to use activation checkpointing on. See :class:`here ` for more information. - -.. warning:: - - Ensure to not wrap the entire model with activation checkpointing. This is not the intended usage of activation checkpointing, and will lead to failures as seen in `this discussion `__. - -.. code-block:: python - - from pytorch_lightning import Trainer - from fairscale.nn import checkpoint_wrapper - - - class MyModel(pl.LightningModule): - def __init__(self): - super().__init__() - # Wrap layers using checkpoint_wrapper - self.block_1 = checkpoint_wrapper(nn.Sequential(nn.Linear(32, 32), nn.ReLU())) - self.block_2 = nn.Linear(32, 2) - - -.. _deepspeed_advanced: - -DeepSpeed -^^^^^^^^^ - -.. note:: - The DeepSpeed strategy is in beta and the API is subject to change. Please create an `issue `_ if you run into any issues. - -`DeepSpeed `__ is a deep learning training optimization library, providing the means to train massive billion parameter models at scale. -Using the DeepSpeed strategy, we were able to **train model sizes of 10 Billion parameters and above**, with a lot of useful information in this `benchmark `_ and the `DeepSpeed docs `__. -DeepSpeed also offers lower level training optimizations, and efficient optimizers such as `1-bit Adam `_. We recommend using DeepSpeed in environments where speed and memory optimizations are important (such as training large billion parameter models). - -Below is a summary of all the configurations of DeepSpeed. - -* :ref:`deepspeed-zero-stage-1` - **Shard optimizer states**, remains at speed parity with DDP whilst providing memory improvement - -* :ref:`deepspeed-zero-stage-2` - **Shard optimizer states and gradients**, remains at speed parity with DDP whilst providing even more memory improvement - -* :ref:`deepspeed-zero-stage-2-offload` - **Offload optimizer states and gradients to CPU**. Increases distributed communication volume and GPU-CPU device transfer, but provides significant memory improvement - -* :ref:`deepspeed-zero-stage-3` - **Shard optimizer states, gradients, parameters and optionally activations**. Increases distributed communication volume, but provides even more memory improvement - -* :ref:`deepspeed-zero-stage-3-offload` - **Offload optimizer states, gradients, parameters and optionally activations to CPU**. Increases distributed communication volume and GPU-CPU device transfer, but even more significant memory improvement. - -* :ref:`deepspeed-activation-checkpointing` - **Free activations after forward pass**. Increases computation, but provides memory improvement for all stages. - -To use DeepSpeed, you first need to install DeepSpeed using the commands below. - -.. code-block:: bash - - pip install deepspeed - -If you run into an issue with the install or later in training, ensure that the CUDA version of the PyTorch you've installed matches your locally installed CUDA (you can see which one has been recognized by running ``nvcc --version``). - -.. note:: - - DeepSpeed currently only supports single optimizer, single scheduler within the training loop. - - When saving a checkpoint we rely on DeepSpeed which saves a directory containing the model and various components. - - -.. _deepspeed-zero-stage-1: - -DeepSpeed ZeRO Stage 1 -"""""""""""""""""""""" - -`DeepSpeed ZeRO Stage 1 `_ partitions your optimizer states (Stage 1) across your GPUs to reduce memory. - -It is recommended to skip Stage 1 and use Stage 2, which comes with larger memory improvements and still remains efficient. Stage 1 is useful to pair with certain optimizations such as `Torch ORT `__. - -.. code-block:: python - - from pytorch_lightning import Trainer - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_1", precision=16) - trainer.fit(model) - - -.. _deepspeed-zero-stage-2: - -DeepSpeed ZeRO Stage 2 -"""""""""""""""""""""" - -`DeepSpeed ZeRO Stage 2 `_ partitions your optimizer states (Stage 1) and your gradients (Stage 2) across your GPUs to reduce memory. In most cases, this is more efficient or at parity with DDP, primarily due to the optimized custom communications written by the DeepSpeed team. -As a result, benefits can also be seen on a single GPU. Do note that the default bucket sizes allocate around ``3.6GB`` of VRAM to use during distributed communications, which can be tweaked when instantiating the strategy described in a few sections below. - -.. code-block:: python - - from pytorch_lightning import Trainer - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_2", precision=16) - trainer.fit(model) - -.. code-block:: bash - - python train.py --strategy deepspeed_stage_2 --precision 16 --accelerator 'gpu' --devices 4 - - -.. _deepspeed-zero-stage-2-offload: - -DeepSpeed ZeRO Stage 2 Offload -"""""""""""""""""""""""""""""" - -Below we show an example of running `ZeRO-Offload `_. ZeRO-Offload leverages the host CPU to offload optimizer memory/computation, reducing the overall memory consumption. - -.. code-block:: python - - from pytorch_lightning import Trainer - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_2_offload", precision=16) - trainer.fit(model) - - -This can also be done via the command line using a PyTorch Lightning script: - -.. code-block:: bash - - python train.py --strategy deepspeed_stage_2_offload --precision 16 --accelerator 'gpu' --devices 4 - - -You can also modify the ZeRO-Offload parameters via the strategy as below. - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DeepSpeedStrategy - - model = MyModel() - trainer = Trainer( - accelerator="gpu", - devices=4, - strategy=DeepSpeedStrategy(offload_optimizer=True, allgather_bucket_size=5e8, reduce_bucket_size=5e8), - precision=16, - ) - trainer.fit(model) - - -.. note:: - We suggest tuning the ``allgather_bucket_size`` parameter and ``reduce_bucket_size`` parameter to find optimum parameters based on your model size. - These control how large a buffer we limit the model to using when reducing gradients/gathering updated parameters. Smaller values will result in less memory, but tradeoff with speed. - - DeepSpeed allocates a reduce buffer size `multiplied by 1.5x `_ so take that into consideration when tweaking the parameters. - - The strategy sets a reasonable default of ``2e8``, which should work for most low VRAM GPUs (less than ``7GB``), allocating roughly ``3.6GB`` of VRAM as buffer. Higher VRAM GPUs should aim for values around ``5e8``. - -For even more speed benefit, DeepSpeed offers an optimized CPU version of ADAM called `DeepSpeedCPUAdam `_ to run the offloaded computation, which is faster than the standard PyTorch implementation. - -.. code-block:: python - - import pytorch_lightning - from pytorch_lightning import Trainer - from deepspeed.ops.adam import DeepSpeedCPUAdam - - - class MyModel(pl.LightningModule): - ... - - def configure_optimizers(self): - # DeepSpeedCPUAdam provides 5x to 7x speedup over torch.optim.adam(w) - return DeepSpeedCPUAdam(self.parameters()) - - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_2_offload", precision=16) - trainer.fit(model) - - -.. _deepspeed-zero-stage-3: - -DeepSpeed ZeRO Stage 3 -"""""""""""""""""""""" - -DeepSpeed ZeRO Stage 3 shards the optimizer states, gradients and the model parameters (also optionally activations). Sharding model parameters and activations comes with an increase in distributed communication, however allows you to scale your models massively from one GPU to multiple GPUs. -**The DeepSpeed team report the ability to fine-tune models with over 40B parameters on a single GPU and over 2 Trillion parameters on 512 GPUs.** For more information we suggest checking the `DeepSpeed ZeRO-3 Offload documentation `__. - -We've ran benchmarks for all these features and given a simple example of how all these features work in Lightning, which you can see at `minGPT `_. - -To reach the highest memory efficiency or model size, you must: - -1. Use the DeepSpeed strategy with the stage 3 parameter -2. Use CPU Offloading to offload weights to CPU, plus have a reasonable amount of CPU RAM to offload onto -3. Use DeepSpeed Activation Checkpointing to shard activations - -Below we describe how to enable all of these to see benefit. **With all these improvements we reached 45 Billion parameters training a GPT model on 8 GPUs with ~1TB of CPU RAM available**. - -Also please have a look at our :ref:`deepspeed-zero-stage-3-tips` which contains a lot of helpful information when configuring your own models. - -.. note:: - - When saving a model using DeepSpeed and Stage 3, model states and optimizer states will be saved in separate sharded states (based on the world size). See :ref:`deepspeed-zero-stage-3-single-file` to obtain a single checkpoint file. - -.. code-block:: python - - from pytorch_lightning import Trainer - from deepspeed.ops.adam import FusedAdam - - - class MyModel(pl.LightningModule): - ... - - def configure_optimizers(self): - return FusedAdam(self.parameters()) - - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3", precision=16) - trainer.fit(model) - - trainer.test() - trainer.predict() - - -You can also use the Lightning Trainer to run predict or evaluate with DeepSpeed once the model has been trained. - -.. code-block:: python - - from pytorch_lightning import Trainer - - - class MyModel(pl.LightningModule): - ... - - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3", precision=16) - trainer.test(ckpt_path="my_saved_deepspeed_checkpoint.ckpt") - - -Shard Model Instantly to Reduce Initialization Time/Memory -"""""""""""""""""""""""""""""""""""""""""""""""""""""""""" - -When instantiating really large models, it is sometimes necessary to shard the model layers instantly. - -This is the case if layers may not fit on one single machines CPU or GPU memory, but would fit once sharded across multiple machines. -We expose a hook that layers initialized within the hook will be sharded instantly on a per layer basis, allowing you to instantly shard models. - -This reduces the time taken to initialize very large models, as well as ensure we do not run out of memory when instantiating larger models. For more information you can refer to the DeepSpeed docs for `Constructing Massive Models `_. - -.. code-block:: python - - import torch.nn as nn - from pytorch_lightning import Trainer - from deepspeed.ops.adam import FusedAdam - - - class MyModel(pl.LightningModule): - ... - - def configure_sharded_model(self): - # Created within sharded model context, modules are instantly sharded across processes - # as soon as they are made. - self.block = nn.Sequential(nn.Linear(32, 32), nn.ReLU()) - - def configure_optimizers(self): - return FusedAdam(self.parameters()) - - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3", precision=16) - trainer.fit(model) - - trainer.test() - trainer.predict() - - -.. _deepspeed-zero-stage-3-offload: - -DeepSpeed ZeRO Stage 3 Offload -"""""""""""""""""""""""""""""" - -DeepSpeed ZeRO Stage 3 Offloads optimizer state, gradients to the host CPU to reduce memory usage as ZeRO Stage 2 does, however additionally allows you to offload the parameters as well for even more memory saving. - -.. note:: - - When saving a model using DeepSpeed and Stage 3, model states and optimizer states will be saved in separate sharded states (based on the world size). See :ref:`deepspeed-zero-stage-3-single-file` to obtain a single checkpoint file. - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DeepSpeedStrategy - - # Enable CPU Offloading - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3_offload", precision=16) - trainer.fit(model) - - # Enable CPU Offloading, and offload parameters to CPU - model = MyModel() - trainer = Trainer( - accelerator="gpu", - devices=4, - strategy=DeepSpeedStrategy( - stage=3, - offload_optimizer=True, - offload_parameters=True, - ), - precision=16, - ) - trainer.fit(model) - - -DeepSpeed Infinity (NVMe Offloading) -"""""""""""""""""""""""""""""""""""" - -Additionally, DeepSpeed supports offloading to NVMe drives for even larger models, utilizing the large memory space found in NVMes. DeepSpeed `reports `__ the ability to fine-tune 1 Trillion+ parameters using NVMe Offloading on one 8 GPU machine. Below shows how to enable this, assuming the NVMe drive is mounted in a directory called ``/local_nvme``. - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DeepSpeedStrategy - - # Enable CPU Offloading - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3_offload", precision=16) - trainer.fit(model) - - # Enable CPU Offloading, and offload parameters to CPU - model = MyModel() - trainer = Trainer( - accelerator="gpu", - devices=4, - strategy=DeepSpeedStrategy( - stage=3, - offload_optimizer=True, - offload_parameters=True, - remote_device="nvme", - offload_params_device="nvme", - offload_optimizer_device="nvme", - nvme_path="/local_nvme", - ), - precision=16, - ) - trainer.fit(model) - -When offloading to NVMe you may notice that the speed is slow. There are parameters that need to be tuned based on the drives that you are using. Running the `aio_bench_perf_sweep.py `__ script can help you to find optimum parameters. See the `issue `__ for more information on how to parse the information. - -.. _deepspeed-activation-checkpointing: - -DeepSpeed Activation Checkpointing -"""""""""""""""""""""""""""""""""" - -Activation checkpointing frees activations from memory as soon as they are not needed during the forward pass. -They are then re-computed for the backwards pass as needed. - -Activation checkpointing is very useful when you have intermediate layers that produce large activations. - -This saves memory when training larger models, however requires using a checkpoint function to run modules as shown below. - -.. warning:: - - Ensure to not wrap the entire model with activation checkpointing. This is not the intended usage of activation checkpointing, and will lead to failures as seen in `this discussion `__. - -.. code-block:: python - - from pytorch_lightning import Trainer - import deepspeed - - - class MyModel(LightningModule): - ... - - def __init__(self): - super().__init__() - self.block_1 = nn.Sequential(nn.Linear(32, 32), nn.ReLU()) - self.block_2 = torch.nn.Linear(32, 2) - - def forward(self, x): - # Use the DeepSpeed checkpointing function instead of calling the module directly - # checkpointing self.block_1 means the activations are deleted after use, - # and re-calculated during the backward passes - x = deepspeed.checkpointing.checkpoint(self.block_1, x) - return self.block_2(x) - - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DeepSpeedStrategy - import deepspeed - - - class MyModel(pl.LightningModule): - ... - - def configure_sharded_model(self): - self.block_1 = nn.Sequential(nn.Linear(32, 32), nn.ReLU()) - self.block_2 = torch.nn.Linear(32, 2) - - def forward(self, x): - # Use the DeepSpeed checkpointing function instead of calling the module directly - x = deepspeed.checkpointing.checkpoint(self.block_1, x) - return self.block_2(x) - - - model = MyModel() - - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3_offload", precision=16) - - # Enable CPU Activation Checkpointing - trainer = Trainer( - accelerator="gpu", - devices=4, - strategy=DeepSpeedStrategy( - stage=3, - offload_optimizer=True, # Enable CPU Offloading - cpu_checkpointing=True, # (Optional) offload activations to CPU - ), - precision=16, - ) - trainer.fit(model) - - -.. _deepspeed-zero-stage-3-tips: - -DeepSpeed ZeRO Stage 3 Tips -""""""""""""""""""""""""""" - -Here is some helpful information when setting up DeepSpeed ZeRO Stage 3 with Lightning. - -* If you're using Adam or AdamW, ensure to use FusedAdam or DeepSpeedCPUAdam (for CPU Offloading) rather than the default torch optimizers as they come with large speed benefits -* Treat your GPU/CPU memory as one large pool. In some cases, you may not want to offload certain things (like activations) to provide even more space to offload model parameters -* When offloading to the CPU, make sure to bump up the batch size as GPU memory will be freed -* We also support sharded checkpointing. By passing ``save_full_weights=False`` to the ``DeepSpeedStrategy``, we'll save shards of the model which allows you to save extremely large models. However to load the model and run test/validation/predict you must use the Trainer object. - -.. _deepspeed-zero-stage-3-single-file: - -Collating Single File Checkpoint for DeepSpeed ZeRO Stage 3 -""""""""""""""""""""""""""""""""""""""""""""""""""""""""""" - -After training using ZeRO Stage 3, you'll notice that your checkpoints are a directory of sharded model and optimizer states. If you'd like to collate a single file from the checkpoint directory please use the below command, which handles all the Lightning states additionally when collating the file. - -.. code-block:: python - - from pytorch_lightning.utilities.deepspeed import convert_zero_checkpoint_to_fp32_state_dict - - # lightning deepspeed has saved a directory instead of a file - save_path = "lightning_logs/version_0/checkpoints/epoch=0-step=0.ckpt/" - output_path = "lightning_model.pt" - convert_zero_checkpoint_to_fp32_state_dict(save_path, output_path) - - -.. warning:: - - This single file checkpoint does not include the optimizer/lr-scheduler states. This means we cannot restore training via the ``trainer.fit(ckpt_path=)`` call. Ensure to keep the sharded checkpoint directory if this is required. - -Custom DeepSpeed Config -""""""""""""""""""""""" - -In some cases you may want to define your own DeepSpeed Config, to access all parameters defined. We've exposed most of the important parameters, however, there may be debugging parameters to enable. Also, DeepSpeed allows the use of custom DeepSpeed optimizers and schedulers defined within a config file that is supported. - -.. note:: - All strategy default parameters will be ignored when a config object is passed. - All compatible arguments can be seen in the `DeepSpeed docs `_. - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DeepSpeedStrategy - - deepspeed_config = { - "zero_allow_untested_optimizer": True, - "optimizer": { - "type": "OneBitAdam", - "params": { - "lr": 3e-5, - "betas": [0.998, 0.999], - "eps": 1e-5, - "weight_decay": 1e-9, - "cuda_aware": True, - }, - }, - "scheduler": { - "type": "WarmupLR", - "params": { - "last_batch_iteration": -1, - "warmup_min_lr": 0, - "warmup_max_lr": 3e-5, - "warmup_num_steps": 100, - }, - }, - "zero_optimization": { - "stage": 2, # Enable Stage 2 ZeRO (Optimizer/Gradient state partitioning) - "offload_optimizer": True, # Enable Offloading optimizer state/calculation to the host CPU - "contiguous_gradients": True, # Reduce gradient fragmentation. - "overlap_comm": True, # Overlap reduce/backward operation of gradients for speed. - "allgather_bucket_size": 2e8, # Number of elements to all gather at once. - "reduce_bucket_size": 2e8, # Number of elements we reduce/allreduce at once. - }, - } - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy=DeepSpeedStrategy(config=deepspeed_config), precision=16) - trainer.fit(model) - - -We support taking the config as a json formatted file: - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DeepSpeedStrategy - - model = MyModel() - trainer = Trainer( - accelerator="gpu", devices=4, strategy=DeepSpeedStrategy(config="/path/to/deepspeed_config.json"), precision=16 - ) - trainer.fit(model) - - -You can use also use an environment variable via your PyTorch Lightning script: - -.. code-block:: bash - - PL_DEEPSPEED_CONFIG_PATH=/path/to/deepspeed_config.json python train.py --strategy deepspeed - ----------- - -.. _ddp-optimizations: - -DDP Optimizations -^^^^^^^^^^^^^^^^^ - - -When Using DDP Strategies, Set find_unused_parameters=False -""""""""""""""""""""""""""""""""""""""""""""""""""""""""""" - -By default, we have set ``find_unused_parameters=True`` for compatibility reasons that have been observed in the past (refer to the `discussion `_ for more details). -When enabled, it can result in a performance hit and can be disabled in most cases. Read more about it `here `_. - -.. tip:: - It applies to all DDP strategies that support ``find_unused_parameters`` as input. - -.. code-block:: python - - from pytorch_lightning.strategies import DDPStrategy - - trainer = pl.Trainer( - accelerator="gpu", - devices=2, - strategy=DDPStrategy(find_unused_parameters=False), - ) - -.. code-block:: python - - from pytorch_lightning.strategies import DDPSpawnStrategy - - trainer = pl.Trainer( - accelerator="gpu", - devices=2, - strategy=DDPSpawnStrategy(find_unused_parameters=False), - ) - - -DDP Static Graph -"""""""""""""""" - -`DDP static graph `__ assumes that your model -employs the same set of used/unused parameters in every iteration, so that it can deterministically know the flow of -training and apply special optimizations during runtime. - -.. note:: - DDP static graph support requires PyTorch>=1.11.0 - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DDPStrategy - - trainer = Trainer(devices=4, strategy=DDPStrategy(static_graph=True)) - - -When Using DDP on a Multi-node Cluster, Set NCCL Parameters -""""""""""""""""""""""""""""""""""""""""""""""""""""""""""" - -`NCCL `__ is the NVIDIA Collective Communications Library that is used by PyTorch to handle communication across nodes and GPUs. There are reported benefits in terms of speedups when adjusting NCCL parameters as seen in this `issue `__. In the issue, we see a 30% speed improvement when training the Transformer XLM-RoBERTa and a 15% improvement in training with Detectron2. - -NCCL parameters can be adjusted via environment variables. - -.. note:: - - AWS and GCP already set default values for these on their clusters. This is typically useful for custom cluster setups. - -* `NCCL_NSOCKS_PERTHREAD `__ -* `NCCL_SOCKET_NTHREADS `__ -* `NCCL_MIN_NCHANNELS `__ - -.. code-block:: bash - - export NCCL_NSOCKS_PERTHREAD=4 - export NCCL_SOCKET_NTHREADS=2 - - -Gradients as Bucket View -"""""""""""""""""""""""" - -Enabling ``gradient_as_bucket_view=True`` in the ``DDPStrategy`` will make gradients views point to different offsets of the ``allreduce`` communication buckets. See :class:`~torch.nn.parallel.DistributedDataParallel` for more information. - -This can reduce peak memory usage and throughput as saved memory will be equal to the total gradient memory + removes the need to copy gradients to the ``allreduce`` communication buckets. - -.. note:: - - When ``gradient_as_bucket_view=True`` you cannot call ``detach_()`` on gradients. If hitting such errors, please fix it by referring to the :meth:`~torch.optim.Optimizer.zero_grad` function in ``torch/optim/optimizer.py`` as a solution (`source `__). - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DDPStrategy - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy=DDPStrategy(gradient_as_bucket_view=True)) - trainer.fit(model) - -DDP Communication Hooks -""""""""""""""""""""""" - -DDP Communication hooks is an interface to control how gradients are communicated across workers, overriding the standard allreduce in DistributedDataParallel. This allows you to enable performance improving communication hooks when using multiple nodes. - -Enable `FP16 Compress Hook for multi-node throughput improvement `__: - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DDPStrategy - from torch.distributed.algorithms.ddp_comm_hooks import default_hooks as default - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy=DDPStrategy(ddp_comm_hook=default.fp16_compress_hook)) - trainer.fit(model) - -Enable `PowerSGD for multi-node throughput improvement `__: - -.. note:: - - PowerSGD typically requires extra memory of the same size as the model’s gradients to enable error feedback, which can compensate for biased compressed communication and improve accuracy (`source `__). - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DDPStrategy - from torch.distributed.algorithms.ddp_comm_hooks import powerSGD_hook as powerSGD - - model = MyModel() - trainer = Trainer( - accelerator="gpu", - devices=4, - strategy=DDPStrategy( - ddp_comm_state=powerSGD.PowerSGDState( - process_group=None, - matrix_approximation_rank=1, - start_powerSGD_iter=5000, - ), - ddp_comm_hook=powerSGD.powerSGD_hook, - ), - ) - trainer.fit(model) - - -Combine hooks for accumulated benefit: - -.. note:: - DDP communication wrappers support requires PyTorch>=1.9.0 - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DDPStrategy - from torch.distributed.algorithms.ddp_comm_hooks import ( - default_hooks as default, - powerSGD_hook as powerSGD, - ) - - model = MyModel() - trainer = Trainer( - accelerator="gpu", - devices=4, - strategy=DDPStrategy( - ddp_comm_state=powerSGD.PowerSGDState( - process_group=None, - matrix_approximation_rank=1, - start_powerSGD_iter=5000, - ), - ddp_comm_hook=powerSGD.powerSGD_hook, - ddp_comm_wrapper=default.fp16_compress_wrapper, - ), - ) - trainer.fit(model) - - -When using Post-localSGD, you must also pass ``model_averaging_period`` to allow for model parameter averaging: - -.. note:: - Post-localSGD support requires PyTorch>=1.10.0 - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DDPStrategy - from torch.distributed.algorithms.ddp_comm_hooks import post_localSGD_hook as post_localSGD - - model = MyModel() - trainer = Trainer( - accelerator="gpu", - devices=4, - strategy=DDPStrategy( - ddp_comm_state=post_localSGD.PostLocalSGDState( - process_group=None, - subgroup=None, - start_localSGD_iter=8, - ), - ddp_comm_hook=post_localSGD.post_localSGD_hook, - model_averaging_period=4, - ), - ) - trainer.fit(model) diff --git a/docs/_sources/advanced/pruning_quantization.rst.txt b/docs/_sources/advanced/pruning_quantization.rst.txt deleted file mode 100644 index 552a96d..0000000 --- a/docs/_sources/advanced/pruning_quantization.rst.txt +++ /dev/null @@ -1,115 +0,0 @@ -.. _pruning_quantization: - -######################## -Pruning and Quantization -######################## - -Pruning and Quantization are techniques to compress model size for deployment, allowing inference speed up and energy saving without significant accuracy losses. - -******* -Pruning -******* - -.. warning:: - - Pruning is in beta and subject to change. - -Pruning is a technique which focuses on eliminating some of the model weights to reduce the model size and decrease inference requirements. - -Pruning has been shown to achieve significant efficiency improvements while minimizing the drop in model performance (prediction quality). Model pruning is recommended for cloud endpoints, deploying models on edge devices, or mobile inference (among others). - -To enable pruning during training in Lightning, simply pass in the :class:`~pytorch_lightning.callbacks.ModelPruning` callback to the Lightning Trainer. PyTorch's native pruning implementation is used under the hood. - -This callback supports multiple pruning functions: pass any `torch.nn.utils.prune `_ function as a string to select which weights to prune (`random_unstructured `_, `RandomStructured `_, etc) or implement your own by subclassing `BasePruningMethod `_. - -.. code-block:: python - - from pytorch_lightning.callbacks import ModelPruning - - # set the amount to be the fraction of parameters to prune - trainer = Trainer(callbacks=[ModelPruning("l1_unstructured", amount=0.5)]) - -You can also perform iterative pruning, apply the `lottery ticket hypothesis `__, and more! - -.. code-block:: python - - def compute_amount(epoch): - # the sum of all returned values need to be smaller than 1 - if epoch == 10: - return 0.5 - - elif epoch == 50: - return 0.25 - - elif 75 < epoch < 99: - return 0.01 - - - # the amount can be also be a callable - trainer = Trainer(callbacks=[ModelPruning("l1_unstructured", amount=compute_amount)]) - - -************ -Quantization -************ - -.. warning :: - Quantization is in beta and subject to change. - -Model quantization is another performance optimization technique that allows speeding up inference and decreasing memory requirements by performing computations and storing tensors at lower bitwidths (such as INT8 or FLOAT16) than floating-point precision. This is particularly beneficial during model deployment. - -Quantization Aware Training (QAT) mimics the effects of quantization during training: The computations are carried-out in floating-point precision but the subsequent quantization effect is taken into account. The weights and activations are quantized into lower precision only for inference, when training is completed. - -Quantization is useful when it is required to serve large models on machines with limited memory, or when there's a need to switch between models and reducing the I/O time is important. For example, switching between monolingual speech recognition models across multiple languages. - -Lightning includes :class:`~pytorch_lightning.callbacks.QuantizationAwareTraining` callback (using PyTorch's native quantization, read more `here `__), which allows creating fully quantized models (compatible with torchscript). - -.. code-block:: python - - from pytorch_lightning.callbacks import QuantizationAwareTraining - - - class RegressionModel(LightningModule): - def __init__(self): - super().__init__() - self.layer_0 = nn.Linear(16, 64) - self.layer_0a = torch.nn.ReLU() - self.layer_1 = nn.Linear(64, 64) - self.layer_1a = torch.nn.ReLU() - self.layer_end = nn.Linear(64, 1) - - def forward(self, x): - x = self.layer_0(x) - x = self.layer_0a(x) - x = self.layer_1(x) - x = self.layer_1a(x) - x = self.layer_end(x) - return x - - - trainer = Trainer(callbacks=[QuantizationAwareTraining()]) - qmodel = RegressionModel() - trainer.fit(qmodel, ...) - - batch = iter(my_dataloader()).next() - qmodel(qmodel.quant(batch[0])) - - tsmodel = qmodel.to_torchscript() - tsmodel(tsmodel.quant(batch[0])) - -You can further customize the callback: - -.. code-block:: python - - - qcb = QuantizationAwareTraining( - # specification of quant estimation quality - observer_type="histogram", - # specify which layers shall be merged together to increase efficiency - modules_to_fuse=[(f"layer_{i}", f"layer_{i}a") for i in range(2)], - # make your model compatible with all original input/outputs, in such case the model is wrapped in a shell with entry/exit layers. - input_compatible=True, - ) - - batch = iter(my_dataloader()).next() - qmodel(batch[0]) diff --git a/docs/_sources/advanced/strategy_registry.rst.txt b/docs/_sources/advanced/strategy_registry.rst.txt deleted file mode 100644 index d92069a..0000000 --- a/docs/_sources/advanced/strategy_registry.rst.txt +++ /dev/null @@ -1,49 +0,0 @@ -Strategy Registry -================= - -.. warning:: The Strategy Registry is experimental and subject to change. - -Lightning includes a registry that holds information about Training strategies and allows for the registration of new custom strategies. - -The Strategies are assigned strings that identify them, such as "ddp", "deepspeed_stage_2_offload", and so on. -It also returns the optional description and parameters for initialising the Strategy that were defined during registration. - - -.. code-block:: python - - # Training with the DDP Strategy with `find_unused_parameters` as False - trainer = Trainer(strategy="ddp_find_unused_parameters_false", accelerator="gpu", devices=4) - - # Training with DeepSpeed ZeRO Stage 3 and CPU Offload - trainer = Trainer(strategy="deepspeed_stage_3_offload", accelerator="gpu", devices=3) - - # Training with the TPU Spawn Strategy with `debug` as True - trainer = Trainer(strategy="tpu_spawn_debug", accelerator="tpu", devices=8) - - -Additionally, you can pass your custom registered training strategies to the ``strategy`` argument. - -.. code-block:: python - - from pytorch_lightning.strategies import DDPStrategy, StrategyRegistry, CheckpointIO - - - class CustomCheckpointIO(CheckpointIO): - def save_checkpoint(self, checkpoint: Dict[str, Any], path: Union[str, Path]) -> None: - ... - - def load_checkpoint(self, path: Union[str, Path]) -> Dict[str, Any]: - ... - - - custom_checkpoint_io = CustomCheckpointIO() - - # Register the DDP Strategy with your custom CheckpointIO plugin - StrategyRegistry.register( - "ddp_custom_checkpoint_io", - DDPStrategy, - description="DDP Strategy with custom checkpoint io plugin", - checkpoint_io=custom_checkpoint_io, - ) - - trainer = Trainer(strategy="ddp_custom_checkpoint_io", accelerator="gpu", devices=2) diff --git a/docs/_sources/advanced/training_tricks.rst.txt b/docs/_sources/advanced/training_tricks.rst.txt deleted file mode 100644 index a8d5c2d..0000000 --- a/docs/_sources/advanced/training_tricks.rst.txt +++ /dev/null @@ -1,356 +0,0 @@ -.. testsetup:: * - - from pytorch_lightning.callbacks import StochasticWeightAveraging - -.. _training_tricks: - -############################# -Effective Training Techniques -############################# - -Lightning implements various techniques to help during training that can help make the training smoother. - ----------- - -******************** -Accumulate Gradients -******************** - -.. include:: ../common/gradient_accumulation.rst - ----------- - -***************** -Gradient Clipping -***************** - -Gradient clipping can be enabled to avoid exploding gradients. By default, this will clip the gradient norm by calling -:func:`torch.nn.utils.clip_grad_norm_` computed over all model parameters together. -If the Trainer's ``gradient_clip_algorithm`` is set to ``'value'`` (``'norm'`` by default), this will use instead -:func:`torch.nn.utils.clip_grad_value_` for each parameter instead. - -.. note:: - If using mixed precision, the ``gradient_clip_val`` does not need to be changed as the gradients are unscaled - before applying the clipping function. - -.. seealso:: :class:`~pytorch_lightning.trainer.trainer.Trainer` - -.. testcode:: - - # DEFAULT (ie: don't clip) - trainer = Trainer(gradient_clip_val=0) - - # clip gradients' global norm to <=0.5 using gradient_clip_algorithm='norm' by default - trainer = Trainer(gradient_clip_val=0.5) - - # clip gradients' maximum magnitude to <=0.5 - trainer = Trainer(gradient_clip_val=0.5, gradient_clip_algorithm="value") - -Read more about :ref:`Configuring Gradient Clipping ` for advanced use-cases. - ----------- - -*************************** -Stochastic Weight Averaging -*************************** - -Stochastic Weight Averaging (SWA) can make your models generalize better at virtually no additional cost. -This can be used with both non-trained and trained models. The SWA procedure smooths the loss landscape thus making -it harder to end up in a local minimum during optimization. - -For a more detailed explanation of SWA and how it works, -read `this post `__ by the PyTorch team. - -.. seealso:: The :class:`~pytorch_lightning.callbacks.StochasticWeightAveraging` callback - -.. testcode:: - - # Enable Stochastic Weight Averaging using the callback - trainer = Trainer(callbacks=[StochasticWeightAveraging(swa_lrs=1e-2)]) - ----------- - -***************** -Batch Size Finder -***************** - -Auto-scaling of batch size can be enabled to find the largest batch size that fits into -memory. Large batch size often yields a better estimation of the gradients, but may also result in -longer training time. Inspired by https://github.com/BlackHC/toma. - -.. seealso:: :class:`~pytorch_lightning.trainer.trainer.Trainer` - -.. code-block:: python - - # DEFAULT (ie: don't scale batch size automatically) - trainer = Trainer(auto_scale_batch_size=None) - - # Autoscale batch size - trainer = Trainer(auto_scale_batch_size=None | "power" | "binsearch") - - # Find the batch size - trainer.tune(model) - -Currently, this feature supports two modes ``'power'`` scaling and ``'binsearch'`` -scaling. In ``'power'`` scaling, starting from a batch size of 1 keeps doubling -the batch size until an out-of-memory (OOM) error is encountered. Setting the -argument to ``'binsearch'`` will initially also try doubling the batch size until -it encounters an OOM, after which it will do a binary search that will finetune the -batch size. Additionally, it should be noted that the batch size scaler cannot -search for batch sizes larger than the size of the training dataset. - - -.. note:: - - This feature expects that a ``batch_size`` field is either located as a model attribute - i.e. ``model.batch_size`` or as a field in your ``hparams`` i.e. ``model.hparams.batch_size``. - Similarly it can work with datamodules too. The field should exist and will be updated by - the results of this algorithm. Additionally, your ``train_dataloader()`` method should depend - on this field for this feature to work i.e. - - .. code-block:: python - - # using LightningModule - class LitModel(LightningModule): - def __init__(self, batch_size): - super().__init__() - self.save_hyperparameters() - # or - self.batch_size = batch_size - - def train_dataloader(self): - return DataLoader(train_dataset, batch_size=self.batch_size | self.hparams.batch_size) - - - trainer = Trainer(...) - model = LitModel(batch_size=32) - trainer.tune(model) - - # using LightningDataModule - class LitDataModule(LightningDataModule): - def __init__(self, batch_size): - super().__init__() - self.save_hyperparameters() - # or - self.batch_size = batch_size - - def train_dataloader(self): - return DataLoader(train_dataset, batch_size=self.batch_size | self.hparams.batch_size) - - - trainer = Trainer(...) - model = MyModel() - datamodule = LitDataModule(batch_size=32) - trainer.tune(model, datamodule=datamodule) - -.. warning:: - - Due to the constraints listed above, this features does *NOT* work when passing dataloaders directly - to ``.fit()``. - -The scaling algorithm has a number of parameters that the user can control by -invoking the :meth:`~pytorch_lightning.tuner.tuning.Tuner.scale_batch_size` method: - -.. code-block:: python - - # Use default in trainer construction - trainer = Trainer() - tuner = Tuner(trainer) - - # Invoke method - new_batch_size = tuner.scale_batch_size(model, *extra_parameters_here) - - # Override old batch size (this is done automatically) - model.hparams.batch_size = new_batch_size - - # Fit as normal - trainer.fit(model) - -The algorithm in short works by: - 1. Dumping the current state of the model and trainer - 2. Iteratively until convergence or maximum number of tries ``max_trials`` (default 25) has been reached: - - Call ``fit()`` method of trainer. This evaluates ``steps_per_trial`` (default 3) number of - optimization steps. Each training step can trigger an OOM error if the tensors - (training batch, weights, gradients, etc.) allocated during the steps have a - too large memory footprint. - - If an OOM error is encountered, decrease batch size else increase it. - How much the batch size is increased/decreased is determined by the chosen - strategy. - 3. The found batch size is saved to either ``model.batch_size`` or ``model.hparams.batch_size`` - 4. Restore the initial state of model and trainer - -.. warning:: Batch size finder is not yet supported for DDP or any of its variations, it is coming soon. - ----------- - -.. _learning_rate_finder: - -******************** -Learning Rate Finder -******************** - -.. raw:: html - - - -| - -For training deep neural networks, selecting a good learning rate is essential -for both better performance and faster convergence. Even optimizers such as -:class:`~torch.optim.Adam` that are self-adjusting the learning rate can benefit from more optimal -choices. - -To reduce the amount of guesswork concerning choosing a good initial learning -rate, a `learning rate finder` can be used. As described in `this paper `_ -a learning rate finder does a small run where the learning rate is increased -after each processed batch and the corresponding loss is logged. The result of -this is a ``lr`` vs. ``loss`` plot that can be used as guidance for choosing an optimal -initial learning rate. - -.. warning:: - - For the moment, this feature only works with models having a single optimizer. - LR Finder support for DDP and any of its variations is not implemented yet. It is coming soon. - - -Using Lightning's built-in LR finder -==================================== - -To enable the learning rate finder, your :doc:`lightning module <../common/lightning_module>` needs to -have a ``learning_rate`` or ``lr`` attribute (or as a field in your ``hparams`` i.e. -``hparams.learning_rate`` or ``hparams.lr``). Then, set ``Trainer(auto_lr_find=True)`` -during trainer construction, and then call ``trainer.tune(model)`` to run the LR finder. -The suggested ``learning_rate`` will be written to the console and will be automatically -set to your :doc:`lightning module <../common/lightning_module>`, which can be accessed -via ``self.learning_rate`` or ``self.lr``. - -.. seealso:: :ref:`trainer.tune `. - -.. code-block:: python - - class LitModel(LightningModule): - def __init__(self, learning_rate): - super().__init__() - self.learning_rate = learning_rate - self.model = Model(...) - - def configure_optimizers(self): - return Adam(self.parameters(), lr=(self.lr or self.learning_rate)) - - - model = LitModel() - - # finds learning rate automatically - # sets hparams.lr or hparams.learning_rate to that learning rate - trainer = Trainer(auto_lr_find=True) - - trainer.tune(model) - -If your model is using an arbitrary value instead of ``self.lr`` or ``self.learning_rate``, set that value as ``auto_lr_find``: - -.. code-block:: python - - model = LitModel() - - # to set to your own hparams.my_value - trainer = Trainer(auto_lr_find="my_value") - - trainer.tune(model) - -You can also inspect the results of the learning rate finder or just play around -with the parameters of the algorithm. This can be done by invoking the -:meth:`~pytorch_lightning.tuner.tuning.Tuner.lr_find` method. A typical example of this would look like: - -.. code-block:: python - - model = MyModelClass(hparams) - trainer = Trainer() - - # Run learning rate finder - lr_finder = trainer.tuner.lr_find(model) - - # Results can be found in - print(lr_finder.results) - - # Plot with - fig = lr_finder.plot(suggest=True) - fig.show() - - # Pick point based on plot, or get suggestion - new_lr = lr_finder.suggestion() - - # update hparams of the model - model.hparams.lr = new_lr - - # Fit model - trainer.fit(model) - -The figure produced by ``lr_finder.plot()`` should look something like the figure -below. It is recommended to not pick the learning rate that achieves the lowest -loss, but instead something in the middle of the sharpest downward slope (red point). -This is the point returned py ``lr_finder.suggestion()``. - -.. figure:: ../_static/images/trainer/lr_finder.png - ----------- - -************************** -Advanced GPU Optimizations -************************** - -When training on single or multiple GPU machines, Lightning offers a host of advanced optimizations to improve throughput, memory efficiency, and model scaling. -Refer to :doc:`Advanced GPU Optimized Training <../advanced/model_parallel>` for more details. - ----------- - - -.. _ddp_spawn_shared_memory: - -****************************************** -Sharing Datasets Across Process Boundaries -****************************************** - -The :class:`~pytorch_lightning.core.datamodule.LightningDataModule` class provides an organized way to decouple data loading from training logic, with :meth:`~pytorch_lightning.core.hooks.DataHooks.prepare_data` being used for downloading and pre-processing the dataset on a single process, and :meth:`~pytorch_lightning.core.hooks.DataHooks.setup` loading the pre-processed data for each process individually: - -.. code-block:: python - - class MNISTDataModule(pl.LightningDataModule): - def prepare_data(self): - MNIST(self.data_dir, download=True) - - def setup(self, stage: Optional[str] = None): - self.mnist = MNIST(self.data_dir) - - def train_loader(self): - return DataLoader(self.mnist, batch_size=128) - -However, for in-memory datasets, that means that each process will hold a (redundant) replica of the dataset in memory, which may be impractical when using many processes while utilizing datasets that nearly fit into CPU memory, as the memory consumption will scale up linearly with the number of processes. -For example, when training Graph Neural Networks, a common strategy is to load the entire graph into CPU memory for fast access to the entire graph structure and its features, and to then perform neighbor sampling to obtain mini-batches that fit onto the GPU. - -A simple way to prevent redundant dataset replicas is to rely on :obj:`torch.multiprocessing` to share the `data automatically between spawned processes via shared memory `_. -For this, all data pre-loading should be done on the main process inside :meth:`DataModule.__init__`. As a result, all tensor-data will get automatically shared when using the :class:`~pytorch_lightning.plugins.strategies.ddp_spawn.DDPSpawnStrategy` strategy. - -.. warning:: - - :obj:`torch.multiprocessing` will send a handle of each individual tensor to other processes. - In order to prevent any errors due to too many open file handles, try to reduce the number of tensors to share, *e.g.*, by stacking your data into a single tensor. - -.. code-block:: python - - class MNISTDataModule(pl.LightningDataModule): - def __init__(self, data_dir: str): - self.mnist = MNIST(data_dir, download=True, transform=T.ToTensor()) - - def train_loader(self): - return DataLoader(self.mnist, batch_size=128) - - - model = Model(...) - datamodule = MNISTDataModule("data/MNIST") - - trainer = Trainer(accelerator="gpu", devices=2, strategy="ddp_spawn") - trainer.fit(model, datamodule) - -See the `graph-level `_ and `node-level `_ prediction examples in PyTorch Geometric for practical use-cases. diff --git a/docs/_sources/advanced/transfer_learning.rst.txt b/docs/_sources/advanced/transfer_learning.rst.txt deleted file mode 100644 index caa739b..0000000 --- a/docs/_sources/advanced/transfer_learning.rst.txt +++ /dev/null @@ -1,128 +0,0 @@ -################# -Transfer Learning -################# -**Audience**: Users looking to use pretrained models with Lightning. - ----- - -************************* -Use any PyTorch nn.Module -************************* -Any model that is a PyTorch nn.Module can be used with Lightning (because LightningModules are nn.Modules also). - ----- - -******************************** -Use a pretrained LightningModule -******************************** -Let's use the `AutoEncoder` as a feature extractor in a separate model. - -.. testcode:: - - class Encoder(torch.nn.Module): - ... - - - class AutoEncoder(LightningModule): - def __init__(self): - self.encoder = Encoder() - self.decoder = Decoder() - - - class CIFAR10Classifier(LightningModule): - def __init__(self): - # init the pretrained LightningModule - self.feature_extractor = AutoEncoder.load_from_checkpoint(PATH) - self.feature_extractor.freeze() - - # the autoencoder outputs a 100-dim representation and CIFAR-10 has 10 classes - self.classifier = nn.Linear(100, 10) - - def forward(self, x): - representations = self.feature_extractor(x) - x = self.classifier(representations) - ... - -We used our pretrained Autoencoder (a LightningModule) for transfer learning! - ----- - -*********************************** -Example: Imagenet (Computer Vision) -*********************************** - -.. testcode:: - :skipif: not _TORCHVISION_AVAILABLE - - import torchvision.models as models - - - class ImagenetTransferLearning(LightningModule): - def __init__(self): - super().__init__() - - # init a pretrained resnet - backbone = models.resnet50(pretrained=True) - num_filters = backbone.fc.in_features - layers = list(backbone.children())[:-1] - self.feature_extractor = nn.Sequential(*layers) - - # use the pretrained model to classify cifar-10 (10 image classes) - num_target_classes = 10 - self.classifier = nn.Linear(num_filters, num_target_classes) - - def forward(self, x): - self.feature_extractor.eval() - with torch.no_grad(): - representations = self.feature_extractor(x).flatten(1) - x = self.classifier(representations) - ... - -Finetune - -.. code-block:: python - - model = ImagenetTransferLearning() - trainer = Trainer() - trainer.fit(model) - -And use it to predict your data of interest - -.. code-block:: python - - model = ImagenetTransferLearning.load_from_checkpoint(PATH) - model.freeze() - - x = some_images_from_cifar10() - predictions = model(x) - -We used a pretrained model on imagenet, finetuned on CIFAR-10 to predict on CIFAR-10. -In the non-academic world we would finetune on a tiny dataset you have and predict on your dataset. - ----- - -******************* -Example: BERT (NLP) -******************* -Lightning is completely agnostic to what's used for transfer learning so long -as it is a `torch.nn.Module` subclass. - -Here's a model that uses `Huggingface transformers `_. - -.. testcode:: - - class BertMNLIFinetuner(LightningModule): - def __init__(self): - super().__init__() - - self.bert = BertModel.from_pretrained("bert-base-cased", output_attentions=True) - self.W = nn.Linear(bert.config.hidden_size, 3) - self.num_classes = 3 - - def forward(self, input_ids, attention_mask, token_type_ids): - - h, _, attn = self.bert(input_ids=input_ids, attention_mask=attention_mask, token_type_ids=token_type_ids) - - h_cls = h[:, 0] - logits = self.W(h_cls) - return logits, attn diff --git a/docs/_sources/benchmarking/benchmarks.rst.txt b/docs/_sources/benchmarking/benchmarks.rst.txt deleted file mode 100644 index af9715f..0000000 --- a/docs/_sources/benchmarking/benchmarks.rst.txt +++ /dev/null @@ -1,19 +0,0 @@ -:orphan: - -Benchmark with vanilla PyTorch -============================== - -In this section we set grounds for comparison between vanilla PyTorch and PT Lightning for most common scenarios. - -Time comparison ---------------- - -We have set regular benchmarking against PyTorch vanilla training loop on with RNN and simple MNIST classifier as per of out CI. -In average for simple MNIST CNN classifier we are only about 0.06s slower per epoch, see detail chart bellow. - -.. figure:: ../_static/images/benchmarks/figure-parity-times.png - :alt: Speed parity to vanilla PT, created on 2020-12-16 - :width: 500 - - -Learn more about reproducible benchmarking from the `PyTorch Reproducibility Guide `__. diff --git a/docs/_sources/cli/lightning_cli.rst.txt b/docs/_sources/cli/lightning_cli.rst.txt deleted file mode 100644 index 76f3f12..0000000 --- a/docs/_sources/cli/lightning_cli.rst.txt +++ /dev/null @@ -1,94 +0,0 @@ -:orphan: - -.. _lightning-cli: - -############################ -Eliminate config boilerplate -############################ - -********* -Basic use -********* - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: 1: Control it all from the CLI - :description: Learn to control a LightningModule and LightningDataModule from the CLI - :col_css: col-md-4 - :button_link: lightning_cli_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: 2: Mix models and datasets - :description: Register models, datasets, optimizers and learning rate schedulers - :col_css: col-md-4 - :button_link: lightning_cli_intermediate_2.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: 3: Control it all via YAML - :description: Enable composable YAMLs - :col_css: col-md-4 - :button_link: lightning_cli_advanced.html - :height: 150 - :tag: advanced - -.. raw:: html - -
-
- ----- - -************ -Advanced use -************ - -.. raw:: html - -
-
- -.. displayitem:: - :header: YAML for production - :description: Use the Lightning CLI with YAMLs for production environments - :col_css: col-md-6 - :button_link: lightning_cli_advanced_2.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Customize configs for complex projects - :description: Learn how to connect complex projects with each Registry. - :col_css: col-md-6 - :button_link: lightning_cli_advanced_3.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: Extend the Lightning CLI - :description: Customize the Lightning CLI - :col_css: col-md-6 - :button_link: lightning_cli_expert.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: FAQ - :description: Frequently asked questions about working with the Lightning CLI and YAML files - :col_css: col-md-6 - :button_link: lightning_cli_faq.html - :height: 150 - -.. raw:: html - -
-
diff --git a/docs/_sources/cli/lightning_cli_advanced.rst.txt b/docs/_sources/cli/lightning_cli_advanced.rst.txt deleted file mode 100644 index 2d4f330..0000000 --- a/docs/_sources/cli/lightning_cli_advanced.rst.txt +++ /dev/null @@ -1,113 +0,0 @@ -:orphan: - -####################################### -Eliminate config boilerplate (Advanced) -####################################### -**Audience:** Users looking to modularize their code for a professional project. - -**Pre-reqs:** You must have read :doc:`(Control it all from the CLI) `. - ----- - -*************************** -What is a yaml config file? -*************************** -A yaml is a standard configuration file that describes parameters for sections of a program. It is a common tool in engineering, and it has recently started to gain popularity in machine learning. - -.. code:: yaml - - # file.yaml - car: - max_speed:100 - max_passengers:2 - plane: - fuel_capacity: 50 - class_3: - option_1: 'x' - option_2: 'y' - ----- - - -********************* -Print the config used -********************* -Before or after you run a training routine, you can print the full training spec in yaml format using ``--print_config``: - -.. code:: bash - - python main.py fit --print_config - -which generates the following config: - -.. code:: bash - - seed_everything: null - trainer: - logger: true - ... - terminate_on_nan: null - model: - out_dim: 10 - learning_rate: 0.02 - data: - data_dir: ./ - ckpt_path: null - ----- - -******************************** -Write a config yaml from the CLI -******************************** -To have a copy of the configuration that produced this model, save a *yaml* file from the *--print_config* outputs: - -.. code:: bash - - python main.py fit --model.learning_rate 0.001 --print_config > config.yaml - ----- - -********************** -Run from a single yaml -********************** -To run from a yaml, pass a yaml produced with ``--print_config`` to the ``--config`` argument: - -.. code:: bash - - python main.py fit --config config.yaml - -when using a yaml to run, you can still pass in inline arguments - -.. code:: bash - - python main.py fit --config config.yaml --trainer.max_epochs 100 - ----- - -****************** -Compose yaml files -****************** -For production or complex research projects it's advisable to have each object in its own config file. To compose all the configs, pass them all inline: - -.. code-block:: bash - - $ python trainer.py fit --config trainer.yaml --config datamodules.yaml --config models.yaml ... - -The configs will be parsed sequentially. Let's say we have two configs with the same args: - -.. code:: yaml - - # trainer.yaml - trainer: - num_epochs: 10 - - - # trainer_2.yaml - trainer: - num_epochs: 20 - -the ones from the last config will be used (num_epochs = 20) in this case: - -.. code-block:: bash - - $ python trainer.py fit --config trainer.yaml --config trainer_2.yaml diff --git a/docs/_sources/cli/lightning_cli_advanced_2.rst.txt b/docs/_sources/cli/lightning_cli_advanced_2.rst.txt deleted file mode 100644 index 0474699..0000000 --- a/docs/_sources/cli/lightning_cli_advanced_2.rst.txt +++ /dev/null @@ -1,207 +0,0 @@ -:orphan: - -.. testsetup:: * - :skipif: not _JSONARGPARSE_AVAILABLE - - import torch - from unittest import mock - from typing import List - import pytorch_lightning as pl - from pytorch_lightning import LightningModule, LightningDataModule, Trainer, Callback - - - class NoFitTrainer(Trainer): - def fit(self, *_, **__): - pass - - - class LightningCLI(pl.utilities.cli.LightningCLI): - def __init__(self, *args, trainer_class=NoFitTrainer, run=False, **kwargs): - super().__init__(*args, trainer_class=trainer_class, run=run, **kwargs) - - - class MyModel(LightningModule): - def __init__( - self, - encoder_layers: int = 12, - decoder_layers: List[int] = [2, 4], - batch_size: int = 8, - ): - pass - - - class MyDataModule(LightningDataModule): - def __init__(self, batch_size: int = 8): - self.num_classes = 5 - - - mock_argv = mock.patch("sys.argv", ["any.py"]) - mock_argv.start() - -.. testcleanup:: * - - mock_argv.stop() - -####################################### -Eliminate config boilerplate (Advanced) -####################################### - -****************************** -Customize arguments by command -****************************** -To customize arguments by subcommand, pass the config *before* the subcommand: - -.. code-block:: bash - - $ python main.py [before] [subcommand] [after] - $ python main.py ... fit ... - -For example, here we set the Trainer argument [max_steps = 100] for the full training routine and [max_steps = 10] for testing: - -.. code-block:: bash - - # config1.yaml - fit: - trainer: - max_steps: 100 - test: - trainer: - max_epochs: 10 - -now you can toggle this behavior by subcommand: - -.. code-block:: bash - - # full routine with max_steps = 100 - $ python main.py --config config1.yaml fit - - # test only with max_epochs = 10 - $ python main.py --config config1.yaml test - ----- - -********************* -Use groups of options -********************* -Groups of options can also be given as independent config files: - -.. code-block:: bash - - $ python trainer.py fit --trainer trainer.yaml --model model.yaml --data data.yaml [...] - ----- - -*************************** -Run from cloud yaml configs -*************************** -For certain enterprise workloads, Lightning CLI supports running from hosted configs: - -.. code-block:: bash - - $ python trainer.py [subcommand] --config s3://bucket/config.yaml - -For more options, refer to :doc:`Remote filesystems <../common/remote_fs>`. - ----- - -************************************** -Use a config via environment variables -************************************** -For certain CI/CD systems, it's useful to pass in config files as environment variables: - -.. code-block:: bash - - $ python trainer.py fit --trainer "$TRAINER_CONFIG" --model "$MODEL_CONFIG" [...] - ----- - -*************************************** -Run from environment variables directly -*************************************** -The Lightning CLI can convert every possible CLI flag into an environment variable. To enable this, set the *env_parse* argument: - -.. code:: python - - LightningCLI(env_parse=True) - -now use the ``--help`` CLI flag with any subcommand: - -.. code:: bash - - $ python main.py fit --help - -which will show you ALL possible environment variables you can now set: - -.. code:: bash - - usage: main.py [options] fit [-h] [-c CONFIG] - [--trainer.max_epochs MAX_EPOCHS] [--trainer.min_epochs MIN_EPOCHS] - [--trainer.max_steps MAX_STEPS] [--trainer.min_steps MIN_STEPS] - ... - [--ckpt_path CKPT_PATH] - - optional arguments: - ... - --model CONFIG Path to a configuration file. - --model.out_dim OUT_DIM - (type: int, default: 10) - --model.learning_rate LEARNING_RATE - (type: float, default: 0.02) - -now you can customize the behavior via environment variables: - -.. code:: bash - - # set the options via env vars - $ export LEARNING_RATE=0.01 - $ export OUT_DIM=5 - - $ python main.py fit - ----- - -************************ -Set default config files -************************ -To set a path to a config file of defaults, use the ``default_config_files`` argument: - -.. testcode:: - - cli = LightningCLI(MyModel, MyDataModule, parser_kwargs={"default_config_files": ["my_cli_defaults.yaml"]}) - -or if you want defaults per subcommand: - -.. testcode:: - - cli = LightningCLI(MyModel, MyDataModule, parser_kwargs={"fit": {"default_config_files": ["my_fit_defaults.yaml"]}}) - -For more configuration options, refer to the `ArgumentParser API -`_ documentation. - ----- - -***************************** -Enable variable interpolation -***************************** -In certain cases where multiple configs need to share variables, consider using variable interpolation. Variable interpolation -allows you to add variables to your yaml configs like so: - -.. code-block:: yaml - - model: - encoder_layers: 12 - decoder_layers: - - ${model.encoder_layers} - - 4 - -To enable variable interpolation, first install omegaconf: - -.. code:: bash - - pip install omegaconf - -Once this is installed, the Lightning CLI will automatically handle variables in yaml files: - -.. code bash: - - python main.py --model.encoder_layers=12 diff --git a/docs/_sources/cli/lightning_cli_advanced_3.rst.txt b/docs/_sources/cli/lightning_cli_advanced_3.rst.txt deleted file mode 100644 index 2eeae17..0000000 --- a/docs/_sources/cli/lightning_cli_advanced_3.rst.txt +++ /dev/null @@ -1,415 +0,0 @@ -:orphan: - -.. testsetup:: * - :skipif: not _JSONARGPARSE_AVAILABLE - - import torch - from unittest import mock - from typing import List - import pytorch_lightning as pl - from pytorch_lightning import LightningModule, LightningDataModule, Trainer, Callback - - - class NoFitTrainer(Trainer): - def fit(self, *_, **__): - pass - - - class LightningCLI(pl.utilities.cli.LightningCLI): - def __init__(self, *args, trainer_class=NoFitTrainer, run=False, **kwargs): - super().__init__(*args, trainer_class=trainer_class, run=run, **kwargs) - - - class MyModel(LightningModule): - def __init__( - self, - encoder_layers: int = 12, - decoder_layers: List[int] = [2, 4], - batch_size: int = 8, - ): - pass - - - class MyDataModule(LightningDataModule): - def __init__(self, batch_size: int = 8): - self.num_classes = 5 - - - MyModelBaseClass = MyModel - MyDataModuleBaseClass = MyDataModule - - mock_argv = mock.patch("sys.argv", ["any.py"]) - mock_argv.start() - -.. testcleanup:: * - - mock_argv.stop() - -Instantiation only mode -^^^^^^^^^^^^^^^^^^^^^^^ - -The CLI is designed to start fitting with minimal code changes. On class instantiation, the CLI will automatically -call the trainer function associated to the subcommand provided so you don't have to do it. -To avoid this, you can set the following argument: - -.. testcode:: - - cli = LightningCLI(MyModel, run=False) # True by default - # you'll have to call fit yourself: - cli.trainer.fit(cli.model) - -In this mode, there are subcommands added to the parser. -This can be useful to implement custom logic without having to subclass the CLI, but still using the CLI's instantiation -and argument parsing capabilities. - - -Subclass registration -^^^^^^^^^^^^^^^^^^^^^ - -To use shorthand notation, the options need to be registered beforehand. This can be easily done with: - -.. code-block:: - - LightningCLI(auto_registry=True) # False by default - -which will register all subclasses of :class:`torch.optim.Optimizer`, :class:`torch.optim.lr_scheduler._LRScheduler`, -:class:`~pytorch_lightning.core.lightning.LightningModule`, -:class:`~pytorch_lightning.core.datamodule.LightningDataModule`, :class:`~pytorch_lightning.callbacks.Callback`, and -:class:`~pytorch_lightning.loggers.LightningLoggerBase` across all imported modules. This includes those in your own -code. - -Alternatively, if this is left unset, only the subclasses defined in PyTorch's :class:`torch.optim.Optimizer`, -:class:`torch.optim.lr_scheduler._LRScheduler` and Lightning's :class:`~pytorch_lightning.callbacks.Callback` and -:class:`~pytorch_lightning.loggers.LightningLoggerBase` subclassess will be registered. - -In subsequent sections, we will go over adding specific classes to specific registries as well as how to use -shorthand notation. - - -Trainer Callbacks and arguments with class type -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - -A very important argument of the :class:`~pytorch_lightning.trainer.trainer.Trainer` class is the :code:`callbacks`. In -contrast to other more simple arguments which just require numbers or strings, :code:`callbacks` expects a list of -instances of subclasses of :class:`~pytorch_lightning.callbacks.Callback`. To specify this kind of argument in a config -file, each callback must be given as a dictionary including a :code:`class_path` entry with an import path of the class, -and optionally an :code:`init_args` entry with arguments required to instantiate it. Therefore, a simple configuration -file example that defines a couple of callbacks is the following: - -.. code-block:: yaml - - trainer: - callbacks: - - class_path: pytorch_lightning.callbacks.EarlyStopping - init_args: - patience: 5 - - class_path: pytorch_lightning.callbacks.LearningRateMonitor - init_args: - ... - -Similar to the callbacks, any arguments in :class:`~pytorch_lightning.trainer.trainer.Trainer` and user extended -:class:`~pytorch_lightning.core.lightning.LightningModule` and -:class:`~pytorch_lightning.core.datamodule.LightningDataModule` classes that have as type hint a class can be configured -the same way using :code:`class_path` and :code:`init_args`. - -For callbacks in particular, Lightning simplifies the command line so that only -the :class:`~pytorch_lightning.callbacks.Callback` name is required. -The argument's order matters and the user needs to pass the arguments in the following way. - -.. code-block:: bash - - $ python ... \ - --trainer.callbacks={CALLBACK_1_NAME} \ - --trainer.callbacks.{CALLBACK_1_ARGS_1}=... \ - --trainer.callbacks.{CALLBACK_1_ARGS_2}=... \ - ... - --trainer.callbacks={CALLBACK_N_NAME} \ - --trainer.callbacks.{CALLBACK_N_ARGS_1}=... \ - ... - -Here is an example: - -.. code-block:: bash - - $ python ... \ - --trainer.callbacks=EarlyStopping \ - --trainer.callbacks.patience=5 \ - --trainer.callbacks=LearningRateMonitor \ - --trainer.callbacks.logging_interval=epoch - -Lightning provides a mechanism for you to add your own callbacks and benefit from the command line simplification -as described above: - -.. code-block:: python - - from pytorch_lightning.utilities.cli import CALLBACK_REGISTRY - - - @CALLBACK_REGISTRY - class CustomCallback(Callback): - ... - - - cli = LightningCLI(...) - -.. code-block:: bash - - $ python ... --trainer.callbacks=CustomCallback ... - -.. note:: - - This shorthand notation is only supported in the shell and not inside a configuration file. The configuration file - generated by calling the previous command with ``--print_config`` will have the ``class_path`` notation. - - .. code-block:: yaml - - trainer: - callbacks: - - class_path: your_class_path.CustomCallback - init_args: - ... - - -.. tip:: - - ``--trainer.logger`` also supports shorthand notation and a ``LOGGER_REGISTRY`` is available to register custom - Loggers. - - -Multiple models and/or datasets -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - -Additionally, the tool can be configured such that a model and/or a datamodule is -specified by an import path and init arguments. For example, with a tool implemented as: - -.. code-block:: python - - cli = LightningCLI(MyModelBaseClass, MyDataModuleBaseClass, subclass_mode_model=True, subclass_mode_data=True) - -A possible config file could be as follows: - -.. code-block:: yaml - - model: - class_path: mycode.mymodels.MyModel - init_args: - decoder_layers: - - 2 - - 4 - encoder_layers: 12 - data: - class_path: mycode.mydatamodules.MyDataModule - init_args: - ... - trainer: - callbacks: - - class_path: pytorch_lightning.callbacks.EarlyStopping - init_args: - patience: 5 - ... - -Only model classes that are a subclass of :code:`MyModelBaseClass` would be allowed, and similarly only subclasses of -:code:`MyDataModuleBaseClass`. If as base classes :class:`~pytorch_lightning.core.lightning.LightningModule` and -:class:`~pytorch_lightning.core.datamodule.LightningDataModule` are given, then the tool would allow any lightning -module and data module. - -.. tip:: - - Note that with the subclass modes the :code:`--help` option does not show information for a specific subclass. To - get help for a subclass the options :code:`--model.help` and :code:`--data.help` can be used, followed by the - desired class path. Similarly :code:`--print_config` does not include the settings for a particular subclass. To - include them the class path should be given before the :code:`--print_config` option. Examples for both help and - print config are: - - .. code-block:: bash - - $ python trainer.py fit --model.help mycode.mymodels.MyModel - $ python trainer.py fit --model mycode.mymodels.MyModel --print_config - - -Models with multiple submodules -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - -Many use cases require to have several modules each with its own configurable options. One possible way to handle this -with LightningCLI is to implement a single module having as init parameters each of the submodules. Since the init -parameters have as type a class, then in the configuration these would be specified with :code:`class_path` and -:code:`init_args` entries. For instance a model could be implemented as: - -.. testcode:: - - class MyMainModel(LightningModule): - def __init__(self, encoder: nn.Module, decoder: nn.Module): - """Example encoder-decoder submodules model - - Args: - encoder: Instance of a module for encoding - decoder: Instance of a module for decoding - """ - super().__init__() - self.encoder = encoder - self.decoder = decoder - -If the CLI is implemented as :code:`LightningCLI(MyMainModel)` the configuration would be as follows: - -.. code-block:: yaml - - model: - encoder: - class_path: mycode.myencoders.MyEncoder - init_args: - ... - decoder: - class_path: mycode.mydecoders.MyDecoder - init_args: - ... - -It is also possible to combine :code:`subclass_mode_model=True` and submodules, thereby having two levels of -:code:`class_path`. - - -Class type defaults -^^^^^^^^^^^^^^^^^^^ - -The support for classes as type hints allows to try many possibilities with the same CLI. This is a useful feature, but -it can make it tempting to use an instance of a class as a default. For example: - -.. code-block:: - - class MyMainModel(LightningModule): - def __init__( - self, - backbone: torch.nn.Module = MyModel(encoder_layers=24), # BAD PRACTICE! - ): - super().__init__() - self.backbone = backbone - -Normally classes are mutable as it is in this case. The instance of :code:`MyModel` would be created the moment that the -module that defines :code:`MyMainModel` is first imported. This means that the default of :code:`backbone` will be -initialized before the CLI class runs :code:`seed_everything` making it non-reproducible. Furthermore, if -:code:`MyMainModel` is used more than once in the same Python process and the :code:`backbone` parameter is not -overridden, the same instance would be used in multiple places which very likely is not what the developer intended. -Having an instance as default also makes it impossible to generate the complete config file since for arbitrary classes -it is not known which arguments were used to instantiate it. - -A good solution to these problems is to not have a default or set the default to a special value (e.g. a -string) which would be checked in the init and instantiated accordingly. If a class parameter has no default and the CLI -is subclassed then a default can be set as follows: - -.. testcode:: - - default_backbone = { - "class_path": "import.path.of.MyModel", - "init_args": { - "encoder_layers": 24, - }, - } - - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.set_defaults({"model.backbone": default_backbone}) - -A more compact version that avoids writing a dictionary would be: - -.. testcode:: - - from jsonargparse import lazy_instance - - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.set_defaults({"model.backbone": lazy_instance(MyModel, encoder_layers=24)}) - -Optimizers -^^^^^^^^^^ - -If you will not be changing the class, you can manually add the arguments for specific optimizers and/or -learning rate schedulers by subclassing the CLI. This has the advantage of providing the proper help message for those -classes. The following code snippet shows how to implement it: - -.. testcode:: - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.add_optimizer_args(torch.optim.Adam) - parser.add_lr_scheduler_args(torch.optim.lr_scheduler.ExponentialLR) - -With this, in the config the :code:`optimizer` and :code:`lr_scheduler` groups would accept all of the options for the -given classes, in this example :code:`Adam` and :code:`ExponentialLR`. -Therefore, the config file would be structured like: - -.. code-block:: yaml - - optimizer: - lr: 0.01 - lr_scheduler: - gamma: 0.2 - model: - ... - trainer: - ... - -Where the arguments can be passed directly through command line without specifying the class. For example: - -.. code-block:: bash - - $ python trainer.py fit --optimizer.lr=0.01 --lr_scheduler.gamma=0.2 - -The automatic implementation of :code:`configure_optimizers` can be disabled by linking the configuration group. An -example can be when one wants to add support for multiple optimizers: - -.. code-block:: python - - from pytorch_lightning.utilities.cli import instantiate_class - - - class MyModel(LightningModule): - def __init__(self, optimizer1_init: dict, optimizer2_init: dict): - super().__init__() - self.optimizer1_init = optimizer1_init - self.optimizer2_init = optimizer2_init - - def configure_optimizers(self): - optimizer1 = instantiate_class(self.parameters(), self.optimizer1_init) - optimizer2 = instantiate_class(self.parameters(), self.optimizer2_init) - return [optimizer1, optimizer2] - - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.add_optimizer_args( - OPTIMIZER_REGISTRY.classes, nested_key="gen_optimizer", link_to="model.optimizer1_init" - ) - parser.add_optimizer_args( - OPTIMIZER_REGISTRY.classes, nested_key="gen_discriminator", link_to="model.optimizer2_init" - ) - - - cli = MyLightningCLI(MyModel) - -The value given to :code:`optimizer*_init` will always be a dictionary including :code:`class_path` and -:code:`init_args` entries. The function :func:`~pytorch_lightning.utilities.cli.instantiate_class` -takes care of importing the class defined in :code:`class_path` and instantiating it using some positional arguments, -in this case :code:`self.parameters()`, and the :code:`init_args`. -Any number of optimizers and learning rate schedulers can be added when using :code:`link_to`. - -With shorthand notation: - -.. code-block:: bash - - $ python trainer.py fit \ - --gen_optimizer=Adam \ - --gen_optimizer.lr=0.01 \ - --gen_discriminator=AdamW \ - --gen_discriminator.lr=0.0001 - -You can also pass the class path directly, for example, if the optimizer hasn't been registered to the -``OPTIMIZER_REGISTRY``: - -.. code-block:: bash - - $ python trainer.py fit \ - --gen_optimizer.class_path=torch.optim.Adam \ - --gen_optimizer.init_args.lr=0.01 \ - --gen_discriminator.class_path=torch.optim.AdamW \ - --gen_discriminator.init_args.lr=0.0001 diff --git a/docs/_sources/cli/lightning_cli_expert.rst.txt b/docs/_sources/cli/lightning_cli_expert.rst.txt deleted file mode 100644 index dbd6061..0000000 --- a/docs/_sources/cli/lightning_cli_expert.rst.txt +++ /dev/null @@ -1,266 +0,0 @@ -:orphan: - -.. testsetup:: * - :skipif: not _JSONARGPARSE_AVAILABLE - - import torch - from unittest import mock - from typing import List - import pytorch_lightning as pl - from pytorch_lightning import LightningModule, LightningDataModule, Trainer, Callback - - - class NoFitTrainer(Trainer): - def fit(self, *_, **__): - pass - - - class LightningCLI(pl.utilities.cli.LightningCLI): - def __init__(self, *args, trainer_class=NoFitTrainer, run=False, **kwargs): - super().__init__(*args, trainer_class=trainer_class, run=run, **kwargs) - - - class MyModel(LightningModule): - def __init__( - self, - encoder_layers: int = 12, - decoder_layers: List[int] = [2, 4], - batch_size: int = 8, - ): - pass - - - class MyClassModel(LightningModule): - def __init__(self, num_classes: int): - pass - - - class MyDataModule(LightningDataModule): - def __init__(self, batch_size: int = 8): - self.num_classes = 5 - - - def send_email(address, message): - pass - - - mock_argv = mock.patch("sys.argv", ["any.py"]) - mock_argv.start() - -.. testcleanup:: * - - mock_argv.stop() - -####################################### -Eliminate config boilerplate (Advanced) -####################################### -**Audience:** Users who already understand the LightningCLI and want to customize it. - ----- - -************************** -Customize the LightningCLI -************************** - -The init parameters of the :class:`~pytorch_lightning.utilities.cli.LightningCLI` class can be used to customize some -things, namely: the description of the tool, enabling parsing of environment variables and additional arguments to -instantiate the trainer and configuration parser. - -Nevertheless the init arguments are not enough for many use cases. For this reason the class is designed so that can be -extended to customize different parts of the command line tool. The argument parser class used by -:class:`~pytorch_lightning.utilities.cli.LightningCLI` is -:class:`~pytorch_lightning.utilities.cli.LightningArgumentParser` which is an extension of python's argparse, thus -adding arguments can be done using the :func:`add_argument` method. In contrast to argparse it has additional methods to -add arguments, for example :func:`add_class_arguments` adds all arguments from the init of a class, though requiring -parameters to have type hints. For more details about this please refer to the `respective documentation -`_. - -The :class:`~pytorch_lightning.utilities.cli.LightningCLI` class has the -:meth:`~pytorch_lightning.utilities.cli.LightningCLI.add_arguments_to_parser` method which can be implemented to include -more arguments. After parsing, the configuration is stored in the :code:`config` attribute of the class instance. The -:class:`~pytorch_lightning.utilities.cli.LightningCLI` class also has two methods that can be used to run code before -and after the trainer runs: :code:`before_` and :code:`after_`. -A realistic example for these would be to send an email before and after the execution. -The code for the :code:`fit` subcommand would be something like: - -.. testcode:: - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.add_argument("--notification_email", default="will@email.com") - - def before_fit(self): - send_email(address=self.config["notification_email"], message="trainer.fit starting") - - def after_fit(self): - send_email(address=self.config["notification_email"], message="trainer.fit finished") - - - cli = MyLightningCLI(MyModel) - -Note that the config object :code:`self.config` is a dictionary whose keys are global options or groups of options. It -has the same structure as the yaml format described previously. This means for instance that the parameters used for -instantiating the trainer class can be found in :code:`self.config['fit']['trainer']`. - -.. tip:: - - Have a look at the :class:`~pytorch_lightning.utilities.cli.LightningCLI` class API reference to learn about other - methods that can be extended to customize a CLI. - ----- - -************************** -Configure forced callbacks -************************** -As explained previously, any Lightning callback can be added by passing it through command line or -including it in the config via :code:`class_path` and :code:`init_args` entries. - -However, certain callbacks MUST be coupled with a model so they are always present and configurable. -This can be implemented as follows: - -.. testcode:: - - from pytorch_lightning.callbacks import EarlyStopping - - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.add_lightning_class_args(EarlyStopping, "my_early_stopping") - parser.set_defaults({"my_early_stopping.monitor": "val_loss", "my_early_stopping.patience": 5}) - - - cli = MyLightningCLI(MyModel) - -To change the configuration of the :code:`EarlyStopping` in the config it would be: - -.. code-block:: yaml - - model: - ... - trainer: - ... - my_early_stopping: - patience: 5 - -.. note:: - - The example above overrides a default in :code:`add_arguments_to_parser`. This is included to show that defaults can - be changed if needed. However, note that overriding of defaults in the source code is not intended to be used to - store the best hyperparameters for a task after experimentation. To ease reproducibility the source code should be - stable. It is better practice to store the best hyperparameters for a task in a configuration file independent from - the source code. - ----- - -******************* -Class type defaults -******************* - -The support for classes as type hints allows to try many possibilities with the same CLI. This is a useful feature, but -it can make it tempting to use an instance of a class as a default. For example: - -.. testcode:: - - class MyMainModel(LightningModule): - def __init__( - self, - backbone: torch.nn.Module = MyModel(encoder_layers=24), # BAD PRACTICE! - ): - super().__init__() - self.backbone = backbone - -Normally classes are mutable as it is in this case. The instance of :code:`MyModel` would be created the moment that the -module that defines :code:`MyMainModel` is first imported. This means that the default of :code:`backbone` will be -initialized before the CLI class runs :code:`seed_everything` making it non-reproducible. Furthermore, if -:code:`MyMainModel` is used more than once in the same Python process and the :code:`backbone` parameter is not -overridden, the same instance would be used in multiple places which very likely is not what the developer intended. -Having an instance as default also makes it impossible to generate the complete config file since for arbitrary classes -it is not known which arguments were used to instantiate it. - -A good solution to these problems is to not have a default or set the default to a special value (e.g. a -string) which would be checked in the init and instantiated accordingly. If a class parameter has no default and the CLI -is subclassed then a default can be set as follows: - -.. testcode:: - - default_backbone = { - "class_path": "import.path.of.MyModel", - "init_args": { - "encoder_layers": 24, - }, - } - - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.set_defaults({"model.backbone": default_backbone}) - -A more compact version that avoids writing a dictionary would be: - -.. testcode:: - - from jsonargparse import lazy_instance - - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.set_defaults({"model.backbone": lazy_instance(MyModel, encoder_layers=24)}) - ----- - -************************ -Connect two config files -************************ -Another case in which it might be desired to extend :class:`~pytorch_lightning.utilities.cli.LightningCLI` is that the -model and data module depend on a common parameter. For example in some cases both classes require to know the -:code:`batch_size`. It is a burden and error prone giving the same value twice in a config file. To avoid this the -parser can be configured so that a value is only given once and then propagated accordingly. With a tool implemented -like shown below, the :code:`batch_size` only has to be provided in the :code:`data` section of the config. - -.. testcode:: - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.link_arguments("data.batch_size", "model.batch_size") - - - cli = MyLightningCLI(MyModel, MyDataModule) - -The linking of arguments is observed in the help of the tool, which for this example would look like: - -.. code-block:: bash - - $ python trainer.py fit --help - ... - --data.batch_size BATCH_SIZE - Number of samples in a batch (type: int, default: 8) - - Linked arguments: - model.batch_size <-- data.batch_size - Number of samples in a batch (type: int) - -Sometimes a parameter value is only available after class instantiation. An example could be that your model requires -the number of classes to instantiate its fully connected layer (for a classification task) but the value is not -available until the data module has been instantiated. The code below illustrates how to address this. - -.. testcode:: - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.link_arguments("data.num_classes", "model.num_classes", apply_on="instantiate") - - - cli = MyLightningCLI(MyClassModel, MyDataModule) - -Instantiation links are used to automatically determine the order of instantiation, in this case data first. - -.. tip:: - - The linking of arguments can be used for more complex cases. For example to derive a value via a function that takes - multiple settings as input. For more details have a look at the API of `link_arguments - `_. - - -The linking of arguments is intended for things that are meant to be non-configurable. This improves the CLI user -experience since it avoids the need for providing more parameters. A related concept is -variable interpolation which in contrast keeps things being configurable. diff --git a/docs/_sources/cli/lightning_cli_faq.rst.txt b/docs/_sources/cli/lightning_cli_faq.rst.txt deleted file mode 100644 index ca1be71..0000000 --- a/docs/_sources/cli/lightning_cli_faq.rst.txt +++ /dev/null @@ -1,136 +0,0 @@ -:orphan: - -.. testsetup:: * - :skipif: not _JSONARGPARSE_AVAILABLE - - import torch - from unittest import mock - from typing import List - import pytorch_lightning as pl - from pytorch_lightning import LightningModule, LightningDataModule, Trainer, Callback - - - class NoFitTrainer(Trainer): - def fit(self, *_, **__): - pass - - - class LightningCLI(pl.utilities.cli.LightningCLI): - def __init__(self, *args, trainer_class=NoFitTrainer, run=False, **kwargs): - super().__init__(*args, trainer_class=trainer_class, run=run, **kwargs) - - - class MyModel(LightningModule): - def __init__( - self, - encoder_layers: int = 12, - decoder_layers: List[int] = [2, 4], - batch_size: int = 8, - ): - pass - - - mock_argv = mock.patch("sys.argv", ["any.py"]) - mock_argv.start() - -.. testcleanup:: * - - mock_argv.stop() - -##################################### -Eliminate config boilerplate (expert) -##################################### - -*************** -Troubleshooting -*************** -The standard behavior for CLIs, when they fail, is to terminate the process with a non-zero exit code and a short message -to hint the user about the cause. This is problematic while developing the CLI since there is no information to track -down the root of the problem. A simple change in the instantiation of the ``LightningCLI`` can be used such that when -there is a failure an exception is raised and the full stack trace printed. - -.. testcode:: - - cli = LightningCLI(MyModel, parser_kwargs={"error_handler": None}) - -.. note:: - - When asking about problems and reporting issues please set the ``error_handler`` to ``None`` and include the stack - trace in your description. With this, it is more likely for people to help out identifying the cause without needing - to create a reproducible script. - ----- - -************************************* -Reproducibility with the LightningCLI -************************************* -The topic of reproducibility is complex and it is impossible to guarantee reproducibility by just providing a class that -people can use in unexpected ways. Nevertheless, the :class:`~pytorch_lightning.utilities.cli.LightningCLI` tries to -give a framework and recommendations to make reproducibility simpler. - -When an experiment is run, it is good practice to use a stable version of the source code, either being a released -package or at least a commit of some version controlled repository. For each run of a CLI the config file is -automatically saved including all settings. This is useful to figure out what was done for a particular run without -requiring to look at the source code. If by mistake the exact version of the source code is lost or some defaults -changed, having the full config means that most of the information is preserved. - -The class is targeted at implementing CLIs because running a command from a shell provides a separation with the Python -source code. Ideally the CLI would be placed in your path as part of the installation of a stable package, instead of -running from a clone of a repository that could have uncommitted local modifications. Creating installable packages that -include CLIs is out of the scope of this document. This is mentioned only as a teaser for people who would strive for -the best practices possible. - - -For every CLI implemented, users are encouraged to learn how to run it by reading the documentation printed with the -:code:`--help` option and use the :code:`--print_config` option to guide the writing of config files. A few more details -that might not be clear by only reading the help are the following. - -:class:`~pytorch_lightning.utilities.cli.LightningCLI` is based on argparse and as such follows the same arguments style -as many POSIX command line tools. Long options are prefixed with two dashes and its corresponding values should be -provided with an empty space or an equal sign, as :code:`--option value` or :code:`--option=value`. Command line options -are parsed from left to right, therefore if a setting appears multiple times the value most to the right will override -the previous ones. If a class has an init parameter that is required (i.e. no default value), it is given as -:code:`--option` which makes it explicit and more readable instead of relying on positional arguments. - ----- - -********************* -What is a subcommand? -********************* -A subcommand is what is the action the LightningCLI applies to the script: - -.. code:: bash - - python main.py [subcommand] - -See the Potential subcommands with: - -.. code:: bash - - python main.py --help - -which prints: - -.. code:: bash - - ... - - fit Runs the full optimization routine. - validate Perform one evaluation epoch over the validation set. - test Perform one evaluation epoch over the test set. - predict Run inference on your data. - tune Runs routines to tune hyperparameters before training. - -use a subcommand as follows: - -.. code:: bash - - python main.py fit - python main.py test - ----- - -**************** -What is the CLI? -**************** -CLI is short for commandline interface. Use your terminal to enter these commands. diff --git a/docs/_sources/cli/lightning_cli_intermediate.rst.txt b/docs/_sources/cli/lightning_cli_intermediate.rst.txt deleted file mode 100644 index 36c6adb..0000000 --- a/docs/_sources/cli/lightning_cli_intermediate.rst.txt +++ /dev/null @@ -1,204 +0,0 @@ -:orphan: - -########################################### -Eliminate config boilerplate (Intermediate) -########################################### -**Audience:** Users who want advanced modularity via the commandline interface (CLI). - -**Pre-reqs:** You must already understand how to use a commandline and :doc:`LightningDataModule <../data/datamodule>`. - ----- - -*************************** -What is config boilerplate? -*************************** -As Lightning projects grow in complexity it becomes desirable to enable full customizability from the commandline (CLI) so you can -change any hyperparameters without changing your code: - -.. code:: bash - - # Mix and match anything - $ python main.py --command fit --model.learning_rate 0.02 - $ python main.py --command fit --model.learning_rate 0.01 --trainer.fast_dev_run True - -This is what the Lightning CLI enables. Without the Lightning CLI, you usually end up with a TON of boilerplate that looks like this: - -.. code:: python - - from argparse import ArgumentParser - - if __name__ == "__main__": - parser = ArgumentParser() - parser.add_argument("--learning_rate_1", default=0.02) - parser.add_argument("--learning_rate_2", default=0.03) - parser.add_argument("--model", default="cnn") - parser.add_argument("--command", default="fit") - parser.add_argument("--run_fast", default=True) - ... - # add 100 more of these - ... - - args = parser.parse_args() - - if args.model == "cnn": - model = ConvNet(learning_rate=args.learning_rate_1) - elif args.model == "transformer": - model = Transformer(learning_rate=args.learning_rate_2) - trainer = Trainer(fast_dev_run=args.run_fast) - ... - - if args.command == "fit": - trainer.fit() - elif args.command == "test": - ... - -This kind of boilerplate is unsustainable as projects grow in complexity. - ----- - -************************ -Enable the Lightning CLI -************************ -To enable the Lightning CLI install the extras: - -.. code:: bash - - pip install pytorch-lightning[extra] - -if the above fails, only install jsonargparse: - -.. code:: bash - - pip install -U jsonargparse[signatures] - ----- - -************************** -Connect a model to the CLI -************************** -The simplest way to control a model with the CLI is to wrap it in the LightningCLI object: - -.. code:: python - - # main.py - - import torch - from pytorch_lightning.utilities.cli import LightningCLI - from pytorch_lightning import LightningModule, demos - - - class DemoModel(LightningModule): - def __init__(self, out_dim: int = 10, learning_rate: float = 0.02): - super().__init__() - self.l1 = torch.nn.Linear(32, out_dim) - self.learning_rate = learning_rate - - def forward(self, x): - return torch.relu(self.l1(x.view(x.size(0), -1))) - - def training_step(self, batch, batch_nb): - x = batch - x = self(x) - loss = x.sum() - return loss - - def configure_optimizers(self): - return torch.optim.Adam(self.parameters(), lr=self.learning_rate) - - - cli = LightningCLI(DemoModel, demos.BoringDataModule) - # don't call fit!! - -Now your model can be managed via the CLI. To see the available commands type: - -.. code:: bash - - $ python main.py --help - -Which prints out: - -.. code:: bash - - usage: a.py [-h] [-c CONFIG] [--print_config [={comments,skip_null,skip_default}+]] - {fit,validate,test,predict,tune} ... - - pytorch-lightning trainer command line tool - - optional arguments: - -h, --help Show this help message and exit. - -c CONFIG, --config CONFIG - Path to a configuration file in json or yaml format. - --print_config [={comments,skip_null,skip_default}+] - Print configuration and exit. - - subcommands: - For more details of each subcommand add it as argument followed by --help. - - {fit,validate,test,predict,tune} - fit Runs the full optimization routine. - validate Perform one evaluation epoch over the validation set. - test Perform one evaluation epoch over the test set. - predict Run inference on your data. - tune Runs routines to tune hyperparameters before training. - - -the message tells us that we have a few available subcommands: - -.. code:: bash - - python main.py [subcommand] - -which you can use depending on your use case: - -.. code:: bash - - $ python main.py fit - $ python main.py validate - $ python main.py test - $ python main.py predict - $ python main.py tune - ----- - -************************** -Train a model with the CLI -************************** -To run the full training routine (train, val, test), use the subcommand ``fit``: - -.. code:: bash - - python main.py fit - -View all available options with the ``--help`` command: - -.. code:: bash - - usage: main.py [options] fit [-h] [-c CONFIG] - [--seed_everything SEED_EVERYTHING] [--trainer CONFIG] - ... - [--ckpt_path CKPT_PATH] - --trainer.logger LOGGER - - optional arguments: - : - --model.out_dim OUT_DIM - (type: int, default: 10) - --model.learning_rate LEARNING_RATE - (type: float, default: 0.02) - : - --data CONFIG Path to a configuration file. - --data.data_dir DATA_DIR - (type: str, default: ./) - -With the Lightning CLI enabled, you can now change the parameters without touching your code: - -.. code:: bash - - # change the learning_rate - python main.py fit --model.out_dim 30 - - # change the out dimensions also - python main.py fit --model.out_dim 10 --model.learning_rate 0.1 - - # change trainer and data arguments too - python main.py fit --model.out_dim 2 --model.learning_rate 0.1 --data.data_dir '~/' --trainer.logger False diff --git a/docs/_sources/cli/lightning_cli_intermediate_2.rst.txt b/docs/_sources/cli/lightning_cli_intermediate_2.rst.txt deleted file mode 100644 index 493d536..0000000 --- a/docs/_sources/cli/lightning_cli_intermediate_2.rst.txt +++ /dev/null @@ -1,251 +0,0 @@ -:orphan: - -########################################### -Eliminate config boilerplate (intermediate) -########################################### -**Audience:** Users who have multiple models and datasets per project. - -**Pre-reqs:** You must have read :doc:`(Control it all from the CLI) `. - ----- - -**************************************** -Why do I want to mix models and datasets -**************************************** -Lightning projects usually begin with one model and one dataset. As the project grows in complexity and you introduce more models and more datasets, it becomes desirable -to mix any model with any dataset directly from the commandline without changing your code. - - -.. code:: bash - - # Mix and match anything - $ python main.py fit --model=GAN --data=MNIST - $ python main.py fit --model=Transformer --data=MNIST - -This is what the Lightning CLI enables. Otherwise, this kind of configuration requires a significant amount of boilerplate that often looks like this: - -.. code:: python - - # choose model - if args.model == "gan": - model = GAN(args.feat_dim) - elif args.model == "transformer": - model = Transformer(args.feat_dim) - ... - - # choose datamodule - if args.data == "MNIST": - datamodule = MNIST() - elif args.data == "imagenet": - datamodule = Imagenet() - ... - - # mix them! - trainer.fit(model, datamodule) - ----- - -************************* -Register LightningModules -************************* -Connect models across different files with the ``MODEL_REGISTRY`` to make them available from the CLI: - -.. code:: python - - # main.py - - from pytorch_lightning import demos - from pytorch_lightning.utilities import cli as pl_cli - - - @pl_cli.MODEL_REGISTRY - class Model1(demos.DemoModel): - def configure_optimizers(self): - print("⚡", "using Model1", "⚡") - return super().configure_optimizers() - - - @pl_cli.MODEL_REGISTRY - class Model2(demos.DemoModel): - def configure_optimizers(self): - print("⚡", "using Model2", "⚡") - return super().configure_optimizers() - - - cli = pl_cli.LightningCLI(datamodule_class=demos.BoringDataModule) - -Now you can choose between any model from the CLI: - -.. code:: bash - - # use Model1 - python main.py fit --model Model1 - - # use Model2 - python main.py fit --model Model2 - ----- - -******************** -Register DataModules -******************** -Connect DataModules across different files with the ``DATAMODULE_REGISTRY`` to make them available from the CLI: - -.. code:: python - - # main.py - import torch - from pytorch_lightning.utilities import cli as pl_cli - from pytorch_lightning import demos - - - @pl_cli.DATAMODULE_REGISTRY - class FakeDataset1(demos.BoringDataModule): - def train_dataloader(self): - print("⚡", "using FakeDataset1", "⚡") - return torch.utils.data.DataLoader(self.random_train) - - - @pl_cli.DATAMODULE_REGISTRY - class FakeDataset2(demos.BoringDataModule): - def train_dataloader(self): - print("⚡", "using FakeDataset2", "⚡") - return torch.utils.data.DataLoader(self.random_train) - - - cli = pl_cli.LightningCLI(demos.DemoModel) - -Now you can choose between any dataset at runtime: - -.. code:: bash - - # use Model1 - python main.py fit --data FakeDataset1 - - # use Model2 - python main.py fit --data FakeDataset2 - ----- - -******************* -Register optimizers -******************* -Connect optimizers with the ``OPTIMIZER_REGISTRY`` to make them available from the CLI: - -.. code:: python - - # main.py - import torch - from pytorch_lightning.utilities import cli as pl_cli - from pytorch_lightning import demos - - - @pl_cli.OPTIMIZER_REGISTRY - class LitAdam(torch.optim.Adam): - def step(self, closure): - print("⚡", "using LitAdam", "⚡") - super().step(closure) - - - @pl_cli.OPTIMIZER_REGISTRY - class FancyAdam(torch.optim.Adam): - def step(self, closure): - print("⚡", "using FancyAdam", "⚡") - super().step(closure) - - - cli = pl_cli.LightningCLI(demos.DemoModel, demos.BoringDataModule) - -Now you can choose between any optimizer at runtime: - -.. code:: bash - - # use LitAdam - python main.py fit --optimizer LitAdam - - # use FancyAdam - python main.py fit --optimizer FancyAdam - -Bonus: If you need only 1 optimizer, the Lightning CLI already works out of the box with any Optimizer from ``torch.optim.optim``: - -.. code:: bash - - python main.py fit --optimizer AdamW - -If the optimizer you want needs other arguments, add them via the CLI (no need to change your code)! - -.. code:: bash - - python main.py fit --optimizer SGD --optimizer.lr=0.01 - ----- - -********************** -Register LR schedulers -********************** -Connect learning rate schedulers with the ``LR_SCHEDULER_REGISTRY`` to make them available from the CLI: - -.. code:: python - - # main.py - import torch - from pytorch_lightning.utilities import cli as pl_cli - from pytorch_lightning import demos - - - @pl_cli.LR_SCHEDULER_REGISTRY - class LitLRScheduler(torch.optim.lr_scheduler.CosineAnnealingLR): - def step(self): - print("⚡", "using LitLRScheduler", "⚡") - super().step() - - - cli = pl_cli.LightningCLI(demos.DemoModel, demos.BoringDataModule) - -Now you can choose between any learning rate scheduler at runtime: - -.. code:: bash - - # LitLRScheduler - python main.py fit --lr_scheduler LitLRScheduler - - -Bonus: If you need only 1 LRScheduler, the Lightning CLI already works out of the box with any LRScheduler from ``torch.optim``: - -.. code:: bash - - python main.py fit --lr_scheduler CosineAnnealingLR - python main.py fit --lr_scheduler LinearLR - ... - -If the scheduler you want needs other arguments, add them via the CLI (no need to change your code)! - -.. code:: bash - - python main.py fit --lr_scheduler=ReduceLROnPlateau --lr_scheduler.monitor=epoch - ----- - -************************* -Register from any package -************************* -A shortcut to register many classes from a package is to use the ``register_classes`` method. Here we register all optimizers from the ``torch.optim`` library: - -.. code:: python - - import torch - from pytorch_lightning.utilities import cli as pl_cli - from pytorch_lightning import demos - - # add all PyTorch optimizers! - pl_cli.OPTIMIZER_REGISTRY.register_classes(module=torch.optim, base_cls=torch.optim.Optimizer) - - cli = pl_cli.LightningCLI(demos.DemoModel, demos.BoringDataModule) - -Now use any of the optimizers in the ``torch.optim`` library: - -.. code:: bash - - python main.py fit --optimizer AdamW - -This method is supported by all the registry classes. diff --git a/docs/_sources/clouds/cloud_training.rst.txt b/docs/_sources/clouds/cloud_training.rst.txt deleted file mode 100644 index 1bd57b1..0000000 --- a/docs/_sources/clouds/cloud_training.rst.txt +++ /dev/null @@ -1,86 +0,0 @@ -.. _grid: - -################## -Train on the cloud -################## -**Audience:** Users who want to develop and train models on the cloud (public cloud, private cloud or onprem clusters). - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: 1: Access a GPU machine on the cloud - :description: Learn to train models using an interactive cloud machine. - :col_css: col-md-4 - :button_link: session_basic.html - :height: 200 - :tag: basic - -.. displayitem:: - :header: 2: Run a model in the background on the cloud - :description: Learn to run a model in the background on a cloud machine. - :col_css: col-md-4 - :button_link: run_basic.html - :height: 200 - :tag: intermediate - -.. displayitem:: - :header: 3: Save up to 80% on cloud costs with fault-tolerant training - :description: Run on the cloud for 1/10th the price with fault-tolerant training. - :col_css: col-md-4 - :button_link: fault_tolerant_training_basic.html - :height: 200 - :tag: intermediate - -.. displayitem:: - :header: 4: Run many models at once - :description: Run many models at once (sweep) to find the best performing model. - :col_css: col-md-4 - :button_link: run_intermediate.html - :height: 200 - :tag: intermediate - -.. displayitem:: - :header: 5: Run on your own cloud - :description: Learn how to run on your Company or University private clouds. - :col_css: col-md-4 - :button_link: run_expert.html - :height: 200 - :tag: expert - -.. raw:: html - -
-
- ----- - -.. raw:: html - -
-
- -.. raw:: html - - - - -.. raw:: html - -
-
- -`Grid.ai `_ is the official cloud training solution for PyTorch Lightning. Grid is designed to support researcher workloads at both academic labs and major companies. - -.. raw:: html - -
-
diff --git a/docs/_sources/clouds/cloud_training_intermediate.rst.txt b/docs/_sources/clouds/cloud_training_intermediate.rst.txt deleted file mode 100644 index c5a65d7..0000000 --- a/docs/_sources/clouds/cloud_training_intermediate.rst.txt +++ /dev/null @@ -1,7 +0,0 @@ -:orphan: - -.. _grid_cloud_intermediate: - -################################# -Train on the cloud (intermediate) -################################# diff --git a/docs/_sources/clouds/cluster.rst.txt b/docs/_sources/clouds/cluster.rst.txt deleted file mode 100644 index 59a252a..0000000 --- a/docs/_sources/clouds/cluster.rst.txt +++ /dev/null @@ -1,48 +0,0 @@ -######################### -Run on an on-prem cluster -######################### - - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Run on an on-prem cluster - :description: Learn to train models on a general compute cluster. - :col_css: col-md-6 - :button_link: cluster_intermediate_1.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Run with Torch Distributed - :description: Run models on a cluster with torch distributed. - :col_css: col-md-6 - :button_link: cluster_intermediate_2.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Run on a SLURM cluster - :description: Run models on a SLURM-managed cluster - :col_css: col-md-6 - :button_link: cluster_advanced.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Integrate your own cluster - :description: Learn how to integrate your own cluster - :col_css: col-md-6 - :button_link: cluster_expert.html - :height: 150 - :tag: expert - -.. raw:: html - -
-
diff --git a/docs/_sources/clouds/cluster_advanced.rst.txt b/docs/_sources/clouds/cluster_advanced.rst.txt deleted file mode 100644 index 918bf06..0000000 --- a/docs/_sources/clouds/cluster_advanced.rst.txt +++ /dev/null @@ -1,213 +0,0 @@ -#################################### -Run on an on-prem cluster (advanced) -#################################### - -.. _slurm: - ----- - -****************************** -Run on a SLRUM managed cluster -****************************** -Lightning automates the details behind training on a SLURM-powered cluster. In contrast to the general purpose -cluster above, the user does not start the jobs manually on each node and instead submits it to SLURM which -schedules the resources and time for which the job is allowed to run. - ----- - -*************************** -Design your training script -*************************** - -To train a model using multiple nodes, do the following: - -1. Design your :ref:`lightning_module` (no need to add anything specific here). - -2. Enable DDP in the trainer - - .. code-block:: python - - # train on 32 GPUs across 4 nodes - trainer = Trainer(accelerator="gpu", devices=8, num_nodes=4, strategy="ddp") - -3. It's a good idea to structure your training script like this: - - .. testcode:: - - # train.py - def main(hparams): - model = LightningTemplateModel(hparams) - - trainer = Trainer(accelerator="gpu", devices=8, num_nodes=4, strategy="ddp") - - trainer.fit(model) - - - if __name__ == "__main__": - root_dir = os.path.dirname(os.path.realpath(__file__)) - parent_parser = ArgumentParser(add_help=False) - hyperparams = parser.parse_args() - - # TRAIN - main(hyperparams) - -4. Create the appropriate SLURM job: - - .. code-block:: bash - - # (submit.sh) - #!/bin/bash -l - - # SLURM SUBMIT SCRIPT - #SBATCH --nodes=4 - #SBATCH --gres=gpu:8 - #SBATCH --ntasks-per-node=8 - #SBATCH --mem=0 - #SBATCH --time=0-02:00:00 - - # activate conda env - source activate $1 - - # debugging flags (optional) - export NCCL_DEBUG=INFO - export PYTHONFAULTHANDLER=1 - - # on your cluster you might need these: - # set the network interface - # export NCCL_SOCKET_IFNAME=^docker0,lo - - # might need the latest CUDA - # module load NCCL/2.4.7-1-cuda.10.0 - - # run script from above - srun python3 train.py - -5. If you want auto-resubmit (read below), add this line to the submit.sh script - - .. code-block:: bash - - #SBATCH --signal=SIGUSR1@90 - -6. Submit the SLURM job - - .. code-block:: bash - - sbatch submit.sh - ----- - -********************************** -Enable auto wall-time resubmitions -********************************** -When you use Lightning in a SLURM cluster, it automatically detects when it is about -to run into the wall time and does the following: - -1. Saves a temporary checkpoint. -2. Requeues the job. -3. When the job starts, it loads the temporary checkpoint. - -To get this behavior make sure to add the correct signal to your SLURM script - -.. code-block:: bash - - # 90 seconds before training ends - SBATCH --signal=SIGUSR1@90 - -If auto-resubmit is not desired, it can be turned off in the :class:`~pytorch_lightning.plugins.environments.slurm_environment.SLURMEnvironment` plugin: - -.. code-block:: python - - from pytorch_lightning.plugins.environments import SLURMEnvironment - - trainer = Trainer(plugins=[SLURMEnvironment(auto_requeue=False)]) - ----- - -*********************** -Build your SLURM script -*********************** -Instead of manually building SLURM scripts, you can use the -`SlurmCluster object `_ -to do this for you. The SlurmCluster can also run a grid search if you pass -in a `HyperOptArgumentParser -`_. - -Here is an example where you run a grid search of 9 combinations of hyperparameters. -See also the multi-node examples -`here `__. - -.. code-block:: python - - # grid search 3 values of learning rate and 3 values of number of layers for your net - # this generates 9 experiments (lr=1e-3, layers=16), (lr=1e-3, layers=32), - # (lr=1e-3, layers=64), ... (lr=1e-1, layers=64) - parser = HyperOptArgumentParser(strategy="grid_search", add_help=False) - parser.opt_list("--learning_rate", default=0.001, type=float, options=[1e-3, 1e-2, 1e-1], tunable=True) - parser.opt_list("--layers", default=1, type=float, options=[16, 32, 64], tunable=True) - hyperparams = parser.parse_args() - - # Slurm cluster submits 9 jobs, each with a set of hyperparams - cluster = SlurmCluster( - hyperparam_optimizer=hyperparams, - log_path="/some/path/to/save", - ) - - # OPTIONAL FLAGS WHICH MAY BE CLUSTER DEPENDENT - # which interface your nodes use for communication - cluster.add_command("export NCCL_SOCKET_IFNAME=^docker0,lo") - - # see the output of the NCCL connection process - # NCCL is how the nodes talk to each other - cluster.add_command("export NCCL_DEBUG=INFO") - - # setting a main port here is a good idea. - cluster.add_command("export MASTER_PORT=%r" % PORT) - - # ************** DON'T FORGET THIS *************** - # MUST load the latest NCCL version - cluster.load_modules(["NCCL/2.4.7-1-cuda.10.0"]) - - # configure cluster - cluster.per_experiment_nb_nodes = 12 - cluster.per_experiment_nb_gpus = 8 - - cluster.add_slurm_cmd(cmd="ntasks-per-node", value=8, comment="1 task per gpu") - - # submit a script with 9 combinations of hyper params - # (lr=1e-3, layers=16), (lr=1e-3, layers=32), (lr=1e-3, layers=64), ... (lr=1e-1, layers=64) - cluster.optimize_parallel_cluster_gpu( - main, nb_trials=9, job_name="name_for_squeue" # how many permutations of the grid search to run - ) - - -The other option is that you generate scripts on your own via a bash command or use our -:doc:`native solution <../clouds/cloud_training>`. - ----- - -******** -Get help -******** -Setting up a cluster for distributed training is not trivial. Lightning offers lightning-grid which allows you to configure a cluster easily and run experiments via the CLI and web UI. - -Try it out for free today: - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Train models on the cloud - :description: Learn to run a model in the background on a cloud machine. - :col_css: col-md-6 - :button_link: cloud_training.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
bool: - """Return True if the cluster is managed (you don't launch processes yourself)""" - return True - - def world_size(self) -> int: - return int(os.environ["WORLD_SIZE"]) - - def global_rank(self) -> int: - return int(os.environ["RANK"]) - - def local_rank(self) -> int: - return int(os.environ["LOCAL_RANK"]) - - def node_rank(self) -> int: - return int(os.environ["NODE_RANK"]) - - def main_address(self) -> str: - return os.environ["MASTER_ADDRESS"] - - def main_port(self) -> int: - return int(os.environ["MASTER_PORT"]) - - - trainer = Trainer(plugins=[MyClusterEnvironment()]) - ----- - -******** -Get help -******** -Setting up a cluster for distributed training is not trivial. Lightning offers lightning-grid which allows you to configure a cluster easily and run experiments via the CLI and web UI. - -Try it out for free today: - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Train models on the cloud - :description: Learn to run a model in the background on a cloud machine. - :col_css: col-md-6 - :button_link: cloud_training.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
`_. and requires the following environment variables to be defined on each node: - -- *MASTER_PORT* - required; has to be a free port on machine with NODE_RANK 0 -- *MASTER_ADDR* - required (except for NODE_RANK 0); address of NODE_RANK 0 node -- *WORLD_SIZE* - required; how many nodes are in the cluster -- *NODE_RANK* - required; id of the node in the cluster - -.. _training_script_setup: - ----- - -************************* -Setup the training script -************************* -To train a model using multiple nodes, do the following: - -1. Design your :ref:`lightning_module` (no need to add anything specific here). - -2. Enable DDP in the trainer - - .. code-block:: python - - # train on 32 GPUs across 4 nodes - trainer = Trainer(accelerator="gpu", devices=8, num_nodes=4, strategy="ddp") - ----- - -*************************** -Submit a job to the cluster -*************************** -To submit a training job to the cluster you need to run the same training script on each node of the cluster. -This means that you need to: - -1. Copy all third-party libraries to each node (usually means - distribute requirements.txt file and install it). -2. Copy all your import dependencies and the script itself to each node. -3. Run the script on each node. - ----- - -****************** -Debug on a cluster -****************** -When running in DDP mode, some errors in your code can show up as an NCCL issue. -Set the ``NCCL_DEBUG=INFO`` environment variable to see the ACTUAL error. - -.. code-block:: bash - - NCCL_DEBUG=INFO python train.py ... - ----- - -******** -Get help -******** -Setting up a cluster for distributed training is not trivial. Lightning offers lightning-grid which allows you to configure a cluster easily and run experiments via the CLI and web UI. - -Try it out for free today: - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Train models on the cloud - :description: Learn to run a model in the background on a cloud machine. - :col_css: col-md-6 - :button_link: cloud_training.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
`__ provides helper functions to setup distributed environment variables from the `PyTorch distributed communication package `__ that need to be defined on each node. - -Once the script is setup like described in :ref:` Training Script Setup`, you can run the below command across your nodes to start multi-node training. - -Like a custom cluster, you have to ensure that there is network connectivity between the nodes with firewall rules that allow traffic flow on a specified *MASTER_PORT*. - -Finally, you'll need to decide which node you'd like to be the main node (*MASTER_ADDR*), and the ranks of each node (*NODE_RANK*). - -For example: - -* *MASTER_ADDR* 10.10.10.16 -* *MASTER_PORT* 29500 -* *NODE_RANK* 0 for the first node, 1 for the second node - -Run the below command with the appropriate variables set on each node. - -.. code-block:: bash - - python -m torch.distributed.run - --nnodes=2 # number of nodes you'd like to run with - --master_addr - --master_port - --node_rank - train.py (--arg1 ... train script args...) - -.. note:: - - ``torch.distributed.run`` assumes that you'd like to spawn a process per GPU if GPU devices are found on the node. This can be adjusted with ``-nproc_per_node``. - ----- - -******** -Get help -******** -Setting up a cluster for distributed training is not trivial. Lightning offers lightning-grid which allows you to configure a cluster easily and run experiments via the CLI and web UI. - -Try it out for free today: - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Train models on the cloud - :description: Learn to run a model in the background on a cloud machine. - :col_css: col-md-6 - :button_link: cloud_training.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
`. - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Basic - :description: Save money with fault-tolerant training on the cloud - :col_css: col-md-4 - :button_link: fault_tolerant_training_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Expert - :description: Learn how to enable fault tolerance on any cloud or cluster environment - :col_css: col-md-4 - :button_link: fault_tolerant_training_expert.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: FAQ - :description: Frequently asked questions about fault-tolerant training. - :col_css: col-md-4 - :button_link: fault_tolerant_training_faq.html - :height: 150 - -.. raw:: html - -
-
diff --git a/docs/_sources/clouds/fault_tolerant_training_basic.rst.txt b/docs/_sources/clouds/fault_tolerant_training_basic.rst.txt deleted file mode 100644 index d5af9ed..0000000 --- a/docs/_sources/clouds/fault_tolerant_training_basic.rst.txt +++ /dev/null @@ -1,43 +0,0 @@ -:orphan: - -############################### -Fault-tolerant Training (basic) -############################### -**Audience:** User who want to run on the cloud or a cluster environment. - -**Pre-requisites**: Users must have first read :doc:`Run on the cloud (basic) ` - ----- - -******************************** -What is fault-tolerant training? -******************************** -When developing models on the cloud or cluster environments, you may be forced to restart from scratch in the event of a software or hardware failure (ie: a *fault*). Lightning models can run fault-proof. - -With Fault Tolerant Training, when ``Trainer.fit()`` fails in the middle of an epoch during training or validation, -Lightning will restart exactly where it failed, and everything will be restored (down to the batch it was on even if the dataset was shuffled). - -.. warning:: Fault-tolerant Training is currently an experimental feature within Lightning. - ----- - -*************************************************** -Use fault-tolerance to save money on cloud training -*************************************************** -Cloud providers offer pre-emptible machines which can be priced as low as 1/10th the cost but can be shut-down automatically at any time. -Because fault-tolerant training can automatically recover from an interruption, you can train models for many weeks/months at a time for the pre-emptible prices. - -To easily run on the cloud with fault-tolerance with lightning-grid, use the following arguments: - -.. code-block:: bash - - grid run --use_spot --auto_resume lightning_script.py - -The ``--use_spot`` argument enables cheap preemptible pricing (but the machines that can be interrupted). -If the machine is interrupted, the ``--auto_resume`` argument automatically restarts the machine. - -As long as you are running a script that runs a lightning model, the model will restore itself and handle all the details of fault tolerance. - ----- - -.. include:: grid_costs.rst diff --git a/docs/_sources/clouds/fault_tolerant_training_expert.rst.txt b/docs/_sources/clouds/fault_tolerant_training_expert.rst.txt deleted file mode 100644 index f0051f7..0000000 --- a/docs/_sources/clouds/fault_tolerant_training_expert.rst.txt +++ /dev/null @@ -1,34 +0,0 @@ -:orphan: - -################################ -Fault-tolerant Training (expert) -################################ -**Audience**: Experts looking to enable and handle their own fault-tolerance. - -**Pre-requisites**: Users must have first read :doc:`Fault-tolrance Training (basic) ` - ----- - -*************************************** -Enable fault-tolerant behavior anywhere -*************************************** -To enable fault tolerance on your own cloud or cluster environment enable the *PL_FAULT_TOLERANT_TRAINING* environment variable: - -.. code-block:: bash - - PL_FAULT_TOLERANT_TRAINING=1 python script.py - -Although Lighting will now be fault-tolerant, you'll have to handle all the nuances of making sure the models are automatically restarted. - -.. note:: This complexity is already handled for you if you use **lightning-grid**. - ----- - -************************************************** -Enable fault-tolerant behavior on your own cluster -************************************************** -The simplest way to enable fault-tolerant behavior is to enable lightning-grid to work on your on-prem cluster or cloud environment which will handle all the nuances of fault-tolerant training at scale. - -Email us to connect with your own cloud account: - -``_ diff --git a/docs/_sources/clouds/fault_tolerant_training_faq.rst.txt b/docs/_sources/clouds/fault_tolerant_training_faq.rst.txt deleted file mode 100644 index 4f2bdf4..0000000 --- a/docs/_sources/clouds/fault_tolerant_training_faq.rst.txt +++ /dev/null @@ -1,144 +0,0 @@ -:orphan: - -############################# -Fault-tolerant Training (FAQ) -############################# - -******************************* -How do I use iterable datasets? -******************************* -To support fault-tolerance, you will need to use and expose a sampler within your dataset. - -For example, the following implementation for an iterable dataset sub-classing :class:`~torch.utils.data.IterableDataset` won't be supported. - -.. code-block:: python - - from torch.utils.data import IterableDataset, DataLoader - - - # does not support fault tolerance training! - class RandomIterableDataset(IterableDataset): - def __init__(self, size: int, count: int): - self.count = count - self.size = size - - def __iter__(self): - for _ in range(self.count): - yield torch.randn(self.size) - - -There are two primary reasons why Lightning can't support the previous implementation. - -* Lightning cannot infer what you are iterating over, making it difficult to restart training. Lightning Fault Tolerant Training requires a :class:`~torch.utils.data.distributed.Sampler` to be used to encapsulate the fetching logic, requiring both the sampler and an iterator to be made available as attributes within the dataset, so Lightning can access them to track progress. -* Implementing the `__next__` method is required as it separates iterator creation from its consumption, which is essential for Lightning to wrap the iterator before their consumption. - -If your iterable dataset are implemented in the following way, everything should works as expected. - -.. code-block:: python - - import torch - from torch.utils.data import IterableDataset, DataLoader - - - class RandomIterableDataset(IterableDataset): - def __init__(self, size: int, length: int): - self.data = torch.randn(length, size) - - # expose the sampler as an attribute - self.sampler = RandomSampler(range(length)) - - def __iter__(self) -> "RandomIterableDataset": - # expose the generator from the sampler as an attribute - # the ``sampler_iter`` will be wrapped by Lightning to ensure - # we can capture random seeds and iteration count for fast-forward samplers - # while restarting. - self.sampler_iter = iter(self.sampler) - return self - - def __next__(self) -> torch.Tensor: - # call next on the iterator and get the associated data. - # the logic here can become more complex but the sampler - # should be the central piece for fetching the next sample - index = next(self.sampler_iter) - return self.data[index] - ----- - -********************************** -How do I use multiple dataloaders? -********************************** -If you are using multiple training dataloaders, Lightning won't be able to restore the random state properly. - -.. testcode:: - - class LitModel(LightningModule): - def train_dataloader(self): - loader_a = torch.utils.data.DataLoader(range(8), batch_size=4) - loader_b = torch.utils.data.DataLoader(range(16), batch_size=4) - return {"loader_a": loader_a, "loader_b": loader_b} - - def training_step(self, batch, batch_idx): - # access the data in the same format as the collection of dataloaders. - # dict, list are supported. - loader_a = batch["loader_a"] - loader_b = batch["loader_b"] - - -If you believe this to be useful, please open a `feature request `_. - - ----- - -********************************* -What are the performance impacts? -********************************* -Fault-tolerant Training was tested on common and worst-case scenarios in order to measure the impact of the internal state tracking on the total training time. -On tiny models like the `BoringModel and RandomDataset `_ -which has virtually no data loading and processing overhead, we noticed up to 50% longer training time with fault tolerance enabled. -In this worst-case scenario, fault-tolerant adds an overhead that is noticeable in comparison to the compute time for dataloading itself. -However, for more realistic training workloads where data loading and preprocessing is more expensive, the constant overhead that fault tolerance adds becomes less noticeable or not noticeable at all. -For example, when training with ResNet50 on CIFAR 10 we have observed a 0.5% to 1% increase in training time depending on ``batch size`` or ``number of workers``. - -More detailed benchmarks will be shared in the future. - -.. note:: - - The extra time is coming from several parts: - - - Capturing the iteration count + random states for each sample within each DataLoader workers and pass it through the data_queue - - Extra logic to handle / store the dataloader's states from each batch. - ----- - -************************************ -What happens to my shuffled dataset? -************************************ -If you are using a single map-based dataset by sub-classing :class:`~torch.utils.data.Dataset`, everything should work as expected. - -.. code-block:: python - - from torch.utils.data import Dataset, DataLoader - - - class RandomDataset(Dataset): - def __init__(self, size: int, length: int): - self.len = length - self.data = torch.randn(length, size) - - def __getitem__(self, index): - return self.data[index] - - def __len__(self): - return self.len - ----- - -****************************** -What parts are fault-tolerant? -****************************** -Lightning keeps track of the following state updates during training: - -* Samplers indices and random states across multiple processes and workers: This enables restoring random transforms and batch fetching to the exact state as it was right before the failure. -* Optimizers, learning rate schedulers, callbacks, etc.. -* Loop progression -* Logging internal states such that metric reductions on epoch end are not getting affected by the failure and model selection can continue as expected. diff --git a/docs/_sources/clouds/grid_costs.rst.txt b/docs/_sources/clouds/grid_costs.rst.txt deleted file mode 100644 index 04b1864..0000000 --- a/docs/_sources/clouds/grid_costs.rst.txt +++ /dev/null @@ -1,6 +0,0 @@ -**** -Cost -**** -Lightning (via `lightning-grid `_) provides access to cloud machines to the community for free. However, you must buy credits on `lightning-grid `_ which are used to pay the cloud providers on your behalf. - -If you want to run on your own AWS account and pay the cloud provider directly, please contact our onprem team: ``_ diff --git a/docs/_sources/clouds/run_advanced.rst.txt b/docs/_sources/clouds/run_advanced.rst.txt deleted file mode 100644 index 3418dee..0000000 --- a/docs/_sources/clouds/run_advanced.rst.txt +++ /dev/null @@ -1,130 +0,0 @@ -:orphan: - -.. _grid_cloud_advanced: - -############################# -Train on the cloud (advanced) -############################# -**Audience**: Anyone looking to train a model on the cloud in the background - ----- - -**************************** -What is background training? -**************************** -Background training lets you train models in the background without you needing to interact with the machine. As the model trains you can monitor its progress via Tensorboard or an experiment manager of your choice. - ----- - -************************* -0: Install lightning-grid -************************* -First Navigate to https://platform.grid.ai to create a free account. - -Next, install lightning-grid and login - -.. code:: bash - - pip install lightning-grid - grid login - ----- - -******************* -1: Create a dataset -******************* -Create a datastore which optimizes your datasets for training at scale on the cloud. - -First, let's download a dummy dataset we created. - -.. code:: bash - - # download - curl https://pl-flash-data.s3.amazonaws.com/cifar5.zip -o cifar5.zip - - # unzip - unzip cifar5.zip - -Now create the datastore - -.. code:: bash - - grid datastore create cifar5/ --name cifar5 - -Now your dataset is ready to be used for training on the cloud! - -.. note:: In some *research* workflows, your model script ALSO downloads the dataset. If the dataset is only a few GBs this is fine. Otherwise we recommend you create a Datastore. - ----- - -************************** -2: Choose the model to run -************************** -You can run any python script in the background. For this example, we'll use a simple classifier: - -Clone the code to your machine: - -.. code bash - - git clone https://github.com/williamFalcon/cifar5-simple.git - - -.. note:: Code repositories can be as complicated as needed. This is just a simple demo. - ----- - -******************* -3: Run on the cloud -******************* -To run this model on the cloud, use the **grid run** command which has two parts: - -.. code:: bash - - grid run [run args] file.py [file args] - -To attach the datastore **cifar5** to the **cifar5.py** file use the following command: - -.. code:: bash - - # command | the datastore to use | the model | argument to the model - grid run --datastore_name cifar5 cifar5.py.py --data_dir /datastores/cifar5 - ----- - -********************* -4: Monitor and manage -********************* -Now that your model is running in the background you can monitor and manage it `here `_. - -You can also monitor its progress on the commandline: - -.. code:: bash - - grid status - ----- - -********** -Next Steps -********** -Here are the recommended next steps depending on your workflow. - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Run many models at once - :description: Learn how to run many models at once using sweeps. - :col_css: col-md-12 - :button_link: session_intermediate.html - :height: 150 - :tag: basic - -.. raw:: html - -
-
`_. - -You can also monitor its progress on the commandline: - -.. code:: bash - - grid status - ----- - -.. include:: grid_costs.rst - ----- - -********** -Next Steps -********** -Here are the recommended next steps depending on your workflow. - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Run many models at once - :description: Learn how to find the best performaning model by running multiple models at once using a sweep. - :col_css: col-md-4 - :button_link: run_intermediate.html - :height: 150 - :tag: basic - -.. raw:: html - -
-
` for more information. - ----- - -*********************************** -Run on your own cloud (hassle free) -*********************************** -Cluster training can get complicated once you start doing multi-node training, fault-tolerant training or sweeps. -If you'd prefer to not deal with any of the hassles of running on your own cloud environments, lightning-grid enables University and Enterprise customers to run on the cloud with their own credentials or even onprem. - -These are some of the benefits of running via lightning-grid: - -- create datasets optimized for scale -- fully configurable on-prem deployment -- SOC-2 compliance (in-progress) (ETA Q3 2022) -- micro cost optimizations everywhere (which add up) -- built-in fault tolerance -- enabled collaboration for teams and enterprises - -Contact our sales support engineering team so we can help you set up Grid with your own cloud credentials. - -Email us to connect with your own cloud account: - -``_. diff --git a/docs/_sources/clouds/run_intermediate.rst.txt b/docs/_sources/clouds/run_intermediate.rst.txt deleted file mode 100644 index dad2edf..0000000 --- a/docs/_sources/clouds/run_intermediate.rst.txt +++ /dev/null @@ -1,229 +0,0 @@ -:orphan: - -.. _grid_cloud_run_intermediate: - -################################# -Train on the cloud (intermediate) -################################# -**Audience**: User looking to run many models at once - ----- - -**************** -What is a sweep? -**************** -A sweep is the term giving to running the same model multiple times with different hyperparameters to find the one that performs the best (according to your definition of performance). - -Let's say I have a python script that trains a Lighting model to classify images. We run this file like so: - -.. code:: bash - - grid run file.py --batch_size 8 - -with such a model, I would be interested in knowing how it performs with different batch size. In this case, I'm going to train many versions of this model. - -.. code:: bash - - # run 4 models in parallel - grid run file.py --batch_size 8 - grid run file.py --batch_size 16 - grid run file.py --batch_size 32 - grid run file.py --batch_size 64 - -Now I can see how my model performs according to the layers and based on time and cost I can pick my "best" model: - -.. list-table:: Training speed vs cost - :widths: 10 40 15 15 - :header-rows: 1 - - * - Batch size - - classification accuracy (%) - - training time - - cost - * - 8 - - 0.80 - - 5 minutes - - $0.15 - * - 16 - - 0.85 - - 10 minutes - - $0.30 - * - 32 - - 0.90 - - 30 minutes - - $0.50 - * - 64 - - 0.95 - - 60 minutes - - $1.01 - ----- - -************* -Start a Sweep -************* -First, recall that in the `previous tutorial `_ we ran a single model using this command: - -.. code:: bash - - grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5 - -Now we're going to run that same model 4 different times each with a different number of layers: - -.. code:: bash - - grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5 --batch_size 8 - grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5 --batch_size 16 - grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5 --batch_size 32 - grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5 --batch_size 64 - -Grid has a special syntax based on python that gives you shortcuts for sweeps. The shortcut for the above commands is: - -.. code:: bash - - grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5 --batch_size "[8, 16, 32, 64]" - ----- - -**************** -Syntax Shortcuts -**************** - -List -==== - -.. code:: bash - - grid run file.py --batch_size "[8, 16, 32, 64]" - -equivalent to: - -.. code:: bash - - grid run file.py --batch_size 8 - grid run file.py --batch_size 16 - grid run file.py --batch_size 32 - grid run file.py --batch_size 64 - ----- - -Range -===== - -.. code:: bash - - grid run file.py --batch_size "range(1, 10, 2)" - -equivalent to: - -.. code:: bash - - grid run main.py --batch_size 1 - grid run main.py --batch_size 3 - grid run main.py --batch_size 5 - grid run main.py --batch_size 7 - grid run main.py --batch_size 9 - ---- - -String list -=========== - -.. code:: bash - - grid run file.py --model_backbone "['resnet18' 'transformer', 'resnet50']" - -equivalent to: - -.. code:: bash - - grid run file.py --model_backbone 'resnet18' - grid run file.py --model_backbone 'transformer' - grid run file.py --model_backbone 'resnet50' - ----- - -Sampling -======== - -.. code:: bash - - grid run file.py --learning_rate "uniform(1e-5, 1e-1, 3)" - -equivalent to: - -.. code:: bash - - grid run file.py --learning_rate 0.03977392 - grid run file.py --learning_rate 0.04835479 - grid run file.py --learning_rate 0.05200016 - ----- - -**************** -Sweep strategies -**************** -Models often have dozens of hyperparameters. We usually don't run all combinations because it would be too prohibitive. Grid supports two strategies: - ----- - -Grid search -=========== -Grid search is a common approach that tries all combinations of hyperparamaters. Grid will automatically compute combinations when it detects special syntax: - -.. code:: bash - - grid run file.py --batch_size "[1, 2]" --layers "[3, 5]" - -is equivalent to: - -.. code:: bash - - grid run file.py --batch_size 1 --layers 3 - grid run file.py --batch_size 2 --layers 3 - grid run file.py --batch_size 1 --layers 5 - grid run file.py --batch_size 2 --layers 5 - ----- - -Random search -============= -With random search, we choose only a subset of hyperparamaters. The larger the number of trials (*num_trials*) the more probable we'll find a great performing model without needing to try all possible combinations. - -.. code:: bash - - grid run --strategy random_search --num_trials 2 file.py --batch_size "[1, 2]" --layers "[3, 5]" - -the above command generates the 4 combinations and runs only 2 at random - -.. code:: bash - - grid run file.py --batch_size 2 --layers 3 - grid run file.py --batch_size 1 --layers 5 - ----- - -********** -Next Steps -********** -Here are the recommended next steps depending on your workflow. - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Run with your own cloud credentials - :description: Learn how to use Grid products with your Company or University cloud account. - :col_css: col-md-4 - :button_link: run_expert.html - :height: 180 - :tag: expert - -.. raw:: html - -
-
`_ to create a free account, then start a new Grid Session. - -A Grid Session is an interactive machine with 1-16 GPUs per machine. - -.. image:: https://docs.grid.ai/assets/images/new-session-3c58be3fd64ffabcdeb7b52516e0782e.gif - :alt: Start a Grid Session in a few seconds - ----- - -************************* -Open the Jupyter Notebook -************************* -Once the Session starts, open a Jupyter notebook. - -.. raw:: html - - - ----- - -************************ -Clone and run your model -************************ -On the Jupyter page you can use a Notebook, or to clone your code and run via the CLI. - -.. raw:: html - - - ----- - -.. include:: grid_costs.rst - ----- - -********** -Next Steps -********** -Here are the recommended next steps depending on your workflow. - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Run a model in the background - :description: Learn to run a model in the background - :col_css: col-md-6 - :button_link: run_basic.html - :height: 180 - :tag: basic - -.. displayitem:: - :header: Run with your own cloud credentials - :description: Learn how to use Grid products on your Company or University private cloud account. - :col_css: col-md-6 - :button_link: run_expert.html - :height: 180 - :tag: expert - -.. raw:: html - -
-
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Basic - :description: Learn to save and load checkpoints - :col_css: col-md-3 - :button_link: checkpointing_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Intermediate - :description: Customize checkpointing behavior - :col_css: col-md-3 - :button_link: checkpointing_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Advanced - :description: Enable cloud-based checkpointing and composable checkpoints. - :col_css: col-md-3 - :button_link: checkpointing_advanced.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Expert - :description: Customize checkpointing for custom distributed strategies and accelerators. - :col_css: col-md-3 - :button_link: checkpointing_expert.html - :height: 150 - :tag: expert - -.. raw:: html - -
- - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: ModelCheckpoint API - :description: Dig into the ModelCheckpoint API - :col_css: col-md-4 - :button_link: ../api/pytorch_lightning.callbacks.ModelCheckpoint.html - :height: 150 - -.. raw:: html - -
-
diff --git a/docs/_sources/common/checkpointing_advanced.rst.txt b/docs/_sources/common/checkpointing_advanced.rst.txt deleted file mode 100644 index 561ca95..0000000 --- a/docs/_sources/common/checkpointing_advanced.rst.txt +++ /dev/null @@ -1,75 +0,0 @@ -.. _checkpointing_advanced: - -######################## -Checkpointing (advanced) -######################## - - -***************** -Cloud checkpoints -***************** -Lightning is integrated with the major remote file systems including local filesystems and several cloud storage providers such as -`S3 `_ on `AWS `_, `GCS `_ on `Google Cloud `_, -or `ADL `_ on `Azure `_. - -PyTorch Lightning uses `fsspec `_ internally to handle all filesystem operations. - ----- - -Save a cloud checkpoint -======================= - -To save to a remote filesystem, prepend a protocol like "s3:/" to the root_dir used for writing and reading model data. - -.. code-block:: python - - # `default_root_dir` is the default path used for logs and checkpoints - trainer = Trainer(default_root_dir="s3://my_bucket/data/") - trainer.fit(model) - ----- - -Resume training from a cloud checkpoint -======================================= -To resume training from a cloud checkpoint use a cloud url. - -.. code-block:: python - - trainer = Trainer(default_root_dir=tmpdir, max_steps=3) - trainer.fit(model, ckpt_path="s3://my_bucket/ckpts/classifier.ckpt") - -PyTorch Lightning uses `fsspec `_ internally to handle all filesystem operations. - ----- - -*************************** -Modularize your checkpoints -*************************** -Checkpoints can also save the state of :doc:`datamodules <../extensions/datamodules_state>` and :doc:`callbacks <../extensions/callbacks_state>`. - ----- - -**************************** -Modify a checkpoint anywhere -**************************** -When you need to change the components of a checkpoint before saving or loading, use the :meth:`~pytorch_lightning.core.hooks.CheckpointHooks.on_save_checkpoint` and :meth:`~pytorch_lightning.core.hooks.CheckpointHooks.on_load_checkpoint` of your ``LightningModule``. - -.. code:: python - - class LitModel(pl.LightningModule): - def on_save_checkpoint(self, checkpoint): - checkpoint["something_cool_i_want_to_save"] = my_cool_pickable_object - - def on_load_checkpoint(self, checkpoint): - my_cool_pickable_object = checkpoint["something_cool_i_want_to_save"] - -Use the above approach when you need to couple this behavior to your LightningModule for reproducibility reasons. Otherwise, Callbacks also have the :meth:`~pytorch_lightning.callbacks.base.Callback.on_save_checkpoint` and :meth:`~pytorch_lightning.callbacks.base.Callback.on_load_checkpoint` which you should use instead: - -.. code:: python - - class LitCallback(pl.Callback): - def on_save_checkpoint(self, checkpoint): - checkpoint["something_cool_i_want_to_save"] = my_cool_pickable_object - - def on_load_checkpoint(self, checkpoint): - my_cool_pickable_object = checkpoint["something_cool_i_want_to_save"] diff --git a/docs/_sources/common/checkpointing_basic.rst.txt b/docs/_sources/common/checkpointing_basic.rst.txt deleted file mode 100644 index 899de91..0000000 --- a/docs/_sources/common/checkpointing_basic.rst.txt +++ /dev/null @@ -1,189 +0,0 @@ -:orphan: - -.. _checkpointing_basic: - -##################### -Checkpointing (basic) -##################### -**Audience:** All users - ----- - -********************* -What is a checkpoint? -********************* -When a model is training, the performance changes as it continues to see more data. It is a best practice to save the state of a model throughout the training process. This gives you a version of the model, *a checkpoint*, at each key point during the development of the model. Once training has completed, use the checkpoint that corresponds to the best performance you found during the training process. - -Checkpoints also enable your training to resume from where it was in case the training process is interrupted. - -PyTorch Lightning checkpoints are fully usable in plain PyTorch. - ----- - -************************ -Contents of a checkpoint -************************ -A Lightning checkpoint contains a dump of the model's entire internal state. Unlike plain PyTorch, Lightning saves *everything* you need to restore a model even in the most complex distributed training environments. - -Inside a Lightning checkpoint you'll find: - -- 16-bit scaling factor (if using 16-bit precision training) -- Current epoch -- Global step -- LightningModule's state_dict -- State of all optimizers -- State of all learning rate schedulers -- State of all callbacks (for stateful callbacks) -- State of datamodule (for stateful datamodules) -- The hyperparameters used for that model if passed in as hparams (Argparse.Namespace) -- State of Loops (if using Fault-Tolerant training) - ----- - -***************** -Save a checkpoint -***************** -Lightning automatically saves a checkpoint for you in your current working directory, with the state of your last training epoch. This makes sure you can resume training in case it was interrupted. - -.. code-block:: python - - # simply by using the Trainer you get automatic checkpointing - trainer = Trainer() - -To change the checkpoint path use the `default_root_dir` argument: - -.. code-block:: python - - # saves checkpoints to 'some/path/' at every epoch end - trainer = Trainer(default_root_dir="some/path/") - ----- - -******************************* -LightningModule from checkpoint -******************************* - -To load a LightningModule along with its weights and hyperparameters use the following method: - -.. code-block:: python - - model = MyLightningModule.load_from_checkpoint("/path/to/checkpoint.ckpt") - - # disable randomness, dropout, etc... - model.eval() - - # predict with the model - y_hat = model(x) - ----- - -Save hyperparameters -==================== -The LightningModule allows you to automatically save all the hyperparameters passed to *init* simply by calling *self.save_hyperparameters()*. - -.. code-block:: python - - class MyLightningModule(LightningModule): - def __init__(self, learning_rate, another_parameter, *args, **kwargs): - super().__init__() - self.save_hyperparameters() - -The hyperparameters are saved to the "hyper_parameters" key in the checkpoint - -.. code-block:: python - - checkpoint = torch.load(checkpoint, map_location=lambda storage, loc: storage) - print(checkpoint["hyper_parameters"]) - # {"learning_rate": the_value, "another_parameter": the_other_value} - -The LightningModule also has access to the Hyperparameters - -.. code-block:: python - - model = MyLightningModule.load_from_checkpoint("/path/to/checkpoint.ckpt") - print(model.learning_rate) - ----- - -Initalize with other parameters -=============================== -If you used the *self.save_hyperparameters()* method in the init of the LightningModule, you can initialize the model with different hyperparameters. - -.. code-block:: python - - # if you train and save the model like this it will use these values when loading - # the weights. But you can overwrite this - LitModel(in_dim=32, out_dim=10) - - # uses in_dim=32, out_dim=10 - model = LitModel.load_from_checkpoint(PATH) - - # uses in_dim=128, out_dim=10 - model = LitModel.load_from_checkpoint(PATH, in_dim=128, out_dim=10) - ----- - -************************* -nn.Module from checkpoint -************************* -Lightning checkpoints are fully compatible with plain torch nn.Modules. - -.. code-block:: python - - checkpoint = torch.load(CKPT_PATH) - print(checkpoint.keys()) - -For example, let's pretend we created a LightningModule like so: - -.. code-block:: python - - class Encoder(nn.Module): - ... - - - class Decoder(nn.Module): - ... - - - class Autoencoder(pl.LightningModule): - def __init__(self, encoder, decoder, *args, **kwargs): - ... - - - autoencoder = Autoencoder(Encoder(), Decoder()) - -Once the autoencoder has trained, pull out the relevant weights for your torch nn.Module: - -.. code-block:: python - - checkpoint = torch.load(CKPT_PATH) - encoder_weights = checkpoint["encoder"] - decoder_weights = checkpoint["decoder"] - ----- - -********************* -Disable checkpointing -********************* - -You can disable checkpointing by passing: - -.. testcode:: - - trainer = Trainer(enable_checkpointing=False) - ----- - -********************* -Resume training state -********************* - -If you don't just want to load weights, but instead restore the full training, do the following: - -.. code-block:: python - - model = LitModel() - trainer = Trainer() - - # automatically restores model, epoch, step, LR schedulers, apex, etc... - trainer.fit(model, ckpt_path="some/path/to/my_checkpoint.ckpt") diff --git a/docs/_sources/common/checkpointing_expert.rst.txt b/docs/_sources/common/checkpointing_expert.rst.txt deleted file mode 100644 index c1859d6..0000000 --- a/docs/_sources/common/checkpointing_expert.rst.txt +++ /dev/null @@ -1,89 +0,0 @@ -:orphan: - -.. _checkpointing_expert: - -###################### -Checkpointing (expert) -###################### - -TODO: I don't understand this... - -*********************** -Customize Checkpointing -*********************** - -.. warning:: - - The Checkpoint IO API is experimental and subject to change. - - -Lightning supports modifying the checkpointing save/load functionality through the ``CheckpointIO``. This encapsulates the save/load logic -that is managed by the ``Strategy``. ``CheckpointIO`` is different from :meth:`~pytorch_lightning.core.hooks.CheckpointHooks.on_save_checkpoint` -and :meth:`~pytorch_lightning.core.hooks.CheckpointHooks.on_load_checkpoint` methods as it determines how the checkpoint is saved/loaded to storage rather than -what's saved in the checkpoint. - - -****************************** -Built-in Checkpoint IO Plugins -****************************** - -.. list-table:: Built-in Checkpoint IO Plugins - :widths: 25 75 - :header-rows: 1 - - * - Plugin - - Description - * - :class:`~pytorch_lightning.plugins.io.TorchCheckpointIO` - - CheckpointIO that utilizes :func:`torch.save` and :func:`torch.load` to save and load checkpoints - respectively, common for most use cases. - * - :class:`~pytorch_lightning.plugins.io.XLACheckpointIO` - - CheckpointIO that utilizes :func:`xm.save` to save checkpoints for TPU training strategies. - - -*************************** -Custom Checkpoint IO Plugin -*************************** - -``CheckpointIO`` can be extended to include your custom save/load functionality to and from a path. The ``CheckpointIO`` object can be passed to either a ``Trainer`` directly or a ``Strategy`` as shown below: - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.callbacks import ModelCheckpoint - from pytorch_lightning.plugins import CheckpointIO - from pytorch_lightning.strategies import SingleDeviceStrategy - - - class CustomCheckpointIO(CheckpointIO): - def save_checkpoint(self, checkpoint, path, storage_options=None): - ... - - def load_checkpoint(self, path, storage_options=None): - ... - - def remove_checkpoint(self, path): - ... - - - custom_checkpoint_io = CustomCheckpointIO() - - # Either pass into the Trainer object - model = MyModel() - trainer = Trainer( - plugins=[custom_checkpoint_io], - callbacks=ModelCheckpoint(save_last=True), - ) - trainer.fit(model) - - # or pass into Strategy - model = MyModel() - device = torch.device("cpu") - trainer = Trainer( - strategy=SingleDeviceStrategy(device, checkpoint_io=custom_checkpoint_io), - callbacks=ModelCheckpoint(save_last=True), - ) - trainer.fit(model) - -.. note:: - - Some ``TrainingTypePlugins`` like ``DeepSpeedStrategy`` do not support custom ``CheckpointIO`` as checkpointing logic is not modifiable. diff --git a/docs/_sources/common/checkpointing_intermediate.rst.txt b/docs/_sources/common/checkpointing_intermediate.rst.txt deleted file mode 100644 index 7796575..0000000 --- a/docs/_sources/common/checkpointing_intermediate.rst.txt +++ /dev/null @@ -1,175 +0,0 @@ -:orphan: - -.. _checkpointing_intermediate: - -############################ -Checkpointing (intermediate) -############################ -**Audience:** Users looking to customize the checkpointing behavior - ----- - -***************************** -Modify checkpointing behavior -***************************** -For fine-grain control over checkpointing behavior, use the :class:`~pytorch_lightning.callbacks.ModelCheckpoint` object - -.. code-block:: python - - from pytorch_lightning.callbacks import ModelCheckpoint - - checkpoint_callback = ModelCheckpoint(dirpath="my/path/", save_top_k=2, monitor="val_loss") - trainer = Trainer(callbacks=[checkpoint_callback]) - trainer.fit(model) - checkpoint_callback.best_model_path - -Any value that has been logged via *self.log* in the LightningModule can be monitored. - -.. code-block:: python - - class LitModel(pl.LightningModule): - def training_step(self, batch, batch_idx): - self.log("my_metric", x) - - - # 'my_metric' is now able to be monitored - checkpoint_callback = ModelCheckpoint(monitor="my_metric") - ----- - -***************************** -Save checkpoints by condition -***************************** -To save checkpoints based on a (*when/which/what/where*) condition (for example *when* the validation_loss is lower) modify the :class:`~pytorch_lightning.callbacks.ModelCheckpoint` properties. - -When -==== - -- When using iterative training which doesn't have an epoch, you can checkpoint at every ``N`` training steps by specifying ``every_n_training_steps=N``. -- You can also control the interval of epochs between checkpoints using ``every_n_epochs`` between checkpoints, to avoid slowdowns. -- You can checkpoint at a regular time interval using ``train_time_interval`` argument independent of the steps or epochs. -- In case you are monitoring a training metrics, we'd suggest using ``save_on_train_epoch_end=True`` to ensure the required metric is being accumulated correctly for creating a checkpoint. - - -Which -===== - -- You can save the last checkpoint when training ends using ``save_last`` argument. -- You can save top-K and last-K checkpoints by configuring the ``monitor`` and ``save_top_k`` argument. - -| - - .. testcode:: - - from pytorch_lightning.callbacks import ModelCheckpoint - - - # saves top-K checkpoints based on "val_loss" metric - checkpoint_callback = ModelCheckpoint( - save_top_k=10, - monitor="val_loss", - mode="min", - dirpath="my/path/", - filename="sample-mnist-{epoch:02d}-{val_loss:.2f}", - ) - - # saves last-K checkpoints based on "global_step" metric - # make sure you log it inside your LightningModule - checkpoint_callback = ModelCheckpoint( - save_top_k=10, - monitor="global_step", - mode="max", - dirpath="my/path/", - filename="sample-mnist-{epoch:02d}-{global_step}", - ) - -- You can customize the checkpointing behavior to monitor any quantity of your training or validation steps. For example, if you want to update your checkpoints based on your validation loss: - -| - - .. testcode:: - - from pytorch_lightning.callbacks import ModelCheckpoint - - - class LitAutoEncoder(LightningModule): - def validation_step(self, batch, batch_idx): - x, y = batch - y_hat = self.backbone(x) - - # 1. calculate loss - loss = F.cross_entropy(y_hat, y) - - # 2. log val_loss - self.log("val_loss", loss) - - - # 3. Init ModelCheckpoint callback, monitoring "val_loss" - checkpoint_callback = ModelCheckpoint(monitor="val_loss") - - # 4. Add your callback to the callbacks list - trainer = Trainer(callbacks=[checkpoint_callback]) - - -What -==== - -- By default, the ``ModelCheckpoint`` callback saves model weights, optimizer states, etc., but in case you have limited disk space or just need the model weights to be saved you can specify ``save_weights_only=True``. - - -Where -===== - -- It gives you the ability to specify the ``dirpath`` and ``filename`` for your checkpoints. Filename can also be dynamic so you can inject the metrics that are being logged using :meth:`~pytorch_lightning.core.lightning.LightningModule.log`. - -| - - .. testcode:: - - from pytorch_lightning.callbacks import ModelCheckpoint - - - # saves a file like: my/path/sample-mnist-epoch=02-val_loss=0.32.ckpt - checkpoint_callback = ModelCheckpoint( - dirpath="my/path/", - filename="sample-mnist-{epoch:02d}-{val_loss:.2f}", - ) - -| - -The :class:`~pytorch_lightning.callbacks.ModelCheckpoint` callback is very robust and should cover 99% of the use-cases. If you find a use-case that is not configured yet, feel free to open an issue with a feature request on GitHub -and the Lightning Team will be happy to integrate/help integrate it. - ----- - -************************* -Save checkpoints manually -************************* - -You can manually save checkpoints and restore your model from the checkpointed state using :meth:`~pytorch_lightning.trainer.trainer.Trainer.save_checkpoint` -and :meth:`~pytorch_lightning.core.saving.ModelIO.load_from_checkpoint`. - -.. code-block:: python - - model = MyLightningModule(hparams) - trainer.fit(model) - trainer.save_checkpoint("example.ckpt") - - # load the checkpoint later as normal - new_model = MyLightningModule.load_from_checkpoint(checkpoint_path="example.ckpt") - -Manual saving with distributed training -======================================= -In distributed training cases where a model is running across many machines, Lightning ensures that only one checkpoint is saved instead of a model per machine. This requires no code changes as seen below: - -.. code-block:: python - - trainer = Trainer(strategy="ddp") - model = MyLightningModule(hparams) - trainer.fit(model) - # Saves only on the main process - trainer.save_checkpoint("example.ckpt") - -Not using :meth:`~pytorch_lightning.trainer.trainer.Trainer.save_checkpoint` can lead to unexpected behavior and potential deadlock. Using other saving functions will result in all devices attempting to save the checkpoint. As a result, we highly recommend using the Trainer's save functionality. -If using custom saving functions cannot be avoided, we recommend using the :func:`~pytorch_lightning.utilities.rank_zero.rank_zero_only` decorator to ensure saving occurs only on the main process. Note that this will only work if all ranks hold the exact same state and won't work when using -model parallel distributed strategies such as deepspeed or sharded training. diff --git a/docs/_sources/common/child_modules.rst.txt b/docs/_sources/common/child_modules.rst.txt deleted file mode 100644 index d3c1832..0000000 --- a/docs/_sources/common/child_modules.rst.txt +++ /dev/null @@ -1,70 +0,0 @@ -Research projects tend to test different approaches to the same dataset. -This is very easy to do in Lightning with inheritance. - -For example, imagine we now want to train an ``AutoEncoder`` to use as a feature extractor for images. -The only things that change in the ``LitAutoEncoder`` model are the init, forward, training, validation and test step. - -.. code-block:: python - - class Encoder(torch.nn.Module): - ... - - - class Decoder(torch.nn.Module): - ... - - - class AutoEncoder(torch.nn.Module): - def __init__(self): - super().__init__() - self.encoder = Encoder() - self.decoder = Decoder() - - def forward(self, x): - return self.decoder(self.encoder(x)) - - - class LitAutoEncoder(LightningModule): - def __init__(self, auto_encoder): - super().__init__() - self.auto_encoder = auto_encoder - self.metric = torch.nn.MSELoss() - - def forward(self, x): - return self.auto_encoder.encoder(x) - - def training_step(self, batch, batch_idx): - x, _ = batch - x_hat = self.auto_encoder(x) - loss = self.metric(x, x_hat) - return loss - - def validation_step(self, batch, batch_idx): - self._shared_eval(batch, batch_idx, "val") - - def test_step(self, batch, batch_idx): - self._shared_eval(batch, batch_idx, "test") - - def _shared_eval(self, batch, batch_idx, prefix): - x, _ = batch - x_hat = self.auto_encoder(x) - loss = self.metric(x, x_hat) - self.log(f"{prefix}_loss", loss) - - -and we can train this using the ``Trainer``: - -.. code-block:: python - - auto_encoder = AutoEncoder() - lightning_module = LitAutoEncoder(auto_encoder) - trainer = Trainer() - trainer.fit(lightning_module, train_dataloader, val_dataloader) - -And remember that the forward method should define the practical use of a :class:`~pytorch_lightning.core.lightning.LightningModule`. -In this case, we want to use the ``LitAutoEncoder`` to extract image representations: - -.. code-block:: python - - some_images = torch.Tensor(32, 1, 28, 28) - representations = lightning_module(some_images) diff --git a/docs/_sources/common/console_logs.rst.txt b/docs/_sources/common/console_logs.rst.txt deleted file mode 100644 index 6761432..0000000 --- a/docs/_sources/common/console_logs.rst.txt +++ /dev/null @@ -1,26 +0,0 @@ -############### -Console logging -############### -**Audience:** Engineers looking to capture more visible logs. - ----- - -******************* -Enable console logs -******************* -Lightning logs useful information about the training process and user warnings to the console. -You can retrieve the Lightning console logger and change it to your liking. For example, adjust the logging level -or redirect output for certain modules to log files: - -.. testcode:: - - import logging - - # configure logging at the root level of Lightning - logging.getLogger("pytorch_lightning").setLevel(logging.ERROR) - - # configure logging on module level, redirect to file - logger = logging.getLogger("pytorch_lightning.core") - logger.addHandler(logging.FileHandler("core.log")) - -Read more about custom Python logging `here `_. diff --git a/docs/_sources/common/early_stopping.rst.txt b/docs/_sources/common/early_stopping.rst.txt deleted file mode 100644 index 593106f..0000000 --- a/docs/_sources/common/early_stopping.rst.txt +++ /dev/null @@ -1,99 +0,0 @@ -.. testsetup:: * - - from pytorch_lightning.callbacks.early_stopping import EarlyStopping - -.. _early_stopping: - - -############## -Early Stopping -############## - -.. raw:: html - - - - -*********************** -Stopping an Epoch Early -*********************** - -You can stop and skip the rest of the current epoch early by overriding :meth:`~pytorch_lightning.core.hooks.ModelHooks.on_train_batch_start` to return ``-1`` when some condition is met. - -If you do this repeatedly, for every epoch you had originally requested, then this will stop your entire training. - - -********************** -EarlyStopping Callback -********************** - -The :class:`~pytorch_lightning.callbacks.early_stopping.EarlyStopping` callback can be used to monitor a metric and stop the training when no improvement is observed. - -To enable it: - -- Import :class:`~pytorch_lightning.callbacks.early_stopping.EarlyStopping` callback. -- Log the metric you want to monitor using :meth:`~pytorch_lightning.core.lightning.LightningModule.log` method. -- Init the callback, and set ``monitor`` to the logged metric of your choice. -- Set the ``mode`` based on the metric needs to be monitored. -- Pass the :class:`~pytorch_lightning.callbacks.early_stopping.EarlyStopping` callback to the :class:`~pytorch_lightning.trainer.trainer.Trainer` callbacks flag. - -.. code-block:: python - - from pytorch_lightning.callbacks.early_stopping import EarlyStopping - - - class LitModel(LightningModule): - def validation_step(self, batch, batch_idx): - loss = ... - self.log("val_loss", loss) - - - model = LitModel() - trainer = Trainer(callbacks=[EarlyStopping(monitor="val_loss", mode="min")]) - trainer.fit(model) - -You can customize the callbacks behaviour by changing its parameters. - -.. testcode:: - - early_stop_callback = EarlyStopping(monitor="val_accuracy", min_delta=0.00, patience=3, verbose=False, mode="max") - trainer = Trainer(callbacks=[early_stop_callback]) - - -Additional parameters that stop training at extreme points: - -- ``stopping_threshold``: Stops training immediately once the monitored quantity reaches this threshold. - It is useful when we know that going beyond a certain optimal value does not further benefit us. -- ``divergence_threshold``: Stops training as soon as the monitored quantity becomes worse than this threshold. - When reaching a value this bad, we believes the model cannot recover anymore and it is better to stop early and run with different initial conditions. -- ``check_finite``: When turned on, it stops training if the monitored metric becomes NaN or infinite. -- ``check_on_train_epoch_end``: When turned on, it checks the metric at the end of a training epoch. Use this only when you are monitoring any metric logged within - training-specific hooks on epoch-level. - - -In case you need early stopping in a different part of training, subclass :class:`~pytorch_lightning.callbacks.early_stopping.EarlyStopping` -and change where it is called: - -.. testcode:: - - class MyEarlyStopping(EarlyStopping): - def on_validation_end(self, trainer, pl_module): - # override this to disable early stopping at the end of val loop - pass - - def on_train_end(self, trainer, pl_module): - # instead, do it at the end of training loop - self._run_early_stopping_check(trainer) - -.. note:: - The :class:`~pytorch_lightning.callbacks.early_stopping.EarlyStopping` callback runs - at the end of every validation epoch by default. However, the frequency of validation - can be modified by setting various parameters in the :class:`~pytorch_lightning.trainer.trainer.Trainer`, - for example :paramref:`~pytorch_lightning.trainer.trainer.Trainer.check_val_every_n_epoch` - and :paramref:`~pytorch_lightning.trainer.trainer.Trainer.val_check_interval`. - It must be noted that the ``patience`` parameter counts the number of - validation checks with no improvement, and not the number of training epochs. - Therefore, with parameters ``check_val_every_n_epoch=10`` and ``patience=3``, the trainer - will perform at least 40 training epochs before being stopped. diff --git a/docs/_sources/common/evaluation.rst.txt b/docs/_sources/common/evaluation.rst.txt deleted file mode 100644 index e126a70..0000000 --- a/docs/_sources/common/evaluation.rst.txt +++ /dev/null @@ -1,33 +0,0 @@ -.. _val-test-dataset: - -******************************** -Add validation and test datasets -******************************** - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Basic - :description: Add a validation and test loop to avoid overfitting. - :col_css: col-md-6 - :button_link: evaluation_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Intermediate - :description: Learn about more complex validation and test workflows - :col_css: col-md-6 - :button_link: evaluation_intermediate.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
diff --git a/docs/_sources/common/evaluation_basic.rst.txt b/docs/_sources/common/evaluation_basic.rst.txt deleted file mode 100644 index 5f933ee..0000000 --- a/docs/_sources/common/evaluation_basic.rst.txt +++ /dev/null @@ -1,128 +0,0 @@ -:orphan: - -################################# -Validate and test a model (basic) -################################# -**Audience**: Users who want to add a validation loop to avoid overfitting - ----- - -*************** -Add a test loop -*************** -To make sure a model can generalize to an unseen dataset (ie: to publish a paper or in a production environment) a dataset is normally split into two parts, the *train* split and the *test* split. - -The test set is **NOT** used during training, it is **ONLY** used once the model has been trained to see how the model will do in the real-world. - ----- - -Find the train and test splits -============================== -Datasets come with two splits. Refer to the dataset documentation to find the *train* and *test* splits. - -.. code-block:: python - - import torch.utils.data as data - from torchvision import datasets - - # Load data sets - train_set = datasets.MNIST(root="MNIST", download=True, train=True) - test_set = datasets.MNIST(root="MNIST", download=True, train=False) - ----- - -Define the test loop -==================== -To add a test loop, implement the **test_step** method of the LightningModule - -.. code:: python - - class LitAutoEncoder(pl.LightningModule): - def training_step(self, batch, batch_idx): - ... - - def test_step(self, batch, batch_idx): - # this is the test loop - x, y = batch - x = x.view(x.size(0), -1) - z = self.encoder(x) - x_hat = self.decoder(z) - test_loss = F.mse_loss(x_hat, x) - self.log("test_loss", test_loss) - ----- - -Train with the test loop -======================== -Once the model has finished training, call **.test** - -.. code-block:: python - - from torch.utils.data import DataLoader - - # initialize the Trainer - trainer = Trainer() - - # test the model - trainer.test(model, dataloaders=DataLoader(test_set)) - ----- - -********************* -Add a validation loop -********************* -During training, it's common practice to use a small portion of the train split to determine when the model has finished training. - ----- - -Split the training data -======================= -As a rule of thumb, we use 20% of the training set as the **validation set**. This number varies from dataset to dataset. - -.. code-block:: python - - # use 20% of training data for validation - train_set_size = int(len(train_set) * 0.8) - valid_set_size = len(train_set) - train_set_size - - # split the train set into two - seed = torch.Generator().manual_seed(42) - train_set, valid_set = data.random_split(train_set, [train_set_size, valid_set_size], generator=seed) - ----- - -Define the validation loop -========================== -To add a validation loop, implement the **validation_step** method of the LightningModule - -.. code:: python - - class LitAutoEncoder(pl.LightningModule): - def training_step(self, batch, batch_idx): - ... - - def validation_step(self, batch, batch_idx): - # this is the validation loop - x, y = batch - x = x.view(x.size(0), -1) - z = self.encoder(x) - x_hat = self.decoder(z) - test_loss = F.mse_loss(x_hat, x) - self.log("val_loss", test_loss) - ----- - -Train with the validation loop -============================== -To run the validation loop, pass in the validation set to **.fit** - -.. code-block:: python - - from torch.utils.data import DataLoader - - train_set = DataLoader(train_set) - val_set = DataLoader(val_set) - - # train with both splits - trainer = Trainer() - trainer.fit(model, train_set, val_set) diff --git a/docs/_sources/common/evaluation_intermediate.rst.txt b/docs/_sources/common/evaluation_intermediate.rst.txt deleted file mode 100644 index 7c0ca00..0000000 --- a/docs/_sources/common/evaluation_intermediate.rst.txt +++ /dev/null @@ -1,157 +0,0 @@ -.. _test_set: - -:orphan: - -######################################## -Validate and test a model (intermediate) -######################################## - -During and after training we need a way to evaluate our models to make sure they are not overfitting while training and -generalize well on unseen or real-world data. There are generally 2 stages of evaluation: validation and testing. To some -degree they serve the same purpose, to make sure models works on real data but they have some practical differences. - -Validation is usually done during training, traditionally after each training epoch. It can be used for hyperparameter optimization or tracking model performance during training. -It's a part of the training process. - -Testing is usually done once we are satisfied with the training and only with the best model selected from the validation metrics. - -Let's see how these can be performed with Lightning. - -******* -Testing -******* - -Lightning allows the user to test their models with any compatible test dataloaders. This can be done before/after training -and is completely agnostic to :meth:`~pytorch_lightning.trainer.trainer.Trainer.fit` call. The logic used here is defined under -:meth:`~pytorch_lightning.core.lightning.LightningModule.test_step`. - -Testing is performed using the ``Trainer`` object's ``.test()`` method. - -.. automethod:: pytorch_lightning.trainer.Trainer.test - :noindex: - - -Test after Fit -============== - -To run the test set after training completes, use this method. - -.. code-block:: python - - # run full training - trainer.fit(model) - - # (1) load the best checkpoint automatically (lightning tracks this for you) - trainer.test(ckpt_path="best") - - # (2) test using a specific checkpoint - trainer.test(ckpt_path="/path/to/my_checkpoint.ckpt") - - # (3) test with an explicit model (will use this model and not load a checkpoint) - trainer.test(model) - -.. warning:: - - It is recommended to test with ``Trainer(devices=1)`` since distributed strategies such as DDP - use :class:`~torch.utils.data.distributed.DistributedSampler` internally, which replicates some samples to - make sure all devices have same batch size in case of uneven inputs. This is helpful to make sure - benchmarking for research papers is done the right way. - - -Test Multiple Models -==================== - -You can run the test set on multiple models using the same trainer instance. - -.. code-block:: python - - model1 = LitModel() - model2 = GANModel() - - trainer = Trainer() - trainer.test(model1) - trainer.test(model2) - - -Test Pre-Trained Model -====================== - -To run the test set on a pre-trained model, use this method. - -.. code-block:: python - - model = MyLightningModule.load_from_checkpoint( - checkpoint_path="/path/to/pytorch_checkpoint.ckpt", - hparams_file="/path/to/test_tube/experiment/version/hparams.yaml", - map_location=None, - ) - - # init trainer with whatever options - trainer = Trainer(...) - - # test (pass in the model) - trainer.test(model) - -In this case, the options you pass to trainer will be used when -running the test set (ie: 16-bit, dp, ddp, etc...) - - -Test with Additional DataLoaders -================================ - -You can still run inference on a test dataset even if the :meth:`~pytorch_lightning.core.hooks.DataHooks.test_dataloader` method hasn't been -defined within your :doc:`lightning module <../common/lightning_module>` instance. This would be the case when your test data -is not available at the time your model was declared. - -.. code-block:: python - - # setup your data loader - test_dataloader = DataLoader(...) - - # test (pass in the loader) - trainer.test(dataloaders=test_dataloader) - -You can either pass in a single dataloader or a list of them. This optional named -parameter can be used in conjunction with any of the above use cases. Additionally, -you can also pass in an :doc:`datamodules <../data/datamodule>` that have overridden the -:ref:`datamodule_test_dataloader_label` method. - -.. code-block:: python - - class MyDataModule(pl.LightningDataModule): - ... - - def test_dataloader(self): - return DataLoader(...) - - - # setup your datamodule - dm = MyDataModule(...) - - # test (pass in datamodule) - trainer.test(datamodule=dm) - ----------- - -********** -Validation -********** - -Lightning allows the user to validate their models with any compatible ``val dataloaders``. This can be done before/after training. -The logic associated to the validation is defined within the :meth:`~pytorch_lightning.core.lightning.LightningModule.validation_step`. - -Apart from this ``.validate`` has same API as ``.test``, but would rely respectively on :meth:`~pytorch_lightning.core.lightning.LightningModule.validation_step` and :meth:`~pytorch_lightning.core.lightning.LightningModule.test_step`. - -.. note:: - ``.validate`` method uses the same validation logic being used under validation happening within - :meth:`~pytorch_lightning.trainer.trainer.Trainer.fit` call. - -.. warning:: - - When using ``trainer.validate()``, it is recommended to use ``Trainer(devices=1)`` since distributed strategies such as DDP - uses :class:`~torch.utils.data.distributed.DistributedSampler` internally, which replicates some samples to - make sure all devices have same batch size in case of uneven inputs. This is helpful to make sure - benchmarking for research papers is done the right way. - -.. automethod:: pytorch_lightning.trainer.Trainer.validate - :noindex: diff --git a/docs/_sources/common/gradient_accumulation.rst.txt b/docs/_sources/common/gradient_accumulation.rst.txt deleted file mode 100644 index c65e75e..0000000 --- a/docs/_sources/common/gradient_accumulation.rst.txt +++ /dev/null @@ -1,43 +0,0 @@ -Accumulated gradients run K small batches of size ``N`` before doing a backward pass. The effect is a large effective batch size of size ``KxN``, where ``N`` is the batch size. -Internally it doesn't stack up the batches and do a forward pass rather it accumulates the gradients for K batches and then do an ``optimizer.step`` to make sure the -effective batch size is increased but there is no memory overhead. - -.. warning:: - - When using distributed training for eg. DDP, with let's say with ``P`` devices, each device accumulates independently i.e. it stores the gradients - after each ``loss.backward()`` and doesn't sync the gradients across the devices until we call ``optimizer.step()``. So for each accumulation - step, the effective batch size on each device will remain ``N*K`` but right before the ``optimizer.step()``, the gradient sync will make the effective - batch size as ``P*N*K``. For DP, since the batch is split across devices, the final effective batch size will be ``N*K``. - -.. seealso:: :class:`~pytorch_lightning.trainer.trainer.Trainer` - -.. testcode:: - - # DEFAULT (ie: no accumulated grads) - trainer = Trainer(accumulate_grad_batches=1) - - # Accumulate gradients for 7 batches - trainer = Trainer(accumulate_grad_batches=7) - -You can set different values for it at different epochs by passing a dictionary, where the key represents the epoch at which the value for gradient accumulation -should be updated. - -.. testcode:: - - # till 5th epoch, it will accumulate every 8 batches. From 5th epoch - # till 9th epoch it will accumulate every 4 batches and after that no accumulation - # will happen. Note that you need to use zero-indexed epoch keys here - trainer = Trainer(accumulate_grad_batches={0: 8, 4: 4, 8: 1}) - -Or, you can create custom :class:`~pytorch_lightning.callbacks.gradient_accumulation_scheduler.GradientAccumulationScheduler` - -.. testcode:: - - from pytorch_lightning.callbacks import GradientAccumulationScheduler - - - # till 5th epoch, it will accumulate every 8 batches. From 5th epoch - # till 9th epoch it will accumulate every 4 batches and after that no accumulation - # will happen. Note that you need to use zero-indexed epoch keys here - accumulator = GradientAccumulationScheduler(scheduling={0: 8, 4: 4, 8: 1}) - trainer = Trainer(callbacks=accumulator) diff --git a/docs/_sources/common/hyperparameters.rst.txt b/docs/_sources/common/hyperparameters.rst.txt deleted file mode 100644 index 9103100..0000000 --- a/docs/_sources/common/hyperparameters.rst.txt +++ /dev/null @@ -1,279 +0,0 @@ -.. testsetup:: * - - from argparse import ArgumentParser, Namespace - - sys.argv = ["foo"] - -Configure hyperparameters from the CLI --------------------------------------- - -Lightning has utilities to interact seamlessly with the command line ``ArgumentParser`` -and plays well with the hyperparameter optimization framework of your choice. - ----------- - -ArgumentParser -^^^^^^^^^^^^^^ -Lightning is designed to augment a lot of the functionality of the built-in Python ArgumentParser - -.. testcode:: - - from argparse import ArgumentParser - - parser = ArgumentParser() - parser.add_argument("--layer_1_dim", type=int, default=128) - args = parser.parse_args() - -This allows you to call your program like so: - -.. code-block:: bash - - python trainer.py --layer_1_dim 64 - ----------- - -Argparser Best Practices -^^^^^^^^^^^^^^^^^^^^^^^^ -It is best practice to layer your arguments in three sections. - -1. Trainer args (``accelerator``, ``devices``, ``num_nodes``, etc...) -2. Model specific arguments (``layer_dim``, ``num_layers``, ``learning_rate``, etc...) -3. Program arguments (``data_path``, ``cluster_email``, etc...) - -| - -We can do this as follows. First, in your ``LightningModule``, define the arguments -specific to that module. Remember that data splits or data paths may also be specific to -a module (i.e.: if your project has a model that trains on Imagenet and another on CIFAR-10). - -.. testcode:: - - class LitModel(LightningModule): - @staticmethod - def add_model_specific_args(parent_parser): - parser = parent_parser.add_argument_group("LitModel") - parser.add_argument("--encoder_layers", type=int, default=12) - parser.add_argument("--data_path", type=str, default="/some/path") - return parent_parser - -Now in your main trainer file, add the ``Trainer`` args, the program args, and add the model args - -.. testcode:: - - # ---------------- - # trainer_main.py - # ---------------- - from argparse import ArgumentParser - - parser = ArgumentParser() - - # add PROGRAM level args - parser.add_argument("--conda_env", type=str, default="some_name") - parser.add_argument("--notification_email", type=str, default="will@email.com") - - # add model specific args - parser = LitModel.add_model_specific_args(parser) - - # add all the available trainer options to argparse - # ie: now --accelerator --devices --num_nodes ... --fast_dev_run all work in the cli - parser = Trainer.add_argparse_args(parser) - - args = parser.parse_args() - -Now you can call run your program like so: - -.. code-block:: bash - - python trainer_main.py --accelerator 'gpu' --devices 2 --num_nodes 2 --conda_env 'my_env' --encoder_layers 12 - -Finally, make sure to start the training like so: - -.. code-block:: python - - # init the trainer like this - trainer = Trainer.from_argparse_args(args, early_stopping_callback=...) - - # NOT like this - trainer = Trainer(accelerator=hparams.accelerator, devices=hparams.devices, ...) - - # init the model with Namespace directly - model = LitModel(args) - - # or init the model with all the key-value pairs - dict_args = vars(args) - model = LitModel(**dict_args) - ----------- - -LightningModule hyperparameters -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -Often times we train many versions of a model. You might share that model or come back to it a few months later -at which point it is very useful to know how that model was trained (i.e.: what learning rate, neural network, etc...). - -Lightning has a standardized way of saving the information for you in checkpoints and YAML files. The goal here is to -improve readability and reproducibility. - -save_hyperparameters -"""""""""""""""""""" - -Use :meth:`~pytorch_lightning.core.lightning.LightningModule.save_hyperparameters` within your -:class:`~pytorch_lightning.core.lightning.LightningModule`'s ``__init__`` method. -It will enable Lightning to store all the provided arguments under the ``self.hparams`` attribute. -These hyperparameters will also be stored within the model checkpoint, which simplifies model re-instantiation after training. - -.. code-block:: python - - class LitMNIST(LightningModule): - def __init__(self, layer_1_dim=128, learning_rate=1e-2): - super().__init__() - # call this to save (layer_1_dim=128, learning_rate=1e-4) to the checkpoint - self.save_hyperparameters() - - # equivalent - self.save_hyperparameters("layer_1_dim", "learning_rate") - - # Now possible to access layer_1_dim from hparams - self.hparams.layer_1_dim - - -In addition, loggers that support it will automatically log the contents of ``self.hparams``. - -Excluding hyperparameters -""""""""""""""""""""""""" - -By default, every parameter of the ``__init__`` method will be considered a hyperparameter to the LightningModule. -However, sometimes some parameters need to be excluded from saving, for example when they are not serializable. -Those parameters should be provided back when reloading the LightningModule. -In this case, exclude them explicitly: - -.. code-block:: python - - class LitMNIST(LightningModule): - def __init__(self, loss_fx, generator_network, layer_1_dim=128): - super().__init__() - self.layer_1_dim = layer_1_dim - self.loss_fx = loss_fx - - # call this to save only (layer_1_dim=128) to the checkpoint - self.save_hyperparameters("layer_1_dim") - - # equivalent - self.save_hyperparameters(ignore=["loss_fx", "generator_network"]) - - -load_from_checkpoint -"""""""""""""""""""" - -LightningModules that have hyperparameters automatically saved with :meth:`~pytorch_lightning.core.lightning.LightningModule.save_hyperparameters` -can conveniently be loaded and instantiated directly from a checkpoint with :meth:`~pytorch_lightning.core.lightning.LightningModule.load_from_checkpoint`: - -.. code-block:: python - - # to load specify the other args - model = LitMNIST.load_from_checkpoint(PATH, loss_fx=torch.nn.SomeOtherLoss, generator_network=MyGenerator()) - - -If parameters were excluded, they need to be provided at the time of loading: - -.. code-block:: python - - # the excluded parameters were `loss_fx` and `generator_network` - model = LitMNIST.load_from_checkpoint(PATH, loss_fx=torch.nn.SomeOtherLoss, generator_network=MyGenerator()) - - ----------- - -Trainer args -^^^^^^^^^^^^ -To recap, add ALL possible trainer flags to the argparser and init the ``Trainer`` this way - -.. code-block:: python - - parser = ArgumentParser() - parser = Trainer.add_argparse_args(parser) - hparams = parser.parse_args() - - trainer = Trainer.from_argparse_args(hparams) - - # or if you need to pass in callbacks - trainer = Trainer.from_argparse_args(hparams, enable_checkpointing=..., callbacks=[...]) - ----------- - -Multiple Lightning Modules -^^^^^^^^^^^^^^^^^^^^^^^^^^ - -We often have multiple Lightning Modules where each one has different arguments. Instead of -polluting the ``main.py`` file, the ``LightningModule`` lets you define arguments for each one. - -.. testcode:: - - class LitMNIST(LightningModule): - def __init__(self, layer_1_dim, **kwargs): - super().__init__() - self.layer_1 = nn.Linear(28 * 28, layer_1_dim) - - @staticmethod - def add_model_specific_args(parent_parser): - parser = parent_parser.add_argument_group("LitMNIST") - parser.add_argument("--layer_1_dim", type=int, default=128) - return parent_parser - -.. testcode:: - - class GoodGAN(LightningModule): - def __init__(self, encoder_layers, **kwargs): - super().__init__() - self.encoder = Encoder(layers=encoder_layers) - - @staticmethod - def add_model_specific_args(parent_parser): - parser = parent_parser.add_argument_group("GoodGAN") - parser.add_argument("--encoder_layers", type=int, default=12) - return parent_parser - - -Now we can allow each model to inject the arguments it needs in the ``main.py`` - -.. code-block:: python - - def main(args): - dict_args = vars(args) - - # pick model - if args.model_name == "gan": - model = GoodGAN(**dict_args) - elif args.model_name == "mnist": - model = LitMNIST(**dict_args) - - trainer = Trainer.from_argparse_args(args) - trainer.fit(model) - - - if __name__ == "__main__": - parser = ArgumentParser() - parser = Trainer.add_argparse_args(parser) - - # figure out which model to use - parser.add_argument("--model_name", type=str, default="gan", help="gan or mnist") - - # THIS LINE IS KEY TO PULL THE MODEL NAME - temp_args, _ = parser.parse_known_args() - - # let the model add what it wants - if temp_args.model_name == "gan": - parser = GoodGAN.add_model_specific_args(parser) - elif temp_args.model_name == "mnist": - parser = LitMNIST.add_model_specific_args(parser) - - args = parser.parse_args() - - # train - main(args) - -and now we can train MNIST or the GAN using the command line interface! - -.. code-block:: bash - - $ python main.py --model_name gan --encoder_layers 24 - $ python main.py --model_name mnist --layer_1_dim 128 diff --git a/docs/_sources/common/lightning_module.rst.txt b/docs/_sources/common/lightning_module.rst.txt deleted file mode 100644 index 19bb9b0..0000000 --- a/docs/_sources/common/lightning_module.rst.txt +++ /dev/null @@ -1,1664 +0,0 @@ -.. role:: hidden - :class: hidden-section - -.. _lightning_module: - -############### -LightningModule -############### - -A :class:`~LightningModule` organizes your PyTorch code into 6 sections: - -- Computations (init). -- Train Loop (training_step) -- Validation Loop (validation_step) -- Test Loop (test_step) -- Prediction Loop (predict_step) -- Optimizers and LR Schedulers (configure_optimizers) - -| - -.. raw:: html - - - -| - -Notice a few things. - -1. It is the SAME code. -2. The PyTorch code IS NOT abstracted - just organized. -3. All the other code that's not in the :class:`~LightningModule` - has been automated for you by the Trainer. - -| - - .. code-block:: python - - net = Net() - trainer = Trainer() - trainer.fit(net) - -4. There are no ``.cuda()`` or ``.to(device)`` calls required. Lightning does these for you. - -| - - .. code-block:: python - - # don't do in Lightning - x = torch.Tensor(2, 3) - x = x.cuda() - x = x.to(device) - - # do this instead - x = x # leave it alone! - - # or to init a new tensor - new_x = torch.Tensor(2, 3) - new_x = new_x.type_as(x) - -5. When running under a distributed strategy, Lightning handles the distributed sampler for you by default. - -| - - .. code-block:: python - - # Don't do in Lightning... - data = MNIST(...) - sampler = DistributedSampler(data) - DataLoader(data, sampler=sampler) - - # do this instead - data = MNIST(...) - DataLoader(data) - -6. A :class:`~LightningModule` is a :class:`torch.nn.Module` but with added functionality. Use it as such! - -| - - .. code-block:: python - - net = Net.load_from_checkpoint(PATH) - net.freeze() - out = net(x) - -Thus, to use Lightning, you just need to organize your code which takes about 30 minutes, -(and let's be real, you probably should do anyway). - ------------- - -*************** -Starter Example -*************** - -Here are the only required methods. - -.. code-block:: python - - import pytorch_lightning as pl - import torch.nn as nn - import torch.nn.functional as F - - - class LitModel(pl.LightningModule): - def __init__(self): - super().__init__() - self.l1 = nn.Linear(28 * 28, 10) - - def forward(self, x): - return torch.relu(self.l1(x.view(x.size(0), -1))) - - def training_step(self, batch, batch_idx): - x, y = batch - y_hat = self(x) - loss = F.cross_entropy(y_hat, y) - return loss - - def configure_optimizers(self): - return torch.optim.Adam(self.parameters(), lr=0.02) - -Which you can train by doing: - -.. code-block:: python - - train_loader = DataLoader(MNIST(os.getcwd(), download=True, transform=transforms.ToTensor())) - trainer = pl.Trainer(max_epochs=1) - model = LitModel() - - trainer.fit(model, train_dataloaders=train_loader) - -The LightningModule has many convenience methods, but the core ones you need to know about are: - -.. list-table:: - :widths: 50 50 - :header-rows: 1 - - * - Name - - Description - * - init - - Define computations here - * - forward - - Use for inference only (separate from training_step) - * - training_step - - the complete training loop - * - validation_step - - the complete validation loop - * - test_step - - the complete test loop - * - predict_step - - the complete prediction loop - * - configure_optimizers - - define optimizers and LR schedulers - ----------- - -******** -Training -******** - -Training Loop -============= - -To activate the training loop, override the :meth:`~pytorch_lightning.core.lightning.LightningModule.training_step` method. - -.. code-block:: python - - class LitClassifier(pl.LightningModule): - def __init__(self, model): - super().__init__() - self.model = model - - def training_step(self, batch, batch_idx): - x, y = batch - y_hat = self.model(x) - loss = F.cross_entropy(y_hat, y) - return loss - -Under the hood, Lightning does the following (pseudocode): - -.. code-block:: python - - # put model in train mode and enable gradient calculation - model.train() - torch.set_grad_enabled(True) - - outs = [] - for batch_idx, batch in enumerate(train_dataloader): - loss = training_step(batch, batch_idx) - outs.append(loss.detach()) - - # clear gradients - optimizer.zero_grad() - - # backward - loss.backward() - - # update parameters - optimizer.step() - - -Train Epoch-level Metrics -========================= - -If you want to calculate epoch-level metrics and log them, use :meth:`~pytorch_lightning.core.lightning.LightningModule.log`. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - x, y = batch - y_hat = self.model(x) - loss = F.cross_entropy(y_hat, y) - - # logs metrics for each training_step, - # and the average across the epoch, to the progress bar and logger - self.log("train_loss", loss, on_step=True, on_epoch=True, prog_bar=True, logger=True) - return loss - -The :meth:`~pytorch_lightning.core.lightning.LightningModule.log` object automatically reduces the -requested metrics across a complete epoch and devices. Here's the pseudocode of what it does under the hood: - -.. code-block:: python - - outs = [] - for batch_idx, batch in enumerate(train_dataloader): - # forward - loss = training_step(batch, batch_idx) - outs.append(loss) - - # clear gradients - optimizer.zero_grad() - - # backward - loss.backward() - - # update parameters - optimizer.step() - - epoch_metric = torch.mean(torch.stack([x for x in outs])) - -Train Epoch-level Operations -============================ - -If you need to do something with all the outputs of each :meth:`~pytorch_lightning.core.lightning.LightningModule.training_step`, -override the :meth:`~pytorch_lightning.core.lightning.LightningModule.training_epoch_end` method. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - x, y = batch - y_hat = self.model(x) - loss = F.cross_entropy(y_hat, y) - preds = ... - return {"loss": loss, "other_stuff": preds} - - - def training_epoch_end(self, training_step_outputs): - all_preds = torch.stack(training_step_outputs) - ... - -The matching pseudocode is: - -.. code-block:: python - - outs = [] - for batch_idx, batch in enumerate(train_dataloader): - # forward - loss = training_step(batch, batch_idx) - outs.append(loss) - - # clear gradients - optimizer.zero_grad() - - # backward - loss.backward() - - # update parameters - optimizer.step() - - training_epoch_end(outs) - -Training with DataParallel -========================== - -When training using a ``strategy`` that splits data from each batch across GPUs, sometimes you might -need to aggregate them on the main GPU for processing (DP, or DDP2). - -In this case, implement the :meth:`~pytorch_lightning.core.lightning.LightningModule.training_step_end` -method which will have outputs from all the devices and you can accumulate to get the effective results. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - x, y = batch - y_hat = self.model(x) - loss = F.cross_entropy(y_hat, y) - pred = ... - return {"loss": loss, "pred": pred} - - - def training_step_end(self, batch_parts): - # predictions from each GPU - predictions = batch_parts["pred"] - # losses from each GPU - losses = batch_parts["loss"] - - gpu_0_prediction = predictions[0] - gpu_1_prediction = predictions[1] - - # do something with both outputs - return (losses[0] + losses[1]) / 2 - - - def training_epoch_end(self, training_step_outputs): - for out in training_step_outputs: - ... - -Here is the Lightning training pseudo-code for DP: - -.. code-block:: python - - outs = [] - for batch_idx, train_batch in enumerate(train_dataloader): - batches = split_batch(train_batch) - dp_outs = [] - for sub_batch in batches: - # 1 - dp_out = training_step(sub_batch, batch_idx) - dp_outs.append(dp_out) - - # 2 - out = training_step_end(dp_outs) - outs.append(out) - - # do something with the outputs for all batches - # 3 - training_epoch_end(outs) - ------------------- - -********** -Validation -********** - -Validation Loop -=============== - -To activate the validation loop while training, override the :meth:`~pytorch_lightning.core.lightning.LightningModule.validation_step` method. - -.. code-block:: python - - class LitModel(pl.LightningModule): - def validation_step(self, batch, batch_idx): - x, y = batch - y_hat = self.model(x) - loss = F.cross_entropy(y_hat, y) - self.log("val_loss", loss) - -Under the hood, Lightning does the following (pseudocode): - -.. code-block:: python - - # ... - for batch_idx, batch in enumerate(train_dataloader): - loss = model.training_step(batch, batch_idx) - loss.backward() - # ... - - if validate_at_some_point: - # disable grads + batchnorm + dropout - torch.set_grad_enabled(False) - model.eval() - - # ----------------- VAL LOOP --------------- - for val_batch_idx, val_batch in enumerate(val_dataloader): - val_out = model.validation_step(val_batch, val_batch_idx) - # ----------------- VAL LOOP --------------- - - # enable grads + batchnorm + dropout - torch.set_grad_enabled(True) - model.train() - -You can also run just the validation loop on your validation dataloaders by overriding :meth:`~pytorch_lightning.core.lightning.LightningModule.validation_step` -and calling :meth:`~pytorch_lightning.trainer.trainer.Trainer.validate`. - -.. code-block:: python - - model = Model() - trainer = Trainer() - trainer.validate(model) - -.. note:: - - It is recommended to validate on single device to ensure each sample/batch gets evaluated exactly once. - This is helpful to make sure benchmarking for research papers is done the right way. Otherwise, in a - multi-device setting, samples could occur duplicated when :class:`~torch.utils.data.distributed.DistributedSampler` - is used, for eg. with ``strategy="ddp"``. It replicates some samples on some devices to make sure all devices have - same batch size in case of uneven inputs. - - -Validation Epoch-level Metrics -============================== - -If you need to do something with all the outputs of each :meth:`~pytorch_lightning.core.lightning.LightningModule.validation_step`, -override the :meth:`~pytorch_lightning.core.lightning.LightningModule.validation_epoch_end` method. Note that this method is called before :meth:`~pytorch_lightning.core.lightning.LightningModule.training_epoch_end`. - -.. code-block:: python - - def validation_step(self, batch, batch_idx): - x, y = batch - y_hat = self.model(x) - loss = F.cross_entropy(y_hat, y) - pred = ... - return pred - - - def validation_epoch_end(self, validation_step_outputs): - all_preds = torch.stack(validation_step_outputs) - ... - -Validating with DataParallel -============================ - -When training using a ``strategy`` that splits data from each batch across GPUs, sometimes you might -need to aggregate them on the main GPU for processing (DP, or DDP2). - -In this case, implement the :meth:`~pytorch_lightning.core.lightning.LightningModule.validation_step_end` -method which will have outputs from all the devices and you can accumulate to get the effective results. - -.. code-block:: python - - def validation_step(self, batch, batch_idx): - x, y = batch - y_hat = self.model(x) - loss = F.cross_entropy(y_hat, y) - pred = ... - return {"loss": loss, "pred": pred} - - - def validation_step_end(self, batch_parts): - # predictions from each GPU - predictions = batch_parts["pred"] - # losses from each GPU - losses = batch_parts["loss"] - - gpu_0_prediction = predictions[0] - gpu_1_prediction = predictions[1] - - # do something with both outputs - return (losses[0] + losses[1]) / 2 - - - def validation_epoch_end(self, validation_step_outputs): - for out in validation_step_outputs: - ... - -Here is the Lightning validation pseudo-code for DP: - -.. code-block:: python - - outs = [] - for batch in dataloader: - batches = split_batch(batch) - dp_outs = [] - for sub_batch in batches: - # 1 - dp_out = validation_step(sub_batch) - dp_outs.append(dp_out) - - # 2 - out = validation_step_end(dp_outs) - outs.append(out) - - # do something with the outputs for all batches - # 3 - validation_epoch_end(outs) - ----------------- - -******* -Testing -******* - -Test Loop -========= - -The process for enabling a test loop is the same as the process for enabling a validation loop. Please refer to -the section above for details. For this you need to override the :meth:`~pytorch_lightning.core.lightning.LightningModule.test_step` method. - -The only difference is that the test loop is only called when :meth:`~pytorch_lightning.trainer.trainer.Trainer.test` is used. - -.. code-block:: python - - model = Model() - trainer = Trainer() - trainer.fit(model) - - # automatically loads the best weights for you - trainer.test(model) - -There are two ways to call ``test()``: - -.. code-block:: python - - # call after training - trainer = Trainer() - trainer.fit(model) - - # automatically auto-loads the best weights from the previous run - trainer.test(dataloaders=test_dataloader) - - # or call with pretrained model - model = MyLightningModule.load_from_checkpoint(PATH) - trainer = Trainer() - trainer.test(model, dataloaders=test_dataloader) - -.. note:: - - It is recommended to validate on single device to ensure each sample/batch gets evaluated exactly once. - This is helpful to make sure benchmarking for research papers is done the right way. Otherwise, in a - multi-device setting, samples could occur duplicated when :class:`~torch.utils.data.distributed.DistributedSampler` - is used, for eg. with ``strategy="ddp"``. It replicates some samples on some devices to make sure all devices have - same batch size in case of uneven inputs. - - ----------- - -********* -Inference -********* - -Prediction Loop -=============== - -By default, the :meth:`~pytorch_lightning.core.lightning.LightningModule.predict_step` method runs the -:meth:`~pytorch_lightning.core.lightning.LightningModule.forward` method. In order to customize this behaviour, -simply override the :meth:`~pytorch_lightning.core.lightning.LightningModule.predict_step` method. - -For the example let's override ``predict_step`` and try out `Monte Carlo Dropout `_: - -.. code-block:: python - - class LitMCdropoutModel(pl.LightningModule): - def __init__(self, model, mc_iteration): - super().__init__() - self.model = model - self.dropout = nn.Dropout() - self.mc_iteration = mc_iteration - - def predict_step(self, batch, batch_idx): - # enable Monte Carlo Dropout - self.dropout.train() - - # take average of `self.mc_iteration` iterations - pred = torch.vstack([self.dropout(self.model(x)).unsqueeze(0) for _ in range(self.mc_iteration)]).mean(dim=0) - return pred - -Under the hood, Lightning does the following (pseudocode): - -.. code-block:: python - - # disable grads + batchnorm + dropout - torch.set_grad_enabled(False) - model.eval() - all_preds = [] - - for batch_idx, batch in enumerate(predict_dataloader): - pred = model.predict_step(batch, batch_idx) - all_preds.append(pred) - -There are two ways to call ``predict()``: - -.. code-block:: python - - # call after training - trainer = Trainer() - trainer.fit(model) - - # automatically auto-loads the best weights from the previous run - predictions = trainer.predict(dataloaders=predict_dataloader) - - # or call with pretrained model - model = MyLightningModule.load_from_checkpoint(PATH) - trainer = Trainer() - predictions = trainer.predict(model, dataloaders=test_dataloader) - -Inference in Research -===================== - -If you want to perform inference with the system, you can add a ``forward`` method to the LightningModule. - -.. note:: When using forward, you are responsible to call :func:`~torch.nn.Module.eval` and use the :func:`~torch.no_grad` context manager. - -.. code-block:: python - - class Autoencoder(pl.LightningModule): - def forward(self, x): - return self.decoder(x) - - - model = Autoencoder() - model.eval() - with torch.no_grad(): - reconstruction = model(embedding) - -The advantage of adding a forward is that in complex systems, you can do a much more involved inference procedure, -such as text generation: - -.. code-block:: python - - class Seq2Seq(pl.LightningModule): - def forward(self, x): - embeddings = self(x) - hidden_states = self.encoder(embeddings) - for h in hidden_states: - # decode - ... - return decoded - -In the case where you want to scale your inference, you should be using -:meth:`~pytorch_lightning.core.lightning.LightningModule.predict_step`. - -.. code-block:: python - - class Autoencoder(pl.LightningModule): - def forward(self, x): - return self.decoder(x) - - def predict_step(self, batch, batch_idx, dataloader_idx=0): - # this calls forward - return self(batch) - - - data_module = ... - model = Autoencoder() - trainer = Trainer(accelerator="gpu", devices=2) - trainer.predict(model, data_module) - -Inference in Production -======================= - -For cases like production, you might want to iterate different models inside a LightningModule. - -.. code-block:: python - - from torchmetrics.functional import accuracy - - - class ClassificationTask(pl.LightningModule): - def __init__(self, model): - super().__init__() - self.model = model - - def training_step(self, batch, batch_idx): - x, y = batch - y_hat = self.model(x) - loss = F.cross_entropy(y_hat, y) - return loss - - def validation_step(self, batch, batch_idx): - loss, acc = self._shared_eval_step(batch, batch_idx) - metrics = {"val_acc": acc, "val_loss": loss} - self.log_dict(metrics) - return metrics - - def test_step(self, batch, batch_idx): - loss, acc = self._shared_eval_step(batch, batch_idx) - metrics = {"test_acc": acc, "test_loss": loss} - self.log_dict(metrics) - return metrics - - def _shared_eval_step(self, batch, batch_idx): - x, y = batch - y_hat = self.model(x) - loss = F.cross_entropy(y_hat, y) - acc = accuracy(y_hat, y) - return loss, acc - - def predict_step(self, batch, batch_idx, dataloader_idx=0): - x, y = batch - y_hat = self.model(x) - return y_hat - - def configure_optimizers(self): - return torch.optim.Adam(self.model.parameters(), lr=0.02) - -Then pass in any arbitrary model to be fit with this task - -.. code-block:: python - - for model in [resnet50(), vgg16(), BidirectionalRNN()]: - task = ClassificationTask(model) - - trainer = Trainer(accelerator="gpu", devices=2) - trainer.fit(task, train_dataloaders=train_dataloader, val_dataloaders=val_dataloader) - -Tasks can be arbitrarily complex such as implementing GAN training, self-supervised or even RL. - -.. code-block:: python - - class GANTask(pl.LightningModule): - def __init__(self, generator, discriminator): - super().__init__() - self.generator = generator - self.discriminator = discriminator - - ... - -When used like this, the model can be separated from the Task and thus used in production without needing to keep it in -a ``LightningModule``. - -The following example shows how you can run inference in the Python runtime: - -.. code-block:: python - - task = ClassificationTask(model) - trainer = Trainer(accelerator="gpu", devices=2) - trainer.fit(task, train_dataloader, val_dataloader) - trainer.save_checkpoint("best_model.ckpt") - - # use model after training or load weights and drop into the production system - model = ClassificationTask.load_from_checkpoint("best_model.ckpt") - x = ... - model.eval() - with torch.no_grad(): - y_hat = model(x) - -Check out :ref:`Inference in Production ` guide to learn about the possible ways to perform inference in production. - - ------------ - - -************* -Child Modules -************* - -.. include:: ../common/child_modules.rst - ------------ - -******************* -LightningModule API -******************* - - -Methods -======= - -all_gather -~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.all_gather - :noindex: - -configure_callbacks -~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.configure_callbacks - :noindex: - -configure_optimizers -~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.configure_optimizers - :noindex: - -forward -~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.forward - :noindex: - -freeze -~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.freeze - :noindex: - -.. _lm-log: - -log -~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.log - :noindex: - -log_dict -~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.log_dict - :noindex: - -lr_schedulers -~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.lr_schedulers - :noindex: - -manual_backward -~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.manual_backward - :noindex: - -optimizers -~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.optimizers - :noindex: - -print -~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.print - :noindex: - -predict_step -~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.predict_step - :noindex: - -save_hyperparameters -~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.save_hyperparameters - :noindex: - -toggle_optimizer -~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.toggle_optimizer - :noindex: - -test_step -~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.test_step - :noindex: - -test_step_end -~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.test_step_end - :noindex: - -test_epoch_end -~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.test_epoch_end - :noindex: - -to_onnx -~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.to_onnx - :noindex: - -to_torchscript -~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.to_torchscript - :noindex: - -training_step -~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.training_step - :noindex: - -training_step_end -~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.training_step_end - :noindex: - -training_epoch_end -~~~~~~~~~~~~~~~~~~ -.. automethod:: pytorch_lightning.core.lightning.LightningModule.training_epoch_end - :noindex: - -unfreeze -~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.unfreeze - :noindex: - -untoggle_optimizer -~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.untoggle_optimizer - :noindex: - -validation_step -~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.validation_step - :noindex: - -validation_step_end -~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.validation_step_end - :noindex: - -validation_epoch_end -~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.validation_epoch_end - :noindex: - ------------ - -Properties -========== - -These are properties available in a LightningModule. - -current_epoch -~~~~~~~~~~~~~ - -The number of epochs run. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - if self.current_epoch == 0: - ... - -device -~~~~~~ - -The device the module is on. Use it to keep your code device agnostic. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - z = torch.rand(2, 3, device=self.device) - -global_rank -~~~~~~~~~~~ - -The ``global_rank`` is the index of the current process across all nodes and devices. -Lightning will perform some operations such as logging, weight checkpointing only when ``global_rank=0``. You -usually do not need to use this property, but it is useful to know how to access it if needed. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - if self.global_rank == 0: - # do something only once across all the nodes - ... - -global_step -~~~~~~~~~~~ - -The number of optimizer steps taken (does not reset each epoch). -This includes multiple optimizers and TBPTT steps (if enabled). - -.. code-block:: python - - def training_step(self, batch, batch_idx): - self.logger.experiment.log_image(..., step=self.global_step) - -hparams -~~~~~~~ - -The arguments passed through ``LightningModule.__init__()`` and saved by calling -:meth:`~pytorch_lightning.core.mixins.hparams_mixin.HyperparametersMixin.save_hyperparameters` could be accessed by the ``hparams`` attribute. - -.. code-block:: python - - def __init__(self, learning_rate): - self.save_hyperparameters() - - - def configure_optimizers(self): - return Adam(self.parameters(), lr=self.hparams.learning_rate) - -logger -~~~~~~ - -The current logger being used (tensorboard or other supported logger) - -.. code-block:: python - - def training_step(self, batch, batch_idx): - # the generic logger (same no matter if tensorboard or other supported logger) - self.logger - - # the particular logger - tensorboard_logger = self.logger.experiment - -loggers -~~~~~~~ - -The list of loggers currently being used by the Trainer. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - # List of Logger objects - loggers = self.loggers - for logger in loggers: - logger.log_metrics({"foo": 1.0}) - -local_rank -~~~~~~~~~~~ - -The ``local_rank`` is the index of the current process across all the devices for the current node. -You usually do not need to use this property, but it is useful to know how to access it if needed. -For example, if using 10 machines (or nodes), the GPU at index 0 on each machine has local_rank = 0. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - if self.local_rank == 0: - # do something only once across each node - ... - -precision -~~~~~~~~~ - -The type of precision used: - -.. code-block:: python - - def training_step(self, batch, batch_idx): - if self.precision == 16: - ... - -trainer -~~~~~~~ - -Pointer to the trainer - -.. code-block:: python - - def training_step(self, batch, batch_idx): - max_steps = self.trainer.max_steps - any_flag = self.trainer.any_flag - -prepare_data_per_node -~~~~~~~~~~~~~~~~~~~~~ - -If set to ``True`` will call ``prepare_data()`` on LOCAL_RANK=0 for every node. -If set to ``False`` will only call from NODE_RANK=0, LOCAL_RANK=0. - -.. testcode:: - - class LitModel(LightningModule): - def __init__(self): - super().__init__() - self.prepare_data_per_node = True - -automatic_optimization -~~~~~~~~~~~~~~~~~~~~~~ - -When set to ``False``, Lightning does not automate the optimization process. This means you are responsible for handling -your optimizers. However, we do take care of precision and any accelerators used. - -See :ref:`manual optimization ` for details. - -.. code-block:: python - - def __init__(self): - self.automatic_optimization = False - - - def training_step(self, batch, batch_idx): - opt = self.optimizers(use_pl_optimizer=True) - - loss = ... - opt.zero_grad() - self.manual_backward(loss) - opt.step() - -This is recommended only if using 2+ optimizers AND if you know how to perform the optimization procedure properly. Note -that automatic optimization can still be used with multiple optimizers by relying on the ``optimizer_idx`` parameter. -Manual optimization is most useful for research topics like reinforcement learning, sparse coding, and GAN research. - -.. code-block:: python - - def __init__(self): - self.automatic_optimization = False - - - def training_step(self, batch, batch_idx): - # access your optimizers with use_pl_optimizer=False. Default is True - opt_a, opt_b = self.optimizers(use_pl_optimizer=True) - - gen_loss = ... - opt_a.zero_grad() - self.manual_backward(gen_loss) - opt_a.step() - - disc_loss = ... - opt_b.zero_grad() - self.manual_backward(disc_loss) - opt_b.step() - -example_input_array -~~~~~~~~~~~~~~~~~~~ - -Set and access example_input_array, which basically represents a single batch. - -.. code-block:: python - - def __init__(self): - self.example_input_array = ... - self.generator = ... - - - def on_train_epoch_end(self): - # generate some images using the example_input_array - gen_images = self.generator(self.example_input_array) - -truncated_bptt_steps -~~~~~~~~~~~~~~~~~~~~ - -Truncated Backpropagation Through Time (TBPTT) performs perform backpropogation every k steps of -a much longer sequence. This is made possible by passing training batches -split along the time-dimensions into splits of size k to the -``training_step``. In order to keep the same forward propagation behavior, all -hidden states should be kept in-between each time-dimension split. - - -If this is enabled, your batches will automatically get truncated -and the Trainer will apply Truncated Backprop to it. - -(`Williams et al. "An efficient gradient-based algorithm for on-line training of -recurrent network trajectories." -`_) - -`Tutorial `_ - -.. testcode:: python - - from pytorch_lightning import LightningModule - - - class MyModel(LightningModule): - def __init__(self, input_size, hidden_size, num_layers): - super().__init__() - # batch_first has to be set to True - self.lstm = nn.LSTM( - input_size=input_size, - hidden_size=hidden_size, - num_layers=num_layers, - batch_first=True, - ) - - ... - - # Important: This property activates truncated backpropagation through time - # Setting this value to 2 splits the batch into sequences of size 2 - self.truncated_bptt_steps = 2 - - # Truncated back-propagation through time - def training_step(self, batch, batch_idx, hiddens): - x, y = batch - - # the training step must be updated to accept a ``hiddens`` argument - # hiddens are the hiddens from the previous truncated backprop step - out, hiddens = self.lstm(x, hiddens) - - ... - - return {"loss": ..., "hiddens": hiddens} - -Lightning takes care of splitting your batch along the time-dimension. It is -assumed to be the second dimension of your batches. Therefore, in the -example above, we have set ``batch_first=True``. - -.. code-block:: python - - # we use the second as the time dimension - # (batch, time, ...) - sub_batch = batch[0, 0:t, ...] - -To modify how the batch is split, -override the :meth:`pytorch_lightning.core.lightning.LightningModule.tbptt_split_batch` method: - -.. testcode:: python - - class LitMNIST(LightningModule): - def tbptt_split_batch(self, batch, split_size): - # do your own splitting on the batch - return splits - --------------- - -.. _lightning_hooks: - -Hooks -===== - -This is the pseudocode to describe the structure of :meth:`~pytorch_lightning.trainer.Trainer.fit`. -The inputs and outputs of each function are not represented for simplicity. Please check each function's API reference -for more information. - -.. code-block:: python - - def fit(self): - if global_rank == 0: - # prepare data is called on GLOBAL_ZERO only - prepare_data() - - configure_callbacks() - - with parallel(devices): - # devices can be GPUs, TPUs, ... - train_on_device(model) - - - def train_on_device(model): - # called PER DEVICE - on_fit_start() - setup("fit") - configure_optimizers() - - # the sanity check runs here - - on_train_start() - for epoch in epochs: - fit_loop() - on_train_end() - - on_fit_end() - teardown("fit") - - - def fit_loop(): - on_train_epoch_start() - - for batch in train_dataloader(): - on_train_batch_start() - - on_before_batch_transfer() - transfer_batch_to_device() - on_after_batch_transfer() - - training_step() - - on_before_zero_grad() - optimizer_zero_grad() - - on_before_backward() - backward() - on_after_backward() - - on_before_optimizer_step() - configure_gradient_clipping() - optimizer_step() - - on_train_batch_end() - - if should_check_val: - val_loop() - # end training epoch - training_epoch_end() - - on_train_epoch_end() - - - def val_loop(): - on_validation_model_eval() # calls `model.eval()` - torch.set_grad_enabled(False) - - on_validation_start() - on_validation_epoch_start() - - val_outs = [] - for batch_idx, batch in enumerate(val_dataloader()): - on_validation_batch_start(batch, batch_idx) - - batch = on_before_batch_transfer(batch) - batch = transfer_batch_to_device(batch) - batch = on_after_batch_transfer(batch) - - out = validation_step(batch, batch_idx) - - on_validation_batch_end(batch, batch_idx) - val_outs.append(out) - - validation_epoch_end(val_outs) - - on_validation_epoch_end() - on_validation_end() - - # set up for train - on_validation_model_train() # calls `model.train()` - torch.set_grad_enabled(True) - -backward -~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.backward - :noindex: - -on_before_backward -~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_before_backward - :noindex: - -on_after_backward -~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_after_backward - :noindex: - -on_before_zero_grad -~~~~~~~~~~~~~~~~~~~ -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_before_zero_grad - :noindex: - -on_fit_start -~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_fit_start - :noindex: - -on_fit_end -~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_fit_end - :noindex: - - -on_load_checkpoint -~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_load_checkpoint - :noindex: - -on_save_checkpoint -~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_save_checkpoint - :noindex: - -load_from_checkpoint -~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.load_from_checkpoint - :noindex: - -on_hpc_save -~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_hpc_save - :noindex: - -on_hpc_load -~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_hpc_load - :noindex: - -on_train_start -~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_train_start - :noindex: - -on_train_end -~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_train_end - :noindex: - -on_validation_start -~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_validation_start - :noindex: - -on_validation_end -~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_validation_end - :noindex: - -on_test_batch_start -~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_test_batch_start - :noindex: - -on_test_batch_end -~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_test_batch_end - :noindex: - -on_test_epoch_start -~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_test_epoch_start - :noindex: - -on_test_epoch_end -~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_test_epoch_end - :noindex: - -on_test_start -~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_test_start - :noindex: - -on_test_end -~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_test_end - :noindex: - -on_predict_batch_start -~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_predict_batch_start - :noindex: - -on_predict_batch_end -~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_predict_batch_end - :noindex: - -on_predict_epoch_start -~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_predict_epoch_start - :noindex: - -on_predict_epoch_end -~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_predict_epoch_end - :noindex: - -on_predict_start -~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_predict_start - :noindex: - -on_predict_end -~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_predict_end - :noindex: - -on_train_batch_start -~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_train_batch_start - :noindex: - -on_train_batch_end -~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_train_batch_end - :noindex: - -on_train_epoch_start -~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_train_epoch_start - :noindex: - -on_train_epoch_end -~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_train_epoch_end - :noindex: - -on_validation_batch_start -~~~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_validation_batch_start - :noindex: - -on_validation_batch_end -~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_validation_batch_end - :noindex: - -on_validation_epoch_start -~~~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_validation_epoch_start - :noindex: - -on_validation_epoch_end -~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_validation_epoch_end - :noindex: - -on_post_move_to_device -~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_post_move_to_device - :noindex: - -configure_sharded_model -~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.configure_sharded_model - :noindex: - -on_validation_model_eval -~~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_validation_model_eval - :noindex: - -on_validation_model_train -~~~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_validation_model_train - :noindex: - -on_test_model_eval -~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_test_model_eval - :noindex: - -on_test_model_train -~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_test_model_train - :noindex: - -on_before_optimizer_step -~~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_before_optimizer_step - :noindex: - -configure_gradient_clipping -~~~~~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.configure_gradient_clipping - :noindex: - -optimizer_step -~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.optimizer_step - :noindex: - -optimizer_zero_grad -~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.optimizer_zero_grad - :noindex: - -prepare_data -~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.prepare_data - :noindex: - -setup -~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.setup - :noindex: - -tbptt_split_batch -~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.tbptt_split_batch - :noindex: - -teardown -~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.teardown - :noindex: - -train_dataloader -~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.train_dataloader - :noindex: - -val_dataloader -~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.val_dataloader - :noindex: - -test_dataloader -~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.test_dataloader - :noindex: - -predict_dataloader -~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.predict_dataloader - :noindex: - -on_train_dataloader -~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_train_dataloader - :noindex: - -on_val_dataloader -~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_val_dataloader - :noindex: - -on_test_dataloader -~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_test_dataloader - :noindex: - -on_predict_dataloader -~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_predict_dataloader - :noindex: - -transfer_batch_to_device -~~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.transfer_batch_to_device - :noindex: - -on_before_batch_transfer -~~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_before_batch_transfer - :noindex: - -on_after_batch_transfer -~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_after_batch_transfer - :noindex: - -add_to_queue -~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.add_to_queue - :noindex: - -get_from_queue -~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.get_from_queue - :noindex: diff --git a/docs/_sources/common/optimization.rst.txt b/docs/_sources/common/optimization.rst.txt deleted file mode 100644 index e7e9e12..0000000 --- a/docs/_sources/common/optimization.rst.txt +++ /dev/null @@ -1,327 +0,0 @@ -:orphan: - -.. _optimization: - -############ -Optimization -############ - -Lightning offers two modes for managing the optimization process: - -- Manual Optimization -- Automatic Optimization - -For the majority of research cases, **automatic optimization** will do the right thing for you and it is what most -users should use. - -For advanced/expert users who want to do esoteric optimization schedules or techniques, use **manual optimization**. - -.. _manual_optimization: - ----- - -.. include:: ../model/manual_optimization.rst - ------ - -********************** -Automatic Optimization -********************** - -With Lightning, most users don't have to think about when to call ``.zero_grad()``, ``.backward()`` and ``.step()`` -since Lightning automates that for you. - -Under the hood, Lightning does the following: - -.. code-block:: python - - for epoch in epochs: - for batch in data: - - def closure(): - loss = model.training_step(batch, batch_idx, ...) - optimizer.zero_grad() - loss.backward() - return loss - - optimizer.step(closure) - - lr_scheduler.step() - -In the case of multiple optimizers, Lightning does the following: - -.. code-block:: python - - for epoch in epochs: - for batch in data: - for opt in optimizers: - - def closure(): - loss = model.training_step(batch, batch_idx, optimizer_idx) - opt.zero_grad() - loss.backward() - return loss - - opt.step(closure) - - for lr_scheduler in lr_schedulers: - lr_scheduler.step() - -As can be seen in the code snippet above, Lightning defines a closure with ``training_step()``, ``optimizer.zero_grad()`` -and ``loss.backward()`` for the optimization. This mechanism is in place to support optimizers which operate on the -output of the closure (e.g. the loss) or need to call the closure several times (e.g. :class:`~torch.optim.LBFGS`). - -.. warning:: - - Before v1.2.2, Lightning internally calls ``backward``, ``step`` and ``zero_grad`` in the order. - From v1.2.2, the order is changed to ``zero_grad``, ``backward`` and ``step``. - - -Gradient Accumulation -===================== - -.. include:: ../common/gradient_accumulation.rst - - -Use Multiple Optimizers (like GANs) -=================================== - -To use multiple optimizers (optionally with learning rate schedulers), return two or more optimizers from -:meth:`~pytorch_lightning.core.lightning.LightningModule.configure_optimizers`. - -.. testcode:: python - - # two optimizers, no schedulers - def configure_optimizers(self): - return Adam(...), SGD(...) - - - # two optimizers, one scheduler for adam only - def configure_optimizers(self): - opt1 = Adam(...) - opt2 = SGD(...) - optimizers = [opt1, opt2] - lr_schedulers = {"scheduler": ReduceLROnPlateau(opt1, ...), "monitor": "metric_to_track"} - return optimizers, lr_schedulers - - - # two optimizers, two schedulers - def configure_optimizers(self): - opt1 = Adam(...) - opt2 = SGD(...) - return [opt1, opt2], [StepLR(opt1, ...), OneCycleLR(opt2, ...)] - -Under the hood, Lightning will call each optimizer sequentially: - -.. code-block:: python - - for epoch in epochs: - for batch in data: - for opt in optimizers: - loss = train_step(batch, batch_idx, optimizer_idx) - opt.zero_grad() - loss.backward() - opt.step() - - for lr_scheduler in lr_schedulers: - lr_scheduler.step() - - -Step Optimizeres at Arbitrary Intervals -======================================= - -To do more interesting things with your optimizers such as learning rate warm-up or odd scheduling, -override the :meth:`~pytorch_lightning.core.lightning.LightningModule.optimizer_step` function. - -.. warning:: - If you are overriding this method, make sure that you pass the ``optimizer_closure`` parameter to - ``optimizer.step()`` function as shown in the examples because ``training_step()``, ``optimizer.zero_grad()``, - ``loss.backward()`` are called in the closure function. - -For example, here step optimizer A every batch and optimizer B every 2 batches. - -.. testcode:: python - - # Alternating schedule for optimizer steps (e.g. GANs) - def optimizer_step( - self, - epoch, - batch_idx, - optimizer, - optimizer_idx, - optimizer_closure, - on_tpu=False, - using_native_amp=False, - using_lbfgs=False, - ): - # update generator every step - if optimizer_idx == 0: - optimizer.step(closure=optimizer_closure) - - # update discriminator every 2 steps - if optimizer_idx == 1: - if (batch_idx + 1) % 2 == 0: - # the closure (which includes the `training_step`) will be executed by `optimizer.step` - optimizer.step(closure=optimizer_closure) - else: - # call the closure by itself to run `training_step` + `backward` without an optimizer step - optimizer_closure() - - # ... - # add as many optimizers as you want - -Here we add a manual learning rate warm-up without an lr scheduler. - -.. testcode:: python - - # learning rate warm-up - def optimizer_step( - self, - epoch, - batch_idx, - optimizer, - optimizer_idx, - optimizer_closure, - on_tpu=False, - using_native_amp=False, - using_lbfgs=False, - ): - # update params - optimizer.step(closure=optimizer_closure) - - # skip the first 500 steps - if self.trainer.global_step < 500: - lr_scale = min(1.0, float(self.trainer.global_step + 1) / 500.0) - for pg in optimizer.param_groups: - pg["lr"] = lr_scale * self.hparams.learning_rate - - -Access your Own Optimizer -========================= - -The provided ``optimizer`` is a :class:`~pytorch_lightning.core.optimizer.LightningOptimizer` object wrapping your own optimizer -configured in your :meth:`~pytorch_lightning.core.lightning.LightningModule.configure_optimizers`. -You can access your own optimizer with ``optimizer.optimizer``. However, if you use your own optimizer -to perform a step, Lightning won't be able to support accelerators, precision and profiling for you. - -.. testcode:: python - - # function hook in LightningModule - def optimizer_step( - self, - epoch, - batch_idx, - optimizer, - optimizer_idx, - optimizer_closure, - on_tpu=False, - using_native_amp=False, - using_lbfgs=False, - ): - optimizer.step(closure=optimizer_closure) - - - # `optimizer` is a `LightningOptimizer` wrapping the optimizer. - # To access it, do the following. - # However, it won't work on TPU, AMP, etc... - def optimizer_step( - self, - epoch, - batch_idx, - optimizer, - optimizer_idx, - optimizer_closure, - on_tpu=False, - using_native_amp=False, - using_lbfgs=False, - ): - optimizer = optimizer.optimizer - optimizer.step(closure=optimizer_closure) - ------ - - -Bring your own Custom Learning Rate Schedulers -============================================== - -Lightning allows using custom learning rate schedulers that aren't available in `PyTorch natively `_. -One good example is `Timm Schedulers `_. When using custom learning rate schedulers -relying on a different API from Native PyTorch ones, you should override the :meth:`~pytorch_lightning.core.lightning.LightningModule.lr_scheduler_step` with your desired logic. -If you are using native PyTorch schedulers, there is no need to override this hook since Lightning will handle it automatically by default. - -.. code-block:: python - - from timm.scheduler import TanhLRScheduler - - - def configure_optimizers(self): - optimizer = ... - scheduler = TanhLRScheduler(optimizer, ...) - return [optimizer], [{"scheduler": scheduler, "interval": "epoch"}] - - - def lr_scheduler_step(self, scheduler, optimizer_idx, metric): - scheduler.step(epoch=self.current_epoch) # timm's scheduler need the epoch value - - -.. _configure_gradient_clipping: - -Configure Gradient Clipping -=========================== - -To configure custom gradient clipping, consider overriding -the :meth:`~pytorch_lightning.core.lightning.LightningModule.configure_gradient_clipping` method. -Attributes ``gradient_clip_val`` and ``gradient_clip_algorithm`` from Trainer will be passed in the -respective arguments here and Lightning will handle gradient clipping for you. In case you want to set -different values for your arguments of your choice and let Lightning handle the gradient clipping, you can -use the inbuilt :meth:`~pytorch_lightning.core.lightning.LightningModule.clip_gradients` method and pass -the arguments along with your optimizer. - -.. warning:: - Make sure to not override :meth:`~pytorch_lightning.core.lightning.LightningModule.clip_gradients` - method. If you want to customize gradient clipping, consider using - :meth:`~pytorch_lightning.core.lightning.LightningModule.configure_gradient_clipping` method. - -For example, here we will apply gradient clipping only to the gradients associated with optimizer A. - -.. testcode:: python - - def configure_gradient_clipping(self, optimizer, optimizer_idx, gradient_clip_val, gradient_clip_algorithm): - if optimizer_idx == 0: - # Lightning will handle the gradient clipping - self.clip_gradients( - optimizer, gradient_clip_val=gradient_clip_val, gradient_clip_algorithm=gradient_clip_algorithm - ) - -Here we configure gradient clipping differently for optimizer B. - -.. testcode:: python - - def configure_gradient_clipping(self, optimizer, optimizer_idx, gradient_clip_val, gradient_clip_algorithm): - if optimizer_idx == 0: - # Lightning will handle the gradient clipping - self.clip_gradients( - optimizer, gradient_clip_val=gradient_clip_val, gradient_clip_algorithm=gradient_clip_algorithm - ) - elif optimizer_idx == 1: - self.clip_gradients( - optimizer, gradient_clip_val=gradient_clip_val * 2, gradient_clip_algorithm=gradient_clip_algorithm - ) - - -Total Stepping Batches -====================== - -You can use built-in trainer property :paramref:`~pytorch_lightning.trainer.trainer.Trainer.estimated_stepping_batches` to compute -total number of stepping batches for the complete training. The property is computed considering gradient accumulation factor and -distributed setting into consideration so you don't have to derive it manually. One good example where this can be helpful is while using -:class:`~torch.optim.lr_scheduler.OneCycleLR` scheduler, which requires pre-computed ``total_steps`` during initialization. - -.. code-block:: python - - def configure_optimizers(self): - optimizer = ... - scheduler = torch.optim.lr_scheduler.OneCycleLR( - optimizer, max_lr=1e-3, total_steps=self.trainer.estimated_stepping_batches - ) - return [optimizer], [scheduler] diff --git a/docs/_sources/common/precision.rst.txt b/docs/_sources/common/precision.rst.txt deleted file mode 100644 index 15fcdf0..0000000 --- a/docs/_sources/common/precision.rst.txt +++ /dev/null @@ -1,43 +0,0 @@ -:orphan: - -.. _precision: - -############### -N-Bit Precision -############### - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Basic - :description: Enable your models to train faster and save memory with different floating-point precision settings. - :col_css: col-md-4 - :button_link: precision_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Intermediate - :description: Enable state-of-the-art scaling with advanced mix-precision settings. - :col_css: col-md-4 - :button_link: precision_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Expert - :description: Create new precision techniques and enable them through Lightning. - :col_css: col-md-4 - :button_link: precision_expert.html - :height: 150 - :tag: expert - -.. raw:: html - -
-
diff --git a/docs/_sources/common/precision_basic.rst.txt b/docs/_sources/common/precision_basic.rst.txt deleted file mode 100644 index 3cc0b3a..0000000 --- a/docs/_sources/common/precision_basic.rst.txt +++ /dev/null @@ -1,92 +0,0 @@ -:orphan: - -.. _precision_basic: - -####################### -N-Bit Precision (Basic) -####################### -**Audience:** Users looking to train models faster and consume less memory. - ----- - -If you're looking to run models faster or consume less memory, consider tweaking the precision settings of your models. - -Lower precision, such as 16-bit floating-point, requires less memory and enables training and deploying larger models. -Higher precision, such as the 64-bit floating-point, can be used for highly sensitive use-cases. - ----- - -**************** -16-bit Precision -**************** - -Use 16-bit precision to cut your memory consumption in half so that you can train and deploy larger models. If your GPUs are [`Tensor Core `_] GPUs, you can also get a ~3x speed improvement. Half precision can sometimes lead to unstable training. - -.. code:: - - Trainer(precision=16) - ----- - -**************** -32-bit Precision -**************** - -32-bit precision is the default used across all models and research. This precision is known to be stable in contrast to lower precision settings. - -.. testcode:: - - Trainer(precision=32) - ----- - -**************** -64-bit Precision -**************** - -For certain scientific computations, 64-bit precision enables more accurate models. However, doubling the precision from 32 to 64 bit also doubles the memory requirements. - -.. testcode:: - - Trainer(precision=64) - -.. note:: - - Since in deep learning, memory is always a bottleneck, especially when dealing with a large volume of data and with limited resources. - It is recommended using single precision for better speed. Although you can still use it if you want for your particular use-case. - ----- - -******************************** -Precision support by accelerator -******************************** - -.. list-table:: Precision with Accelerators - :widths: 20 20 20 20 20 - :header-rows: 1 - - * - Precision - - CPU - - GPU - - TPU - - IPU - * - 16 - - No - - Yes - - No - - Yes - * - BFloat16 - - Yes - - Yes - - Yes - - No - * - 32 - - Yes - - Yes - - Yes - - Yes - * - 64 - - Yes - - Yes - - No - - No diff --git a/docs/_sources/common/precision_expert.rst.txt b/docs/_sources/common/precision_expert.rst.txt deleted file mode 100644 index 34bc955..0000000 --- a/docs/_sources/common/precision_expert.rst.txt +++ /dev/null @@ -1,28 +0,0 @@ -:orphan: - -.. _precision_expert: - -######################## -N-Bit Precision (Expert) -######################## -**Audience:** Researchers looking to integrate their new precision techniques into Lightning. - - -***************** -Precision Plugins -***************** - -You can also customize and pass your own Precision Plugin by subclassing the :class:`~pytorch_lightning.plugins.precision.precision_plugin.PrecisionPlugin` class. - -- Perform pre and post backward/optimizer step operations such as scaling gradients. -- Provide context managers for forward, training_step, etc. - -.. code-block:: python - - class CustomPrecisionPlugin(PrecisionPlugin): - precision = 16 - - ... - - - trainer = Trainer(plugins=[CustomPrecisionPlugin()]) diff --git a/docs/_sources/common/precision_intermediate.rst.txt b/docs/_sources/common/precision_intermediate.rst.txt deleted file mode 100644 index 9ed4c75..0000000 --- a/docs/_sources/common/precision_intermediate.rst.txt +++ /dev/null @@ -1,143 +0,0 @@ -:orphan: - -.. _precision_intermediate: - -############################## -N-Bit Precision (Intermediate) -############################## -**Audience:** Users looking to scale larger models or take advantage of optimized accelerators. - ----- - -************************ -What is Mixed Precision? -************************ - -PyTorch, like most deep learning frameworks, trains on 32-bit floating-point (FP32) arithmetic by default. However, many deep learning models do not require this to reach complete accuracy. By conducting -operations in half-precision format while keeping minimum information in single-precision to maintain as much information as possible in crucial areas of the network, mixed precision training delivers -significant computational speedup. Switching to mixed precision has resulted in considerable training speedups since the introduction of Tensor Cores in the Volta and Turing architectures. It combines -FP32 and lower-bit floating-points (such as FP16) to reduce memory footprint and increase performance during model training and evaluation. It accomplishes this by recognizing the steps that require -complete accuracy and employing a 32-bit floating-point for those steps only, while using a 16-bit floating-point for the rest. When compared to complete precision training, mixed precision training -delivers all of these benefits while ensuring that no task-specific accuracy is lost. [`2 `_]. - -.. note:: - - In some cases, it is essential to remain in FP32 for numerical stability, so keep this in mind when using mixed precision. - For example, when running scatter operations during the forward (such as torchpoint3d), computation must remain in FP32. - -.. warning:: - - Do not cast anything to other dtypes manually using ``torch.autocast`` or ``tensor.half()`` when using native precision because - this can bring instability. - - .. code-block:: python - - class LitModel(LightningModule): - def training_step(self, batch, batch_idx): - outs = self(batch) - - a_float32 = torch.rand((8, 8), device=self.device, dtype=self.dtype) - b_float32 = torch.rand((8, 4), device=self.device, dtype=self.dtype) - - # casting to float16 manually - with torch.autocast(device_type=self.device.type): - c_float16 = torch.mm(a_float32, b_float32) - target = self.layer(c_float16.flatten()[None]) - - # here outs is of type float32 and target is of type float16 - loss = torch.mm(target @ outs).float() - return loss - - - trainer = Trainer(accelerator="gpu", devices=1, precision=32) - ----- - -******************** -FP16 Mixed Precision -******************** - -In most cases, mixed precision uses FP16. Supported `PyTorch operations `__ automatically run in FP16, saving memory and improving throughput on the supported accelerators. - - -.. note:: - - When using TPUs, setting ``precision=16`` will enable bfloat16, the only supported half precision type on TPUs. - -.. testcode:: - :skipif: not torch.cuda.is_available() - - Trainer(accelerator="gpu", devices=1, precision=16) - - -PyTorch Native --------------- - -PyTorch 1.6 release introduced mixed precision functionality into their core as the AMP package, `torch.cuda.amp `__. It is more flexible and intuitive compared to `NVIDIA APEX `__. -Since computation happens in FP16, there is a chance of numerical instability during training. This is handled internally by a dynamic grad scaler which skips invalid steps and adjusts the scaler to ensure subsequent steps fall within a finite range. For more information `see the autocast docs `__. -Lightning uses native amp by default with ``precision=16|"bf16"``. You can also set it using: - -.. testcode:: - - Trainer(precision=16, amp_backend="native") - - -NVIDIA APEX ------------ - -.. warning:: - - We strongly recommend using the above native mixed precision rather than NVIDIA APEX unless you require more refined control. - -`NVIDIA APEX `__ offers additional flexibility in setting mixed precision. This can be useful when trying out different precision configurations, such as keeping most of your weights in FP16 and running computation in FP16. - -.. testcode:: - :skipif: not _APEX_AVAILABLE or not torch.cuda.is_available() - - Trainer(accelerator="gpu", devices=1, amp_backend="apex", precision=16) - -Set the `NVIDIA optimization level `__ via the trainer. - -.. testcode:: - :skipif: not _APEX_AVAILABLE or not torch.cuda.is_available() - - Trainer(accelerator="gpu", devices=1, amp_backend="apex", amp_level="O2", precision=16) - ----- - -************************ -BFloat16 Mixed Precision -************************ - -.. warning:: - - BFloat16 requires PyTorch 1.10 or later and is only supported with PyTorch Native AMP. - - BFloat16 is also experimental and may not provide significant speedups or memory improvements, offering better numerical stability. - - Do note for GPUs, the most significant benefits require `Ampere `__ based GPUs, such as A100s or 3090s. - -BFloat16 Mixed precision is similar to FP16 mixed precision, however, it maintains more of the "dynamic range" that FP32 offers. This means it is able to improve numerical stability than FP16 mixed precision. For more information, see `this TPU performance blogpost `__. - -Under the hood, we use `torch.autocast `__ with the dtype set to ``bfloat16``, with no gradient scaling. - -.. testcode:: - :skipif: not _TORCH_GREATER_EQUAL_1_10 or not torch.cuda.is_available() - - Trainer(accelerator="gpu", devices=1, precision="bf16") - -It is also possible to use BFloat16 mixed precision on the CPU, relying on MKLDNN under the hood. - -.. testcode:: - :skipif: not _TORCH_GREATER_EQUAL_1_10 - - Trainer(precision="bf16") - ----- - -*************** -8-bit Optimizer -*************** - -It is possible to further reduce the precision using third-party libraries like `bitsandbytes `_. Although, -Lightning doesn't support it out of the box yet but you can still use it by configuring it in your LightningModule and setting ``Trainer(precision=32)``. diff --git a/docs/_sources/common/progress_bar.rst.txt b/docs/_sources/common/progress_bar.rst.txt deleted file mode 100644 index d00c716..0000000 --- a/docs/_sources/common/progress_bar.rst.txt +++ /dev/null @@ -1,138 +0,0 @@ -.. testsetup:: * - - from pytorch_lightning.trainer.trainer import Trainer - -.. _progress_bar: - - -Customize the progress bar -========================== - -Lightning supports two different types of progress bars (`tqdm `_ and `rich `_). :class:`~pytorch_lightning.callbacks.TQDMProgressBar` is used by default, -but you can override it by passing a custom :class:`~pytorch_lightning.callbacks.TQDMProgressBar` or :class:`~pytorch_lightning.callbacks.RichProgressBar` to the ``callbacks`` argument of the :class:`~pytorch_lightning.trainer.trainer.Trainer`. - -You could also use the :class:`~pytorch_lightning.callbacks.ProgressBarBase` class to implement your own progress bar. - -------------- - -TQDMProgressBar ---------------- - -The :class:`~pytorch_lightning.callbacks.TQDMProgressBar` uses the `tqdm `_ library internally and is the default progress bar used by Lightning. -It prints to ``stdout`` and shows up to four different bars: - -- **sanity check progress:** the progress during the sanity check run -- **main progress:** shows training + validation progress combined. It also accounts for multiple validation runs during training when :paramref:`~pytorch_lightning.trainer.trainer.Trainer.val_check_interval` is used. -- **validation progress:** only visible during validation; shows total progress over all validation datasets. -- **test progress:** only active when testing; shows total progress over all test datasets. - -For infinite datasets, the progress bar never ends. - -You can update ``refresh_rate`` (rate (number of batches) at which the progress bar get updated) for :class:`~pytorch_lightning.callbacks.TQDMProgressBar` by: - -.. code-block:: python - - from pytorch_lightning.callbacks import TQDMProgressBar - - trainer = Trainer(callbacks=[TQDMProgressBar(refresh_rate=10)]) - -If you want to customize the default :class:`~pytorch_lightning.callbacks.TQDMProgressBar` used by Lightning, you can override -specific methods of the callback class and pass your custom implementation to the :class:`~pytorch_lightning.trainer.trainer.Trainer`. - -.. code-block:: python - - class LitProgressBar(TQDMProgressBar): - def init_validation_tqdm(self): - bar = super().init_validation_tqdm() - bar.set_description("running validation...") - return bar - - - trainer = Trainer(callbacks=[LitProgressBar()]) - -.. seealso:: - - :class:`~pytorch_lightning.callbacks.TQDMProgressBar` docs. - - `tqdm library `__ - ----------------- - -RichProgressBar ---------------- - -`Rich `_ is a Python library for rich text and beautiful formatting in the terminal. -To use the :class:`~pytorch_lightning.callbacks.RichProgressBar` as your progress bar, first install the package: - -.. code-block:: bash - - pip install rich - -Then configure the callback and pass it to the :class:`~pytorch_lightning.trainer.trainer.Trainer`: - -.. code-block:: python - - from pytorch_lightning.callbacks import RichProgressBar - - trainer = Trainer(callbacks=[RichProgressBar()]) - -Customize the theme for your :class:`~pytorch_lightning.callbacks.RichProgressBar` like this: - -.. code-block:: python - - from pytorch_lightning.callbacks import RichProgressBar - from pytorch_lightning.callbacks.progress.rich_progress import RichProgressBarTheme - - # create your own theme! - progress_bar = RichProgressBar( - theme=RichProgressBarTheme( - description="green_yellow", - progress_bar="green1", - progress_bar_finished="green1", - progress_bar_pulse="#6206E0", - batch_progress="green_yellow", - time="grey82", - processing_speed="grey82", - metrics="grey82", - ) - ) - - trainer = Trainer(callbacks=progress_bar) - -You can customize the components used within :class:`~pytorch_lightning.callbacks.RichProgressBar` with ease by overriding the -:func:`~pytorch_lightning.callbacks.RichProgressBar.configure_columns` method. - -.. code-block:: python - - from rich.progress import TextColumn - - custom_column = TextColumn("[progress.description]Custom Rich Progress Bar!") - - - class CustomRichProgressBar(RichProgressBar): - def configure_columns(self, trainer): - return [custom_column] - - - progress_bar = CustomRichProgressBar() - -If you wish for a new progress bar to be displayed at the end of every epoch, you should enable -:paramref:`RichProgressBar.leave ` by passing ``True`` - -.. code-block:: python - - from pytorch_lightning.callbacks import RichProgressBar - - trainer = Trainer(callbacks=[RichProgressBar(leave=True)]) - -.. seealso:: - - :class:`~pytorch_lightning.callbacks.RichProgressBar` docs. - - :class:`~pytorch_lightning.callbacks.RichModelSummary` docs to customize the model summary table. - - `Rich library `__. - - -.. note:: - - Progress bar is automatically enabled with the Trainer, and to disable it, one should do this: - - .. code-block:: python - - trainer = Trainer(enable_progress_bar=False) diff --git a/docs/_sources/common/remote_fs.rst.txt b/docs/_sources/common/remote_fs.rst.txt deleted file mode 100644 index 29a4fe7..0000000 --- a/docs/_sources/common/remote_fs.rst.txt +++ /dev/null @@ -1,57 +0,0 @@ -.. _remote_fs: - -################## -Remote Filesystems -################## - -PyTorch Lightning enables working with data from a variety of filesystems, including local filesystems and several cloud storage providers such as -`S3 `_ on `AWS `_, `GCS `_ on `Google Cloud `_, -or `ADL `_ on `Azure `_. - -This applies to saving and writing checkpoints, as well as for logging. -Working with different filesystems can be accomplished by appending a protocol like "s3:/" to file paths for writing and reading data. - -.. code-block:: python - - # `default_root_dir` is the default path used for logs and checkpoints - trainer = Trainer(default_root_dir="s3://my_bucket/data/") - trainer.fit(model) - -You could pass custom paths to loggers for logging data. - -.. code-block:: python - - from pytorch_lightning.loggers import TensorBoardLogger - - logger = TensorBoardLogger(save_dir="s3://my_bucket/logs/") - - trainer = Trainer(logger=logger) - trainer.fit(model) - -Additionally, you could also resume training with a checkpoint stored at a remote filesystem. - -.. code-block:: python - - trainer = Trainer(default_root_dir=tmpdir, max_steps=3) - trainer.fit(model, ckpt_path="s3://my_bucket/ckpts/classifier.ckpt") - -PyTorch Lightning uses `fsspec `_ internally to handle all filesystem operations. - -The most common filesystems supported by Lightning are: - -* Local filesystem: ``file://`` - It's the default and doesn't need any protocol to be used. It's installed by default in Lightning. -* Amazon S3: ``s3://`` - Amazon S3 remote binary store, using the library `s3fs `__. Run ``pip install fsspec[s3]`` to install it. -* Google Cloud Storage: ``gcs://`` or ``gs://`` - Google Cloud Storage, using `gcsfs `__. Run ``pip install fsspec[gcs]`` to install it. -* Microsoft Azure Storage: ``adl://``, ``abfs://`` or ``az://`` - Microsoft Azure Storage, using `adlfs `__. Run ``pip install fsspec[adl]`` to install it. -* Hadoop File System: ``hdfs://`` - Hadoop Distributed File System. This uses `PyArrow `__ as the backend. Run ``pip install fsspec[hdfs]`` to install it. - -You could learn more about the available filesystems with: - -.. code-block:: python - - from fsspec.registry import known_implementations - - print(known_implementations) - - -You could also look into :ref:`CheckpointIO Plugin ` for more details on how to customize saving and loading checkpoints. diff --git a/docs/_sources/common/trainer.rst.txt b/docs/_sources/common/trainer.rst.txt deleted file mode 100644 index 848ac8a..0000000 --- a/docs/_sources/common/trainer.rst.txt +++ /dev/null @@ -1,1832 +0,0 @@ -.. role:: hidden - :class: hidden-section - -.. testsetup:: * - - import os - from pytorch_lightning.trainer.trainer import Trainer - from pytorch_lightning.core.lightning import LightningModule - from pytorch_lightning.utilities.seed import seed_everything - -.. _trainer: - -Trainer -======= - -Once you've organized your PyTorch code into a LightningModule, -the Trainer automates everything else. - -.. raw:: html - - - -| - -This abstraction achieves the following: - -1. You maintain control over all aspects via PyTorch code without an added abstraction. - -2. The trainer uses best practices embedded by contributors and users - from top AI labs such as Facebook AI Research, NYU, MIT, Stanford, etc... - -3. The trainer allows overriding any key part that you don't want automated. - -| - ------------ - -Basic use ---------- - -This is the basic use of the trainer: - -.. code-block:: python - - model = MyLightningModule() - - trainer = Trainer() - trainer.fit(model, train_dataloader, val_dataloader) - --------- - -Under the hood --------------- -Under the hood, the Lightning Trainer handles the training loop details for you, some examples include: - -- Automatically enabling/disabling grads -- Running the training, validation and test dataloaders -- Calling the Callbacks at the appropriate times -- Putting batches and computations on the correct devices - -Here's the pseudocode for what the trainer does under the hood (showing the train loop only) - -.. code-block:: python - - # put model in train mode - model.train() - torch.set_grad_enabled(True) - - losses = [] - for batch in train_dataloader: - # calls hooks like this one - on_train_batch_start() - - # train step - loss = training_step(batch) - - # clear gradients - optimizer.zero_grad() - - # backward - loss.backward() - - # update parameters - optimizer.step() - - losses.append(loss) - - --------- - -Trainer in Python scripts -------------------------- -In Python scripts, it's recommended you use a main function to call the Trainer. - -.. code-block:: python - - from argparse import ArgumentParser - - - def main(hparams): - model = LightningModule() - trainer = Trainer(accelerator=hparams.accelerator, devices=hparams.devices) - trainer.fit(model) - - - if __name__ == "__main__": - parser = ArgumentParser() - parser.add_argument("--accelerator", default=None) - parser.add_argument("--devices", default=None) - args = parser.parse_args() - - main(args) - -So you can run it like so: - -.. code-block:: bash - - python main.py --accelerator 'gpu' --devices 2 - -.. note:: - - Pro-tip: You don't need to define all flags manually. Lightning can add them automatically - -.. code-block:: python - - from argparse import ArgumentParser - - - def main(args): - model = LightningModule() - trainer = Trainer.from_argparse_args(args) - trainer.fit(model) - - - if __name__ == "__main__": - parser = ArgumentParser() - parser = Trainer.add_argparse_args(parser) - args = parser.parse_args() - - main(args) - -So you can run it like so: - -.. code-block:: bash - - python main.py --accelerator 'gpu' --devices 2 --max_steps 10 --limit_train_batches 10 --any_trainer_arg x - -.. note:: - If you want to stop a training run early, you can press "Ctrl + C" on your keyboard. - The trainer will catch the ``KeyboardInterrupt`` and attempt a graceful shutdown, including - running accelerator callback ``on_train_end`` to clean up memory. The trainer object will also set - an attribute ``interrupted`` to ``True`` in such cases. If you have a callback which shuts down compute - resources, for example, you can conditionally run the shutdown logic for only uninterrupted runs. - ------------- - -Validation ----------- -You can perform an evaluation epoch over the validation set, outside of the training loop, -using :meth:`~pytorch_lightning.trainer.trainer.Trainer.validate`. This might be -useful if you want to collect new metrics from a model right at its initialization -or after it has already been trained. - -.. code-block:: python - - trainer.validate(dataloaders=val_dataloaders) - ------------- - -Testing -------- -Once you're done training, feel free to run the test set! -(Only right before publishing your paper or pushing to production) - -.. code-block:: python - - trainer.test(dataloaders=test_dataloaders) - ------------- - -Reproducibility ---------------- - -To ensure full reproducibility from run to run you need to set seeds for pseudo-random generators, -and set ``deterministic`` flag in ``Trainer``. - -Example:: - - from pytorch_lightning import Trainer, seed_everything - - seed_everything(42, workers=True) - # sets seeds for numpy, torch and python.random. - model = Model() - trainer = Trainer(deterministic=True) - - -By setting ``workers=True`` in :func:`~pytorch_lightning.utilities.seed.seed_everything`, Lightning derives -unique seeds across all dataloader workers and processes for :mod:`torch`, :mod:`numpy` and stdlib -:mod:`random` number generators. When turned on, it ensures that e.g. data augmentations are not repeated across workers. - -------- - -.. _trainer_flags: - -Trainer flags -------------- - -accelerator -^^^^^^^^^^^ - -Supports passing different accelerator types (``"cpu", "gpu", "tpu", "ipu", "auto"``) -as well as custom accelerator instances. - -.. code-block:: python - - # CPU accelerator - trainer = Trainer(accelerator="cpu") - - # Training with GPU Accelerator using 2 GPUs - trainer = Trainer(devices=2, accelerator="gpu") - - # Training with TPU Accelerator using 8 tpu cores - trainer = Trainer(devices=8, accelerator="tpu") - - # Training with GPU Accelerator using the DistributedDataParallel strategy - trainer = Trainer(devices=4, accelerator="gpu", strategy="ddp") - -.. note:: The ``"auto"`` option recognizes the machine you are on, and selects the respective ``Accelerator``. - -.. code-block:: python - - # If your machine has GPUs, it will use the GPU Accelerator for training - trainer = Trainer(devices=2, accelerator="auto") - -You can also modify hardware behavior by subclassing an existing accelerator to adjust for your needs. - -Example:: - - class MyOwnAcc(CPUAccelerator): - ... - - Trainer(accelerator=MyOwnAcc()) - -.. note:: - - If the ``devices`` flag is not defined, it will assume ``devices`` to be ``"auto"`` and fetch the ``auto_device_count`` - from the accelerator. - - .. code-block:: python - - # This is part of the built-in `GPUAccelerator` - class GPUAccelerator(Accelerator): - """Accelerator for GPU devices.""" - - @staticmethod - def auto_device_count() -> int: - """Get the devices when set to auto.""" - return torch.cuda.device_count() - - - # Training with GPU Accelerator using total number of gpus available on the system - Trainer(accelerator="gpu") - -.. warning:: Passing training strategies (e.g., ``"ddp"``) to ``accelerator`` has been deprecated in v1.5.0 - and will be removed in v1.7.0. Please use the ``strategy`` argument instead. - -accumulate_grad_batches -^^^^^^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Accumulates grads every k batches or as set up in the dict. -Trainer also calls ``optimizer.step()`` for the last indivisible step number. - -.. testcode:: - - # default used by the Trainer (no accumulation) - trainer = Trainer(accumulate_grad_batches=1) - -Example:: - - # accumulate every 4 batches (effective batch size is batch*4) - trainer = Trainer(accumulate_grad_batches=4) - - # no accumulation for epochs 1-4. accumulate 3 for epochs 5-10. accumulate 20 after that - trainer = Trainer(accumulate_grad_batches={5: 3, 10: 20}) - -amp_backend -^^^^^^^^^^^ - -.. raw:: html - - - -| - -Use PyTorch AMP ('native'), or NVIDIA apex ('apex'). - -.. testcode:: - - # using PyTorch built-in AMP, default used by the Trainer - trainer = Trainer(amp_backend="native") - - # using NVIDIA Apex - trainer = Trainer(amp_backend="apex") - -amp_level -^^^^^^^^^ - -.. raw:: html - - - -| - -The optimization level to use (O1, O2, etc...) -for 16-bit GPU precision (using NVIDIA apex under the hood). - -Check `NVIDIA apex docs `_ for level - -Example:: - - # default used by the Trainer - trainer = Trainer(amp_level='O2') - -auto_scale_batch_size -^^^^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Automatically tries to find the largest batch size that fits into memory, -before any training. - -.. code-block:: python - - # default used by the Trainer (no scaling of batch size) - trainer = Trainer(auto_scale_batch_size=None) - - # run batch size scaling, result overrides hparams.batch_size - trainer = Trainer(auto_scale_batch_size="binsearch") - - # call tune to find the batch size - trainer.tune(model) - -auto_select_gpus -^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -If enabled and ``devices`` is an integer, pick available GPUs automatically. -This is especially useful when GPUs are configured to be in "exclusive mode", -such that only one process at a time can access them. - -Example:: - - # no auto selection (picks first 2 GPUs on system, may fail if other process is occupying) - trainer = Trainer(accelerator="gpu", devices=2, auto_select_gpus=False) - - # enable auto selection (will find two available GPUs on system) - trainer = Trainer(accelerator="gpu", devices=2, auto_select_gpus=True) - - # specifies all GPUs regardless of its availability - Trainer(accelerator="gpu", devices=-1, auto_select_gpus=False) - - # specifies all available GPUs (if only one GPU is not occupied, uses one gpu) - Trainer(accelerator="gpu", devices=-1, auto_select_gpus=True) - -auto_lr_find -^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Runs a learning rate finder algorithm (see this `paper `_) -when calling trainer.tune(), to find optimal initial learning rate. - -.. code-block:: python - - # default used by the Trainer (no learning rate finder) - trainer = Trainer(auto_lr_find=False) - -Example:: - - # run learning rate finder, results override hparams.learning_rate - trainer = Trainer(auto_lr_find=True) - - # call tune to find the lr - trainer.tune(model) - -Example:: - - # run learning rate finder, results override hparams.my_lr_arg - trainer = Trainer(auto_lr_find='my_lr_arg') - - # call tune to find the lr - trainer.tune(model) - -.. note:: - See the :ref:`learning rate finder guide `. - -benchmark -^^^^^^^^^ - -.. raw:: html - - - -| - -Defaults to ``True`` if :paramref:`~pytorch_lightning.trainer.Trainer.deterministic` is not set. -This flag sets the ``torch.backends.cudnn.benchmark`` flag. You can read more about its impact -`here `__ - -This is likely to increase the speed of your system if your input sizes don't change. However, if they do, then it -might make your system slower. The CUDNN auto-tuner will try to find the best algorithm for the hardware when a new -input size is encountered. Read more about it `here `__. - -Example:: - - # defaults to True if not deterministic (which is False by default) - trainer = Trainer() - - # you can overwrite the value - trainer = Trainer(benchmark=False) - -deterministic -^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -This flag sets the ``torch.backends.cudnn.deterministic`` flag. -Might make your system slower, but ensures reproducibility. -Also sets ``$HOROVOD_FUSION_THRESHOLD=0``. - -For more info check `PyTorch docs `_. - -Example:: - - # default used by the Trainer - trainer = Trainer(deterministic=False) - -callbacks -^^^^^^^^^ - -.. raw:: html - - - -| - -Add a list of :class:`~pytorch_lightning.callbacks.Callback`. Callbacks run sequentially in the order defined here -with the exception of :class:`~pytorch_lightning.callbacks.model_checkpoint.ModelCheckpoint` callbacks which run -after all others to ensure all states are saved to the checkpoints. - -.. code-block:: python - - # a list of callbacks - callbacks = [PrintCallback()] - trainer = Trainer(callbacks=callbacks) - -Example:: - - from pytorch_lightning.callbacks import Callback - - class PrintCallback(Callback): - def on_train_start(self, trainer, pl_module): - print("Training is started!") - def on_train_end(self, trainer, pl_module): - print("Training is done.") - - -Model-specific callbacks can also be added inside the ``LightningModule`` through -:meth:`~pytorch_lightning.core.lightning.LightningModule.configure_callbacks`. -Callbacks returned in this hook will extend the list initially given to the ``Trainer`` argument, and replace -the trainer callbacks should there be two or more of the same type. -:class:`~pytorch_lightning.callbacks.model_checkpoint.ModelCheckpoint` callbacks always run last. - - -check_val_every_n_epoch -^^^^^^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Check val every n train epochs. - -Example:: - - # default used by the Trainer - trainer = Trainer(check_val_every_n_epoch=1) - - # run val loop every 10 training epochs - trainer = Trainer(check_val_every_n_epoch=10) - -checkpoint_callback -^^^^^^^^^^^^^^^^^^^ - -.. warning:: `checkpoint_callback` has been deprecated in v1.5 and will be removed in v1.7. - To disable checkpointing, pass ``enable_checkpointing = False`` to the Trainer instead. - - -default_root_dir -^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Default path for logs and weights when no logger or -:class:`pytorch_lightning.callbacks.ModelCheckpoint` callback passed. On -certain clusters you might want to separate where logs and checkpoints are -stored. If you don't then use this argument for convenience. Paths can be local -paths or remote paths such as `s3://bucket/path` or 'hdfs://path/'. Credentials -will need to be set up to use remote filepaths. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(default_root_dir=os.getcwd()) - -devices -^^^^^^^ - -Number of devices to train on (``int``), which devices to train on (``list`` or ``str``), or ``"auto"``. -It will be mapped to either ``gpus``, ``tpu_cores``, ``num_processes`` or ``ipus``, -based on the accelerator type (``"cpu", "gpu", "tpu", "ipu", "auto"``). - -.. code-block:: python - - # Training with CPU Accelerator using 2 processes - trainer = Trainer(devices=2, accelerator="cpu") - - # Training with GPU Accelerator using GPUs 1 and 3 - trainer = Trainer(devices=[1, 3], accelerator="gpu") - - # Training with TPU Accelerator using 8 tpu cores - trainer = Trainer(devices=8, accelerator="tpu") - -.. tip:: The ``"auto"`` option recognizes the devices to train on, depending on the ``Accelerator`` being used. - -.. code-block:: python - - # If your machine has GPUs, it will use all the available GPUs for training - trainer = Trainer(devices="auto", accelerator="auto") - - # Training with CPU Accelerator using 1 process - trainer = Trainer(devices="auto", accelerator="cpu") - - # Training with TPU Accelerator using 8 tpu cores - trainer = Trainer(devices="auto", accelerator="tpu") - - # Training with IPU Accelerator using 4 ipus - trainer = Trainer(devices="auto", accelerator="ipu") - -.. note:: - - If the ``devices`` flag is not defined, it will assume ``devices`` to be ``"auto"`` and fetch the ``auto_device_count`` - from the accelerator. - - .. code-block:: python - - # This is part of the built-in `GPUAccelerator` - class GPUAccelerator(Accelerator): - """Accelerator for GPU devices.""" - - @staticmethod - def auto_device_count() -> int: - """Get the devices when set to auto.""" - return torch.cuda.device_count() - - - # Training with GPU Accelerator using total number of gpus available on the system - Trainer(accelerator="gpu") - -enable_checkpointing -^^^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -By default Lightning saves a checkpoint for you in your current working directory, with the state of your last training epoch, -Checkpoints capture the exact value of all parameters used by a model. -To disable automatic checkpointing, set this to `False`. - -.. code-block:: python - - # default used by Trainer, saves the most recent model to a single checkpoint after each epoch - trainer = Trainer(enable_checkpointing=True) - - # turn off automatic checkpointing - trainer = Trainer(enable_checkpointing=False) - - -You can override the default behavior by initializing the :class:`~pytorch_lightning.callbacks.ModelCheckpoint` -callback, and adding it to the :paramref:`~pytorch_lightning.trainer.trainer.Trainer.callbacks` list. -See :doc:`Saving and Loading Checkpoints <../common/checkpointing>` for how to customize checkpointing. - -.. testcode:: - - from pytorch_lightning.callbacks import ModelCheckpoint - - # Init ModelCheckpoint callback, monitoring 'val_loss' - checkpoint_callback = ModelCheckpoint(monitor="val_loss") - - # Add your callback to the callbacks list - trainer = Trainer(callbacks=[checkpoint_callback]) - -fast_dev_run -^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Runs n if set to ``n`` (int) else 1 if set to ``True`` batch(es) of train, val and test -to find any bugs (ie: a sort of unit test). - -Under the hood the pseudocode looks like this when running *fast_dev_run* with a single batch: - -.. code-block:: python - - # loading - __init__() - prepare_data - - # test training step - training_batch = next(train_dataloader) - training_step(training_batch) - - # test val step - val_batch = next(val_dataloader) - out = validation_step(val_batch) - validation_epoch_end([out]) - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(fast_dev_run=False) - - # runs 1 train, val, test batch and program ends - trainer = Trainer(fast_dev_run=True) - - # runs 7 train, val, test batches and program ends - trainer = Trainer(fast_dev_run=7) - -.. note:: - - This argument is a bit different from ``limit_train/val/test_batches``. Setting this argument will - disable tuner, checkpoint callbacks, early stopping callbacks, loggers and logger callbacks like - ``LearningRateLogger`` and runs for only 1 epoch. This must be used only for debugging purposes. - ``limit_train/val/test_batches`` only limits the number of batches and won't disable anything. - -flush_logs_every_n_steps -^^^^^^^^^^^^^^^^^^^^^^^^ - -.. warning:: ``flush_logs_every_n_steps`` has been deprecated in v1.5 and will be removed in v1.7. - Please configure flushing directly in the logger instead. - -.. raw:: html - - - -| - -Writes logs to disk this often. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(flush_logs_every_n_steps=100) - -See Also: - - :doc:`logging <../extensions/logging>` - -.. _gpus: - -gpus -^^^^ - -.. warning:: ``gpus=x`` has been deprecated in v1.7 and will be removed in v2.0. - Please use ``accelerator='gpu'`` and ``devices=x`` instead. - -.. raw:: html - - - -| - -- Number of GPUs to train on (int) -- or which GPUs to train on (list) -- can handle strings - -.. testcode:: - - # default used by the Trainer (ie: train on CPU) - trainer = Trainer(gpus=None) - - # equivalent - trainer = Trainer(gpus=0) - -Example:: - - # int: train on 2 gpus - trainer = Trainer(gpus=2) - - # list: train on GPUs 1, 4 (by bus ordering) - trainer = Trainer(gpus=[1, 4]) - trainer = Trainer(gpus='1, 4') # equivalent - - # -1: train on all gpus - trainer = Trainer(gpus=-1) - trainer = Trainer(gpus='-1') # equivalent - - # combine with num_nodes to train on multiple GPUs across nodes - # uses 8 gpus in total - trainer = Trainer(gpus=2, num_nodes=4) - - # train only on GPUs 1 and 4 across nodes - trainer = Trainer(gpus=[1, 4], num_nodes=4) - -See Also: - - :ref:`Multi GPU Training ` - -gradient_clip_val -^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Gradient clipping value - -- 0 means don't clip. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(gradient_clip_val=0.0) - -limit_train_batches -^^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -How much of training dataset to check. -Useful when debugging or testing something that happens at the end of an epoch. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(limit_train_batches=1.0) - -Example:: - - # default used by the Trainer - trainer = Trainer(limit_train_batches=1.0) - - # run through only 25% of the training set each epoch - trainer = Trainer(limit_train_batches=0.25) - - # run through only 10 batches of the training set each epoch - trainer = Trainer(limit_train_batches=10) - -limit_test_batches -^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -How much of test dataset to check. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(limit_test_batches=1.0) - - # run through only 25% of the test set each epoch - trainer = Trainer(limit_test_batches=0.25) - - # run for only 10 batches - trainer = Trainer(limit_test_batches=10) - -In the case of multiple test dataloaders, the limit applies to each dataloader individually. - -limit_val_batches -^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -How much of validation dataset to check. -Useful when debugging or testing something that happens at the end of an epoch. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(limit_val_batches=1.0) - - # run through only 25% of the validation set each epoch - trainer = Trainer(limit_val_batches=0.25) - - # run for only 10 batches - trainer = Trainer(limit_val_batches=10) - -In the case of multiple validation dataloaders, the limit applies to each dataloader individually. - -log_every_n_steps -^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - - -How often to add logging rows (does not write to disk) - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(log_every_n_steps=50) - -See Also: - - :doc:`logging <../extensions/logging>` - -logger -^^^^^^ - -.. raw:: html - - - -| - -:doc:`Logger <../visualize/loggers>` (or iterable collection of loggers) for experiment tracking. A ``True`` value uses the default ``TensorBoardLogger`` shown below. ``False`` will disable logging. - -.. testcode:: - - from pytorch_lightning.loggers import TensorBoardLogger - - # default logger used by trainer - logger = TensorBoardLogger(save_dir=os.getcwd(), version=1, name="lightning_logs") - Trainer(logger=logger) - -max_epochs -^^^^^^^^^^ - -.. raw:: html - - - -| - -Stop training once this number of epochs is reached - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(max_epochs=1000) - -If both ``max_epochs`` and ``max_steps`` aren't specified, ``max_epochs`` will default to ``1000``. -To enable infinite training, set ``max_epochs = -1``. - -min_epochs -^^^^^^^^^^ - -.. raw:: html - - - -| - -Force training for at least these many epochs - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(min_epochs=1) - -max_steps -^^^^^^^^^ - -.. raw:: html - - - -| - -Stop training after this number of :ref:`global steps `. -Training will stop if max_steps or max_epochs have reached (earliest). - -.. testcode:: - - # Default (disabled) - trainer = Trainer(max_steps=None) - - # Stop after 100 steps - trainer = Trainer(max_steps=100) - -If ``max_steps`` is not specified, ``max_epochs`` will be used instead (and ``max_epochs`` defaults to -``1000`` if ``max_epochs`` is not specified). To disable this default, set ``max_steps = -1``. - -min_steps -^^^^^^^^^ - -.. raw:: html - - - -| - -Force training for at least this number of :ref:`global steps `. -Trainer will train model for at least min_steps or min_epochs (latest). - -.. testcode:: - - # Default (disabled) - trainer = Trainer(min_steps=None) - - # Run at least for 100 steps (disable min_epochs) - trainer = Trainer(min_steps=100, min_epochs=0) - -max_time -^^^^^^^^ - -Set the maximum amount of time for training. Training will get interrupted mid-epoch. -For customizable options use the :class:`~pytorch_lightning.callbacks.timer.Timer` callback. - -.. testcode:: - - # Default (disabled) - trainer = Trainer(max_time=None) - - # Stop after 12 hours of training or when reaching 10 epochs (string) - trainer = Trainer(max_time="00:12:00:00", max_epochs=10) - - # Stop after 1 day and 5 hours (dict) - trainer = Trainer(max_time={"days": 1, "hours": 5}) - -In case ``max_time`` is used together with ``min_steps`` or ``min_epochs``, the ``min_*`` requirement -always has precedence. - -num_nodes -^^^^^^^^^ - -.. raw:: html - - - -| - -Number of GPU nodes for distributed training. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(num_nodes=1) - - # to train on 8 nodes - trainer = Trainer(num_nodes=8) - -num_processes -^^^^^^^^^^^^^ - -.. warning:: ``num_processes=x`` has been deprecated in v1.7 and will be removed in v2.0. - Please use ``accelerator='cpu'`` and ``devices=x`` instead. - -.. raw:: html - - - -| - -Number of processes to train with. Automatically set to the number of GPUs -when using ``strategy="ddp"``. Set to a number greater than 1 when -using ``accelerator="cpu"`` and ``strategy="ddp"`` to mimic distributed training on a -machine without GPUs. This is useful for debugging, but **will not** provide -any speedup, since single-process Torch already makes efficient use of multiple -CPUs. While it would typically spawns subprocesses for training, setting -``num_nodes > 1`` and keeping ``num_processes = 1`` runs training in the main -process. - -.. testcode:: - - # Simulate DDP for debugging on your GPU-less laptop - trainer = Trainer(accelerator="cpu", strategy="ddp", num_processes=2) - -num_sanity_val_steps -^^^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Sanity check runs n batches of val before starting the training routine. -This catches any bugs in your validation without having to wait for the first validation check. -The Trainer uses 2 steps by default. Turn it off or modify it here. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(num_sanity_val_steps=2) - - # turn it off - trainer = Trainer(num_sanity_val_steps=0) - - # check all validation data - trainer = Trainer(num_sanity_val_steps=-1) - - -This option will reset the validation dataloader unless ``num_sanity_val_steps=0``. - -overfit_batches -^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Uses this much data of the training & validation set. -If the training & validation dataloaders have ``shuffle=True``, Lightning will automatically disable it. - -Useful for quickly debugging or trying to overfit on purpose. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(overfit_batches=0.0) - - # use only 1% of the train & val set - trainer = Trainer(overfit_batches=0.01) - - # overfit on 10 of the same batches - trainer = Trainer(overfit_batches=10) - -plugins -^^^^^^^ - -.. raw:: html - - - -| - -:ref:`Plugins` allow you to connect arbitrary backends, precision libraries, clusters etc. For example: - -- :ref:`Checkpoint IO ` -- `TorchElastic `_ -- :ref:`Precision Plugins ` - -To define your own behavior, subclass the relevant class and pass it in. Here's an example linking up your own -:class:`~pytorch_lightning.plugins.environments.ClusterEnvironment`. - -.. code-block:: python - - from pytorch_lightning.plugins.environments import ClusterEnvironment - - - class MyCluster(ClusterEnvironment): - def main_address(self): - return your_main_address - - def main_port(self): - return your_main_port - - def world_size(self): - return the_world_size - - - trainer = Trainer(plugins=[MyCluster()], ...) - -precision -^^^^^^^^^ - -.. raw:: html - - - -| - -Lightning supports either double (64), float (32), bfloat16 (bf16), or half (16) precision training. - -Half precision, or mixed precision, is the combined use of 32 and 16 bit floating points to reduce memory footprint during model training. This can result in improved performance, achieving +3X speedups on modern GPUs. - -.. testcode:: - :skipif: not torch.cuda.is_available() - - # default used by the Trainer - trainer = Trainer(precision=32) - - # 16-bit precision - trainer = Trainer(precision=16, accelerator="gpu", devices=1) # works only on CUDA - - # bfloat16 precision - trainer = Trainer(precision="bf16") - - # 64-bit precision - trainer = Trainer(precision=64) - - -.. note:: When running on TPUs, torch.bfloat16 will be used but tensor printing will still show torch.float32. - -.. admonition:: If you are interested in using Apex 16-bit training: - :class: dropdown - - NVIDIA Apex and DDP have instability problems. We recommend using the native AMP for 16-bit precision with multiple GPUs. - To use Apex 16-bit training: - - 1. `Install apex. `__ - - 2. Set the ``precision`` trainer flag to 16. You can customize the `Apex optimization level `_ by setting the `amp_level` flag. - - .. testcode:: - :skipif: not _APEX_AVAILABLE or not torch.cuda.is_available() - - # turn on 16-bit - trainer = Trainer(amp_backend="apex", amp_level="O2", precision=16, accelerator="gpu", devices=1) - - -process_position -^^^^^^^^^^^^^^^^ - -.. warning:: ``process_position`` has been deprecated in v1.5 and will be removed in v1.7. - Please pass :class:`~pytorch_lightning.callbacks.progress.TQDMProgressBar` with ``process_position`` - directly to the Trainer's ``callbacks`` argument instead. - -.. raw:: html - - - -| - -Orders the progress bar. Useful when running multiple trainers on the same node. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(process_position=0) - -.. note:: This argument is ignored if a custom callback is passed to :paramref:`~Trainer.callbacks`. - -profiler -^^^^^^^^ - -.. raw:: html - - - -| - -To profile individual steps during training and assist in identifying bottlenecks. - -See the :doc:`profiler documentation <../tuning/profiler>`. for more details. - -.. testcode:: - - from pytorch_lightning.profiler import SimpleProfiler, AdvancedProfiler - - # default used by the Trainer - trainer = Trainer(profiler=None) - - # to profile standard training events, equivalent to `profiler=SimpleProfiler()` - trainer = Trainer(profiler="simple") - - # advanced profiler for function-level stats, equivalent to `profiler=AdvancedProfiler()` - trainer = Trainer(profiler="advanced") - -enable_progress_bar -^^^^^^^^^^^^^^^^^^^ - -Whether to enable or disable the progress bar. Defaults to True. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(enable_progress_bar=True) - - # disable progress bar - trainer = Trainer(enable_progress_bar=False) - -reload_dataloaders_every_n_epochs -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Set to a positive integer to reload dataloaders every n epochs. - -.. code-block:: python - - # if 0 (default) - train_loader = model.train_dataloader() - for epoch in epochs: - for batch in train_loader: - ... - - # if a positive integer - for epoch in epochs: - if not epoch % reload_dataloaders_every_n_epochs: - train_loader = model.train_dataloader() - for batch in train_loader: - ... - -.. _replace-sampler-ddp: - -replace_sampler_ddp -^^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Enables auto adding of :class:`~torch.utils.data.distributed.DistributedSampler`. In PyTorch, you must use it in -distributed settings such as TPUs or multi-node. The sampler makes sure each GPU sees the appropriate part of your data. -By default it will add ``shuffle=True`` for train sampler and ``shuffle=False`` for val/test sampler. -If you want to customize it, you can set ``replace_sampler_ddp=False`` and add your own distributed sampler. -If ``replace_sampler_ddp=True`` and a distributed sampler was already added, -Lightning will not replace the existing one. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(replace_sampler_ddp=True) - -By setting to False, you have to add your own distributed sampler: - -.. code-block:: python - - # in your LightningModule or LightningDataModule - def train_dataloader(self): - # default used by the Trainer - sampler = torch.utils.data.distributed.DistributedSampler(dataset, shuffle=True) - dataloader = DataLoader(dataset, batch_size=32, sampler=sampler) - return dataloader - -.. note:: For iterable datasets, we don't do this automatically. - -resume_from_checkpoint -^^^^^^^^^^^^^^^^^^^^^^ - -.. warning:: ``resume_from_checkpoint`` is deprecated in v1.5 and will be removed in v2.0. - Please pass ``trainer.fit(ckpt_path="some/path/to/my_checkpoint.ckpt")`` instead. - - -.. raw:: html - - - -| - -To resume training from a specific checkpoint pass in the path here. If resuming from a mid-epoch -checkpoint, training will start from the beginning of the next epoch. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(resume_from_checkpoint=None) - - # resume from a specific checkpoint - trainer = Trainer(resume_from_checkpoint="some/path/to/my_checkpoint.ckpt") - -strategy -^^^^^^^^ - -Supports passing different training strategies with aliases (ddp, ddp_spawn, etc) as well as custom strategies. - -.. code-block:: python - - # Training with the DistributedDataParallel strategy on 4 GPUs - trainer = Trainer(strategy="ddp", accelerator="gpu", devices=4) - - # Training with the DDP Spawn strategy using 4 cpu processes - trainer = Trainer(strategy="ddp_spawn", accelerator="cpu", devices=4) - -.. note:: Additionally, you can pass your custom strategy to the ``strategy`` argument. - -.. code-block:: python - - from pytorch_lightning.strategies import DDPStrategy - - - class CustomDDPStrategy(DDPStrategy): - def configure_ddp(self): - self._model = MyCustomDistributedDataParallel( - self.model, - device_ids=..., - ) - - - trainer = Trainer(strategy=CustomDDPStrategy(), accelerator="gpu", devices=2) - -See Also: - - :ref:`Multi GPU Training `. - - :doc:`Model Parallel GPU training guide <../advanced/model_parallel>`. - - :doc:`TPU training guide <../accelerators/tpu>`. - -sync_batchnorm -^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Enable synchronization between batchnorm layers across all GPUs. - -.. testcode:: - - trainer = Trainer(sync_batchnorm=True) - -track_grad_norm -^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -- no tracking (-1) -- Otherwise tracks that norm (2 for 2-norm) - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(track_grad_norm=-1) - - # track the 2-norm - trainer = Trainer(track_grad_norm=2) - -.. _tpu_cores: - -tpu_cores -^^^^^^^^^ - -.. warning:: ``tpu_cores=x`` has been deprecated in v1.7 and will be removed in v2.0. - Please use ``accelerator='tpu'`` and ``devices=x`` instead. - -.. raw:: html - - - -| - -- How many TPU cores to train on (1 or 8). -- Which TPU core to train on [1-8] - -A single TPU v2 or v3 has 8 cores. A TPU pod has -up to 2048 cores. A slice of a POD means you get as many cores -as you request. - -Your effective batch size is batch_size * total tpu cores. - -This parameter can be either 1 or 8. - -Example:: - - # your_trainer_file.py - - # default used by the Trainer (ie: train on CPU) - trainer = Trainer(tpu_cores=None) - - # int: train on a single core - trainer = Trainer(tpu_cores=1) - - # list: train on a single selected core - trainer = Trainer(tpu_cores=[2]) - - # int: train on all cores few cores - trainer = Trainer(tpu_cores=8) - - # for 8+ cores must submit via xla script with - # a max of 8 cores specified. The XLA script - # will duplicate script onto each TPU in the POD - trainer = Trainer(tpu_cores=8) - -To train on more than 8 cores (ie: a POD), -submit this script using the xla_dist script. - -Example:: - - python -m torch_xla.distributed.xla_dist - --tpu=$TPU_POD_NAME - --conda-env=torch-xla-nightly - --env=XLA_USE_BF16=1 - -- python your_trainer_file.py - - -val_check_interval -^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -How often within one training epoch to check the validation set. -Can specify as float or int. - -- pass a ``float`` in the range [0.0, 1.0] to check after a fraction of the training epoch. -- pass an ``int`` to check after a fixed number of training batches. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(val_check_interval=1.0) - - # check validation set 4 times during a training epoch - trainer = Trainer(val_check_interval=0.25) - - # check validation set every 1000 training batches - # use this when using iterableDataset and your dataset has no length - # (ie: production cases with streaming data) - trainer = Trainer(val_check_interval=1000) - - -.. code-block:: python - - # Here is the computation to estimate the total number of batches seen within an epoch. - - # Find the total number of train batches - total_train_batches = total_train_samples // (train_batch_size * world_size) - - # Compute how many times we will call validation during the training loop - val_check_batch = max(1, int(total_train_batches * val_check_interval)) - val_checks_per_epoch = total_train_batches / val_check_batch - - # Find the total number of validation batches - total_val_batches = total_val_samples // (val_batch_size * world_size) - - # Total number of batches run - total_fit_batches = total_train_batches + total_val_batches - - -weights_save_path -^^^^^^^^^^^^^^^^^ - - -.. warning:: `weights_save_path` has been deprecated in v1.6 and will be removed in v1.8. Please pass - ``dirpath`` directly to the :class:`~pytorch_lightning.callbacks.model_checkpoint.ModelCheckpoint` - callback. - - -.. raw:: html - - - -| - -Directory of where to save weights if specified. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(weights_save_path=os.getcwd()) - - # save to your custom path - trainer = Trainer(weights_save_path="my/path") - -Example:: - - # if checkpoint callback used, then overrides the weights path - # **NOTE: this saves weights to some/path NOT my/path - checkpoint = ModelCheckpoint(dirpath='some/path') - trainer = Trainer( - callbacks=[checkpoint], - weights_save_path='my/path' - ) - -weights_summary -^^^^^^^^^^^^^^^ - -.. warning:: `weights_summary` is deprecated in v1.5 and will be removed in v1.7. Please pass :class:`~pytorch_lightning.callbacks.model_summary.ModelSummary` - directly to the Trainer's ``callbacks`` argument instead. To disable the model summary, - pass ``enable_model_summary = False`` to the Trainer. - - -.. raw:: html - - - -| - -Prints a summary of the weights when training begins. -Options: 'full', 'top', None. - -.. testcode:: - - # default used by the Trainer (ie: print summary of top level modules) - trainer = Trainer(weights_summary="top") - - # print full summary of all modules and submodules - trainer = Trainer(weights_summary="full") - - # don't print a summary - trainer = Trainer(weights_summary=None) - - -enable_model_summary -^^^^^^^^^^^^^^^^^^^^ - -Whether to enable or disable the model summarization. Defaults to True. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(enable_model_summary=True) - - # disable summarization - trainer = Trainer(enable_model_summary=False) - - # enable custom summarization - from pytorch_lightning.callbacks import ModelSummary - - trainer = Trainer(enable_model_summary=True, callbacks=[ModelSummary(max_depth=-1)]) - ------ - -Trainer class API ------------------ - -Methods -^^^^^^^ - -init -**** - -.. automethod:: pytorch_lightning.trainer.Trainer.__init__ - :noindex: - -fit -**** - -.. automethod:: pytorch_lightning.trainer.Trainer.fit - :noindex: - -validate -******** - -.. automethod:: pytorch_lightning.trainer.Trainer.validate - :noindex: - -test -**** - -.. automethod:: pytorch_lightning.trainer.Trainer.test - :noindex: - -predict -******* - -.. automethod:: pytorch_lightning.trainer.Trainer.predict - :noindex: - -tune -**** - -.. automethod:: pytorch_lightning.trainer.Trainer.tune - :noindex: - - -Properties -^^^^^^^^^^ - -callback_metrics -**************** - -The metrics available to callbacks. These are automatically set when you log via `self.log` - -.. code-block:: python - - def training_step(self, batch, batch_idx): - self.log("a_val", 2) - - - callback_metrics = trainer.callback_metrics - assert callback_metrics["a_val"] == 2 - -current_epoch -************* - -The number of epochs run. - -.. code-block:: python - - if trainer.current_epoch >= 10: - ... - -global_step -*********** - -The number of optimizer steps taken (does not reset each epoch). -This includes multiple optimizers and TBPTT steps (if enabled). - -.. code-block:: python - - if trainer.global_step >= 100: - ... - -logger -******* - -The current logger being used. Here's an example using tensorboard - -.. code-block:: python - - logger = trainer.logger - tensorboard = logger.experiment - - -loggers -******** - -The list of loggers currently being used by the Trainer. - -.. code-block:: python - - # List of Logger objects - loggers = trainer.loggers - for logger in loggers: - logger.log_metrics({"foo": 1.0}) - - -logged_metrics -************** - -The metrics sent to the logger (visualizer). - -.. code-block:: python - - def training_step(self, batch, batch_idx): - self.log("a_val", 2, logger=True) - - - logged_metrics = trainer.logged_metrics - assert logged_metrics["a_val"] == 2 - -log_dir -******* -The directory for the current experiment. Use this to save images to, etc... - -.. code-block:: python - - def training_step(self, batch, batch_idx): - img = ... - save_img(img, self.trainer.log_dir) - - - -is_global_zero -************** - -Whether this process is the global zero in multi-node training - -.. code-block:: python - - def training_step(self, batch, batch_idx): - if self.trainer.is_global_zero: - print("in node 0, accelerator 0") - -progress_bar_metrics -******************** - -The metrics sent to the progress bar. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - self.log("a_val", 2, prog_bar=True) - - - progress_bar_metrics = trainer.progress_bar_metrics - assert progress_bar_metrics["a_val"] == 2 - - -estimated_stepping_batches -************************** - -Check out :meth:`~pytorch_lightning.trainer.trainer.Trainer.estimated_stepping_batches`. - -state -***** - -The current state of the Trainer, including the current function that is running, the stage of -execution within that function, and the status of the Trainer. - -.. code-block:: python - - # fn in ("fit", "validate", "test", "predict", "tune") - trainer.state.fn - # status in ("initializing", "running", "finished", "interrupted") - trainer.state.status - # stage in ("train", "sanity_check", "validate", "test", "predict", "tune") - trainer.state.stage diff --git a/docs/_sources/common_usecases.rst.txt b/docs/_sources/common_usecases.rst.txt deleted file mode 100644 index 606eea9..0000000 --- a/docs/_sources/common_usecases.rst.txt +++ /dev/null @@ -1,171 +0,0 @@ -:orphan: - -################ -Common Workflows -################ - -Customize and extend Lightning for things like custom hardware or distributed strategies. - -.. join_slack:: - :align: left - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Avoid overfitting - :description: Add a training and test loop. - :col_css: col-md-12 - :button_link: common/evaluation.html - :height: 100 - -.. displayitem:: - :header: Build a model - :description: Steps to build a model. - :col_css: col-md-12 - :button_link: model/build_model.html - :height: 100 - -.. displayitem:: - :header: Configure hyperparameters from the CLI - :description: Enable basic CLI with Lightning. - :col_css: col-md-12 - :button_link: common/hyperparameters.html - :height: 100 - -.. displayitem:: - :header: Customize the progress bar - :description: Change the progress bar behavior. - :col_css: col-md-12 - :button_link: common/progress_bar.html - :height: 100 - -.. displayitem:: - :header: Deploy models into production - :description: Deploy models with different levels of scale. - :col_css: col-md-12 - :button_link: deploy/production.html - :height: 100 - -.. displayitem:: - :header: Effective Training Techniques - :description: Explore advanced training techniques. - :col_css: col-md-12 - :button_link: advanced/training_tricks.html - :height: 100 - -.. displayitem:: - :header: Eliminate config boilerplate - :description: Control your training via CLI and YAML. - :col_css: col-md-12 - :button_link: cli/lightning_cli.html - :height: 100 - -.. displayitem:: - :header: Find bottlenecks in your code - :description: Learn to find bottlenecks in your code. - :col_css: col-md-12 - :button_link: tuning/profiler.html - :height: 100 - -.. displayitem:: - :header: Finetune a model - :description: Learn to use pretrained models - :col_css: col-md-12 - :button_link: advanced/transfer_learning.html - :height: 100 - -.. displayitem:: - :header: Manage Experiments - :description: Learn to track and visualize experiments - :col_css: col-md-12 - :button_link: visualize/logging_intermediate.html - :height: 100 - -.. displayitem:: - :header: Run on an on-prem cluster - :description: Learn to run on your own cluster - :col_css: col-md-12 - :button_link: clouds/cluster.html - :height: 100 - -.. displayitem:: - :header: Save and load model progress - :description: Save and load progress with checkpoints. - :col_css: col-md-12 - :button_link: common/checkpointing_basic.html - :height: 100 - -.. displayitem:: - :header: Save memory with half-precision - :description: Enable half-precision to train faster and save memory. - :col_css: col-md-12 - :button_link: common/precision.html - :height: 100 - -.. displayitem:: - :header: Train 1 trillion+ parameter models - :description: Scale GPU training to 1 trillion + parameter models - :col_css: col-md-12 - :button_link: advanced/model_parallel.html - :height: 100 - -.. displayitem:: - :header: Train on the cloud - :description: Run models on the cloud. - :col_css: col-md-12 - :button_link: clouds/cloud_training.html - :height: 100 - -.. displayitem:: - :header: Train on single or multiple GPUs - :description: Train models faster with GPUs. - :col_css: col-md-12 - :button_link: accelerators/gpu.html - :height: 100 - -.. displayitem:: - :header: Train on single or multiple HPUs - :description: Train models faster with HPUs. - :col_css: col-md-12 - :button_link: accelerators/hpu.html - :height: 100 - -.. displayitem:: - :header: Train on single or multiple IPUs - :description: Train models faster with IPUs. - :col_css: col-md-12 - :button_link: accelerators/ipu.html - :height: 100 - -.. displayitem:: - :header: Train on single or multiple TPUs - :description: Train models faster with TPUs. - :col_css: col-md-12 - :button_link: accelerators/tpu.html - :height: 100 - -.. displayitem:: - :header: Track and Visualize Experiments - :description: Learn to track and visualize experiments - :col_css: col-md-12 - :button_link: visualize/logging_intermediate.html - :height: 100 - -.. displayitem:: - :header: Use a pure PyTorch training loop - :description: Run your pure PyTorch loop with Lightning. - :col_css: col-md-12 - :button_link: model/own_your_loop.html - :height: 100 - -.. raw:: html - -
-
diff --git a/docs/_sources/data/datamodule.rst.txt b/docs/_sources/data/datamodule.rst.txt deleted file mode 100644 index bce1877..0000000 --- a/docs/_sources/data/datamodule.rst.txt +++ /dev/null @@ -1,501 +0,0 @@ -.. _datamodules: - -################### -LightningDataModule -################### -A datamodule is a shareable, reusable class that encapsulates all the steps needed to process data: - -.. raw:: html - - - -| - -A datamodule encapsulates the five steps involved in data processing in PyTorch: - -1. Download / tokenize / process. -2. Clean and (maybe) save to disk. -3. Load inside :class:`~torch.utils.data.Dataset`. -4. Apply transforms (rotate, tokenize, etc...). -5. Wrap inside a :class:`~torch.utils.data.DataLoader`. - -| - -This class can then be shared and used anywhere: - -.. code-block:: python - - from pl_bolts.datamodules import CIFAR10DataModule, ImagenetDataModule - - model = LitClassifier() - trainer = Trainer() - - imagenet = ImagenetDataModule() - trainer.fit(model, datamodule=imagenet) - - cifar10 = CIFAR10DataModule() - trainer.fit(model, datamodule=cifar10) - ---------------- - -*************************** -Why do I need a DataModule? -*************************** -In normal PyTorch code, the data cleaning/preparation is usually scattered across many files. This makes -sharing and reusing the exact splits and transforms across projects impossible. - -Datamodules are for you if you ever asked the questions: - -- what splits did you use? -- what transforms did you use? -- what normalization did you use? -- how did you prepare/tokenize the data? - --------------- - -********************* -What is a DataModule? -********************* -A DataModule is simply a collection of a train_dataloader(s), val_dataloader(s), test_dataloader(s) and -predict_dataloader(s) along with the matching transforms and data processing/downloads steps required. - -Here's a simple PyTorch example: - -.. code-block:: python - - # regular PyTorch - test_data = MNIST(my_path, train=False, download=True) - predict_data = MNIST(my_path, train=False, download=True) - train_data = MNIST(my_path, train=True, download=True) - train_data, val_data = random_split(train_data, [55000, 5000]) - - train_loader = DataLoader(train_data, batch_size=32) - val_loader = DataLoader(val_data, batch_size=32) - test_loader = DataLoader(test_data, batch_size=32) - predict_loader = DataLoader(predict_data, batch_size=32) - -The equivalent DataModule just organizes the same exact code, but makes it reusable across projects. - -.. code-block:: python - - class MNISTDataModule(pl.LightningDataModule): - def __init__(self, data_dir: str = "path/to/dir", batch_size: int = 32): - super().__init__() - self.data_dir = data_dir - self.batch_size = batch_size - - def setup(self, stage: Optional[str] = None): - self.mnist_test = MNIST(self.data_dir, train=False) - self.mnist_predict = MNIST(self.data_dir, train=False) - mnist_full = MNIST(self.data_dir, train=True) - self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000]) - - def train_dataloader(self): - return DataLoader(self.mnist_train, batch_size=self.batch_size) - - def val_dataloader(self): - return DataLoader(self.mnist_val, batch_size=self.batch_size) - - def test_dataloader(self): - return DataLoader(self.mnist_test, batch_size=self.batch_size) - - def predict_dataloader(self): - return DataLoader(self.mnist_predict, batch_size=self.batch_size) - - def teardown(self, stage: Optional[str] = None): - # Used to clean-up when the run is finished - ... - -But now, as the complexity of your processing grows (transforms, multiple-GPU training), you can -let Lightning handle those details for you while making this dataset reusable so you can share with -colleagues or use in different projects. - -.. code-block:: python - - mnist = MNISTDataModule(my_path) - model = LitClassifier() - - trainer = Trainer() - trainer.fit(model, mnist) - -Here's a more realistic, complex DataModule that shows how much more reusable the datamodule is. - -.. code-block:: python - - import pytorch_lightning as pl - from torch.utils.data import random_split, DataLoader - - # Note - you must have torchvision installed for this example - from torchvision.datasets import MNIST - from torchvision import transforms - - - class MNISTDataModule(pl.LightningDataModule): - def __init__(self, data_dir: str = "./"): - super().__init__() - self.data_dir = data_dir - self.transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.1307,), (0.3081,))]) - - def prepare_data(self): - # download - MNIST(self.data_dir, train=True, download=True) - MNIST(self.data_dir, train=False, download=True) - - def setup(self, stage: Optional[str] = None): - - # Assign train/val datasets for use in dataloaders - if stage == "fit" or stage is None: - mnist_full = MNIST(self.data_dir, train=True, transform=self.transform) - self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000]) - - # Assign test dataset for use in dataloader(s) - if stage == "test" or stage is None: - self.mnist_test = MNIST(self.data_dir, train=False, transform=self.transform) - - if stage == "predict" or stage is None: - self.mnist_predict = MNIST(self.data_dir, train=False, transform=self.transform) - - def train_dataloader(self): - return DataLoader(self.mnist_train, batch_size=32) - - def val_dataloader(self): - return DataLoader(self.mnist_val, batch_size=32) - - def test_dataloader(self): - return DataLoader(self.mnist_test, batch_size=32) - - def predict_dataloader(self): - return DataLoader(self.mnist_predict, batch_size=32) - ---------------- - -*********************** -LightningDataModule API -*********************** -To define a DataModule the following methods are used to create train/val/test/predict dataloaders: - -- :ref:`prepare_data` (how to download, tokenize, etc...) -- :ref:`setup` (how to split, define dataset, etc...) -- :ref:`train_dataloader` -- :ref:`val_dataloader` -- :ref:`test_dataloader` -- :ref:`predict_dataloader` - - -prepare_data -============ -Downloading and saving data with multiple processes (distributed settings) will result in corrupted data. Lightning -ensures the :meth:`~pytorch_lightning.core.hooks.DataHooks.prepare_data` is called only within a single process on CPU, -so you can safely add your downloading logic within. In case of multi-node training, the execution of this hook -depends upon :ref:`prepare_data_per_node`. :meth:`~pytorch_lightning.core.hooks.DataHooks.setup` is called after -``prepare_data`` and there is a barrier in between which ensures that all the processes proceed to ``setup`` once the data is prepared and available for use. - -- download, i.e. download data only once on the disk from a single process -- tokenize. Since it's a one time process, it is not recommended to do it on all processes -- etc... - -.. code-block:: python - - class MNISTDataModule(pl.LightningDataModule): - def prepare_data(self): - # download - MNIST(os.getcwd(), train=True, download=True, transform=transforms.ToTensor()) - MNIST(os.getcwd(), train=False, download=True, transform=transforms.ToTensor()) - - -.. warning:: - - ``prepare_data`` is called from the main process. It is not recommended to assign state here (e.g. ``self.x = y``) since it is called on a single process and if you assign - states here then they won't be available for other processes. - - -setup -===== -There are also data operations you might want to perform on every GPU. Use :meth:`~pytorch_lightning.core.hooks.DataHooks.setup` to do things like: - -- count number of classes -- build vocabulary -- perform train/val/test splits -- create datasets -- apply transforms (defined explicitly in your datamodule) -- etc... - -.. code-block:: python - - import pytorch_lightning as pl - - - class MNISTDataModule(pl.LightningDataModule): - def setup(self, stage: Optional[str] = None): - - # Assign Train/val split(s) for use in Dataloaders - if stage in (None, "fit"): - mnist_full = MNIST(self.data_dir, train=True, download=True, transform=self.transform) - self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000]) - - # Assign Test split(s) for use in Dataloaders - if stage in (None, "test"): - self.mnist_test = MNIST(self.data_dir, train=False, download=True, transform=self.transform) - - -For eg., if you are working with NLP task where you need to tokenize the text and use it, then you can do something like as follows: - -.. code-block:: python - - class LitDataModule(LightningDataModule): - def prepare_data(self): - dataset = load_Dataset(...) - train_dataset = ... - val_dataset = ... - # tokenize - # save it to disk - - def setup(self, stage): - # load it back here - dataset = load_dataset_from_disk(...) - - -This method expects a ``stage`` argument. -It is used to separate setup logic for ``trainer.{fit,validate,test,predict}``. If ``setup`` is called with ``stage=None``, -we assume all stages have been set-up. - -.. note:: :ref:`setup` is called from every process across all the nodes. Setting state here is recommended. -.. note:: :ref:`teardown` can be used to clean up the state. It is also called from every process across all the nodes. - - -train_dataloader -================ -Use the :meth:`~pytorch_lightning.core.hooks.DataHooks.train_dataloader` method to generate the training dataloader(s). -Usually you just wrap the dataset you defined in :ref:`setup`. This is the dataloader that the Trainer -:meth:`~pytorch_lightning.trainer.trainer.Trainer.fit` method uses. - -.. code-block:: python - - import pytorch_lightning as pl - - - class MNISTDataModule(pl.LightningDataModule): - def train_dataloader(self): - return DataLoader(self.mnist_train, batch_size=64) - -.. _datamodule_val_dataloader_label: - -val_dataloader -============== -Use the :meth:`~pytorch_lightning.core.hooks.DataHooks.val_dataloader` method to generate the validation dataloader(s). -Usually you just wrap the dataset you defined in :ref:`setup`. This is the dataloader that the Trainer -:meth:`~pytorch_lightning.trainer.trainer.Trainer.fit` and :meth:`~pytorch_lightning.trainer.trainer.Trainer.validate` methods uses. - -.. code-block:: python - - import pytorch_lightning as pl - - - class MNISTDataModule(pl.LightningDataModule): - def val_dataloader(self): - return DataLoader(self.mnist_val, batch_size=64) - - -.. _datamodule_test_dataloader_label: - -test_dataloader -=============== -Use the :meth:`~pytorch_lightning.core.hooks.DataHooks.test_dataloader` method to generate the test dataloader(s). -Usually you just wrap the dataset you defined in :ref:`setup`. This is the dataloader that the Trainer -:meth:`~pytorch_lightning.trainer.trainer.Trainer.test` method uses. - -.. code-block:: python - - import pytorch_lightning as pl - - - class MNISTDataModule(pl.LightningDataModule): - def test_dataloader(self): - return DataLoader(self.mnist_test, batch_size=64) - - -predict_dataloader -================== -Use the :meth:`~pytorch_lightning.core.hooks.DataHooks.predict_dataloader` method to generate the prediction dataloader(s). -Usually you just wrap the dataset you defined in :ref:`setup`. This is the dataloader that the Trainer -:meth:`~pytorch_lightning.trainer.trainer.Trainer.predict` method uses. - -.. code-block:: python - - import pytorch_lightning as pl - - - class MNISTDataModule(pl.LightningDataModule): - def predict_dataloader(self): - return DataLoader(self.mnist_predict, batch_size=64) - - -transfer_batch_to_device -======================== - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.transfer_batch_to_device - :noindex: - -on_before_batch_transfer -======================== - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.on_before_batch_transfer - :noindex: - -on_after_batch_transfer -======================= - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.on_after_batch_transfer - :noindex: - -load_state_dict -=============== - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.load_state_dict - :noindex: - -state_dict -========== - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.state_dict - :noindex: - -on_train_dataloader -=================== - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.on_train_dataloader - :noindex: - -on_val_dataloader -================= - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.on_val_dataloader - :noindex: - -on_test_dataloader -================== - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.on_test_dataloader - :noindex: - -on_predict_dataloader -===================== - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.on_predict_dataloader - :noindex: - -teardown -======== - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.teardown - :noindex: - -prepare_data_per_node -===================== -If set to ``True`` will call ``prepare_data()`` on LOCAL_RANK=0 for every node. -If set to ``False`` will only call from NODE_RANK=0, LOCAL_RANK=0. - -.. testcode:: - - class LitDataModule(LightningDataModule): - def __init__(self): - super().__init__() - self.prepare_data_per_node = True - - ------------------- - -****************** -Using a DataModule -****************** - -The recommended way to use a DataModule is simply: - -.. code-block:: python - - dm = MNISTDataModule() - model = Model() - trainer.fit(model, datamodule=dm) - trainer.test(datamodule=dm) - trainer.validate(datamodule=dm) - trainer.predict(datamodule=dm) - -If you need information from the dataset to build your model, then run -:ref:`prepare_data` and -:ref:`setup` manually (Lightning ensures -the method runs on the correct devices). - -.. code-block:: python - - dm = MNISTDataModule() - dm.prepare_data() - dm.setup(stage="fit") - - model = Model(num_classes=dm.num_classes, width=dm.width, vocab=dm.vocab) - trainer.fit(model, dm) - - dm.setup(stage="test") - trainer.test(datamodule=dm) - ----------------- - -***************************** -DataModules without Lightning -***************************** -You can of course use DataModules in plain PyTorch code as well. - -.. code-block:: python - - # download, etc... - dm = MNISTDataModule() - dm.prepare_data() - - # splits/transforms - dm.setup(stage="fit") - - # use data - for batch in dm.train_dataloader(): - ... - - for batch in dm.val_dataloader(): - ... - - dm.teardown(stage="fit") - - # lazy load test data - dm.setup(stage="test") - for batch in dm.test_dataloader(): - ... - - dm.teardown(stage="test") - -But overall, DataModules encourage reproducibility by allowing all details of a dataset to be specified in a unified -structure. - ----------------- - -****************************** -Hyperparameters in DataModules -****************************** -Like LightningModules, DataModules support hyperparameters with the same API. - -.. code-block:: python - - import pytorch_lightning as pl - - - class CustomDataModule(pl.LightningDataModule): - def __init__(self, *args, **kwargs): - super().__init__() - self.save_hyperparameters() - - def configure_optimizers(self): - # access the saved hyperparameters - opt = optim.Adam(self.parameters(), lr=self.hparams.lr) - -Refer to ``save_hyperparameters`` in :doc:`lightning module <../common/lightning_module>` for more details. - - ----- - -.. include:: ../extensions/datamodules_state.rst diff --git a/docs/_sources/debug/debugging.rst.txt b/docs/_sources/debug/debugging.rst.txt deleted file mode 100644 index 8fd78d6..0000000 --- a/docs/_sources/debug/debugging.rst.txt +++ /dev/null @@ -1,41 +0,0 @@ -.. _debugging: - -################ -Debug your model -################ - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Basic - :description: Learn the basics of model debugging. - :col_css: col-md-4 - :button_link: debugging_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Intermediate - :description: Learn to debug machine learning operations - :col_css: col-md-4 - :button_link: debugging_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Advanced - :description: Learn to debug distributed models - :col_css: col-md-4 - :button_link: debugging_advanced.html - :height: 150 - :tag: advanced - -.. raw:: html - -
-
diff --git a/docs/_sources/debug/debugging_advanced.rst.txt b/docs/_sources/debug/debugging_advanced.rst.txt deleted file mode 100644 index 0c1685a..0000000 --- a/docs/_sources/debug/debugging_advanced.rst.txt +++ /dev/null @@ -1,44 +0,0 @@ -:orphan: - -.. _debugging_advanced: - -########################### -Debug your model (advanced) -########################### -**Audience**: Users who want to debug distributed models. - ----- - -************************ -Debug distributed models -************************ -To debug a distributed model, we recommend you debug it locally by running the distributed version on CPUs: - -.. code-block:: python - - trainer = Trainer(accelerator="cpu", strategy="ddp", devices=2) - -On the CPU, you can use `pdb `_ or `breakpoint() `_ -or use regular print statements. - -.. testcode:: - - class LitModel(LightningModule): - def training_step(self, batch, batch_idx): - - debugging_message = ... - print(f"RANK - {self.trainer.global_rank}: {debugging_message}") - - if self.trainer.global_rank == 0: - import pdb - - pdb.set_trace() - - # to prevent other processes from moving forward until all processes are in sync - self.trainer.strategy.barrier() - -When everything works, switch back to GPU by changing only the accelerator. - -.. code-block:: python - - trainer = Trainer(accelerator="gpu", strategy="ddp", devices=2) diff --git a/docs/_sources/debug/debugging_basic.rst.txt b/docs/_sources/debug/debugging_basic.rst.txt deleted file mode 100644 index 147285f..0000000 --- a/docs/_sources/debug/debugging_basic.rst.txt +++ /dev/null @@ -1,161 +0,0 @@ -:orphan: - -.. _debugging_basic: - -######################## -Debug your model (basic) -######################## -**Audience**: Users who want to learn the basics of debugging models. - -.. raw:: html - - - ----- - -********************************** -How does Lightning help me debug ? -********************************** -The Lightning Trainer has *a lot* of arguments devoted to maximizing your debugging productivity. - ----- - -**************** -Set a breakpoint -**************** -A breakpoint stops your code execution so you can inspect variables, etc... and allow your code to execute one line at a time. - -.. code:: python - - def function_to_debug(): - x = 2 - - # set breakpoint - import pdb - - pdb.set_trace() - y = x ** 2 - -In this example, the code will stop before executing the ``y = x**2`` line. - ----- - -************************************ -Run all your model code once quickly -************************************ -If you've ever trained a model for days only to crash during validation or testing then this trainer argument is about to become your best friend. - -The :paramref:`~pytorch_lightning.trainer.trainer.Trainer.fast_dev_run` argument in the trainer runs 5 batch of training, validation, test and prediction data through your trainer to see if there are any bugs: - -.. code:: python - - Trainer(fast_dev_run=True) - -To change how many batches to use, change the argument to an integer. Here we run 7 batches of each: - -.. code:: python - - Trainer(fast_dev_run=7) - - -.. note:: - - This argument will disable tuner, checkpoint callbacks, early stopping callbacks, - loggers and logger callbacks like :class:`~pytorch_lightning.callbacks.lr_monitor.LearningRateMonitor` and - :class:`~pytorch_lightning.callbacks.device_stats_monitor.DeviceStatsMonitor`. - ----- - -************************ -Shorten the epoch length -************************ -Sometimes it's helpful to only use a fraction of your training, val, test, or predict data (or a set number of batches). -For example, you can use 20% of the training set and 1% of the validation set. - -On larger datasets like Imagenet, this can help you debug or test a few things faster than waiting for a full epoch. - -.. testcode:: - - # use only 10% of training data and 1% of val data - trainer = Trainer(limit_train_batches=0.1, limit_val_batches=0.01) - - # use 10 batches of train and 5 batches of val - trainer = Trainer(limit_train_batches=10, limit_val_batches=5) - ----- - -****************** -Run a Sanity Check -****************** -Lightning runs **2** steps of validation in the beginning of training. -This avoids crashing in the validation loop sometime deep into a lengthy training loop. - -(See: :paramref:`~pytorch_lightning.trainer.trainer.Trainer.num_sanity_val_steps` -argument of :class:`~pytorch_lightning.trainer.trainer.Trainer`) - -.. testcode:: - - trainer = Trainer(num_sanity_val_steps=2) - ----- - -************************************* -Print LightningModule weights summary -************************************* -Whenever the ``.fit()`` function gets called, the Trainer will print the weights summary for the LightningModule. - -.. code:: python - - trainer.fit(...) - -this generate a table like: - -.. code-block:: text - - | Name | Type | Params - ---------------------------------- - 0 | net | Sequential | 132 K - 1 | net.0 | Linear | 131 K - 2 | net.1 | BatchNorm1d | 1.0 K - -To add the child modules to the summary add a :class:`~pytorch_lightning.callbacks.model_summary.ModelSummary`: - -.. testcode:: - - from pytorch_lightning.callbacks import ModelSummary - - trainer = Trainer(callbacks=[ModelSummary(max_depth=-1)]) - -To turn off the autosummary use: - -.. code:: python - - Trainer(enable_model_summary=False) - ----- - -*********************************** -Print input output layer dimensions -*********************************** -Another debugging tool is to display the intermediate input- and output sizes of all your layers by setting the -``example_input_array`` attribute in your LightningModule. - -.. code-block:: python - - class LitModel(LightningModule): - def __init__(self, *args, **kwargs): - self.example_input_array = torch.Tensor(32, 1, 28, 28) - -With the input array, the summary table will include the input and output layer dimensions: - -.. code-block:: text - - | Name | Type | Params | In sizes | Out sizes - -------------------------------------------------------------- - 0 | net | Sequential | 132 K | [10, 256] | [10, 512] - 1 | net.0 | Linear | 131 K | [10, 256] | [10, 512] - 2 | net.1 | BatchNorm1d | 1.0 K | [10, 512] | [10, 512] - -when you call ``.fit()`` on the Trainer. This can help you find bugs in the composition of your layers. diff --git a/docs/_sources/debug/debugging_intermediate.rst.txt b/docs/_sources/debug/debugging_intermediate.rst.txt deleted file mode 100644 index da8eb59..0000000 --- a/docs/_sources/debug/debugging_intermediate.rst.txt +++ /dev/null @@ -1,79 +0,0 @@ -:orphan: - -.. _debugging_intermediate: - - -############################### -Debug your model (intermediate) -############################### -**Audience**: Users who want to debug their ML code - ----- - -*************************** -Why should I debug ML code? -*************************** -Machine learning code requires debugging mathematical correctness, which is not something non-ML code has to deal with. Lightning implements a few best-practice techniques to give all users, expert level ML debugging abilities. - ----- - -************************************** -Overfit your model on a Subset of Data -************************************** -A good debugging technique is to take a tiny portion of your data (say 2 samples per class), -and try to get your model to overfit. If it can't, it's a sign it won't work with large datasets. - -(See: :paramref:`~pytorch_lightning.trainer.trainer.Trainer.overfit_batches` -argument of :class:`~pytorch_lightning.trainer.trainer.Trainer`) - -.. testcode:: - - # use only 1% of training data (and turn off validation) - trainer = Trainer(overfit_batches=0.01) - - # similar, but with a fixed 10 batches - trainer = Trainer(overfit_batches=10) - -When using this argument, the validation loop will be disabled. We will also replace the sampler -in the training set to turn off shuffle for you. - ----- - -******************************** -Look-out for exploding gradients -******************************** -One major problem that plagues models is exploding gradients. Gradient norm is one technique that can help keep gradients from exploding. - -.. testcode:: - - # the 2-norm - trainer = Trainer(track_grad_norm=2) - -This will plot the 2-norm to your experiment manager. If you notice the norm is going up, there's a good chance your gradients are/will explode. - -One technique to stop exploding gradients is to clip the gradient - -.. testcode:: - - # DEFAULT (ie: don't clip) - trainer = Trainer(gradient_clip_val=0) - - # clip gradients' global norm to <=0.5 using gradient_clip_algorithm='norm' by default - trainer = Trainer(gradient_clip_val=0.5) - - # clip gradients' maximum magnitude to <=0.5 - trainer = Trainer(gradient_clip_val=0.5, gradient_clip_algorithm="value") - ----- - -************************* -Detect autograd anomalies -************************* -Lightning helps you detect anomalies in the PyTorh autograd engine via PyTorch's built-in -`Anomaly Detection Context-manager `_. - -Enable it via the **detect_anomaly** trainer argument: - -.. testcode:: - - trainer = Trainer(detect_anomaly=True) diff --git a/docs/_sources/deploy/production.rst.txt b/docs/_sources/deploy/production.rst.txt deleted file mode 100644 index 686fcc5..0000000 --- a/docs/_sources/deploy/production.rst.txt +++ /dev/null @@ -1,79 +0,0 @@ -.. _production_inference: - -############################# -Deploy models into production -############################# - -****** -Basics -****** - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Basic - :description: Learn the basics of predicting with Lightning - :col_css: col-md-6 - :button_link: production_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Intermediate - :description: Learn to remove the Lightning dependencies and use pure PyTorch for prediction. - :col_css: col-md-6 - :button_link: production_intermediate.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
- ----- - -******** -Advanced -******** - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Deploy with ONNX - :description: Optimize models for enterprise-scale production environments with ONNX. - :col_css: col-md-4 - :button_link: production_advanced.html - :height: 180 - :tag: advanced - -.. displayitem:: - :header: Deploy with torchscript - :description: Optimize models for enterprise-scale production environments with torchscript. - :col_css: col-md-4 - :button_link: production_advanced_2.html - :height: 180 - :tag: advanced - -.. displayitem:: - :header: Compress models for fast inference - :description: Compress models for fast inference for deployment with Quantization and Pruning. - :col_css: col-md-4 - :button_link: ../advanced/pruning_quantization.html - :height: 180 - :tag: advanced - -.. raw:: html - -
-
diff --git a/docs/_sources/deploy/production_advanced.rst.txt b/docs/_sources/deploy/production_advanced.rst.txt deleted file mode 100644 index 750355d..0000000 --- a/docs/_sources/deploy/production_advanced.rst.txt +++ /dev/null @@ -1,60 +0,0 @@ -######################################## -Deploy models into production (advanced) -######################################## -**Audience**: Machine learning engineers optimizing models for enterprise-scale production environments. - ----- - -************************** -Compile your model to ONNX -************************** -`ONNX `_ is a package developed by Microsoft to optimize inference. ONNX allows the model to be independent of PyTorch and run on any ONNX Runtime. - -To export your model to ONNX format call the :meth:`~pytorch_lightning.core.lightning.LightningModule.to_onnx` function on your :class:`~pytorch_lightning.core.lightning.LightningModule` with the ``filepath`` and ``input_sample``. - -.. code-block:: python - - class SimpleModel(LightningModule): - def __init__(self): - super().__init__() - self.l1 = torch.nn.Linear(in_features=64, out_features=4) - - def forward(self, x): - return torch.relu(self.l1(x.view(x.size(0), -1))) - - - # create the model - model = SimpleModel() - filepath = "model.onnx" - input_sample = torch.randn((1, 64)) - model.to_onnx(filepath, input_sample, export_params=True) - -You can also skip passing the input sample if the ``example_input_array`` property is specified in your :class:`~pytorch_lightning.core.lightning.LightningModule`. - -.. code-block:: python - - class SimpleModel(LightningModule): - def __init__(self): - super().__init__() - self.l1 = torch.nn.Linear(in_features=64, out_features=4) - self.example_input_array = torch.randn(7, 64) - - def forward(self, x): - return torch.relu(self.l1(x.view(x.size(0), -1))) - - - # create the model - model = SimpleModel() - filepath = "model.onnx" - model.to_onnx(filepath, export_params=True) - -Once you have the exported model, you can run it on your ONNX runtime in the following way: - -.. code-block:: python - - import onnxruntime - - ort_session = onnxruntime.InferenceSession(filepath) - input_name = ort_session.get_inputs()[0].name - ort_inputs = {input_name: np.random.randn(1, 64)} - ort_outs = ort_session.run(None, ort_inputs) diff --git a/docs/_sources/deploy/production_advanced_2.rst.txt b/docs/_sources/deploy/production_advanced_2.rst.txt deleted file mode 100644 index e86aee8..0000000 --- a/docs/_sources/deploy/production_advanced_2.rst.txt +++ /dev/null @@ -1,69 +0,0 @@ -:orphan: - -######################################## -Deploy models into production (advanced) -######################################## -**Audience**: Machine learning engineers optimizing models for enterprise-scale production environments. - ----- - -********************************* -Compile your model to TorchScript -********************************* -`TorchScript `_ allows you to serialize your models in a way that it can be loaded in non-Python environments. -The ``LightningModule`` has a handy method :meth:`~pytorch_lightning.core.lightning.LightningModule.to_torchscript` that returns a scripted module which you -can save or directly use. - -.. testcode:: python - - class SimpleModel(LightningModule): - def __init__(self): - super().__init__() - self.l1 = torch.nn.Linear(in_features=64, out_features=4) - - def forward(self, x): - return torch.relu(self.l1(x.view(x.size(0), -1))) - - - # create the model - model = SimpleModel() - script = model.to_torchscript() - - # save for use in production environment - torch.jit.save(script, "model.pt") - -It is recommended that you install the latest supported version of PyTorch to use this feature without limitations. - -Once you have the exported model, you can run it in Pytorch or C++ runtime: - -.. code-block:: python - - inp = torch.rand(1, 64) - scripted_module = torch.jit.load("model.pt") - output = scripted_module(inp) - - -If you want to script a different method, you can decorate the method with :func:`torch.jit.export`: - -.. code-block:: python - - class LitMCdropoutModel(pl.LightningModule): - def __init__(self, model, mc_iteration): - super().__init__() - self.model = model - self.dropout = nn.Dropout() - self.mc_iteration = mc_iteration - - @torch.jit.export - def predict_step(self, batch, batch_idx): - # enable Monte Carlo Dropout - self.dropout.train() - - # take average of `self.mc_iteration` iterations - pred = [self.dropout(self.model(x)).unsqueeze(0) for _ in range(self.mc_iteration)] - pred = torch.vstack(pred).mean(dim=0) - return pred - - - model = LitMCdropoutModel(...) - script = model.to_torchscript(file_path="model.pt", method="script") diff --git a/docs/_sources/deploy/production_basic.rst.txt b/docs/_sources/deploy/production_basic.rst.txt deleted file mode 100644 index 00e9caa..0000000 --- a/docs/_sources/deploy/production_basic.rst.txt +++ /dev/null @@ -1,80 +0,0 @@ -##################################### -Deploy models into production (basic) -##################################### -**Audience**: All users. - ----- - -***************************** -Load a checkpoint and predict -***************************** -The easiest way to use a model for predictions is to load the weights using **load_from_checkpoint** found in the LightningModule. - -.. code-block:: python - - model = LitModel.load_from_checkpoint("best_model.ckpt") - model.eval() - x = torch.randn(1, 64) - - with torch.no_grad(): - y_hat = model(x) - ----- - -************************************** -Predict step with your LightningModule -************************************** -Loading a checkpoint and predicting still leaves you with a lot of boilerplate around the predict epoch. The **predict step** in the LightningModule removes this boilerplate. - -.. code-block:: python - - class MyModel(LightningModule): - def predict_step(self, batch, batch_idx, dataloader_idx=0): - return self(batch) - -And pass in any dataloader to the Lightning Trainer: - -.. code-block:: python - - data_loader = DataLoader(...) - model = MyModel() - trainer = Trainer() - predictions = trainer.predict(model, data_loader) - ----- - -******************************** -Enable complicated predict logic -******************************** -When you need to add complicated pre-processing or post-processing logic to your data use the predict step. For example here we do `Monte Carlo Dropout `_ for predictions: - -.. code-block:: python - - class LitMCdropoutModel(pl.LightningModule): - def __init__(self, model, mc_iteration): - super().__init__() - self.model = model - self.dropout = nn.Dropout() - self.mc_iteration = mc_iteration - - def predict_step(self, batch, batch_idx): - # enable Monte Carlo Dropout - self.dropout.train() - - # take average of `self.mc_iteration` iterations - pred = [self.dropout(self.model(x)).unsqueeze(0) for _ in range(self.mc_iteration)] - pred = torch.vstack(pred).mean(dim=0) - return pred - ----- - -**************************** -Enable distributed inference -**************************** -By using the predict step in Lightning you get free distributed inference - - -.. code-block:: python - - trainer = Trainer(devices=8, accelerator="gpu") - predictions = trainer.predict(model, data_loader) diff --git a/docs/_sources/deploy/production_intermediate.rst.txt b/docs/_sources/deploy/production_intermediate.rst.txt deleted file mode 100644 index eacb03d..0000000 --- a/docs/_sources/deploy/production_intermediate.rst.txt +++ /dev/null @@ -1,99 +0,0 @@ -############################################ -Deploy models into production (intermediate) -############################################ -**Audience**: Researchers and MLEs looking to use their models for predictions without Lightning dependencies. - ----- - -********************* -Use PyTorch as normal -********************* -If you prefer to use PyTorch directly, feel free to use any Lightning checkpoint without Lightning. - -.. code-block:: python - - import torch - - model = torch.load("path/to/lightning/checkpoint.ckpt") - model.eval() - -You can also pull out the specific modules you want out of the checkpoint: - -.. code-block:: python - - model = torch.load("path/to/lightning/checkpoint.ckpt") - encoder = model["encoder"] - encoder.eval() - ----- - -******************************************** -Extract nn.Module from Lightning checkpoints -******************************************** -You can also load the saved checkpoint and use it as a regular :class:`torch.nn.Module`. You can extract all your :class:`torch.nn.Module` -and load the weights using the checkpoint saved using LightningModule after training. For this, we recommend copying the exact implementation -from your LightningModule ``init`` and ``forward`` method. - -.. code-block:: python - - class Encoder(nn.Module): - ... - - - class Decoder(nn.Module): - ... - - - class AutoEncoderProd(nn.Module): - def __init__(self): - super().__init__() - self.encoder = Encoder() - self.decoder = Decoder() - - def forward(self, x): - return self.encoder(x) - - - class AutoEncoderSystem(LightningModule): - def __init__(self): - super().__init__() - self.auto_encoder = AutoEncoderProd() - - def forward(self, x): - return self.auto_encoder.encoder(x) - - def training_step(self, batch, batch_idx): - x, y = batch - y_hat = self.auto_encoder.encoder(x) - y_hat = self.auto_encoder.decoder(y_hat) - loss = ... - return loss - - - # train it - trainer = Trainer(devices=2, accelerator="gpu", strategy="ddp") - model = AutoEncoderSystem() - trainer.fit(model, train_dataloader, val_dataloader) - trainer.save_checkpoint("best_model.ckpt") - - - # create the PyTorch model and load the checkpoint weights - model = AutoEncoderProd() - checkpoint = torch.load("best_model.ckpt") - hyper_parameters = checkpoint["hyper_parameters"] - - # if you want to restore any hyperparameters, you can pass them too - model = AutoEncoderProd(**hyper_parameters) - - state_dict = checkpoint["state_dict"] - - # update keys by dropping `auto_encoder.` - for key in list(model_weights): - model_weights[key.replace("auto_encoder.", "")] = model_weights.pop(key) - - model.load_state_dict(model_weights) - model.eval() - x = torch.randn(1, 64) - - with torch.no_grad(): - y_hat = model(x) diff --git a/docs/_sources/ecosystem/asr_nlp_tts.rst.txt b/docs/_sources/ecosystem/asr_nlp_tts.rst.txt deleted file mode 100644 index b624696..0000000 --- a/docs/_sources/ecosystem/asr_nlp_tts.rst.txt +++ /dev/null @@ -1,816 +0,0 @@ -:orphan: - -################# -Conversational AI -################# - -These are amazing ecosystems to help with Automatic Speech Recognition (ASR), Natural Language Processing (NLP), and Text to speech (TTS). - ----- - -**** -NeMo -**** - -`NVIDIA NeMo `_ is a toolkit for building new State-of-the-Art -Conversational AI models. NeMo has separate collections for Automatic Speech Recognition (ASR), -Natural Language Processing (NLP), and Text-to-Speech (TTS) models. Each collection consists of -prebuilt modules that include everything needed to train on your data. -Every module can easily be customized, extended, and composed to create new Conversational AI -model architectures. - -Conversational AI architectures are typically very large and require a lot of data and compute -for training. NeMo uses PyTorch Lightning for easy and performant multi-GPU/multi-node -mixed-precision training. - -.. note:: Every NeMo model is a LightningModule that comes equipped with all supporting infrastructure for training and reproducibility. - ----------- - -NeMo Models -=========== - -NeMo Models contain everything needed to train and reproduce state of the art Conversational AI -research and applications, including: - -- neural network architectures -- datasets/data loaders -- data preprocessing/postprocessing -- data augmentors -- optimizers and schedulers -- tokenizers -- language models - -NeMo uses `Hydra `_ for configuring both NeMo models and the PyTorch Lightning Trainer. -Depending on the domain and application, many different AI libraries will have to be configured -to build the application. Hydra makes it easy to bring all of these libraries together -so that each can be configured from .yaml or the Hydra CLI. - -.. note:: Every NeMo model has an example configuration file and a corresponding script that contains all configurations needed for training. - -The end result of using NeMo, Pytorch Lightning, and Hydra is that -NeMo models all have the same look and feel. This makes it easy to do Conversational AI research -across multiple domains. NeMo models are also fully compatible with the PyTorch ecosystem. - -Installing NeMo ---------------- - -Before installing NeMo, please install Cython first. - -.. code-block:: bash - - pip install Cython - -For ASR and TTS models, also install these linux utilities. - -.. code-block:: bash - - apt-get update && apt-get install -y libsndfile1 ffmpeg - -Then installing the latest NeMo release is a simple pip install. - -.. code-block:: bash - - pip install nemo_toolkit[all]==1.0.0b1 - -To install the main branch from GitHub: - -.. code-block:: bash - - python -m pip install git+https://github.com/NVIDIA/NeMo.git@main#egg=nemo_toolkit[all] - -To install from a local clone of NeMo: - -.. code-block:: bash - - ./reinstall.sh # from cloned NeMo's git root - -For Docker users, the NeMo container is available on -`NGC `_. - -.. code-block:: bash - - docker pull nvcr.io/nvidia/nemo:v1.0.0b1 - -.. code-block:: bash - - docker run --runtime=nvidia -it --rm -v --shm-size=8g -p 8888:8888 -p 6006:6006 --ulimit memlock=-1 --ulimit stack=67108864 nvcr.io/nvidia/nemo:v1.0.0b1 - -Experiment Manager ------------------- - -NeMo's Experiment Manager leverages PyTorch Lightning for model checkpointing, -TensorBoard Logging, and Weights and Biases logging. The Experiment Manager is included by default -in all NeMo example scripts. - -.. code-block:: python - - exp_manager(trainer, cfg.get("exp_manager", None)) - -And is configurable via .yaml with Hydra. - -.. code-block:: bash - - exp_manager: - exp_dir: null - name: *name - create_tensorboard_logger: True - create_checkpoint_callback: True - -Optionally launch Tensorboard to view training results in ./nemo_experiments (by default). - -.. code-block:: bash - - tensorboard --bind_all --logdir nemo_experiments - --------- - -Automatic Speech Recognition (ASR) -================================== - -Everything needed to train Convolutional ASR models is included with NeMo. -NeMo supports multiple Speech Recognition architectures, including Jasper and QuartzNet. -`NeMo Speech Models `_ -can be trained from scratch on custom datasets or -fine-tuned using pre-trained checkpoints trained on thousands of hours of audio -that can be restored for immediate use. - -Some typical ASR tasks are included with NeMo: - -- `Audio transcription `_ -- `Byte Pair/Word Piece Training `_ -- `Speech Commands `_ -- `Voice Activity Detection `_ -- `Speaker Recognition `_ - -See this `asr notebook `_ -for a full tutorial on doing ASR with NeMo, PyTorch Lightning, and Hydra. - -Specify ASR Model Configurations with YAML File ------------------------------------------------ - -NeMo Models and the PyTorch Lightning Trainer can be fully configured from .yaml files using Hydra. - -See this `asr config `_ -for the entire speech to text .yaml file. - -.. code-block:: yaml - - # configure the PyTorch Lightning Trainer - trainer: - gpus: 0 # number of gpus - max_epochs: 5 - max_steps: null # computed at runtime if not set - num_nodes: 1 - accelerator: ddp - ... - # configure the ASR model - model: - ... - encoder: - cls: nemo.collections.asr.modules.ConvASREncoder - params: - feat_in: *n_mels - activation: relu - conv_mask: true - - jasper: - - filters: 128 - repeat: 1 - kernel: [11] - stride: [1] - dilation: [1] - dropout: *dropout - ... - # all other configuration, data, optimizer, preprocessor, etc - ... - -Developing ASR Model From Scratch ---------------------------------- - -`speech_to_text.py `_ - -.. code-block:: python - - # hydra_runner calls hydra.main and is useful for multi-node experiments - @hydra_runner(config_path="conf", config_name="config") - def main(cfg): - trainer = Trainer(**cfg.trainer) - asr_model = EncDecCTCModel(cfg.model, trainer) - trainer.fit(asr_model) - - -Hydra makes every aspect of the NeMo model, -including the PyTorch Lightning Trainer, customizable from the command line. - -.. code-block:: bash - - python NeMo/examples/asr/speech_to_text.py --config-name=quartznet_15x5 \ - trainer.accelerator=gpu \ - trainer.devices=4 \ - trainer.max_epochs=128 \ - +trainer.precision=16 \ - model.train_ds.manifest_filepath=/librispeech-train-all.json \ - model.validation_ds.manifest_filepath=/librispeech-dev-other.json \ - model.train_ds.batch_size=64 \ - +model.validation_ds.num_workers=16 \ - +model.train_ds.num_workers=16 - -.. note:: Training NeMo ASR models can take days/weeks so it is highly recommended to use multiple GPUs and multiple nodes with the PyTorch Lightning Trainer. - - -Using State-Of-The-Art Pre-trained ASR Model --------------------------------------------- - -Transcribe audio with QuartzNet model pretrained on ~3300 hours of audio. - -.. code-block:: python - - quartznet = EncDecCTCModel.from_pretrained("QuartzNet15x5Base-En") - - files = ["path/to/my.wav"] # file duration should be less than 25 seconds - - for fname, transcription in zip(files, quartznet.transcribe(paths2audio_files=files)): - print(f"Audio in {fname} was recognized as: {transcription}") - -To see the available pretrained checkpoints: - -.. code-block:: python - - EncDecCTCModel.list_available_models() - -NeMo ASR Model Under the Hood ------------------------------ - -Any aspect of ASR training or model architecture design can easily be customized -with PyTorch Lightning since every NeMo model is a Lightning Module. - -.. code-block:: python - - class EncDecCTCModel(ASRModel): - """Base class for encoder decoder CTC-based models.""" - - ... - - def forward(self, input_signal, input_signal_length): - processed_signal, processed_signal_len = self.preprocessor( - input_signal=input_signal, - length=input_signal_length, - ) - # Spec augment is not applied during evaluation/testing - if self.spec_augmentation is not None and self.training: - processed_signal = self.spec_augmentation(input_spec=processed_signal) - encoded, encoded_len = self.encoder(audio_signal=processed_signal, length=processed_signal_len) - log_probs = self.decoder(encoder_output=encoded) - greedy_predictions = log_probs.argmax(dim=-1, keepdim=False) - return log_probs, encoded_len, greedy_predictions - - # PTL-specific methods - def training_step(self, batch, batch_nb): - audio_signal, audio_signal_len, transcript, transcript_len = batch - log_probs, encoded_len, predictions = self.forward( - input_signal=audio_signal, input_signal_length=audio_signal_len - ) - loss_value = self.loss( - log_probs=log_probs, targets=transcript, input_lengths=encoded_len, target_lengths=transcript_len - ) - wer_num, wer_denom = self._wer(predictions, transcript, transcript_len) - self.log_dict( - { - "train_loss": loss_value, - "training_batch_wer": wer_num / wer_denom, - "learning_rate": self._optimizer.param_groups[0]["lr"], - } - ) - return loss_value - -Neural Types in NeMo ASR ------------------------- - -NeMo Models and Neural Modules come with Neural Type checking. -Neural type checking is extremely useful when combining many different neural -network architectures for a production-grade application. - -.. code-block:: python - - @property - def input_types(self) -> Optional[Dict[str, NeuralType]]: - if hasattr(self.preprocessor, "_sample_rate"): - audio_eltype = AudioSignal(freq=self.preprocessor._sample_rate) - else: - audio_eltype = AudioSignal() - return { - "input_signal": NeuralType(("B", "T"), audio_eltype), - "input_signal_length": NeuralType(tuple("B"), LengthsType()), - } - - - @property - def output_types(self) -> Optional[Dict[str, NeuralType]]: - return { - "outputs": NeuralType(("B", "T", "D"), LogprobsType()), - "encoded_lengths": NeuralType(tuple("B"), LengthsType()), - "greedy_predictions": NeuralType(("B", "T"), LabelsType()), - } - --------- - -Natural Language Processing (NLP) -================================= - -Everything needed to finetune BERT-like language models for NLP tasks is included with NeMo. -`NeMo NLP Models `_ -include `HuggingFace Transformers `_ -and `NVIDIA Megatron-LM `_ BERT and Bio-Megatron models. -NeMo can also be used for pretraining BERT-based language models from HuggingFace. - -Any of the HuggingFace encoders or Megatron-LM encoders can easily be used for the NLP tasks -that are included with NeMo: - -- `Glue Benchmark (All tasks) `_ -- `Intent Slot Classification `_ -- `Language Modeling (BERT Pretraining) `_ -- `Question Answering `_ -- `Text Classification `_ (including Sentiment Analysis) -- `Token Classification `_ (including Named Entity Recognition) -- `Punctuation and Capitalization `_ - -Named Entity Recognition (NER) ------------------------------- - -NER (or more generally token classification) is the NLP task of detecting and classifying key information (entities) in text. -This task is very popular in Healthcare and Finance. In finance, for example, it can be important to identify -geographical, geopolitical, organizational, persons, events, and natural phenomenon entities. -See this `NER notebook `_ -for a full tutorial on doing NER with NeMo, PyTorch Lightning, and Hydra. - -Specify NER Model Configurations with YAML File ------------------------------------------------ - -.. note:: NeMo Models and the PyTorch Lightning Trainer can be fully configured from .yaml files using Hydra. - -See this `token classification config `_ -for the entire NER (token classification) .yaml file. - -.. code-block:: yaml - - # configure any argument of the PyTorch Lightning Trainer - trainer: - gpus: 1 # the number of gpus, 0 for CPU - num_nodes: 1 - max_epochs: 5 - ... - # configure any aspect of the token classification model here - model: - dataset: - data_dir: ??? # /path/to/data - class_balancing: null # choose from [null, weighted_loss]. Weighted_loss enables the weighted class balancing of the loss, may be used for handling unbalanced classes - max_seq_length: 128 - ... - tokenizer: - tokenizer_name: ${model.language_model.pretrained_model_name} # or sentencepiece - vocab_file: null # path to vocab file - ... - # the language model can be from HuggingFace or Megatron-LM - language_model: - pretrained_model_name: bert-base-uncased - lm_checkpoint: null - ... - # the classifier for the downstream task - head: - num_fc_layers: 2 - fc_dropout: 0.5 - activation: 'relu' - ... - # all other configuration: train/val/test/ data, optimizer, experiment manager, etc - ... - -Developing NER Model From Scratch ---------------------------------- - -`token_classification.py `_ - -.. code-block:: python - - # hydra_runner calls hydra.main and is useful for multi-node experiments - @hydra_runner(config_path="conf", config_name="token_classification_config") - def main(cfg: DictConfig) -> None: - trainer = pl.Trainer(**cfg.trainer) - model = TokenClassificationModel(cfg.model, trainer=trainer) - trainer.fit(model) - -After training, we can do inference with the saved NER model using PyTorch Lightning. - -Inference from file: - -.. code-block:: python - - gpu = 1 if cfg.trainer.gpus != 0 else 0 - trainer = pl.Trainer(accelerator="gpu", devices=gpu) - model.set_trainer(trainer) - model.evaluate_from_file( - text_file=os.path.join(cfg.model.dataset.data_dir, cfg.model.validation_ds.text_file), - labels_file=os.path.join(cfg.model.dataset.data_dir, cfg.model.validation_ds.labels_file), - output_dir=exp_dir, - add_confusion_matrix=True, - normalize_confusion_matrix=True, - ) - -Or we can run inference on a few examples: - -.. code-block:: python - - queries = ["we bought four shirts from the nvidia gear store in santa clara.", "Nvidia is a company in Santa Clara."] - results = model.add_predictions(queries) - - for query, result in zip(queries, results): - logging.info(f"Query : {query}") - logging.info(f"Result: {result.strip()}\n") - -Hydra makes every aspect of the NeMo model, including the PyTorch Lightning Trainer, customizable from the command line. - -.. code-block:: bash - - python token_classification.py \ - model.language_model.pretrained_model_name=bert-base-cased \ - model.head.num_fc_layers=2 \ - model.dataset.data_dir=/path/to/my/data \ - trainer.max_epochs=5 \ - trainer.accelerator=gpu \ - trainer.devices=[0,1] - ------------ - -Tokenizers ----------- - -Tokenization is the process of converting natural language text into integer arrays -which can be used for machine learning. -For NLP tasks, tokenization is an essential part of data preprocessing. -NeMo supports all BERT-like model tokenizers from -`HuggingFace's AutoTokenizer `_ -and also supports `Google's SentencePieceTokenizer `_ -which can be trained on custom data. - -To see the list of supported tokenizers: - -.. code-block:: python - - from nemo.collections import nlp as nemo_nlp - - nemo_nlp.modules.get_tokenizer_list() - -See this `tokenizer notebook `_ -for a full tutorial on using tokenizers in NeMo. - -Language Models ---------------- - -Language models are used to extract information from (tokenized) text. -Much of the state-of-the-art in natural language processing is achieved -by fine-tuning pretrained language models on the downstream task. - -With NeMo, you can either `pretrain `_ -a BERT model on your data or use a pretrained language model from `HuggingFace Transformers `_ -or `NVIDIA Megatron-LM `_. - -To see the list of language models available in NeMo: - -.. code-block:: python - - nemo_nlp.modules.get_pretrained_lm_models_list(include_external=True) - -Easily switch between any language model in the above list by using `.get_lm_model`. - -.. code-block:: python - - nemo_nlp.modules.get_lm_model(pretrained_model_name="distilbert-base-uncased") - -See this `language model notebook `_ -for a full tutorial on using pretrained language models in NeMo. - -Using a Pre-trained NER Model ------------------------------ - -NeMo has pre-trained NER models that can be used -to get started with Token Classification right away. -Models are automatically downloaded from NGC, -cached locally to disk, -and loaded into GPU memory using the `.from_pretrained` method. - -.. code-block:: python - - # load pre-trained NER model - pretrained_ner_model = TokenClassificationModel.from_pretrained(model_name="NERModel") - - # define the list of queries for inference - queries = [ - "we bought four shirts from the nvidia gear store in santa clara.", - "Nvidia is a company.", - "The Adventures of Tom Sawyer by Mark Twain is an 1876 novel about a young boy growing " - + "up along the Mississippi River.", - ] - results = pretrained_ner_model.add_predictions(queries) - - for query, result in zip(queries, results): - print() - print(f"Query : {query}") - print(f"Result: {result.strip()}\n") - -NeMo NER Model Under the Hood ------------------------------ - -Any aspect of NLP training or model architecture design can easily be customized with PyTorch Lightning -since every NeMo model is a Lightning Module. - -.. code-block:: python - - class TokenClassificationModel(ModelPT): - """ - Token Classification Model with BERT, applicable for tasks such as Named Entity Recognition - """ - - ... - - def forward(self, input_ids, token_type_ids, attention_mask): - hidden_states = self.bert_model( - input_ids=input_ids, token_type_ids=token_type_ids, attention_mask=attention_mask - ) - logits = self.classifier(hidden_states=hidden_states) - return logits - - # PTL-specific methods - def training_step(self, batch, batch_idx): - """ - Lightning calls this inside the training loop with the data from the training dataloader - passed in as `batch`. - """ - input_ids, input_type_ids, input_mask, subtokens_mask, loss_mask, labels = batch - logits = self(input_ids=input_ids, token_type_ids=input_type_ids, attention_mask=input_mask) - - loss = self.loss(logits=logits, labels=labels, loss_mask=loss_mask) - self.log_dict({"train_loss": loss, "lr": self._optimizer.param_groups[0]["lr"]}) - return loss - - ... - -Neural Types in NeMo NLP ------------------------- - -NeMo Models and Neural Modules come with Neural Type checking. -Neural type checking is extremely useful when combining many different neural network architectures -for a production-grade application. - -.. code-block:: python - - @property - def input_types(self) -> Optional[Dict[str, NeuralType]]: - return self.bert_model.input_types - - - @property - def output_types(self) -> Optional[Dict[str, NeuralType]]: - return self.classifier.output_types - --------- - -Text-To-Speech (TTS) -==================== - -Everything needed to train TTS models and generate audio is included with NeMo. -`NeMo TTS Models `_ -can be trained from scratch on your own data or pretrained models can be downloaded -automatically. NeMo currently supports a two step inference procedure. -First, a model is used to generate a mel spectrogram from text. -Second, a model is used to generate audio from a mel spectrogram. - -Mel Spectrogram Generators: - -- `Tacotron 2 `_ -- `Glow-TTS `_ - -Audio Generators: - -- Griffin-Lim -- `WaveGlow `_ -- `SqueezeWave `_ - - -Specify TTS Model Configurations with YAML File ------------------------------------------------ - -.. note:: NeMo Models and PyTorch Lightning Trainer can be fully configured from .yaml files using Hydra. - -`tts/conf/glow_tts.yaml `_ - -.. code-block:: yaml - - # configure the PyTorch Lightning Trainer - trainer: - gpus: -1 # number of gpus - max_epochs: 350 - num_nodes: 1 - accelerator: ddp - ... - - # configure the TTS model - model: - ... - encoder: - cls: nemo.collections.tts.modules.glow_tts.TextEncoder - params: - n_vocab: 148 - out_channels: *n_mels - hidden_channels: 192 - filter_channels: 768 - filter_channels_dp: 256 - ... - # all other configuration, data, optimizer, parser, preprocessor, etc - ... - -Developing TTS Model From Scratch ---------------------------------- - -`tts/glow_tts.py `_ - -.. code-block:: python - - # hydra_runner calls hydra.main and is useful for multi-node experiments - @hydra_runner(config_path="conf", config_name="glow_tts") - def main(cfg): - trainer = pl.Trainer(**cfg.trainer) - model = GlowTTSModel(cfg=cfg.model, trainer=trainer) - trainer.fit(model) - -Hydra makes every aspect of the NeMo model, including the PyTorch Lightning Trainer, customizable from the command line. - -.. code-block:: bash - - python NeMo/examples/tts/glow_tts.py \ - trainer.accelerator=gpu \ - trainer.devices=4 \ - trainer.max_epochs=400 \ - ... - train_dataset=/path/to/train/data \ - validation_datasets=/path/to/val/data \ - model.train_ds.batch_size = 64 \ - -.. note:: Training NeMo TTS models from scratch can take days or weeks so it is highly recommended to use multiple GPUs and multiple nodes with the PyTorch Lightning Trainer. - -Using State-Of-The-Art Pre-trained TTS Model --------------------------------------------- - -Generate speech using models trained on `LJSpeech `, -around 24 hours of single speaker data. - -See this `TTS notebook `_ -for a full tutorial on generating speech with NeMo, PyTorch Lightning, and Hydra. - -.. code-block:: python - - # load pretrained spectrogram model - spec_gen = SpecModel.from_pretrained("GlowTTS-22050Hz").cuda() - - # load pretrained Generators - vocoder = WaveGlowModel.from_pretrained("WaveGlow-22050Hz").cuda() - - - def infer(spec_gen_model, vocder_model, str_input): - with torch.no_grad(): - parsed = spec_gen.parse(text_to_generate) - spectrogram = spec_gen.generate_spectrogram(tokens=parsed) - audio = vocoder.convert_spectrogram_to_audio(spec=spectrogram) - if isinstance(spectrogram, torch.Tensor): - spectrogram = spectrogram.to("cpu").numpy() - if len(spectrogram.shape) == 3: - spectrogram = spectrogram[0] - if isinstance(audio, torch.Tensor): - audio = audio.to("cpu").numpy() - return spectrogram, audio - - - text_to_generate = input("Input what you want the model to say: ") - spec, audio = infer(spec_gen, vocoder, text_to_generate) - -To see the available pretrained checkpoints: - -.. code-block:: python - - # spec generator - GlowTTSModel.list_available_models() - - # vocoder - WaveGlowModel.list_available_models() - -NeMo TTS Model Under the Hood ------------------------------ - -Any aspect of TTS training or model architecture design can easily -be customized with PyTorch Lightning since every NeMo model is a LightningModule. - -`glow_tts.py `_ - -.. code-block:: python - - class GlowTTSModel(SpectrogramGenerator): - """ - GlowTTS model used to generate spectrograms from text - Consists of a text encoder and an invertible spectrogram decoder - """ - - ... - # NeMo models come with neural type checking - @typecheck( - input_types={ - "x": NeuralType(("B", "T"), TokenIndex()), - "x_lengths": NeuralType(("B"), LengthsType()), - "y": NeuralType(("B", "D", "T"), MelSpectrogramType(), optional=True), - "y_lengths": NeuralType(("B"), LengthsType(), optional=True), - "gen": NeuralType(optional=True), - "noise_scale": NeuralType(optional=True), - "length_scale": NeuralType(optional=True), - } - ) - def forward(self, *, x, x_lengths, y=None, y_lengths=None, gen=False, noise_scale=0.3, length_scale=1.0): - if gen: - return self.glow_tts.generate_spect( - text=x, text_lengths=x_lengths, noise_scale=noise_scale, length_scale=length_scale - ) - else: - return self.glow_tts(text=x, text_lengths=x_lengths, spect=y, spect_lengths=y_lengths) - - ... - - def step(self, y, y_lengths, x, x_lengths): - z, y_m, y_logs, logdet, logw, logw_, y_lengths, attn = self( - x=x, x_lengths=x_lengths, y=y, y_lengths=y_lengths, gen=False - ) - - l_mle, l_length, logdet = self.loss( - z=z, - y_m=y_m, - y_logs=y_logs, - logdet=logdet, - logw=logw, - logw_=logw_, - x_lengths=x_lengths, - y_lengths=y_lengths, - ) - - loss = sum([l_mle, l_length]) - - return l_mle, l_length, logdet, loss, attn - - # PTL-specific methods - def training_step(self, batch, batch_idx): - y, y_lengths, x, x_lengths = batch - - y, y_lengths = self.preprocessor(input_signal=y, length=y_lengths) - - l_mle, l_length, logdet, loss, _ = self.step(y, y_lengths, x, x_lengths) - - self.log_dict({"l_mle": l_mle, "l_length": l_length, "logdet": logdet}, prog_bar=True) - return loss - - ... - -Neural Types in NeMo TTS ------------------------- - -NeMo Models and Neural Modules come with Neural Type checking. -Neural type checking is extremely useful when combining many different neural network architectures -for a production-grade application. - -.. code-block:: python - - @typecheck( - input_types={ - "x": NeuralType(("B", "T"), TokenIndex()), - "x_lengths": NeuralType(("B"), LengthsType()), - "y": NeuralType(("B", "D", "T"), MelSpectrogramType(), optional=True), - "y_lengths": NeuralType(("B"), LengthsType(), optional=True), - "gen": NeuralType(optional=True), - "noise_scale": NeuralType(optional=True), - "length_scale": NeuralType(optional=True), - } - ) - def forward(self, *, x, x_lengths, y=None, y_lengths=None, gen=False, noise_scale=0.3, length_scale=1.0): - ... - --------- - -Learn More -========== - -- Watch the `NVIDIA NeMo Intro Video `_ -- Watch the `PyTorch Lightning and NVIDIA NeMo Discussion Video `_ -- Visit the `NVIDIA NeMo Developer Website `_ -- Read the `NVIDIA NeMo PyTorch Blog `_ -- Download pre-trained `ASR `_, `NLP `_, and `TTS `_ models on `NVIDIA NGC `_ to quickly get started with NeMo. -- Become an expert on Building Conversational AI applications with our `tutorials `_, and `example scripts `_, -- See our `developer guide `_ for more information on core NeMo concepts, ASR/NLP/TTS collections, and the NeMo API. - -.. note:: NeMo tutorial notebooks can be run on `Google Colab `_. - -NVIDIA `NeMo `_ is actively being developed on GitHub. -`Contributions `_ are welcome! diff --git a/docs/_sources/ecosystem/bolts.rst.txt b/docs/_sources/ecosystem/bolts.rst.txt deleted file mode 100644 index 56c7768..0000000 --- a/docs/_sources/ecosystem/bolts.rst.txt +++ /dev/null @@ -1,92 +0,0 @@ -:orphan: - -Lightning Bolts -=============== - -`PyTorch Lightning Bolts `_, is our official collection -of prebuilt models across many research domains. - -.. code-block:: bash - - pip install lightning-bolts - -In bolts we have: - -- A collection of pretrained state-of-the-art models. -- A collection of models designed to bootstrap your research. -- A collection of callbacks, transforms, full datasets. -- All models work on CPUs, TPUs, GPUs and 16-bit precision. - ------------------ - -Quality control ---------------- -The Lightning community builds bolts and contributes them to Bolts. -The lightning team guarantees that contributions are: - -- Rigorously Tested (CPUs, GPUs, TPUs). -- Rigorously Documented. -- Standardized via PyTorch Lightning. -- Optimized for speed. -- Checked for correctness. - ---------- - -Example 1: Pretrained, prebuilt models --------------------------------------- - -.. code-block:: python - - from pl_bolts.models import VAE, GPT2, ImageGPT, PixelCNN - from pl_bolts.models.self_supervised import AMDIM, CPCV2, SimCLR, MocoV2 - from pl_bolts.models import LinearRegression, LogisticRegression - from pl_bolts.models.gans import GAN - from pl_bolts.callbacks import PrintTableMetricsCallback - from pl_bolts.datamodules import FashionMNISTDataModule, CIFAR10DataModule, ImagenetDataModule - ------------- - -Example 2: Extend for faster research -------------------------------------- -Bolts are contributed with benchmarks and continuous-integration tests. This means -you can trust the implementations and use them to bootstrap your research much faster. - -.. code-block:: python - - from pl_bolts.models import ImageGPT - from pl_bolts.self_supervised import SimCLR - - - class VideoGPT(ImageGPT): - def training_step(self, batch, batch_idx): - x, y = batch - x = _shape_input(x) - - logits = self.gpt(x) - simclr_features = self.simclr(x) - - # ----------------- - # do something new with GPT logits + simclr_features - # ----------------- - - loss = self.criterion(logits.view(-1, logits.size(-1)), x.view(-1).long()) - - self.log("loss", loss) - return loss - ----------- - -Example 3: Callbacks --------------------- -We also have a collection of callbacks. - -.. code-block:: python - - from pl_bolts.callbacks import PrintTableMetricsCallback - import pytorch_lightning as pl - - trainer = pl.Trainer(callbacks=[PrintTableMetricsCallback()]) - - # loss│train_loss│val_loss│epoch - # ────────────────────────────── - # 2.2541470527648926│2.2541470527648926│2.2158432006835938│0 diff --git a/docs/_sources/ecosystem/community_examples.rst.txt b/docs/_sources/ecosystem/community_examples.rst.txt deleted file mode 100644 index f535857..0000000 --- a/docs/_sources/ecosystem/community_examples.rst.txt +++ /dev/null @@ -1,36 +0,0 @@ -:orphan: - -Community Examples -================== - - -- `Lightning Bolts: Deep Learning components for extending PyTorch Lightning `_. -- `Lightning Flash: Your PyTorch AI Factory - Flash enables you to easily configure and run complex AI recipes `_. -- `Contextual Emotion Detection (DoubleDistilBert) `_ -- `Cotatron: Transcription-Guided Speech Encoder `_ -- `FasterRCNN object detection + Hydra `_ -- `Image Inpainting using Partial Convolutions `_ -- `MNIST on TPU `_ -- `NER (transformers, TPU) `_ -- `NeuralTexture (CVPR) `_ -- `Recurrent Attentive Neural Process `_ -- `Siamese Nets for One-shot Image Recognition `_ -- `Speech Transformers `_ -- `Transformers transfer learning (Huggingface) `_ -- `Transformers text classification `_ -- `VAE Library of over 18+ VAE flavors `_ -- `Transformers Question Answering (SQuAD) `_ -- `Atlas: End-to-End 3D Scene Reconstruction from Posed Images `_ -- `Self-Supervised Representation Learning (MoCo and BYOL) `_ -- `PyTorch-Forecasting: Time series forecasting package `_ -- `Transformers masked language modeling `_ -- `PyTorch Geometric examples with PyTorch Lightning and Hydra `_ -- `PyTorch Tabular: Deep learning with tabular data `_ -- `Asteroid: An audio source separation toolkit for researchers `_ - - -PyTorch Ecosystem Examples -========================== - -- `PyTorch Geometric: Deep learning on graphs and other irregular structures `_. -- `TorchIO, MONAI and Lightning for 3D medical image segmentation `_. diff --git a/docs/_sources/ecosystem/ecosystem-ci.rst.txt b/docs/_sources/ecosystem/ecosystem-ci.rst.txt deleted file mode 100644 index 04ff342..0000000 --- a/docs/_sources/ecosystem/ecosystem-ci.rst.txt +++ /dev/null @@ -1,30 +0,0 @@ -:orphan: - -Ecosystem CI -============ - -`Ecosystem CI `_ automates issue discovery for your projects against Lightning nightly and releases. -It is a lightweight repository that provides easy configuration of Continues Integration running on CPUs and GPUs. -Any user who wants to keep their project aligned with current and future Lightning releases can use the EcoSystem CI to configure their integrations. -Read more: `Stay Ahead of Breaking Changes with the New Lightning Ecosystem CI `_ - --------------- - -*********************** -Integrate a New Project -*********************** - -Follow the instructions below to add a new project to the PyTorch Lightning ecosystem. - -1. Fork the ecosystem CI repository to be able to create a `new Pull Request `_ and work within a specific branch. -2. Create a new config file in ``configs/`` folder and call it ``.yaml``. -3. Define runtime for CPU and link the config for GPU: - For CPU integrations, list OS and Python version combination to be running with GitHub actions. - For GPU integrations, you only add the path to the config (OS/Linux and Python version is fixed) to be running with Azure pipelines. -4. Add a Contact to the ``.github/CODEOWNERS`` list for your organization folder or just a single project. -5. Create a Draft PR with all mentioned requirements. -6. Join our `Slack `_ (Optional) channel ``#alerts-ecosystem-ci`` to be notified if your project is breaking. - - -To learn more about Ecosystem CI, please refer to the `Ecosystem CI repo `_. -Also, note that some particular implementation details described above may evolve over time. diff --git a/docs/_sources/ecosystem/flash.rst.txt b/docs/_sources/ecosystem/flash.rst.txt deleted file mode 100644 index 31c6e9d..0000000 --- a/docs/_sources/ecosystem/flash.rst.txt +++ /dev/null @@ -1,78 +0,0 @@ -:orphan: - -Lightning Flash -=============== - -`Lightning Flash `_ is a high-level deep learning framework for fast prototyping, baselining, fine-tuning, and solving deep learning problems. -Flash makes complex AI recipes for over 15 tasks across 7 data domains accessible to all. -It is built for beginners with a simple API that requires very little deep learning background, and for data scientists, Kagglers, applied ML practitioners, and deep learning researchers that -want a quick way to get a deep learning baseline with advanced features PyTorch Lightning offers. - -.. code-block:: bash - - pip install lightning-flash - ------------------ - -********************************* -Using Lightning Flash in 3 Steps! -********************************* - -1. Load your Data ------------------ - -All data loading in Flash is performed via a ``from_*`` classmethod of a ``DataModule``. -Which ``DataModule`` to use and which ``from_*`` methods are available depends on the task you want to perform. -For example, for image segmentation where your data is stored in folders, you would use the ``SemanticSegmentationData``'s `from_folders `_ method: - -.. code-block:: python - - from flash.image import SemanticSegmentationData - - dm = SemanticSegmentationData.from_folders( - train_folder="data/CameraRGB", - train_target_folder="data/CameraSeg", - val_split=0.1, - image_size=(256, 256), - num_classes=21, - ) - ------------- - -2. Configure your Model ------------------------ - -Our tasks come loaded with pre-trained backbones and (where applicable) heads. -You can view the available backbones to use with your task using `available_backbones `_. -Once you've chosen, create the model: - -.. code-block:: python - - from flash.image import SemanticSegmentation - - print(SemanticSegmentation.available_heads()) - # ['deeplabv3', 'deeplabv3plus', 'fpn', ..., 'unetplusplus'] - - print(SemanticSegmentation.available_backbones("fpn")) - # ['densenet121', ..., 'xception'] # + 113 models - - print(SemanticSegmentation.available_pretrained_weights("efficientnet-b0")) - # ['imagenet', 'advprop'] - - model = SemanticSegmentation(head="fpn", backbone="efficientnet-b0", pretrained="advprop", num_classes=dm.num_classes) - ------------- - -3. Finetune! ------------- - -.. code-block:: python - - from flash import Trainer - - trainer = Trainer(max_epochs=3) - trainer.finetune(model, datamodule=datamodule, strategy="freeze") - trainer.save_checkpoint("semantic_segmentation_model.pt") - - -To learn more about Lightning Flash, please refer to the `Lightning Flash documentation `_. diff --git a/docs/_sources/ecosystem/metrics.rst.txt b/docs/_sources/ecosystem/metrics.rst.txt deleted file mode 100644 index 8ec155f..0000000 --- a/docs/_sources/ecosystem/metrics.rst.txt +++ /dev/null @@ -1,93 +0,0 @@ -:orphan: - -TorchMetrics -============ - -`TorchMetrics `_ is a collection of machine learning metrics for distributed, -scalable PyTorch models and an easy-to-use API to create custom metrics. It has a collection of 60+ PyTorch metrics implementations and -is rigorously tested for all edge cases. - -.. code-block:: bash - - pip install torchmetrics - -In TorchMetrics, we offer the following benefits: - -- A standardized interface to increase reproducibility -- Reduced Boilerplate -- Distributed-training compatible -- Rigorously tested -- Automatic accumulation over batches -- Automatic synchronization across multiple devices - ------------------ - -Example 1: Functional Metrics ------------------------------ - -Below is a simple example for calculating the accuracy using the functional interface: - -.. code-block:: python - - import torch - import torchmetrics - - # simulate a classification problem - preds = torch.randn(10, 5).softmax(dim=-1) - target = torch.randint(5, (10,)) - - acc = torchmetrics.functional.accuracy(preds, target) - ------------- - -Example 2: Module Metrics -------------------------- - -The example below shows how to use the class-based interface: - -.. code-block:: python - - import torch - import torchmetrics - - # initialize metric - metric = torchmetrics.Accuracy() - - n_batches = 10 - for i in range(n_batches): - # simulate a classification problem - preds = torch.randn(10, 5).softmax(dim=-1) - target = torch.randint(5, (10,)) - # metric on current batch - acc = metric(preds, target) - print(f"Accuracy on batch {i}: {acc}") - - # metric on all batches using custom accumulation - acc = metric.compute() - print(f"Accuracy on all data: {acc}") - - # Reseting internal state such that metric ready for new data - metric.reset() - ------------- - -Example 3: TorchMetrics with Lightning --------------------------------------- - -The example below shows how to use a metric in your :doc:`LightningModule <../common/lightning_module>`: - -.. code-block:: python - - class MyModel(LightningModule): - def __init__(self): - ... - self.accuracy = torchmetrics.Accuracy() - - def training_step(self, batch, batch_idx): - x, y = batch - preds = self(x) - ... - # log step metric - self.accuracy(preds, y) - self.log("train_acc_step", self.accuracy, on_epoch=True) - ... diff --git a/docs/_sources/ecosystem/transformers.rst.txt b/docs/_sources/ecosystem/transformers.rst.txt deleted file mode 100644 index b20402a..0000000 --- a/docs/_sources/ecosystem/transformers.rst.txt +++ /dev/null @@ -1,47 +0,0 @@ -:orphan: - -Lightning Transformers -====================== - -`Lightning Transformers `_ offers a flexible interface for training and fine-tuning SOTA Transformer models -using the :doc:`PyTorch Lightning Trainer <../common/trainer>`. - -.. code-block:: bash - - pip install lightning-transformers - -In Lightning Transformers, we offer the following benefits: - -- Powered by `PyTorch Lightning `_ - Accelerators, custom Callbacks, Loggers, and high performance scaling with minimal changes. -- Backed by `HuggingFace Transformers `_ models and datasets, spanning multiple modalities and tasks within NLP/Audio and Vision. -- Task Abstraction for Rapid Research & Experimentation - Build your own custom transformer tasks across all modalities with little friction. -- Powerful config composition backed by `Hydra `_ - simply swap out models, optimizers, schedulers task, and many more configurations without touching the code. -- Seamless Memory and Speed Optimizations - Out-of-the-box training optimizations such as `DeepSpeed ZeRO `_ or `FairScale Sharded Training `_ with no code changes. - ------------------ - -Using Lightning-Transformers ----------------------------- - -Lightning Transformers has a collection of tasks for common NLP problems such as `language_modeling `_, -`translation `_ and more. To use, simply: - -1. Pick a task to train (passed to ``train.py`` as ``task=``) - -2. Pick a dataset (passed to ``train.py`` as ``dataset=``) - -3. Customize the backbone, optimizer, or any component within the config - -4. Add any :doc:`Lightning supported parameters and optimizations <../common/trainer>` - -.. code-block:: bash - - python train.py \ - task= \ - dataset= - backbone.pretrained_model_name_or_path= # Optionally change the HF backbone - optimizer= # Optionally specify optimizer (Default AdamW) - trainer. # Optionally specify Lightning trainer arguments - - -To learn more about Lightning Transformers, please refer to the `Lightning Transformers documentation `_. diff --git a/docs/_sources/expertise_levels.rst.txt b/docs/_sources/expertise_levels.rst.txt deleted file mode 100644 index 9b563f7..0000000 --- a/docs/_sources/expertise_levels.rst.txt +++ /dev/null @@ -1,298 +0,0 @@ -:orphan: - -Level up -======== -Learn enough Lightning to match the level of expertise required by your research or job. - -.. join_slack:: - :align: left - :margin: 30 - ----- - -Basic skills ------------- -Learn the basics of model development with Lightning. Researchers and machine learning engineers should start here. - - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Level 1: Train a model - :description: Learn the basics of training a model. - :button_link: model/train_model_basic.html - :col_css: col-md-6 - :height: 150 - :tag: basic - -.. displayitem:: - :header: Level 2: Add a validation and test set - :description: Add validation and test sets to avoid over/underfitting. - :button_link: levels/basic_level_2.html - :col_css: col-md-6 - :height: 150 - :tag: basic - -.. displayitem:: - :header: Level 3: Use pretrained models - :description: Learn how to use pretrained models with Lightning - :button_link: advanced/transfer_learning.html - :col_css: col-md-6 - :height: 150 - :tag: basic - -.. displayitem:: - :header: Level 4: Enable script parameters - :description: Add parameters to your script so you can run from the commandline. - :button_link: common/hyperparameters.html - :col_css: col-md-6 - :height: 150 - :tag: basic - -.. displayitem:: - :header: Level 5: Understand and visualize your model - :description: Remove bottlenecks and visualize your model - :button_link: levels/basic_level_5.html - :col_css: col-md-6 - :height: 150 - :tag: basic - -.. displayitem:: - :description: Use your model for predictions. - :header: Level 6: Predict with your model - :button_link: levels/core_level_6.html - :col_css: col-md-6 - :height: 150 - :tag: basic - -.. raw:: html - -
-
- ----- - -Intermediate skills -------------------- -Learn to scale up your models and enable collaborative model development at academic or industry research labs. - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Level 7: Interactive cloud development - :description: Learn how to access GPUs and TPUs on the cloud. - :button_link: levels/intermediate_level_7.html - :col_css: col-md-6 - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 8: Train in the background on the cloud - :description: Learn how to run models on the cloud in the background. - :button_link: levels/intermediate_level_8.html - :col_css: col-md-6 - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 9: Modularize your projects - :description: Create DataModules to enable dataset reusability. - :col_css: col-md-6 - :button_link: levels/intermediate_level_9.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 10: Understand your model - :description: Use advanced visuals to find the best performing model. - :col_css: col-md-6 - :button_link: levels/intermediate_level_10.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 11: Explore SOTA scaling techniques - :description: Explore SOTA techniques to help convergence, stability and scalability. - :col_css: col-md-6 - :button_link: levels/intermediate_level_11.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 12: Deploy your models - :description: Learn how to deploy your models with optimizations like ONNX and torchscript. - :col_css: col-md-6 - :button_link: levels/intermediate_level_12.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 13: Optimize training speed - :description: Use advanced profilers to mixed precision to train bigger models, faster. - :col_css: col-md-6 - :button_link: levels/intermediate_level_13.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 14: Run on on-prem clusters - :description: Run on a custom on-prem cluster or SLURM cluster. - :col_css: col-md-6 - :button_link: levels/intermediate_level_14.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
- ----- - -Advanced skills ---------------- -Configure all aspects of Lightning for advanced usecases. - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Level 15: Customize configs to run in production - :description: Enable composable YAMLs - :col_css: col-md-6 - :button_link: levels/advanced_level_15.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 16: Customize the trainer - :description: Inject custom code into the trainer and modify the progress bar. - :col_css: col-md-6 - :button_link: levels/advanced_level_16.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 17: Own the training loop - :description: Learn all the ways of owning your raw PyTorch loops with Lighting. - :col_css: col-md-6 - :button_link: levels/advanced_level_17.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 18: Enable advanced checkpointing - :description: Enable composable or cloud based checkpoints. - :col_css: col-md-6 - :button_link: levels/advanced_level_18.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 19: Explore IPUs - :description: Explore Intelligence Processing Unit (IPU) for model scaling. - :col_css: col-md-6 - :button_link: levels/advanced_level_19.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 20: Explore HPUs - :description: Explore Havana Gaudi Processing Unit (HPU) for model scaling. - :col_css: col-md-6 - :button_link: levels/advanced_level_20.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 21: Master TPUs - :description: Master TPUs and run on cloud TPUs. - :col_css: col-md-6 - :button_link: levels/advanced_level_21.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 22: Reach 1 trillion parameters on GPUs - :description: Scale to 1 trillion params on GPUs. - :col_css: col-md-6 - :button_link: levels/advanced_level_22.html - :height: 150 - :tag: advanced - -.. raw:: html - -
-
- ----- - -Expert skills -------------- -Customize and extend Lightning for things like custom hardware or distributed strategies. - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Level 23: Extend the Lightning CLI - :description: Extend the functionality of the Lightning CLI. - :col_css: col-md-6 - :button_link: levels/expert_level_23.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: Level 24: Integrate a custom cluster - :description: Integrate a custom cluster into Lightning. - :col_css: col-md-6 - :button_link: levels/expert_level_24.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: Level 25: Explore fault-tolerance in-depth - :description: Understand the details of fault-tolerance. - :col_css: col-md-6 - :button_link: clouds/fault_tolerant_training_faq.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: Level 26: Make your own profiler - :description: Make your own profiler. - :col_css: col-md-6 - :button_link: tuning/profiler_expert.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: Level 27: Add a new accelerator or Strategy - :description: Integrate a new accelerator or distributed strategy. - :col_css: col-md-6 - :button_link: levels/expert_level_27.html - :height: 150 - :tag: expert - -.. raw:: html - -
-
diff --git a/docs/_sources/extensions/accelerator.rst.txt b/docs/_sources/extensions/accelerator.rst.txt deleted file mode 100644 index dd5a067..0000000 --- a/docs/_sources/extensions/accelerator.rst.txt +++ /dev/null @@ -1,130 +0,0 @@ -.. _accelerator: - -########### -Accelerator -########### - -The Accelerator connects a Lightning Trainer to arbitrary hardware (CPUs, GPUs, TPUs, IPUs, ...). -Currently there are accelerators for: - -- CPU -- :doc:`GPU <../accelerators/gpu>` -- :doc:`TPU <../accelerators/tpu>` -- :doc:`IPU <../accelerators/ipu>` -- :doc:`HPU <../accelerators/hpu>` - -The Accelerator is part of the Strategy which manages communication across multiple devices (distributed communication). -Whenever the Trainer, the loops or any other component in Lightning needs to talk to hardware, it calls into the Strategy and the Strategy calls into the Accelerator. - -.. image:: https://pl-public-data.s3.amazonaws.com/docs/static/images/strategies/overview.jpeg - :alt: Illustration of the Strategy as a composition of the Accelerator and several plugins - -We expose Accelerators and Strategies mainly for expert users who want to extend Lightning to work with new -hardware and distributed training or clusters. - - ----------- - -Create a Custom Accelerator ---------------------------- - -Here is how you create a new Accelerator. -Let's pretend we want to integrate the fictional XPU accelerator and we have access to its hardware through a library -``xpulib``. - -.. code-block:: python - - import xpulib - - - class XPUAccelerator(Accelerator): - """Experimental support for XPU, optimized for large-scale machine learning.""" - - @staticmethod - def parse_devices(devices: Any) -> Any: - # Put parsing logic here how devices can be passed into the Trainer - # via the `devices` argument - return devices - - @staticmethod - def get_parallel_devices(devices: Any) -> Any: - # Here, convert the device indices to actual device objects - return [torch.device("xpu", idx) for idx in devices] - - @staticmethod - def auto_device_count() -> int: - # Return a value for auto-device selection when `Trainer(devices="auto")` - return xpulib.available_devices() - - @staticmethod - def is_available() -> bool: - return xpulib.is_available() - - def get_device_stats(self, device: Union[str, torch.device]) -> Dict[str, Any]: - # Return optional device statistics for loggers - return {} - - -Finally, add the XPUAccelerator to the Trainer: - -.. code-block:: python - - from pytorch_lightning import Trainer - - accelerator = XPUAccelerator() - trainer = Trainer(accelerator=accelerator, devices=2) - - -:doc:`Learn more about Strategies <../extensions/strategy>` and how they interact with the Accelerator. - - ----------- - -Registering Accelerators ------------------------- - -If you wish to switch to a custom accelerator from the CLI without code changes, you can implement the :meth:`~pytorch_lightning.accelerators.accelerator.Accelerator.register_accelerators` class method to register your new accelerator under a shorthand name like so: - -.. code-block:: python - - class XPUAccelerator(Accelerator): - ... - - @classmethod - def register_accelerators(cls, accelerator_registry): - accelerator_registry.register( - "xpu", - cls, - description=f"XPU Accelerator - optimized for large-scale machine learning.", - ) - -Now, this is possible: - -.. code-block:: python - - trainer = Trainer(accelerator="xpu") - -Or if you are using the Lightning CLI, for example: - -.. code-block:: bash - - python train.py fit --trainer.accelerator=xpu --trainer.devices=2 - - ----------- - -Accelerator API ---------------- - -.. currentmodule:: pytorch_lightning.accelerators - -.. autosummary:: - :nosignatures: - :template: classtemplate.rst - - Accelerator - CPUAccelerator - GPUAccelerator - HPUAccelerator - IPUAccelerator - TPUAccelerator diff --git a/docs/_sources/extensions/callbacks.rst.txt b/docs/_sources/extensions/callbacks.rst.txt deleted file mode 100644 index 6def5ee..0000000 --- a/docs/_sources/extensions/callbacks.rst.txt +++ /dev/null @@ -1,408 +0,0 @@ -.. role:: hidden - :class: hidden-section - -.. _callbacks: - -######## -Callback -######## - -.. raw:: html - - - -| - -A callback is a self-contained program that can be reused across projects. - -Lightning has a callback system to execute them when needed. Callbacks should capture NON-ESSENTIAL -logic that is NOT required for your :doc:`lightning module <../common/lightning_module>` to run. - -Here's the flow of how the callback hooks are executed: - -.. raw:: html - - - -An overall Lightning system should have: - -1. Trainer for all engineering -2. LightningModule for all research code. -3. Callbacks for non-essential code. - -| - -Example: - -.. testcode:: - - from pytorch_lightning.callbacks import Callback - - - class MyPrintingCallback(Callback): - def on_train_start(self, trainer, pl_module): - print("Training is starting") - - def on_train_end(self, trainer, pl_module): - print("Training is ending") - - - trainer = Trainer(callbacks=[MyPrintingCallback()]) - -We successfully extended functionality without polluting our super clean -:doc:`lightning module <../common/lightning_module>` research code. - ------------ - -******** -Examples -******** -You can do pretty much anything with callbacks. - -- `Add a MLP to fine-tune self-supervised networks `_. -- `Find how to modify an image input to trick the classification result `_. -- `Interpolate the latent space of any variational model `_. -- `Log images to Tensorboard for any model `_. - - --------------- - -****************** -Built-in Callbacks -****************** -Lightning has a few built-in callbacks. - -.. note:: - For a richer collection of callbacks, check out our - `bolts library `_. - -.. currentmodule:: pytorch_lightning.callbacks - -.. autosummary:: - :nosignatures: - :template: classtemplate.rst - - BackboneFinetuning - BaseFinetuning - BasePredictionWriter - Callback - DeviceStatsMonitor - EarlyStopping - GradientAccumulationScheduler - LambdaCallback - LearningRateMonitor - ModelCheckpoint - ModelPruning - ModelSummary - ProgressBarBase - QuantizationAwareTraining - RichModelSummary - RichProgressBar - StochasticWeightAveraging - Timer - TQDMProgressBar - ----------- - -.. include:: callbacks_state.rst - ----------- - -************** -Best Practices -************** -The following are best practices when using/designing callbacks. - -1. Callbacks should be isolated in their functionality. -2. Your callback should not rely on the behavior of other callbacks in order to work properly. -3. Do not manually call methods from the callback. -4. Directly calling methods (eg. `on_validation_end`) is strongly discouraged. -5. Whenever possible, your callbacks should not depend on the order in which they are executed. - ------------ - -.. _callback_hooks: - -************ -Callback API -************ -Here is the full API of methods available in the Callback base class. - -The :class:`~pytorch_lightning.callbacks.Callback` class is the base for all the callbacks in Lightning just like the :class:`~pytorch_lightning.core.lightning.LightningModule` is the base for all models. -It defines a public interface that each callback implementation must follow, the key ones are: - -Properties -========== - -state_key -^^^^^^^^^ - -.. autoattribute:: pytorch_lightning.callbacks.Callback.state_key - :noindex: - - -Hooks -===== - -on_configure_sharded_model -^^^^^^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_configure_sharded_model - :noindex: - -setup -^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.setup - :noindex: - -teardown -^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.teardown - :noindex: - -on_init_start -^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_init_start - :noindex: - -on_init_end -^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_init_end - :noindex: - -on_fit_start -^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_fit_start - :noindex: - -on_fit_end -^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_fit_end - :noindex: - -on_sanity_check_start -^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_sanity_check_start - :noindex: - -on_sanity_check_end -^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_sanity_check_end - :noindex: - -on_train_batch_start -^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_train_batch_start - :noindex: - -on_train_batch_end -^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_train_batch_end - :noindex: - -on_train_epoch_start -^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_train_epoch_start - :noindex: - -on_train_epoch_end -^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_train_epoch_end - :noindex: - -on_validation_epoch_start -^^^^^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_validation_epoch_start - :noindex: - -on_validation_epoch_end -^^^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_validation_epoch_end - :noindex: - -on_test_epoch_start -^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_test_epoch_start - :noindex: - -on_test_epoch_end -^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_test_epoch_end - :noindex: - -on_predict_epoch_start -^^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_predict_epoch_start - :noindex: - -on_predict_epoch_end -^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_predict_epoch_end - :noindex: - -.. automethod:: pytorch_lightning.callbacks.Callback.on_epoch_end - :noindex: - -on_validation_batch_start -^^^^^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_validation_batch_start - :noindex: - -on_validation_batch_end -^^^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_validation_batch_end - :noindex: - -on_test_batch_start -^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_test_batch_start - :noindex: - -on_test_batch_end -^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_test_batch_end - :noindex: - -on_predict_batch_start -^^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_predict_batch_start - :noindex: - -on_predict_batch_end -^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_predict_batch_end - :noindex: - -on_train_start -^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_train_start - :noindex: - -on_train_end -^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_train_end - :noindex: - -on_validation_start -^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_validation_start - :noindex: - -on_validation_end -^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_validation_end - :noindex: - -on_test_start -^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_test_start - :noindex: - -on_test_end -^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_test_end - :noindex: - -on_predict_start -^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_predict_start - :noindex: - -on_predict_end -^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_predict_end - :noindex: - -on_keyboard_interrupt -^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_keyboard_interrupt - :noindex: - -on_exception -^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_exception - :noindex: - -state_dict -^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.state_dict - :noindex: - -on_save_checkpoint -^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_save_checkpoint - :noindex: - -load_state_dict -^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.load_state_dict - :noindex: - -on_load_checkpoint -^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_load_checkpoint - :noindex: - -on_before_backward -^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_before_backward - :noindex: - -on_after_backward -^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_after_backward - :noindex: - -on_before_optimizer_step -^^^^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_before_optimizer_step - :noindex: - -on_before_zero_grad -^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_before_zero_grad - :noindex: diff --git a/docs/_sources/extensions/callbacks_state.rst.txt b/docs/_sources/extensions/callbacks_state.rst.txt deleted file mode 100644 index 0a104ca..0000000 --- a/docs/_sources/extensions/callbacks_state.rst.txt +++ /dev/null @@ -1,62 +0,0 @@ -******************* -Save Callback state -******************* - -Some callbacks require internal state in order to function properly. You can optionally -choose to persist your callback's state as part of model checkpoint files using -:meth:`~pytorch_lightning.callbacks.Callback.state_dict` and :meth:`~pytorch_lightning.callbacks.Callback.load_state_dict`. -Note that the returned state must be able to be pickled. - -When your callback is meant to be used only as a singleton callback then implementing the above two hooks is enough -to persist state effectively. However, if passing multiple instances of the callback to the Trainer is supported, then -the callback must define a :attr:`~pytorch_lightning.callbacks.Callback.state_key` property in order for Lightning -to be able to distinguish the different states when loading the callback state. This concept is best illustrated by -the following example. - -.. testcode:: - - class Counter(Callback): - def __init__(self, what="epochs", verbose=True): - self.what = what - self.verbose = verbose - self.state = {"epochs": 0, "batches": 0} - - @property - def state_key(self): - # note: we do not include `verbose` here on purpose - return self._generate_state_key(what=self.what) - - def on_train_epoch_end(self, *args, **kwargs): - if self.what == "epochs": - self.state["epochs"] += 1 - - def on_train_batch_end(self, *args, **kwargs): - if self.what == "batches": - self.state["batches"] += 1 - - def load_state_dict(self, state_dict): - self.state.update(state_dict) - - def state_dict(self): - return self.state.copy() - - - # two callbacks of the same type are being used - trainer = Trainer(callbacks=[Counter(what="epochs"), Counter(what="batches")]) - -A Lightning checkpoint from this Trainer with the two stateful callbacks will include the following information: - -.. code-block:: - - { - "state_dict": ..., - "callbacks": { - "Counter{'what': 'batches'}": {"batches": 32, "epochs": 0}, - "Counter{'what': 'epochs'}": {"batches": 0, "epochs": 2}, - ... - } - } - -The implementation of a :attr:`~pytorch_lightning.callbacks.Callback.state_key` is essential here. If it were missing, -Lightning would not be able to disambiguate the state for these two callbacks, and :attr:`~pytorch_lightning.callbacks.Callback.state_key` -by default only defines the class name as the key, e.g., here ``Counter``. diff --git a/docs/_sources/extensions/datamodules_state.rst.txt b/docs/_sources/extensions/datamodules_state.rst.txt deleted file mode 100644 index 61710d7..0000000 --- a/docs/_sources/extensions/datamodules_state.rst.txt +++ /dev/null @@ -1,15 +0,0 @@ -Save DataModule state -===================== -When a checkpoint is created, it asks every DataModule for their state. If your DataModule defines the *state_dict* and *load_state_dict* methods, the checkpoint will automatically track and restore your DataModules. - -.. code:: python - - class LitDataModule(pl.DataModuler): - def state_dict(self): - # track whatever you want here - state = {"current_train_batch_index": self.current_train_batch_index} - return state - - def load_state_dict(self, state_dict): - # restore the state based on what you tracked in (def state_dict) - self.current_train_batch_index = state_dict["current_train_batch_index"] diff --git a/docs/_sources/extensions/generated/pytorch_lightning.loggers.CSVLogger.rst.txt b/docs/_sources/extensions/generated/pytorch_lightning.loggers.CSVLogger.rst.txt deleted file mode 100644 index bd8ccbf..0000000 --- a/docs/_sources/extensions/generated/pytorch_lightning.loggers.CSVLogger.rst.txt +++ /dev/null @@ -1,15 +0,0 @@ -.. role:: hidden - :class: hidden-section -.. currentmodule:: pytorch_lightning.loggers - - -CSVLogger -========= - -.. autoclass:: CSVLogger - :members: - - -.. - autogenerated from source/_templates/classtemplate.rst - note it does not have :inherited-members: \ No newline at end of file diff --git a/docs/_sources/extensions/generated/pytorch_lightning.loggers.CometLogger.rst.txt b/docs/_sources/extensions/generated/pytorch_lightning.loggers.CometLogger.rst.txt deleted file mode 100644 index 324d77c..0000000 --- a/docs/_sources/extensions/generated/pytorch_lightning.loggers.CometLogger.rst.txt +++ /dev/null @@ -1,15 +0,0 @@ -.. role:: hidden - :class: hidden-section -.. currentmodule:: pytorch_lightning.loggers - - -CometLogger -=========== - -.. autoclass:: CometLogger - :members: - - -.. - autogenerated from source/_templates/classtemplate.rst - note it does not have :inherited-members: \ No newline at end of file diff --git a/docs/_sources/extensions/generated/pytorch_lightning.loggers.MLFlowLogger.rst.txt b/docs/_sources/extensions/generated/pytorch_lightning.loggers.MLFlowLogger.rst.txt deleted file mode 100644 index 2eaf478..0000000 --- a/docs/_sources/extensions/generated/pytorch_lightning.loggers.MLFlowLogger.rst.txt +++ /dev/null @@ -1,15 +0,0 @@ -.. role:: hidden - :class: hidden-section -.. currentmodule:: pytorch_lightning.loggers - - -MLFlowLogger -============ - -.. autoclass:: MLFlowLogger - :members: - - -.. - autogenerated from source/_templates/classtemplate.rst - note it does not have :inherited-members: \ No newline at end of file diff --git a/docs/_sources/extensions/generated/pytorch_lightning.loggers.NeptuneLogger.rst.txt b/docs/_sources/extensions/generated/pytorch_lightning.loggers.NeptuneLogger.rst.txt deleted file mode 100644 index e9da513..0000000 --- a/docs/_sources/extensions/generated/pytorch_lightning.loggers.NeptuneLogger.rst.txt +++ /dev/null @@ -1,15 +0,0 @@ -.. role:: hidden - :class: hidden-section -.. currentmodule:: pytorch_lightning.loggers - - -NeptuneLogger -============= - -.. autoclass:: NeptuneLogger - :members: - - -.. - autogenerated from source/_templates/classtemplate.rst - note it does not have :inherited-members: \ No newline at end of file diff --git a/docs/_sources/extensions/generated/pytorch_lightning.loggers.TensorBoardLogger.rst.txt b/docs/_sources/extensions/generated/pytorch_lightning.loggers.TensorBoardLogger.rst.txt deleted file mode 100644 index 6bcd4a2..0000000 --- a/docs/_sources/extensions/generated/pytorch_lightning.loggers.TensorBoardLogger.rst.txt +++ /dev/null @@ -1,15 +0,0 @@ -.. role:: hidden - :class: hidden-section -.. currentmodule:: pytorch_lightning.loggers - - -TensorBoardLogger -================= - -.. autoclass:: TensorBoardLogger - :members: - - -.. - autogenerated from source/_templates/classtemplate.rst - note it does not have :inherited-members: \ No newline at end of file diff --git a/docs/_sources/extensions/generated/pytorch_lightning.loggers.WandbLogger.rst.txt b/docs/_sources/extensions/generated/pytorch_lightning.loggers.WandbLogger.rst.txt deleted file mode 100644 index 3dcb424..0000000 --- a/docs/_sources/extensions/generated/pytorch_lightning.loggers.WandbLogger.rst.txt +++ /dev/null @@ -1,15 +0,0 @@ -.. role:: hidden - :class: hidden-section -.. currentmodule:: pytorch_lightning.loggers - - -WandbLogger -=========== - -.. autoclass:: WandbLogger - :members: - - -.. - autogenerated from source/_templates/classtemplate.rst - note it does not have :inherited-members: \ No newline at end of file diff --git a/docs/_sources/extensions/logging.rst.txt b/docs/_sources/extensions/logging.rst.txt deleted file mode 100644 index 8bad452..0000000 --- a/docs/_sources/extensions/logging.rst.txt +++ /dev/null @@ -1,410 +0,0 @@ -:orphan: - -.. testsetup:: * - - from pytorch_lightning import loggers as pl_loggers - -.. role:: hidden - :class: hidden-section - -.. _logging: - - -####### -Logging -####### - -***************** -Supported Loggers -***************** - -The following are loggers we support: - -.. currentmodule:: pytorch_lightning.loggers - -.. autosummary:: - :toctree: generated - :nosignatures: - :template: classtemplate.rst - - CometLogger - CSVLogger - MLFlowLogger - NeptuneLogger - TensorBoardLogger - WandbLogger - - -The above loggers will normally plot an additional chart (**global_step VS epoch**). Depending on the loggers you use, there might be some additional charts too. - -By default, Lightning uses ``TensorBoard`` logger under the hood, and stores the logs to a directory (by default in ``lightning_logs/``). - -.. testcode:: - - from pytorch_lightning import Trainer - - # Automatically logs to a directory (by default ``lightning_logs/``) - trainer = Trainer() - -To see your logs: - -.. code-block:: bash - - tensorboard --logdir=lightning_logs/ - -To visualize tensorboard in a jupyter notebook environment, run the following command in a jupyter cell: - -.. code-block:: bash - - %reload_ext tensorboard - %tensorboard --logdir=lightning_logs/ - -You can also pass a custom Logger to the :class:`~pytorch_lightning.trainer.trainer.Trainer`. - -.. testcode:: - - from pytorch_lightning import loggers as pl_loggers - - tb_logger = pl_loggers.TensorBoardLogger(save_dir="logs/") - trainer = Trainer(logger=tb_logger) - -Choose from any of the others such as MLflow, Comet, Neptune, WandB, etc. - -.. testcode:: - - comet_logger = pl_loggers.CometLogger(save_dir="logs/") - trainer = Trainer(logger=comet_logger) - -To use multiple loggers, simply pass in a ``list`` or ``tuple`` of loggers. - -.. testcode:: - - tb_logger = pl_loggers.TensorBoardLogger(save_dir="logs/") - comet_logger = pl_loggers.CometLogger(save_dir="logs/") - trainer = Trainer(logger=[tb_logger, comet_logger]) - -.. note:: - - By default, Lightning logs every 50 steps. Use Trainer flags to :ref:`logging_frequency`. - -.. note:: - - By default, all loggers log to ``os.getcwd()``. You can change the logging path using - ``Trainer(default_root_dir="/your/path/to/save/checkpoints")`` without instantiating a logger. - ----------- - -****************************** -Logging from a LightningModule -****************************** - -Lightning offers automatic log functionalities for logging scalars, or manual logging for anything else. - -Automatic Logging -================= - -Use the :meth:`~pytorch_lightning.core.lightning.LightningModule.log` or :meth:`~pytorch_lightning.core.lightning.LightningModule.log_dict` -methods to log from anywhere in a :doc:`LightningModule <../common/lightning_module>` and :doc:`callbacks <../extensions/callbacks>`. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - self.log("my_metric", x) - - - # or a dict to get multiple metrics on the same plot if the logger supports it - def training_step(self, batch, batch_idx): - self.log("performance", {"acc": acc, "recall": recall}) - - - # or a dict to log all metrics at once with individual plots - def training_step(self, batch, batch_idx): - self.log_dict({"acc": acc, "recall": recall}) - -.. note:: - Everything explained below applies to both :meth:`~pytorch_lightning.core.lightning.LightningModule.log` or :meth:`~pytorch_lightning.core.lightning.LightningModule.log_dict` methods. - -Depending on where the :meth:`~pytorch_lightning.core.lightning.LightningModule.log` method is called, Lightning auto-determines -the correct logging mode for you. Of course you can override the default behavior by manually setting the -:meth:`~pytorch_lightning.core.lightning.LightningModule.log` parameters. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - self.log("my_loss", loss, on_step=True, on_epoch=True, prog_bar=True, logger=True) - -The :meth:`~pytorch_lightning.core.lightning.LightningModule.log` method has a few options: - -* ``on_step``: Logs the metric at the current step. -* ``on_epoch``: Automatically accumulates and logs at the end of the epoch. -* ``prog_bar``: Logs to the progress bar (Default: ``False``). -* ``logger``: Logs to the logger like ``Tensorboard``, or any other custom logger passed to the :class:`~pytorch_lightning.trainer.trainer.Trainer` (Default: ``True``). -* ``reduce_fx``: Reduction function over step values for end of epoch. Uses :meth:`torch.mean` by default. -* ``enable_graph``: If True, will not auto detach the graph. -* ``sync_dist``: If True, reduces the metric across devices. Use with care as this may lead to a significant communication overhead. -* ``sync_dist_group``: The DDP group to sync across. -* ``add_dataloader_idx``: If True, appends the index of the current dataloader to the name (when using multiple dataloaders). If False, user needs to give unique names for each dataloader to not mix the values. -* ``batch_size``: Current batch size used for accumulating logs logged with ``on_epoch=True``. This will be directly inferred from the loaded batch, but for some data structures you might need to explicitly provide it. -* ``rank_zero_only``: Whether the value will be logged only on rank 0. This will prevent synchronization which would produce a deadlock as not all processes would perform this log call. - -.. list-table:: Default behavior of logging in Callback or LightningModule - :widths: 50 25 25 - :header-rows: 1 - - * - Hook - - on_step - - on_epoch - * - on_train_start, on_train_epoch_start, on_train_epoch_end, training_epoch_end - - False - - True - * - on_before_backward, on_after_backward, on_before_optimizer_step, on_before_zero_grad - - True - - False - * - on_train_batch_start, on_train_batch_end, training_step, training_step_end - - True - - False - * - on_validation_start, on_validation_epoch_start, on_validation_epoch_end, validation_epoch_end - - False - - True - * - on_validation_batch_start, on_validation_batch_end, validation_step, validation_step_end - - False - - True - - -.. note:: - - While logging tensor metrics with ``on_epoch=True`` inside step-level hooks and using mean-reduction (default) to accumulate the metrics across the current epoch, Lightning tries to extract the - batch size from the current batch. If multiple possible batch sizes are found, a warning is logged and if it fails to extract the batch size from the current batch, which is possible if - the batch is a custom structure/collection, then an error is raised. To avoid this, you can specify the ``batch_size`` inside the ``self.log(... batch_size=batch_size)`` call. - - .. code-block:: python - - def training_step(self, batch, batch_idx): - # extracts the batch size from `batch` - self.log("train_loss", loss, on_epoch=True) - - - def validation_step(self, batch, batch_idx): - # uses `batch_size=10` - self.log("val_loss", loss, batch_size=10) - -.. note:: - - - The above config for ``validation`` applies for ``test`` hooks as well. - - - Setting ``on_epoch=True`` will cache all your logged values during the full training epoch and perform a - reduction in ``on_train_epoch_end``. We recommend using `TorchMetrics `_, when working with custom reduction. - - - Setting both ``on_step=True`` and ``on_epoch=True`` will create two keys per metric you log with - suffix ``_step`` and ``_epoch`` respectively. You can refer to these keys e.g. in the `monitor` - argument of :class:`~pytorch_lightning.callbacks.model_checkpoint.ModelCheckpoint` or in the graphs plotted to the logger of your choice. - - -If your work requires to log in an unsupported method, please open an issue with a clear description of why it is blocking you. - - -Manual Logging Non-Scalar Artifacts -=================================== - -If you want to log anything that is not a scalar, like histograms, text, images, etc., you may need to use the logger object directly. - -.. code-block:: python - - def training_step(self): - ... - # the logger you used (in this case tensorboard) - tensorboard = self.logger.experiment - tensorboard.add_image() - tensorboard.add_histogram(...) - tensorboard.add_figure(...) - - ----------- - -******************** -Make a Custom Logger -******************** - -You can implement your own logger by writing a class that inherits from :class:`~pytorch_lightning.loggers.logger.Logger`. -Use the :func:`~pytorch_lightning.loggers.logger.rank_zero_experiment` and :func:`~pytorch_lightning.utilities.rank_zero.rank_zero_only` decorators to make sure that only the first process in DDP training creates the experiment and logs the data respectively. - -.. testcode:: - - from pytorch_lightning.loggers.logger import Logger, rank_zero_experiment - from pytorch_lightning.utilities.distributed import rank_zero_only - - - class MyLogger(Logger): - @property - def name(self): - return "MyLogger" - - @property - def version(self): - # Return the experiment version, int or str. - return "0.1" - - @rank_zero_only - def log_hyperparams(self, params): - # params is an argparse.Namespace - # your code to record hyperparameters goes here - pass - - @rank_zero_only - def log_metrics(self, metrics, step): - # metrics is a dictionary of metric names and values - # your code to record metrics goes here - pass - - @rank_zero_only - def save(self): - # Optional. Any code necessary to save logger data goes here - pass - - @rank_zero_only - def finalize(self, status): - # Optional. Any code that needs to be run after training - # finishes goes here - pass - -If you write a logger that may be useful to others, please send -a pull request to add it to Lightning! - ----------- - -.. _logging_frequency: - - -************************* -Control Logging Frequency -************************* - -Logging frequency -================= - -It may slow down training to log on every single batch. By default, Lightning logs every 50 rows, or 50 training steps. -To change this behaviour, set the ``log_every_n_steps`` :class:`~pytorch_lightning.trainer.trainer.Trainer` flag. - -.. testcode:: - - k = 10 - trainer = Trainer(log_every_n_steps=k) - - -Log Writing Frequency -===================== - -Individual logger implementations determine their flushing frequency. For example, on the -:class:`~pytorch_lightning.loggers.csv_logs.CSVLogger` you can set the flag ``flush_logs_every_n_steps``. - ----------- - -************ -Progress Bar -************ - -You can add any metric to the progress bar using :meth:`~pytorch_lightning.core.lightning.LightningModule.log` -method, setting ``prog_bar=True``. - - -.. code-block:: python - - def training_step(self, batch, batch_idx): - self.log("my_loss", loss, prog_bar=True) - - -You could learn more about progress bars supported by Lightning :doc:`here <../common/progress_bar>`. - -Modifying the Progress Bar -========================== - -The progress bar by default already includes the training loss and version number of the experiment -if you are using a logger. These defaults can be customized by overriding the -:meth:`~pytorch_lightning.callbacks.progress.base.ProgressBarBase.get_metrics` hook in your logger. - -.. code-block:: python - - from pytorch_lightning.callbacks.progress import Tqdm - - - class CustomProgressBar(Tqdm): - def get_metrics(self, *args, **kwargs): - # don't show the version number - items = super().get_metrics() - items.pop("v_num", None) - return items - - ----------- - - -************************* -Configure Console Logging -************************* - -Lightning logs useful information about the training process and user warnings to the console. -You can retrieve the Lightning console logger and change it to your liking. For example, adjust the logging level -or redirect output for certain modules to log files: - -.. testcode:: - - import logging - - # configure logging at the root level of Lightning - logging.getLogger("pytorch_lightning").setLevel(logging.ERROR) - - # configure logging on module level, redirect to file - logger = logging.getLogger("pytorch_lightning.core") - logger.addHandler(logging.FileHandler("core.log")) - -Read more about custom Python logging `here `_. - - ----------- - -*********************** -Logging Hyperparameters -*********************** - -When training a model, it is useful to know what hyperparams went into that model. -When Lightning creates a checkpoint, it stores a key ``"hyper_parameters"`` with the hyperparams. - -.. code-block:: python - - lightning_checkpoint = torch.load(filepath, map_location=lambda storage, loc: storage) - hyperparams = lightning_checkpoint["hyper_parameters"] - -Some loggers also allow logging the hyperparams used in the experiment. For instance, -when using the ``TensorBoardLogger``, all hyperparams will show -in the `hparams tab `_. - -.. note:: - If you want to track a metric in the tensorboard hparams tab, log scalars to the key ``hp_metric``. If tracking multiple metrics, initialize ``TensorBoardLogger`` with ``default_hp_metric=False`` and call ``log_hyperparams`` only once with your metric keys and initial values. Subsequent updates can simply be logged to the metric keys. Refer to the examples below for setting up proper hyperparams metrics tracking within the :doc:`LightningModule <../common/lightning_module>`. - - .. code-block:: python - - # Using default_hp_metric - def validation_step(self, batch, batch_idx): - self.log("hp_metric", some_scalar) - - - # Using custom or multiple metrics (default_hp_metric=False) - def on_train_start(self): - self.logger.log_hyperparams(self.hparams, {"hp/metric_1": 0, "hp/metric_2": 0}) - - - def validation_step(self, batch, batch_idx): - self.log("hp/metric_1", some_scalar_1) - self.log("hp/metric_2", some_scalar_2) - - In the example, using ``"hp/"`` as a prefix allows for the metrics to be grouped under "hp" in the tensorboard scalar tab where you can collapse them. - ------------ - -*************************** -Managing Remote Filesystems -*************************** - -Lightning supports saving logs to a variety of filesystems, including local filesystems and several cloud storage providers. - -Check out the :doc:`Remote Filesystems <../common/remote_fs>` doc for more info. diff --git a/docs/_sources/extensions/loops.rst.txt b/docs/_sources/extensions/loops.rst.txt deleted file mode 100644 index c24d4ce..0000000 --- a/docs/_sources/extensions/loops.rst.txt +++ /dev/null @@ -1,461 +0,0 @@ -.. _loop-customization-extensions: - - -Loops -===== - -Loops let advanced users swap out the default gradient descent optimization loop at the core of Lightning with a different optimization paradigm. - -The Lightning Trainer is built on top of the standard gradient descent optimization loop which works for 90%+ of machine learning use cases: - -.. code-block:: python - - for i, batch in enumerate(dataloader): - x, y = batch - y_hat = model(x) - loss = loss_function(y_hat, y) - optimizer.zero_grad() - loss.backward() - optimizer.step() - -However, some new research use cases such as meta-learning, active learning, recommendation systems, etc., require a different loop structure. -For example here is a simple loop that guides the weight updates with a loss from a special validation split: - -.. code-block:: python - - for i, batch in enumerate(train_dataloader): - x, y = batch - y_hat = model(x) - loss = loss_function(y_hat, y) - optimizer.zero_grad() - loss.backward() - - val_loss = 0 - for i, val_batch in enumerate(val_dataloader): - x, y = val_batch - y_hat = model(x) - val_loss += loss_function(y_hat, y) - - scale_gradients(model, 1 / val_loss) - optimizer.step() - - -With Lightning Loops, you can customize to non-standard gradient descent optimizations to get the same loop above: - -.. code-block:: python - - trainer = Trainer() - trainer.fit_loop.epoch_loop = MyGradientDescentLoop() - -Think of this as swapping out the engine in a car! - ----------- - -Understanding the Default Trainer Loop --------------------------------------- - -The Lightning :class:`~pytorch_lightning.trainer.trainer.Trainer` automates the standard optimization loop which every PyTorch user is familiar with: - -.. code-block:: python - - for i, batch in enumerate(dataloader): - x, y = batch - y_hat = model(x) - loss = loss_function(y_hat, y) - optimizer.zero_grad() - loss.backward() - optimizer.step() - -The core research logic is simply shifted to the :class:`~pytorch_lightning.core.lightning.LightningModule`: - -.. code-block:: python - - for i, batch in enumerate(dataloader): - # x, y = batch moved to training_step - # y_hat = model(x) moved to training_step - # loss = loss_function(y_hat, y) moved to training_step - loss = lightning_module.training_step(batch, i) - - # Lightning handles automatically: - optimizer.zero_grad() - loss.backward() - optimizer.step() - -Under the hood, the above loop is implemented using the :class:`~pytorch_lightning.loops.base.Loop` API like so: - -.. code-block:: python - - class DefaultLoop(Loop): - def advance(self, batch, i): - loss = lightning_module.training_step(batch, i) - optimizer.zero_grad() - loss.backward() - optimizer.step() - - def run(self, dataloader): - for i, batch in enumerate(dataloader): - self.advance(batch, i) - -Defining a loop within a class interface instead of hard-coding a raw Python for/while loop has several benefits: - -1. You can have full control over the data flow through loops. -2. You can add new loops and nest as many of them as you want. -3. If needed, the state of a loop can be :ref:`saved and resumed `. -4. New hooks can be injected at any point. - -.. image:: https://pl-public-data.s3.amazonaws.com/docs/static/images/loops/epoch-loop-steps.gif - :alt: Animation showing how to convert a standard training loop to a Lightning loop - ----------- - -.. _override-default-loops-extensions: - -Overriding the default Loops ----------------------------- - -The fastest way to get started with loops, is to override functionality of an existing loop. -Lightning has 4 main loops which relies on : :class:`~pytorch_lightning.loops.fit_loop.FitLoop` for fitting (training and validating), -:class:`~pytorch_lightning.loops.dataloader.evaluation_loop.EvaluationLoop` for validating or testing, -:class:`~pytorch_lightning.loops.dataloader.prediction_loop.PredictionLoop` for predicting. - -For simple changes that don't require a custom loop, you can modify each of these loops. - -Each loop has a series of methods that can be modified. -For example with the :class:`~pytorch_lightning.loops.fit_loop.FitLoop`: - -.. code-block:: python - - from pytorch_lightning.loops import FitLoop - - - class MyLoop(FitLoop): - def advance(self): - """Advance from one iteration to the next.""" - - def on_advance_end(self): - """Do something at the end of an iteration.""" - - def on_run_end(self): - """Do something when the loop ends.""" - -A full list with all built-in loops and subloops can be found :ref:`here `. - -To add your own modifications to a loop, simply subclass an existing loop class and override what you need. -Here is a simple example how to add a new hook: - -.. code-block:: python - - from pytorch_lightning.loops import FitLoop - - - class CustomFitLoop(FitLoop): - def advance(self): - # ... whatever code before - - # pass anything you want to the hook - self.trainer.call_hook("my_new_hook", *args, **kwargs) - - # ... whatever code after - -Now simply attach the correct loop in the trainer directly: - -.. code-block:: python - - trainer = Trainer(...) - trainer.fit_loop = CustomFitLoop() - - # fit() now uses the new FitLoop! - trainer.fit(...) - - # the equivalent for validate() - val_loop = CustomValLoop() - trainer = Trainer() - trainer.validate_loop = val_loop - trainer.validate(...) - -Now your code is FULLY flexible and you can still leverage ALL the best parts of Lightning! - -.. image:: https://pl-public-data.s3.amazonaws.com/docs/static/images/loops/replace-fit-loop.gif - :alt: Animation showing how to replace a loop on the Trainer - ----------- - -Creating a New Loop From Scratch --------------------------------- - -You can also go wild and implement a full loop from scratch by sub-classing the :class:`~pytorch_lightning.loops.base.Loop` base class. -You will need to override a minimum of two things: - -.. code-block:: python - - from pytorch_lightning.loop import Loop - - - class MyFancyLoop(Loop): - @property - def done(self): - """Provide a condition to stop the loop.""" - - def advance(self): - """ - Access your dataloader/s in whatever way you want. - Do your fancy optimization things. - Call the LightningModule methods at your leisure. - """ - -Finally, attach it into the :class:`~pytorch_lightning.trainer.trainer.Trainer`: - -.. code-block:: python - - trainer = Trainer(...) - trainer.fit_loop = MyFancyLoop() - - # fit() now uses your fancy loop! - trainer.fit(...) - -But beware: Loop customization gives you more power and full control over the Trainer and with great power comes great responsibility. -We recommend that you familiarize yourself with :ref:`overriding the default loops ` first before you start building a new loop from the ground up. - ----------- - -Loop API --------- -Here is the full API of methods available in the Loop base class. - -The :class:`~pytorch_lightning.loops.base.Loop` class is the base of all loops in the same way as the :class:`~pytorch_lightning.core.lightning.LightningModule` is the base of all models. -It defines a public interface that each loop implementation must follow, the key ones are: - -Properties -^^^^^^^^^^ - -done -~~~~ - -.. autoattribute:: pytorch_lightning.loops.base.Loop.done - :noindex: - -skip (optional) -~~~~~~~~~~~~~~~ - -.. autoattribute:: pytorch_lightning.loops.base.Loop.skip - :noindex: - -Methods -^^^^^^^ - -reset (optional) -~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.loops.base.Loop.reset - :noindex: - -advance -~~~~~~~ - -.. automethod:: pytorch_lightning.loops.base.Loop.advance - :noindex: - -run (optional) -~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.loops.base.Loop.run - :noindex: - - ----------- - -Subloops --------- - -When you want to customize nested loops within loops, use the :meth:`~pytorch_lightning.loops.base.Loop.replace` method: - -.. code-block:: python - - # This takes care of properly instantiating the new Loop and setting all references - trainer.fit_loop.replace(epoch_loop=MyEpochLoop) - # Trainer runs the fit loop with your new epoch loop! - trainer.fit(model) - -Alternatively, for more fine-grained control, use the :meth:`~pytorch_lightning.loops.base.Loop.connect` method: - -.. code-block:: python - - # Optional: stitch back the trainer arguments - epoch_loop = MyEpochLoop(trainer.fit_loop.epoch_loop.min_steps, trainer.fit_loop.epoch_loop.max_steps) - # Optional: connect children loops as they might have existing state - epoch_loop.connect(trainer.fit_loop.epoch_loop.batch_loop, trainer.fit_loop.epoch_loop.val_loop) - # Instantiate and connect the loop. - trainer.fit_loop.connect(epoch_loop=epoch_loop) - trainer.fit(model) - -More about the built-in loops and how they are composed is explained in the next section. - -.. image:: https://pl-public-data.s3.amazonaws.com/docs/static/images/loops/connect-epoch-loop.gif - :alt: Animation showing how to connect a custom subloop - ----------- - -Built-in Loops --------------- - -.. _loop-structure-extensions: - -The training loop in Lightning is called *fit loop* and is actually a combination of several loops. -Here is what the structure would look like in plain Python: - -.. code-block:: python - - # FitLoop - for epoch in range(max_epochs): - - # TrainingEpochLoop - for batch_idx, batch in enumerate(train_dataloader): - - # TrainingBatchLoop - for split_batch in tbptt_split(batch): - - # OptimizerLoop - for optimizer_idx, opt in enumerate(optimizers): - - loss = lightning_module.training_step(batch, batch_idx, optimizer_idx) - ... - - # ValidationEpochLoop - for batch_idx, batch in enumerate(val_dataloader): - lightning_module.validation_step(batch, batch_idx, optimizer_idx) - ... - - -Each of these :code:`for`-loops represents a class implementing the :class:`~pytorch_lightning.loops.base.Loop` interface. - - -.. list-table:: Trainer entry points and associated loops - :widths: 25 75 - :header-rows: 1 - - * - Built-in loop - - Description - * - :class:`~pytorch_lightning.loops.fit_loop.FitLoop` - - The :class:`~pytorch_lightning.loops.fit_loop.FitLoop` is the top-level loop where training starts. - It simply counts the epochs and iterates from one to the next by calling :code:`TrainingEpochLoop.run()` in its :code:`advance()` method. - * - :class:`~pytorch_lightning.loops.epoch.training_epoch_loop.TrainingEpochLoop` - - The :class:`~pytorch_lightning.loops.epoch.training_epoch_loop.TrainingEpochLoop` is the one that iterates over the dataloader that the user returns in their :meth:`~pytorch_lightning.core.lightning.LightningModule.train_dataloader` method. - Its main responsibilities are calling the :code:`*_epoch_start` and :code:`*_epoch_end` hooks, accumulating outputs if the user request them in one of these hooks, and running validation at the requested interval. - The validation is carried out by yet another loop, :class:`~pytorch_lightning.loops.epoch.validation_epoch_loop.ValidationEpochLoop`. - - In the :code:`run()` method, the training epoch loop could in theory simply call the :code:`LightningModule.training_step` already and perform the optimization. - However, Lightning has built-in support for automatic optimization with multiple optimizers and on top of that also supports :ref:`TBPTT `. - For this reason there are actually two more loops nested under :class:`~pytorch_lightning.loops.epoch.training_epoch_loop.TrainingEpochLoop`. - * - :class:`~pytorch_lightning.loops.batch.training_batch_loop.TrainingBatchLoop` - - The responsibility of the :class:`~pytorch_lightning.loops.batch.training_batch_loop.TrainingBatchLoop` is to split a batch given by the :class:`~pytorch_lightning.loops.epoch.training_epoch_loop.TrainingEpochLoop` along the time-dimension and iterate over the list of splits. - It also keeps track of the hidden state *hiddens* returned by the training step. - By default, when truncated back-propagation through time (TBPTT) is turned off, this loop does not do anything except redirect the call to the :class:`~pytorch_lightning.loops.optimization.optimizer_loop.OptimizerLoop`. - Read more about :ref:`TBPTT `. - * - :class:`~pytorch_lightning.loops.optimization.optimizer_loop.OptimizerLoop` - - The :class:`~pytorch_lightning.loops.optimization.optimizer_loop.OptimizerLoop` iterates over one or multiple optimizers and for each one it calls the :meth:`~pytorch_lightning.core.lightning.LightningModule.training_step` method with the batch, the current batch index and the optimizer index if multiple optimizers are requested. - It is the leaf node in the tree of loops and performs the actual optimization (forward, zero grad, backward, optimizer step). - * - :class:`~pytorch_lightning.loops.optimization.manual_loop.ManualOptimization` - - Substitutes the :class:`~pytorch_lightning.loops.optimization.optimizer_loop.OptimizerLoop` in case of :doc:`manual optimization <../model/manual_optimization>` and implements the manual optimization step. - * - :class:`~pytorch_lightning.loops.dataloader.evaluation_loop.EvaluationLoop` - - The :class:`~pytorch_lightning.loops.dataloader.evaluation_loop.EvaluationLoop` is the top-level loop where validation/testing starts. - It simply iterates over each evaluation dataloader from one to the next by calling :code:`EvaluationEpochLoop.run()` in its :code:`advance()` method. - * - :class:`~pytorch_lightning.loops.dataloader.prediction_loop.PredictionLoop` - - The :class:`~pytorch_lightning.loops.dataloader.prediction_loop.PredictionLoop` is the top-level loop where prediction starts. - It simply iterates over each prediction dataloader from one to the next by calling :code:`PredictionEpochLoop.run()` in its :code:`advance()` method. - - ----------- - -Available Loops in Lightning Flash ----------------------------------- - -`Active Learning `__ is a machine learning practice in which the user interacts with the learner in order to provide new labels when required. - -You can find a real use case in `Lightning Flash `_. - -Flash implements the :code:`ActiveLearningLoop` that you can use together with the :code:`ActiveLearningDataModule` to label new data on the fly. -To run the following demo, install Flash and `BaaL `__ first: - -.. code-block:: bash - - pip install lightning-flash baal - -.. code-block:: python - - import torch - - import flash - from flash.core.classification import Probabilities - from flash.core.data.utils import download_data - from flash.image import ImageClassificationData, ImageClassifier - from flash.image.classification.integrations.baal import ActiveLearningDataModule, ActiveLearningLoop - - # 1. Create the DataModule - download_data("https://pl-flash-data.s3.amazonaws.com/hymenoptera_data.zip", "./data") - - # Implement the research use-case where we mask labels from labelled dataset. - datamodule = ActiveLearningDataModule( - ImageClassificationData.from_folders(train_folder="data/hymenoptera_data/train/", batch_size=2), - initial_num_labels=5, - val_split=0.1, - ) - - # 2. Build the task - head = torch.nn.Sequential( - torch.nn.Dropout(p=0.1), - torch.nn.Linear(512, datamodule.num_classes), - ) - model = ImageClassifier(backbone="resnet18", head=head, num_classes=datamodule.num_classes, output=Probabilities()) - - - # 3.1 Create the trainer - trainer = flash.Trainer(max_epochs=3) - - # 3.2 Create the active learning loop and connect it to the trainer - active_learning_loop = ActiveLearningLoop(label_epoch_frequency=1) - active_learning_loop.connect(trainer.fit_loop) - trainer.fit_loop = active_learning_loop - - # 3.3 Finetune - trainer.finetune(model, datamodule=datamodule, strategy="freeze") - - # 4. Predict what's on a few images! ants or bees? - predictions = model.predict("data/hymenoptera_data/val/bees/65038344_52a45d090d.jpg") - print(predictions) - - # 5. Save the model! - trainer.save_checkpoint("image_classification_model.pt") - -Here is the `Active Learning Loop example `_ and the `code for the active learning loop `_. - - ----------- - -Advanced Examples ------------------ - - -.. list-table:: Ready-to-run loop examples and tutorials - :widths: 25 75 - :header-rows: 1 - - * - Link to Example - - Description - * - `K-fold Cross Validation `_ - - `KFold / Cross Validation `__ is a machine learning practice in which the training dataset is being partitioned into ``num_folds`` complementary subsets. - One cross validation round will perform fitting where one fold is left out for validation and the other folds are used for training. - To reduce variability, once all rounds are performed using the different folds, the trained models are ensembled and their predictions are - averaged when estimating the model's predictive performance on the test dataset. - * - `Yielding Training Step `_ - - This loop enables you to write the :meth:`~pytorch_lightning.core.lightning.LightningModule.training_step` hook - as a Python Generator for automatic optimization with multiple optimizers, i.e., you can :code:`yield` loss - values from it instead of returning them. This can enable more elegant and expressive implementations, as shown - shown with a GAN in this example. - - ----------- - -Advanced Features ------------------ - -Next: :doc:`Advanced loop features <../extensions/loops_advanced>` diff --git a/docs/_sources/extensions/loops_advanced.rst.txt b/docs/_sources/extensions/loops_advanced.rst.txt deleted file mode 100644 index e71c827..0000000 --- a/docs/_sources/extensions/loops_advanced.rst.txt +++ /dev/null @@ -1,41 +0,0 @@ -:orphan: - -Loops (Advanced) -================ - -.. _persisting loop state: - -Persisting the State of Loops ------------------------------ - -.. note:: - - This is an experimental feature and is not activated by default. - Set the environment variable `PL_FAULT_TOLERANT_TRAINING = 1` to enable saving the progress of loops. - Read more about :doc:`fault-tolerant training <../clouds/fault_tolerant_training>`. - -A powerful property of the class-based loop interface is that it can own an internal state. -Loop instances can save their state to the checkpoint through corresponding hooks and if implemented accordingly, resume the state of execution at the appropriate place. -This design is particularly interesting for fault-tolerant training which is an experimental feature released in Lightning v1.5. - -The two hooks :meth:`~pytorch_lightning.loops.base.Loop.on_save_checkpoint` and :meth:`~pytorch_lightning.loops.base.Loop.on_load_checkpoint` function very similarly to how LightningModules and Callbacks save and load state. - -.. code-block:: python - - def on_save_checkpoint(self): - state_dict["iteration"] = self.iteration - return state_dict - - - def on_load_checkpoint(self, state_dict): - self.iteration = state_dict["iteration"] - -When the Trainer is restarting from a checkpoint (e.g., through :code:`trainer.fit(ckpt_path=...)`), the loop exposes a boolean attribute :attr:`~pytorch_lightning.loops.base.Loop.restarting`. -Based around the value of this variable, the user can write the loop in such a way that it can restart from an arbitrary point given the state loaded from the checkpoint. -For example, the implementation of the :meth:`~pytorch_lightning.loops.base.Loop.reset` method could look like this given our previous example: - -.. code-block:: python - - def reset(self): - if not self.restarting: - self.iteration = 0 diff --git a/docs/_sources/extensions/plugins.rst.txt b/docs/_sources/extensions/plugins.rst.txt deleted file mode 100644 index 392a072..0000000 --- a/docs/_sources/extensions/plugins.rst.txt +++ /dev/null @@ -1,119 +0,0 @@ -.. _plugins: - -####### -Plugins -####### - -.. include:: ../links.rst - -Plugins allow custom integrations to the internals of the Trainer such as custom precision, checkpointing or -cluster environment implementation. - -Under the hood, the Lightning Trainer is using plugins in the training routine, added automatically -depending on the provided Trainer arguments. - -There are three types of Plugins in Lightning with different responsibilities: - -- Precision Plugins -- CheckpointIO Plugins -- Cluster Environments - -You can make the Trainer use one or multiple plugins by adding it to the ``plugins`` argument like so: - -.. code-block:: python - - trainer = Trainer(plugins=[plugin1, plugin2, ...]) - - -By default, the plugins get selected based on the rest of the Trainer settings such as the ``strategy``. - - ------------ - -.. _precision-plugins: - -***************** -Precision Plugins -***************** - -We provide precision plugins for you to benefit from numerical representations with lower precision than -32-bit floating-point or higher precision, such as 64-bit floating-point. - -.. code-block:: python - - # Training with 16-bit precision - trainer = Trainer(precision=16) - -The full list of built-in precision plugins is listed below. - -.. currentmodule:: pytorch_lightning.plugins.precision - -.. autosummary:: - :nosignatures: - :template: classtemplate.rst - - ApexMixedPrecisionPlugin - DeepSpeedPrecisionPlugin - DoublePrecisionPlugin - FullyShardedNativeMixedPrecisionPlugin - HPUPrecisionPlugin - IPUPrecisionPlugin - MixedPrecisionPlugin - NativeMixedPrecisionPlugin - PrecisionPlugin - ShardedNativeMixedPrecisionPlugin - TPUBf16PrecisionPlugin - TPUPrecisionPlugin - -More information regarding precision with Lightning can be found :ref:`here ` - ------------ - - -.. _checkpoint_io_plugins: - -******************** -CheckpointIO Plugins -******************** - -As part of our commitment to extensibility, we have abstracted Lightning's checkpointing logic into the :class:`~pytorch_lightning.plugins.io.CheckpointIO` plugin. -With this, you have the ability to customize the checkpointing logic to match the needs of your infrastructure. - -Below is a list of built-in plugins for checkpointing. - -.. currentmodule:: pytorch_lightning.plugins.io - -.. autosummary:: - :nosignatures: - :template: classtemplate.rst - - CheckpointIO - HPUCheckpointIO - TorchCheckpointIO - XLACheckpointIO - -Learn more about custom checkpointing with Lightning :ref:`here `. - ------------ - - -.. _cluster_environment_plugins: - -******************** -Cluster Environments -******************** - -You can define the interface of your own cluster environment based on the requirements of your infrastructure. - -.. currentmodule:: pytorch_lightning.plugins.environments - -.. autosummary:: - :nosignatures: - :template: classtemplate.rst - - ClusterEnvironment - KubeflowEnvironment - LightningEnvironment - LSFEnvironment - SLURMEnvironment - TorchElasticEnvironment diff --git a/docs/_sources/extensions/strategy.rst.txt b/docs/_sources/extensions/strategy.rst.txt deleted file mode 100644 index ad9d799..0000000 --- a/docs/_sources/extensions/strategy.rst.txt +++ /dev/null @@ -1,122 +0,0 @@ -:orphan: - -################### -What is a Strategy? -################### - -Strategy controls the model distribution across training, evaluation, and prediction to be used by the :doc:`Trainer <../common/trainer>`. It can be controlled by passing different -strategy with aliases (``"ddp"``, ``"ddp_spawn"``, ``"deepspeed"`` and so on) as well as a custom strategy to the ``strategy`` parameter for Trainer. - -The Strategy in PyTorch Lightning handles the following responsibilities: - -* Launch and teardown of training processes (if applicable). -* Setup communication between processes (NCCL, GLOO, MPI, and so on). -* Provide a unified communication interface for reduction, broadcast, and so on. -* Owns the :class:`~pytorch_lightning.core.lightning.LightningModule` -* Handles/owns optimizers and schedulers. - - -:class:`~pytorch_lightning.strategies.strategy.Strategy` also manages the accelerator, precision, and checkpointing plugins. - -.. image:: https://pl-public-data.s3.amazonaws.com/docs/static/images/strategies/overview.jpeg - :alt: Illustration of the Strategy as a composition of the Accelerator and several plugins - -We expose Strategies mainly for expert users that want to extend Lightning for new hardware support or new distributed backends (e.g. a backend not yet supported by `PyTorch `_ itself). - - ----- - -########################### -Enable Different Strategies -########################### - -.. code-block:: python - - # Training with the DistributedDataParallel strategy on 4 GPUs - trainer = Trainer(strategy="ddp", accelerator="gpu", devices=4) - - # Training with the custom DistributedDataParallel strategy on 4 GPUs - trainer = Trainer(strategy=DDPStrategy(...), accelerator="gpu", devices=4) - - # Training with the DDP Spawn strategy using auto accelerator selection - trainer = Trainer(strategy="ddp_spawn", accelerator="auto", devices=4) - - # Training with the DeepSpeed strategy on available GPUs - trainer = Trainer(strategy="deepspeed", accelerator="gpu", devices="auto") - - # Training with the DDP strategy using 3 CPU processes - trainer = Trainer(strategy="ddp", accelerator="cpu", devices=3) - - # Training with the DDP Spawn strategy on 8 TPU cores - trainer = Trainer(strategy="ddp_spawn", accelerator="tpu", devices=8) - - # Training with the default IPU strategy on 8 IPUs - trainer = Trainer(accelerator="ipu", devices=8) - ----- - -######################## -Create a Custom Strategy -######################## - -Expert users may choose to extend an existing strategy by overriding its methods. - -.. code-block:: python - - from pytorch_lightning.strategies import DDPStrategy - - - class CustomDDPStrategy(DDPStrategy): - def configure_ddp(self): - self.model = MyCustomDistributedDataParallel( - self.model, - device_ids=..., - ) - -or by subclassing the base class :class:`~pytorch_lightning.strategies.Strategy` to create new ones. These custom strategies -can then be passed into the ``Trainer`` directly via the ``strategy`` parameter. - -.. code-block:: python - - # custom plugins - trainer = Trainer(strategy=CustomDDPStrategy()) - - # fully custom accelerator and plugins - accelerator = MyAccelerator() - precision_plugin = MyPrecisionPlugin() - training_strategy = CustomDDPStrategy(accelerator=accelerator, precision_plugin=precision_plugin) - trainer = Trainer(strategy=training_strategy) - - -The complete list of built-in strategies is listed below. - ----- - -############################# -Available Training Strategies -############################# - -.. currentmodule:: pytorch_lightning.strategies - -.. autosummary:: - :nosignatures: - :template: classtemplate.rst - - BaguaStrategy - DDP2Strategy - DDPFullyShardedStrategy - DDPShardedStrategy - DDPSpawnShardedStrategy - DDPSpawnStrategy - DDPStrategy - DataParallelStrategy - DeepSpeedStrategy - HorovodStrategy - HPUParallelStrategy - IPUStrategy - ParallelStrategy - SingleDeviceStrategy - SingleHPUStrategy - SingleTPUStrategy - Strategy - TPUSpawnStrategy diff --git a/docs/_sources/guides/data.rst.txt b/docs/_sources/guides/data.rst.txt deleted file mode 100644 index 72dba27..0000000 --- a/docs/_sources/guides/data.rst.txt +++ /dev/null @@ -1,423 +0,0 @@ -:orphan: - -.. _data: - -############# -Managing Data -############# - -**************************** -Data Containers in Lightning -**************************** - -There are a few different data containers used in Lightning: - -.. list-table:: Data objects - :widths: 20 80 - :header-rows: 1 - - * - Object - - Definition - * - :class:`~torch.utils.data.Dataset` - - The PyTorch :class:`~torch.utils.data.Dataset` represents a map from keys to data samples. - * - :class:`~torch.utils.data.IterableDataset` - - The PyTorch :class:`~torch.utils.data.IterableDataset` represents a stream of data. - * - :class:`~torch.utils.data.DataLoader` - - The PyTorch :class:`~torch.utils.data.DataLoader` represents a Python iterable over a Dataset. - * - :class:`~pytorch_lightning.core.datamodule.LightningDataModule` - - A :class:`~pytorch_lightning.core.datamodule.LightningDataModule` is simply a collection of: training DataLoader(s), validation DataLoader(s), test DataLoader(s) and predict DataLoader(s), along with the matching transforms and data processing/downloads steps required. - - -Why Use LightningDataModule? -============================ - -The :class:`~pytorch_lightning.core.datamodule.LightningDataModule` was designed as a way of decoupling data-related hooks from the :class:`~pytorch_lightning.core.lightning.LightningModule` so you can develop dataset agnostic models. The :class:`~pytorch_lightning.core.datamodule.LightningDataModule` makes it easy to hot swap different Datasets with your model, so you can test it and benchmark it across domains. It also makes sharing and reusing the exact data splits and transforms across projects possible. - -Read :ref:`this ` for more details on LightningDataModule. - ---------- - -.. _multiple-dataloaders: - -***************** -Multiple Datasets -***************** - -There are a few ways to pass multiple Datasets to Lightning: - -1. Create a DataLoader that iterates over multiple Datasets under the hood. -2. In the training loop, you can pass multiple DataLoaders as a dict or list/tuple, and Lightning will - automatically combine the batches from different DataLoaders. -3. In the validation, test, or prediction, you have the option to return multiple DataLoaders as list/tuple, which Lightning will call sequentially - or combine the DataLoaders using :class:`~pytorch_lightning.trainer.supporters.CombinedLoader`, which Lightning will - automatically combine the batches from different DataLoaders. - - -Using LightningDataModule -========================= - -You can set more than one :class:`~torch.utils.data.DataLoader` in your :class:`~pytorch_lightning.core.datamodule.LightningDataModule` using its DataLoader hooks -and Lightning will use the correct one. - -.. testcode:: - - class DataModule(LightningDataModule): - - ... - - def train_dataloader(self): - return DataLoader(self.train_dataset) - - def val_dataloader(self): - return [DataLoader(self.val_dataset_1), DataLoader(self.val_dataset_2)] - - def test_dataloader(self): - return DataLoader(self.test_dataset) - - def predict_dataloader(self): - return DataLoader(self.predict_dataset) - - -Using LightningModule Hooks -=========================== - -Concatenated Dataset --------------------- - -For training with multiple Datasets, you can create a :class:`~torch.utils.data.DataLoader` class -which wraps your multiple Datasets using :class:`~torch.utils.data.ConcatDataset`. This, of course, -also works for testing, validation, and prediction Datasets. - -.. testcode:: - - from torch.utils.data import ConcatDataset - - - class LitModel(LightningModule): - def train_dataloader(self): - concat_dataset = ConcatDataset(datasets.ImageFolder(traindir_A), datasets.ImageFolder(traindir_B)) - - loader = DataLoader( - concat_dataset, batch_size=args.batch_size, shuffle=True, num_workers=args.workers, pin_memory=True - ) - return loader - - def val_dataloader(self): - # SAME - ... - - def test_dataloader(self): - # SAME - ... - - -Return Multiple DataLoaders ---------------------------- - -You can set multiple DataLoaders in your :class:`~pytorch_lightning.core.lightning.LightningModule`, and Lightning will take care of batch combination. - -For more details, refer to :paramref:`~pytorch_lightning.trainer.trainer.Trainer.multiple_trainloader_mode` - -.. testcode:: - - class LitModel(LightningModule): - def train_dataloader(self): - - loader_a = DataLoader(range(6), batch_size=4) - loader_b = DataLoader(range(15), batch_size=5) - - # pass loaders as a dict. This will create batches like this: - # {'a': batch from loader_a, 'b': batch from loader_b} - loaders = {"a": loader_a, "b": loader_b} - - # OR: - # pass loaders as sequence. This will create batches like this: - # [batch from loader_a, batch from loader_b] - loaders = [loader_a, loader_b] - - return loaders - -Furthermore, Lightning also supports nested lists and dicts (or a combination). - -.. testcode:: - - class LitModel(LightningModule): - def train_dataloader(self): - - loader_a = DataLoader(range(8), batch_size=4) - loader_b = DataLoader(range(16), batch_size=2) - - return {"a": loader_a, "b": loader_b} - - def training_step(self, batch, batch_idx): - # access a dictionary with a batch from each DataLoader - batch_a = batch["a"] - batch_b = batch["b"] - - -.. testcode:: - - class LitModel(LightningModule): - def train_dataloader(self): - - loader_a = DataLoader(range(8), batch_size=4) - loader_b = DataLoader(range(16), batch_size=4) - loader_c = DataLoader(range(32), batch_size=4) - loader_c = DataLoader(range(64), batch_size=4) - - # pass loaders as a nested dict. This will create batches like this: - loaders = {"loaders_a_b": [loader_a, loader_b], "loaders_c_d": {"c": loader_c, "d": loader_d}} - return loaders - - def training_step(self, batch, batch_idx): - # access the data - batch_a_b = batch["loaders_a_b"] - batch_c_d = batch["loaders_c_d"] - - batch_a = batch_a_b[0] - batch_b = batch_a_b[1] - - batch_c = batch_c_d["c"] - batch_d = batch_c_d["d"] - -Alternatively, you can also pass in a :class:`~pytorch_lightning.trainer.supporters.CombinedLoader` containing multiple DataLoaders. - -.. testcode:: - - from pytorch_lightning.trainer.supporters import CombinedLoader - - - def train_dataloader(self): - loader_a = DataLoader() - loader_b = DataLoader() - loaders = {"a": loader_a, "b": loader_b} - combined_loader = CombinedLoader(loaders, mode="max_size_cycle") - return combined_loader - - - def training_step(self, batch, batch_idx): - batch_a = batch["a"] - batch_b = batch["b"] - - -Multiple Validation/Test/Predict DataLoaders -============================================ - -For validation, test and predict DataLoaders, you can pass a single DataLoader or a list of them. This optional named -parameter can be used in conjunction with any of the above use cases. You can choose to pass -the batches sequentially or simultaneously, as is done for the training step. -The default mode for these DataLoaders is sequential. Note that when using a sequence of DataLoaders you need -to add an additional argument ``dataloader_idx`` in their corresponding step specific hook. The corresponding loop will process -the DataLoaders in sequential order; that is, the first DataLoader will be processed completely, then the second one, and so on. - -Refer to the following for more details for the default sequential option: - -- :meth:`~pytorch_lightning.core.hooks.DataHooks.val_dataloader` -- :meth:`~pytorch_lightning.core.hooks.DataHooks.test_dataloader` -- :meth:`~pytorch_lightning.core.hooks.DataHooks.predict_dataloader` - -.. testcode:: - - def val_dataloader(self): - loader_1 = DataLoader() - loader_2 = DataLoader() - return [loader_1, loader_2] - - - def validation_step(self, batch, batch_idx, dataloader_idx): - ... - - -Evaluation DataLoaders are iterated over sequentially. If you want to iterate over them in parallel, PyTorch Lightning provides a :class:`~pytorch_lightning.trainer.supporters.CombinedLoader` object which supports collections of DataLoaders such as list, tuple, or dictionary. The DataLoaders can be accessed using in the same way as the provided structure: - -.. testcode:: - - from pytorch_lightning.trainer.supporters import CombinedLoader - - - def val_dataloader(self): - loader_a = DataLoader() - loader_b = DataLoader() - loaders = {"a": loader_a, "b": loader_b} - combined_loaders = CombinedLoader(loaders, mode="max_size_cycle") - return combined_loaders - - - def validation_step(self, batch, batch_idx): - batch_a = batch["a"] - batch_b = batch["b"] - - -Evaluate with Additional DataLoaders -==================================== - -You can evaluate your models using additional DataLoaders even if the DataLoader specific hooks haven't been defined within your -:class:`~pytorch_lightning.core.lightning.LightningModule`. For example, this would be the case if your test data -set is not available at the time your model was declared. Simply pass the test set to the :meth:`~pytorch_lightning.trainer.trainer.Trainer.test` method: - -.. code-block:: python - - # setup your DataLoader - test = DataLoader(...) - - # test (pass in the loader) - trainer.test(dataloaders=test) - --------------- - -******************************************** -Accessing DataLoaders within LightningModule -******************************************** - -In the case that you require access to the DataLoader or Dataset objects, DataLoaders for each step can be accessed using the ``Trainer`` object: - -.. testcode:: - - from pytorch_lightning import LightningModule - - - class Model(LightningModule): - def test_step(self, batch, batch_idx, dataloader_idx): - test_dl = self.trainer.test_dataloaders[dataloader_idx] - test_dataset = test_dl.dataset - test_sampler = test_dl.sampler - ... - # extract metadata, etc. from the dataset: - ... - -If you are using a :class:`~pytorch_lightning.trainer.supporters.CombinedLoader` object which allows you to fetch batches from a collection of DataLoaders -simultaneously which supports collections of DataLoader such as list, tuple, or dictionary. The DataLoaders can be accessed using the same collection structure: - -.. code-block:: python - - from pytorch_lightning.trainer.supporters import CombinedLoader - - test_dl1 = ... - test_dl2 = ... - - # If you provided a list of DataLoaders: - - combined_loader = CombinedLoader([test_dl1, test_dl2]) - list_of_loaders = combined_loader.loaders - test_dl1 = list_of_loaders.loaders[0] - - - # If you provided dictionary of DataLoaders: - - combined_loader = CombinedLoader({"dl1": test_dl1, "dl2": test_dl2}) - dictionary_of_loaders = combined_loader.loaders - test_dl1 = dictionary_of_loaders["dl1"] - --------------- - -.. _sequential-data: - -*************** -Sequential Data -*************** - -Lightning has built in support for dealing with sequential data. - - -Packed Sequences as Inputs -========================== - -When using :class:`~torch.nn.utils.rnn.PackedSequence`, do two things: - -1. Return either a padded tensor in dataset or a list of variable length tensors in the DataLoader's `collate_fn `_ (example shows the list implementation). -2. Pack the sequence in forward or training and validation steps depending on use case. - -| - -.. testcode:: - - # For use in DataLoader - def collate_fn(batch): - x = [item[0] for item in batch] - y = [item[1] for item in batch] - return x, y - - - # In LightningModule - def training_step(self, batch, batch_idx): - x = rnn.pack_sequence(batch[0], enforce_sorted=False) - y = rnn.pack_sequence(batch[1], enforce_sorted=False) - - -Truncated Backpropagation Through Time (TBPTT) -============================================== - -There are times when multiple backwards passes are needed for each batch. -For example, it may save memory to use **Truncated Backpropagation Through Time** when training RNNs. - -Lightning can handle TBPTT automatically via this flag. - -.. testcode:: - - from pytorch_lightning import LightningModule - - - class MyModel(LightningModule): - def __init__(self): - super().__init__() - # Important: This property activates truncated backpropagation through time - # Setting this value to 2 splits the batch into sequences of size 2 - self.truncated_bptt_steps = 2 - - # Truncated back-propagation through time - def training_step(self, batch, batch_idx, hiddens): - # the training step must be updated to accept a ``hiddens`` argument - # hiddens are the hiddens from the previous truncated backprop step - out, hiddens = self.lstm(data, hiddens) - return {"loss": ..., "hiddens": hiddens} - -.. note:: If you need to modify how the batch is split, - override :func:`~pytorch_lightning.core.lightning.LightningModule.tbptt_split_batch`. - - -Iterable Datasets -================= -Lightning supports using :class:`~torch.utils.data.IterableDataset` as well as map-style Datasets. IterableDatasets provide a more natural -option when using sequential data. - -.. note:: When using an :class:`~torch.utils.data.IterableDataset` you must set the ``val_check_interval`` to 1.0 (the default) or an int - (specifying the number of training batches to run before each validation loop) when initializing the Trainer. This is - because the IterableDataset does not have a ``__len__`` and Lightning requires this to calculate the validation - interval when ``val_check_interval`` is less than one. Similarly, you can set ``limit_{mode}_batches`` to a float or - an int. If it is set to 0.0 or 0, it will set ``num_{mode}_batches`` to 0, if it is an int, it will set ``num_{mode}_batches`` - to ``limit_{mode}_batches``, if it is set to 1.0 it will run for the whole dataset, otherwise it will throw an exception. - Here ``mode`` can be train/val/test/predict. - -When iterable datasets are used, Lightning will pre-fetch 1 batch (in addition to the current batch) so it can detect -when the training will stop and run validation if necessary. - -.. testcode:: - - # IterableDataset - class CustomDataset(IterableDataset): - def __init__(self, data): - self.data_source = data - - def __iter__(self): - return iter(self.data_source) - - - # Setup DataLoader - def train_dataloader(self): - seq_data = ["A", "long", "time", "ago", "in", "a", "galaxy", "far", "far", "away"] - iterable_dataset = CustomDataset(seq_data) - - dataloader = DataLoader(dataset=iterable_dataset, batch_size=5) - return dataloader - - -.. testcode:: - - # Set val_check_interval - trainer = Trainer(val_check_interval=100) - - # Set limit_val_batches to 0.0 or 0 - trainer = Trainer(limit_val_batches=0.0) - - # Set limit_val_batches as an int - trainer = Trainer(limit_val_batches=100) diff --git a/docs/_sources/guides/speed.rst.txt b/docs/_sources/guides/speed.rst.txt deleted file mode 100644 index 1020755..0000000 --- a/docs/_sources/guides/speed.rst.txt +++ /dev/null @@ -1,477 +0,0 @@ -:orphan: - -.. testsetup:: * - - from pytorch_lightning.callbacks.early_stopping import EarlyStopping - -.. _training-speedup: - - -####################### -Speed Up Model Training -####################### - -When you are limited with the resources, it becomes hard to speed up model training and reduce the training time -without affecting the model's performance. There are multiple ways you can speed up your model's time to convergence. - -************************ -Training on Accelerators -************************ - -**Use when:** Whenever possible! - -With Lightning, running on GPUs, TPUs, IPUs on multiple nodes is a simple switch of a flag. - -GPU Training -============ - -Lightning supports a variety of plugins to speed up distributed GPU training. Most notably: - -* :class:`~pytorch_lightning.strategies.DDPStrategy` -* :class:`~pytorch_lightning.strategies.DDPShardedStrategy` -* :class:`~pytorch_lightning.strategies.DeepSpeedStrategy` - -.. code-block:: python - - # run on 1 gpu - trainer = Trainer(accelerator="gpu", devices=1) - - # train on 8 GPUs, using the DDP strategy - trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp") - - # train on multiple GPUs across nodes (uses 8 GPUs in total) - trainer = Trainer(accelerator="gpu", devices=2, num_nodes=4) - - -GPU Training Speedup Tips -------------------------- - -When training on single or multiple GPU machines, Lightning offers a host of advanced optimizations to improve throughput, memory efficiency, and model scaling. -Refer to :doc:`Advanced GPU Optimized Training for more details <../advanced/model_parallel>`. - -Prefer DDP Over DP -^^^^^^^^^^^^^^^^^^ -:class:`~pytorch_lightning.strategies.dp.DataParallelStrategy` performs three GPU transfers for EVERY batch: - -1. Copy the model to the device. -2. Copy the data to the device. -3. Copy the outputs of each device back to the main device. - -.. image:: https://pl-public-data.s3.amazonaws.com/docs/static/images/distributed_training/dp.gif - :alt: Animation showing DP execution. - :width: 500 - :align: center - -| - -Whereas :class:`~pytorch_lightning.strategies.ddp.DDPStrategy` only performs two transfer operations, making DDP much faster than DP: - -1. Moving data to the device. -2. Transfer and sync gradients. - -.. image:: https://pl-public-data.s3.amazonaws.com/docs/static/images/distributed_training/ddp.gif - :alt: Animation showing DDP execution. - :width: 500 - :align: center - -| - -For more details on how to tune performance with DDP, please see the :ref:`DDP Optimizations ` section. - -DataLoaders -^^^^^^^^^^^ - -When building your DataLoader set ``num_workers>0`` and ``pin_memory=True`` (only for GPUs). - -.. code-block:: python - - Dataloader(dataset, num_workers=8, pin_memory=True) - -num_workers -^^^^^^^^^^^ - -The question of how many workers to specify in ``num_workers`` is tricky. Here's a summary of `some references `_, and our suggestions: - -1. ``num_workers=0`` means ONLY the main process will load batches (that can be a bottleneck). -2. ``num_workers=1`` means ONLY one worker (just not the main process) will load data, but it will still be slow. -3. The performance of high ``num_workers`` depends on the batch size and your machine. -4. A general place to start is to set ``num_workers`` equal to the number of CPU cores on that machine. You can get the number of CPU cores in python using ``os.cpu_count()``, but note that depending on your batch size, you may overflow RAM memory. - -.. warning:: Increasing ``num_workers`` will ALSO increase your CPU memory consumption. - -The best thing to do is to increase the ``num_workers`` slowly and stop once there is no more improvement in your training speed. - -For debugging purposes or for dataloaders that load very small datasets, it is desirable to set ``num_workers=0``. However, this will always log a warning for every dataloader with ``num_workers <= min(2, os.cpu_count())``. In such cases, you can specifically filter this warning by using: - -.. code-block:: python - - import warnings - - warnings.filterwarnings("ignore", ".*Consider increasing the value of the `num_workers` argument*") - - # or to ignore all warnings that could be false positives - from pytorch_lightning.utilities.warnings import PossibleUserWarning - - warnings.filterwarnings("ignore", category=PossibleUserWarning) - -Spawn -^^^^^ - -When using ``strategy="ddp_spawn"`` or training on TPUs, the way multiple GPUs/TPU cores are used is by calling :obj:`torch.multiprocessing` -``.spawn()`` under the hood. The problem is that PyTorch has issues with ``num_workers>0`` when using ``.spawn()``. For this reason, we recommend you -use ``strategy="ddp"`` so you can increase the ``num_workers``, however since DDP doesn't work in an interactive environment like IPython/Jupyter notebooks -your script has to be callable like so: - -.. code-block:: bash - - python my_program.py - -However, using ``strategy="ddp_spawn"`` enables to reduce memory usage with In-Memory Dataset and shared memory tensors. For more info, checkout -:ref:`Sharing Datasets Across Process Boundaries ` section. - -Persistent Workers -^^^^^^^^^^^^^^^^^^ - -When using ``strategy="ddp_spawn"`` and ``num_workers>0``, consider setting ``persistent_workers=True`` inside your DataLoader since it can result in data-loading bottlenecks and slowdowns. -This is a limitation of Python ``.spawn()`` and PyTorch. - - -TPU Training -============ - -You can set the ``devices`` trainer argument to 1, [7] (specific core) or eight cores. - -.. code-block:: python - - # train on 1 TPU core - trainer = Trainer(accelerator="tpu", devices=1) - - # train on 7th TPU core - trainer = Trainer(accelerator="tpu", devices=[7]) - - # train on 8 TPU cores - trainer = Trainer(accelerator="tpu", devices=8) - -To train on more than eight cores (a POD), -submit this script using the xla_dist script. - -Example:: - - python -m torch_xla.distributed.xla_dist - --tpu=$TPU_POD_NAME - --conda-env=torch-xla-nightly - --env=XLA_USE_BF16=1 - -- python your_trainer_file.py - - -Read more in our :ref:`training-speedup` and :ref:`plugins` guides. - - ------------ - -************** -Early Stopping -************** - -Usually, long training epochs can lead to either overfitting or no major improvements in your metrics due to no limited convergence. -Here :class:`~pytorch_lightning.callbacks.early_stopping.EarlyStopping` callback can help you stop the training entirely by monitoring a metric of your choice. - -You can read more about it :ref:`here `. - ----------- - -.. _speed-amp: - -********************************* -Mixed Precision (16-bit) Training -********************************* - -Lower precision, such as the 16-bit floating-point, enables the training and deployment of large neural networks since they require less memory, enhance data transfer operations since they required -less memory bandwidth and run match operations much faster on GPUs that support Tensor Core. - -**Use when:** - -* You want to optimize for memory usage on a GPU. -* You have a GPU that supports 16-bit precision (NVIDIA pascal architecture or newer). -* Your optimization algorithm (training_step) is numerically stable. -* You want to be the cool person in the lab :p - -.. raw:: html - - - -| - -Mixed precision combines the use of both 32 and 16-bit floating points to reduce memory footprint during model training, resulting in improved performance, achieving upto +3X speedups on modern GPUs. - -Lightning offers mixed precision training for GPUs and CPUs, as well as bfloat16 mixed precision training for TPUs. - - -.. testcode:: - :skipif: torch.cuda.device_count() < 4 - - # 16-bit precision - trainer = Trainer(precision=16, accelerator="gpu", devices=4) - - -Read more about :ref:`mixed-precision training `. - - ----------------- - - -*********************** -Control Training Epochs -*********************** - -**Use when:** You run a hyperparameter search to find good initial parameters and want to save time, cost (money), or power (environment). -It can allow you to be more cost efficient and also run more experiments at the same time. - -You can use Trainer flags to force training for a minimum number of epochs or limit it to a max number of epochs. Use the ``min_epochs`` and ``max_epochs`` Trainer flags to set the number of epochs to run. -Setting ``min_epochs=N`` makes sure that the training will run for at least ``N`` epochs. Setting ``max_epochs=N`` will ensure that training won't happen after -``N`` epochs. - -.. testcode:: - - # DEFAULT - trainer = Trainer(min_epochs=1, max_epochs=1000) - - -If running iteration based training, i.e., infinite / iterable DataLoader, you can also control the number of steps with the ``min_steps`` and ``max_steps`` flags: - -.. testcode:: - - trainer = Trainer(max_steps=1000) - - trainer = Trainer(min_steps=100) - -You can also interrupt training based on training time: - -.. testcode:: - - # Stop after 12 hours of training or when reaching 10 epochs (string) - trainer = Trainer(max_time="00:12:00:00", max_epochs=10) - - # Stop after 1 day and 5 hours (dict) - trainer = Trainer(max_time={"days": 1, "hours": 5}) - -Learn more in our :ref:`trainer_flags` guide. - - ----------------- - -**************************** -Control Validation Frequency -**************************** - -Check Validation Every n Epochs -=============================== - -**Use when:** You have a small dataset and want to run fewer validation checks. - -You can limit validation check to only run every n epochs using the ``check_val_every_n_epoch`` Trainer flag. - -.. testcode:: - - # default - trainer = Trainer(check_val_every_n_epoch=1) - - # runs validation after every 7th Epoch - trainer = Trainer(check_val_every_n_epoch=7) - - -Validation Within Training Epoch -================================ - -**Use when:** You have a large training dataset and want to run mid-epoch validation checks. - -For large datasets, it's often desirable to check validation multiple times within a training epoch. -Pass in a float to check that often within one training epoch. Pass in an int ``K`` to check every ``K`` training batch. -Must use an ``int`` if using an :class:`~torch.utils.data.IterableDataset`. - -.. testcode:: - - # default - trainer = Trainer(val_check_interval=1.0) - - # check every 1/4 th of an epoch - trainer = Trainer(val_check_interval=0.25) - - # check every 100 train batches (ie: for IterableDatasets or fixed frequency) - trainer = Trainer(val_check_interval=100) - -Learn more in our :ref:`trainer_flags` guide. - ----------------- - -********************* -Preload Data Into RAM -********************* - -**Use when:** You need access to all samples in a dataset at once. - -When your training or preprocessing requires many operations to be performed on entire dataset(s), it can -sometimes be beneficial to store all data in RAM given there is enough space. -However, loading all data at the beginning of the training script has the disadvantage that it can take a long -time, and hence, it slows down the development process. Another downside is that in multiprocessing (e.g., DDP) -the data would get copied in each process. -One can overcome these problems by copying the data into RAM in advance. -Most UNIX-based operating systems provide direct access to tmpfs through a mount point typically named ``/dev/shm``. - -Increase shared memory if necessary. Refer to the documentation of your OS on how to do this. - -1. Copy training data to shared memory: - - .. code-block:: bash - - cp -r /path/to/data/on/disk /dev/shm/ - -2. Refer to the new data root in your script or command-line arguments: - - .. code-block:: python - - datamodule = MyDataModule(data_root="/dev/shm/my_data") - ---------- - -************** -Model Toggling -************** - -**Use when:** Performing gradient accumulation with multiple optimizers in a -distributed setting. - -Here is an explanation of what it does: - -* Considering the current optimizer as A and all other optimizers as B. -* Toggling, which means all parameters from B exclusive to A will have their ``requires_grad`` attribute set to ``False``. -* Restoring their original state when exiting the context manager. - -When performing gradient accumulation, there is no need to perform grad synchronization during the accumulation phase. -Setting ``sync_grad`` to ``False`` will block this synchronization and improve your training speed. - -:class:`~pytorch_lightning.core.optimizer.LightningOptimizer` provides a -:meth:`~pytorch_lightning.core.optimizer.LightningOptimizer.toggle_model` function as a -:func:`contextlib.contextmanager` for advanced users. - -Here is an example of an advanced use case: - -.. testcode:: - - # Scenario for a GAN with gradient accumulation every two batches and optimized for multiple GPUs. - class SimpleGAN(LightningModule): - def __init__(self): - super().__init__() - self.automatic_optimization = False - - def training_step(self, batch, batch_idx): - # Implementation follows the PyTorch tutorial: - # https://pytorch.org/tutorials/beginner/dcgan_faces_tutorial.html - g_opt, d_opt = self.optimizers() - - X, _ = batch - X.requires_grad = True - batch_size = X.shape[0] - - real_label = torch.ones((batch_size, 1), device=self.device) - fake_label = torch.zeros((batch_size, 1), device=self.device) - - # Sync and clear gradients - # at the end of accumulation or - # at the end of an epoch. - is_last_batch_to_accumulate = (batch_idx + 1) % 2 == 0 or self.trainer.is_last_batch - - g_X = self.sample_G(batch_size) - - ########################## - # Optimize Discriminator # - ########################## - with d_opt.toggle_model(sync_grad=is_last_batch_to_accumulate): - d_x = self.D(X) - errD_real = self.criterion(d_x, real_label) - - d_z = self.D(g_X.detach()) - errD_fake = self.criterion(d_z, fake_label) - - errD = errD_real + errD_fake - - self.manual_backward(errD) - if is_last_batch_to_accumulate: - d_opt.step() - d_opt.zero_grad() - - ###################### - # Optimize Generator # - ###################### - with g_opt.toggle_model(sync_grad=is_last_batch_to_accumulate): - d_z = self.D(g_X) - errG = self.criterion(d_z, real_label) - - self.manual_backward(errG) - if is_last_batch_to_accumulate: - g_opt.step() - g_opt.zero_grad() - - self.log_dict({"g_loss": errG, "d_loss": errD}, prog_bar=True) - ------ - -***************** -Set Grads to None -***************** - -In order to improve performance, you can override :meth:`~pytorch_lightning.core.lightning.LightningModule.optimizer_zero_grad`. - -For a more detailed explanation of the pros / cons of this technique, -read the documentation for :meth:`~torch.optim.Optimizer.zero_grad` by the PyTorch team. - -.. testcode:: - - class Model(LightningModule): - def optimizer_zero_grad(self, epoch, batch_idx, optimizer, optimizer_idx): - optimizer.zero_grad(set_to_none=True) - - ------ - -*************** -Things to Avoid -*************** - -.item(), .numpy(), .cpu() -========================= - -Don't call ``.item()`` anywhere in your code. Use ``.detach()`` instead to remove the connected graph calls. Lightning -takes a great deal of care to be optimized for this. - -Clear Cache -=========== - -Don't call :func:`torch.cuda.empty_cache` unnecessarily! Every time you call this, ALL your GPUs have to wait to sync. - -Transferring Tensors to Device -============================== - -LightningModules know what device they are on! Construct tensors on the device directly to avoid CPU->Device transfer. - -.. code-block:: python - - # bad - t = torch.rand(2, 2).cuda() - - # good (self is LightningModule) - t = torch.rand(2, 2, device=self.device) - - -For tensors that need to be model attributes, it is best practice to register them as buffers in the module's -``__init__`` method: - -.. code-block:: python - - # bad - self.t = torch.rand(2, 2, device=self.device) - - # good - self.register_buffer("t", torch.rand(2, 2)) diff --git a/docs/_sources/index.rst.txt b/docs/_sources/index.rst.txt deleted file mode 100644 index d646beb..0000000 --- a/docs/_sources/index.rst.txt +++ /dev/null @@ -1,275 +0,0 @@ -.. PyTorch-Lightning documentation master file, created by - sphinx-quickstart on Fri Nov 15 07:48:22 2019. - You can adapt this file completely to your liking, but it should at least - contain the root `toctree` directive. - -⚡ PyTorch Lightning에 오신 것을 환영합니다! -============================================== - -.. twocolumns:: - :left: - .. image:: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/mov.gif - :alt: Animation showing how to convert a standard training loop to a Lightning loop - :right: - PyTorch Lightning(파이토치 라이트닝))은 대규모에서 성능을 포기하지 않으면서 최대한의 유연성을 필요로 하는 전문적인 AI 연구자들과 머신러닝 엔지니어들을 위한 딥러닝 프레임워크입니다. - Lightning(라이트닝)은 프로젝트가 생각으로부터 문서 / 제품화에 이르는 동안 함께 발전합니다. - -.. raw:: html - -
-
-
-
- -.. join_slack:: - :align: center - :margin: 0 - -.. raw:: html - -
-
- - -.. raw:: html - -
- - -Lightning 설치하기 ----------------------- - - -.. raw:: html - -
-
- -Pip 사용자라면, - -.. code-block:: bash - - pip install pytorch-lightning - -.. raw:: html - -
-
- -Conda 사용자라면, - -.. code-block:: bash - - conda install pytorch-lightning -c conda-forge - -.. raw:: html - -
-
- -또는 `advanced install guide `_ 참조하세요. - -.. raw:: html - -
- -처음이신가요? ------------------ - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. customcalloutitem:: - :header: LIGHTNING 15분 만에 배워보기 - :description: 일반적인 Lightning 워크플로우의 주요한 7단계를 배웁니다. - :button_link: starter/introduction.html - -.. customcalloutitem:: - :header: Benchmarking - :description: Learn how to benchmark PyTorch Lightning. - :button_link: benchmarking/benchmarks.html - -.. raw:: html - -
-
- -.. End of callout item section - -.. raw:: html - -
- -이미 Lightning 사용자라면? ---------------------------- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. customcalloutitem:: - :description: Learn Lightning in small bites at 4 levels of expertise: Introductory, intermediate, advanced and expert. - :header: Level Up! - :button_link: expertise_levels.html - -.. customcalloutitem:: - :description: Detailed description of API each package. Assumes you already have basic Lightning knowledge. - :header: API Reference - :button_link: api_references.html - -.. customcalloutitem:: - :description: From NLP, Computer vision to RL and meta learning - see how to use Lightning in ALL research areas. - :header: Hands-on Examples - :button_link: tutorials.html - -.. customcalloutitem:: - :description: Learn how to do everything from hyperparameters sweeps to cloud training to Pruning and Quantization with Lightning. - :header: Common Workflows - :button_link: common_usecases.html - -.. customcalloutitem:: - :description: Convert your current code to Lightning - :header: Convert code to PyTorch Lightning - :button_link: starter/converting.html - - -.. raw:: html - -
-
- -.. End of callout item section - -.. raw:: html - -
- -.. toctree:: - :maxdepth: 1 - :name: start - :caption: Get Started - - starter/introduction - Organize existing PyTorch into Lightning - - -.. toctree:: - :maxdepth: 2 - :name: levels - :caption: Level Up - - levels/core_skills - levels/intermediate - levels/advanced - levels/expert - -.. toctree:: - :maxdepth: 2 - :name: pl_docs - :caption: Core API - - common/lightning_module - common/trainer - -.. toctree:: - :maxdepth: 1 - :name: Common Workflows - :caption: Common Workflows - - Avoid overfitting - model/build_model.rst - common/hyperparameters - common/progress_bar - deploy/production - advanced/training_tricks - cli/lightning_cli - tuning/profiler - Finetune a model - Manage experiments - clouds/cluster - advanced/model_parallel - clouds/cloud_training - Save and load model progress - Save memory with half-precision - Train on single or multiple GPUs - Train on single or multiple HPUs - Train on single or multiple IPUs - Train on single or multiple TPUs - model/own_your_loop - -.. toctree:: - :maxdepth: 1 - :name: Glossary - :caption: Glossary - - Accelerators - Callback - Checkpointing - Cluster - Cloud checkpoint - Console Logging - Debugging - Early stopping - Experiment manager (Logger) - Fault tolerant training - Flash - Grid AI - GPU - Half precision - HPU - Inference - IPU - Lightning CLI - Lightning Lite - LightningDataModule - LightningModule - Lightning Transformers - Log - Loops - TPU - Metrics - Model - Model Parallel - Plugins - Progress bar - Production - Predict - Profiler - Pruning and Quantization - Remote filesystem and FSSPEC - Strategy registry - Style guide - Sweep - SWA - SLURM - Transfer learning - Trainer - Torch distributed - -.. toctree:: - :maxdepth: 1 - :name: Hands-on Examples - :caption: Hands-on Examples - :glob: - - PyTorch Lightning 101 class - From PyTorch to PyTorch Lightning [Blog] - From PyTorch to PyTorch Lightning [Video] - - -.. raw:: html - -
- -색인 및 검색 ------------------- - -* :ref:`genindex` -* :ref:`search` diff --git a/docs/_sources/levels/advanced.rst.txt b/docs/_sources/levels/advanced.rst.txt deleted file mode 100644 index 4ffe090..0000000 --- a/docs/_sources/levels/advanced.rst.txt +++ /dev/null @@ -1,87 +0,0 @@ - -############### -Advanced skills -############### - -Configure all aspects of Lightning for advanced usecases. - -.. join_slack:: - :align: left - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Level 15: Customize configs to run in production - :description: Enable composable YAMLs - :col_css: col-md-6 - :button_link: advanced_level_15.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 16: Customize the trainer - :description: Inject custom code into the trainer and modify the progress bar. - :col_css: col-md-6 - :button_link: advanced_level_16.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 17: Own the training loop - :description: Learn all the ways of owning your raw PyTorch loops with Lighting. - :col_css: col-md-6 - :button_link: advanced_level_17.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 18: Enable advanced checkpointing - :description: Enable composable or cloud based checkpoints. - :col_css: col-md-6 - :button_link: advanced_level_18.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 19: Explore IPUs - :description: Explore Intelligence Processing Unit (IPU) for model scaling. - :col_css: col-md-6 - :button_link: advanced_level_19.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 20: Explore HPUs - :description: Explore Havana Gaudi Processing Unit (HPU) for model scaling. - :col_css: col-md-6 - :button_link: advanced_level_20.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 21: Master TPUs - :description: Master TPUs and run on cloud TPUs. - :col_css: col-md-6 - :button_link: advanced_level_21.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 22: Reach 1 trillion parameters on GPUs - :description: Scale to 1 trillion params on GPUs. - :col_css: col-md-6 - :button_link: advanced_level_22.html - :height: 150 - :tag: advanced - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/advanced_level_15.rst.txt b/docs/_sources/levels/advanced_level_15.rst.txt deleted file mode 100644 index 761dbd3..0000000 --- a/docs/_sources/levels/advanced_level_15.rst.txt +++ /dev/null @@ -1,37 +0,0 @@ -:orphan: - -################################################ -Level 15: Customize configs to run in production -################################################ - -This level goes over advanced YAML use for running models in production. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: 1: Control it all via YAML - :description: Enable composable YAMLs. - :col_css: col-md-6 - :button_link: ../cli/lightning_cli_advanced.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: 2: Use YAML for production - :description: Use the Lightning CLI with YAMLs for production environments. - :col_css: col-md-6 - :button_link: ../cli/lightning_cli_advanced_2.html - :height: 150 - :tag: advanced - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/advanced_level_16.rst.txt b/docs/_sources/levels/advanced_level_16.rst.txt deleted file mode 100644 index fd41df1..0000000 --- a/docs/_sources/levels/advanced_level_16.rst.txt +++ /dev/null @@ -1,37 +0,0 @@ -:orphan: - -############################### -Level 16: Customize the trainer -############################### - -In this level, you'll learn to modify the Trainer behavior. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Create and use Callbacks - :description: Modify Trainer behavior with reusable, self-contained code. - :col_css: col-md-6 - :button_link: ../extensions/callbacks.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Customize the progress bar - :description: Create beautiful custom progress bars. - :col_css: col-md-6 - :button_link: ../common/progress_bar.html - :height: 150 - :tag: advanced - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/advanced_level_17.rst.txt b/docs/_sources/levels/advanced_level_17.rst.txt deleted file mode 100644 index c05c8c9..0000000 --- a/docs/_sources/levels/advanced_level_17.rst.txt +++ /dev/null @@ -1,45 +0,0 @@ -:orphan: - -############################### -Level 17: Own the training loop -############################### - -Learn all the ways of owning your raw PyTorch loops with Lighting. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Enable manual optimization - :description: Gain control of the training loop with manual optimization and LightningModule methods. - :col_css: col-md-4 - :button_link: ../model/build_model_advanced.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Use a Raw PyTorch Loop - :description: Migrate complex PyTorch projects to Lightning and push bleeding-edge research with the raw PyTorch loop. - :col_css: col-md-4 - :button_link: ../model/build_model_expert.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Make a custom Lightning Loop - :description: Conduct bleeding-edge research like meta-learning and RL with a custom Loop. - :col_css: col-md-4 - :button_link: ../extensions/loops.html - :height: 150 - :tag: expert - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/advanced_level_18.rst.txt b/docs/_sources/levels/advanced_level_18.rst.txt deleted file mode 100644 index a7d7966..0000000 --- a/docs/_sources/levels/advanced_level_18.rst.txt +++ /dev/null @@ -1,37 +0,0 @@ -:orphan: - -####################################### -Level 18: Enable advanced checkpointing -####################################### - -This level shows you how to enable composable and/or cloud based checkpoints. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Enable composable and cloud checkpoints - :description: Enable cloud-based checkpointing and composable checkpoints. - :col_css: col-md-6 - :button_link: ../common/checkpointing_advanced.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Explore remote filesystems - :description: Explore advanced cloud checkpointing features. - :col_css: col-md-6 - :button_link: ../common/remote_fs.html - :height: 150 - :tag: advanced - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/advanced_level_19.rst.txt b/docs/_sources/levels/advanced_level_19.rst.txt deleted file mode 100644 index c7b6697..0000000 --- a/docs/_sources/levels/advanced_level_19.rst.txt +++ /dev/null @@ -1,45 +0,0 @@ -:orphan: - -###################### -Level 19: Explore IPUs -###################### - -Explore Intelligence Processing Unit (IPU) for model scaling. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Prepare your code (Optional) - :description: Prepare your code to run on any hardware. - :col_css: col-md-4 - :button_link: ../accelerators/accelerator_prepare.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Train models on IPUs - :description: Learn the basics of single and multi-IPU training. - :col_css: col-md-4 - :button_link: ../accelerators/ipu_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Optimize models training on IPUs - :description: Tune model performance with mix-precision and the performance analyser. - :col_css: col-md-4 - :button_link: ../accelerators/ipu_intermediate.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/advanced_level_20.rst.txt b/docs/_sources/levels/advanced_level_20.rst.txt deleted file mode 100644 index 7e9d562..0000000 --- a/docs/_sources/levels/advanced_level_20.rst.txt +++ /dev/null @@ -1,37 +0,0 @@ -:orphan: - -###################### -Level 19: Explore HPUs -###################### - -Explore Intelligence Processing Unit (IPU) for model scaling. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Train models on HPUs - :description: Learn the basics of single and multi-HPU core training. - :col_css: col-md-6 - :button_link: ../accelerators/hpu_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Optimize models training on HPUs - :description: Enable state-of-the-art scaling with advanced mix-precision settings. - :col_css: col-md-6 - :button_link: ../accelerators/hpu_intermediate.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/advanced_level_21.rst.txt b/docs/_sources/levels/advanced_level_21.rst.txt deleted file mode 100644 index 5252a1c..0000000 --- a/docs/_sources/levels/advanced_level_21.rst.txt +++ /dev/null @@ -1,45 +0,0 @@ -:orphan: - -##################### -Level 21: Master TPUs -##################### - -Master cloud TPU training with profiling and scaling techniques. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Run on cloud TPUs - :description: Scale massive models using cloud TPUs. - :col_css: col-md-4 - :button_link: ../accelerators/tpu_intermediate.html - :height: 180 - :tag: intermediate - -.. displayitem:: - :header: Explore advanced TPU scaling techniques - :description: Dive into XLA and advanced techniques to optimize TPU-powered models. - :col_css: col-md-4 - :button_link: ../accelerators/tpu_advanced.html - :height: 180 - :tag: advanced - -.. displayitem:: - :header: Profile TPU code - :description: Learn to profile TPU code. - :col_css: col-md-4 - :button_link: ../tuning/profiler_advanced.html - :height: 180 - :tag: advanced - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/advanced_level_22.rst.txt b/docs/_sources/levels/advanced_level_22.rst.txt deleted file mode 100644 index a90a482..0000000 --- a/docs/_sources/levels/advanced_level_22.rst.txt +++ /dev/null @@ -1,37 +0,0 @@ -:orphan: - -############################################# -Level 22: Reach 1 trillion parameters on GPUs -############################################# - -Scale to 1 trillion+ parameters with multiple distributed strategies. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Scale with distributed strategies - :description: Learn about different distributed strategies to reach bigger model parameter sizes. - :col_css: col-md-6 - :button_link: ../accelerators/gpu_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Reach 1 trillion parameters on GPUs - :description: Scale to 1 trillion params on GPUs with FSDP and Deepspeed. - :col_css: col-md-6 - :button_link: ../advanced/model_parallel.html - :height: 150 - :tag: advanced - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/basic_level_2.rst.txt b/docs/_sources/levels/basic_level_2.rst.txt deleted file mode 100644 index 348a389..0000000 --- a/docs/_sources/levels/basic_level_2.rst.txt +++ /dev/null @@ -1,41 +0,0 @@ -:orphan: - -###################################### -Level 2: Add a validation and test set -###################################### - -.. raw:: html - -
-
- -.. displayitem:: - :header: Validate and test a model - :description: Add a validation and test data split to avoid overfitting. - :col_css: col-md-4 - :button_link: ../common/evaluation_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Save your model progress - :description: Learn to save the state of a model as it trains. - :col_css: col-md-4 - :button_link: ../common/checkpointing_basic.html#save-a-checkpoint - :height: 150 - :tag: basic - -.. displayitem:: - :header: Enable early stopping - :description: Use early stopping to decide when to stop training your model. - :col_css: col-md-4 - :button_link: ../common/early_stopping.html - :height: 150 - :tag: basic - - - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/basic_level_5.rst.txt b/docs/_sources/levels/basic_level_5.rst.txt deleted file mode 100644 index 98de180..0000000 --- a/docs/_sources/levels/basic_level_5.rst.txt +++ /dev/null @@ -1,39 +0,0 @@ -:orphan: - -########################################################## -Level 5: Debug, visualize and find performance bottlenecks -########################################################## - -.. raw:: html - -
-
- -.. displayitem:: - :header: Debug your model - :description: Learn the basics of model debugging - :col_css: col-md-4 - :button_link: ../debug/debugging_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Find bottlenecks in training - :description: Learn to find bottlenecks in the training loop. - :col_css: col-md-4 - :button_link: ../tuning/profiler_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Visualize metrics, images, and text. - :description: Learn how to track and visualize metrics, images and text. - :col_css: col-md-4 - :button_link: ../visualize/logging_basic.html - :height: 150 - :tag: basic - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/core_level_3.rst.txt b/docs/_sources/levels/core_level_3.rst.txt deleted file mode 100644 index ea34853..0000000 --- a/docs/_sources/levels/core_level_3.rst.txt +++ /dev/null @@ -1,31 +0,0 @@ -:orphan: - -#################################### -Level 3: Visualize training progress -#################################### - -.. raw:: html - -
-
- -.. displayitem:: - :header: Visualize metrics, images, and text. - :description: Learn how to track and visualize metrics, images and text. - :col_css: col-md-6 - :button_link: ../visualize/logging_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Use third-party experiment managers - :description: Enable third-party experiment managers with advanced visualizations. - :col_css: col-md-6 - :button_link: ../visualize/logging_intermediate.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/core_level_6.rst.txt b/docs/_sources/levels/core_level_6.rst.txt deleted file mode 100644 index 99686bc..0000000 --- a/docs/_sources/levels/core_level_6.rst.txt +++ /dev/null @@ -1,39 +0,0 @@ -:orphan: - -################################# - Level 6: Predict with your model -################################# - -.. raw:: html - -
-
- -.. displayitem:: - :header: Load model weights - :description: Learn to load the weights (checkpoint) of a model. - :col_css: col-md-4 - :button_link: ../common/checkpointing_basic.html#lightningmodule-from-checkpoint - :height: 150 - :tag: basic - -.. displayitem:: - :header: Predict with LightningModule - :description: Learn the basics of predicting with Lightning. - :col_css: col-md-4 - :button_link: ../deploy/production_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Predict with pure PyTorch - :description: Learn to use pure PyTorch without the Lightning dependencies for prediction. - :col_css: col-md-4 - :button_link: ../deploy/production_intermediate.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/core_skills.rst.txt b/docs/_sources/levels/core_skills.rst.txt deleted file mode 100644 index 19cab69..0000000 --- a/docs/_sources/levels/core_skills.rst.txt +++ /dev/null @@ -1,70 +0,0 @@ - -############ -Basic skills -############ -Learn the basics of model development with Lightning. Researchers and machine learning engineers should start here. - -.. join_slack:: - :align: left - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Level 1: Train a model - :description: Learn the basics of training a model. - :button_link: ../model/train_model_basic.html - :col_css: col-md-6 - :height: 150 - :tag: basic - -.. displayitem:: - :header: Level 2: Add a validation and test set - :description: Add validation and test sets to avoid over/underfitting. - :button_link: /levels/basic_level_2.html - :col_css: col-md-6 - :height: 150 - :tag: basic - -.. displayitem:: - :header: Level 3: Use pretrained models - :description: Learn how to use pretrained models with Lightning - :button_link: ../advanced/transfer_learning.html - :col_css: col-md-6 - :height: 150 - :tag: basic - -.. displayitem:: - :header: Level 4: Enable script parameters - :description: Add parameters to your script so you can run from the commandline. - :button_link: ../common/hyperparameters.html - :col_css: col-md-6 - :height: 150 - :tag: basic - -.. displayitem:: - :header: Level 5: Understand and visualize your model - :description: Remove bottlenecks and visualize your model - :button_link: ../levels/basic_level_5.html - :col_css: col-md-6 - :height: 150 - :tag: basic - -.. displayitem:: - :description: Use your model for predictions. - :header: Level 6: Predict with your model - :button_link: core_level_6.html - :col_css: col-md-6 - :height: 150 - :tag: basic - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/expert.rst.txt b/docs/_sources/levels/expert.rst.txt deleted file mode 100644 index d41680b..0000000 --- a/docs/_sources/levels/expert.rst.txt +++ /dev/null @@ -1,63 +0,0 @@ - -############# -Expert skills -############# - -Customize and extend Lightning for things like custom hardware or distributed strategies. - -.. join_slack:: - :align: left - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Level 23: Extend the Lightning CLI - :description: Extend the functionality of the Lightning CLI. - :col_css: col-md-6 - :button_link: expert_level_23.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: Level 24: Integrate a custom cluster - :description: Integrate a custom cluster into Lightning. - :col_css: col-md-6 - :button_link: expert_level_24.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: Level 25: Explore fault-tolerance in-depth - :description: Understand the details of fault-tolerance. - :col_css: col-md-6 - :button_link: ../clouds/fault_tolerant_training_faq.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: Level 26: Make your own profiler - :description: Make your own profiler. - :col_css: col-md-6 - :button_link: ../tuning/profiler_expert.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: Level 27: Add a new accelerator or Strategy - :description: Integrate a new accelerator or distributed strategy. - :col_css: col-md-6 - :button_link: expert_level_27.html - :height: 150 - :tag: expert - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/expert_level_23.rst.txt b/docs/_sources/levels/expert_level_23.rst.txt deleted file mode 100644 index 9b143a0..0000000 --- a/docs/_sources/levels/expert_level_23.rst.txt +++ /dev/null @@ -1,37 +0,0 @@ -:orphan: - -################################## -Level 23: Extend the Lightning CLI -################################## - -Extend the functionality of the Lightning CLI. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Customize configs for complex projects - :description: Learn how to connect complex projects with each Registry. - :col_css: col-md-6 - :button_link: ../cli/lightning_cli_advanced_3.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: Extend the Lightning CLI - :description: Customize the Lightning CLI - :col_css: col-md-6 - :button_link: ../cli/lightning_cli_expert.html - :height: 150 - :tag: expert - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/expert_level_24.rst.txt b/docs/_sources/levels/expert_level_24.rst.txt deleted file mode 100644 index b32a8ac..0000000 --- a/docs/_sources/levels/expert_level_24.rst.txt +++ /dev/null @@ -1,37 +0,0 @@ -:orphan: - -#################################### -Level 24: Integrate a custom cluster -#################################### - -Extend the functionality of the Lightning CLI. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Integrate your own cluster - :description: Learn how to integrate your own cluster - :col_css: col-md-6 - :button_link: ../clouds/cluster_expert.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: Run on your own cloud - :description: Learn how to run on your Company or University private clouds. - :col_css: col-md-6 - :button_link: ../clouds/run_expert.html - :height: 150 - :tag: expert - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/expert_level_27.rst.txt b/docs/_sources/levels/expert_level_27.rst.txt deleted file mode 100644 index c2d682b..0000000 --- a/docs/_sources/levels/expert_level_27.rst.txt +++ /dev/null @@ -1,53 +0,0 @@ -:orphan: - -########################################### -Level 27: Add a new accelerator or Strategy -########################################### - -Integrate a new accelerator or distributed strategy. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: 1: Develop a new strategy - :description: Develop new strategies for training and deploying larger and larger models. - :col_css: col-md-6 - :button_link: ../accelerators/gpu_expert.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: 2: Customize checkpointing with new strategies. - :description: Customize checkpointing for custom distributed strategies and accelerators. - :col_css: col-md-6 - :button_link: ../common/checkpointing_expert.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: 3: Register a new strategy - :description: Enable a new strategy to be used in Lightning. - :col_css: col-md-6 - :button_link: ../advanced/strategy_registry.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: 4: Create a new precision technique - :description: Create new precision techniques and enable them through Lightning. - :col_css: col-md-6 - :button_link: ../common/precision_expert.html - :height: 150 - :tag: expert - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/intermediate.rst.txt b/docs/_sources/levels/intermediate.rst.txt deleted file mode 100644 index 331e477..0000000 --- a/docs/_sources/levels/intermediate.rst.txt +++ /dev/null @@ -1,89 +0,0 @@ - -################### -Intermediate skills -################### - -Learn to scale up your models and enable collaborative model development at academic or industry research labs. - -.. join_slack:: - :align: left - ----- - -.. include:: ../links.rst - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Level 7: Interactive cloud development - :description: Learn how to access GPUs and TPUs on the cloud. - :button_link: intermediate_level_7.html - :col_css: col-md-6 - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 8: Train in the background on the cloud - :description: Learn how to run models on the cloud in the background. - :button_link: intermediate_level_8.html - :col_css: col-md-6 - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 9: Modularize your projects - :description: Create DataModules to enable dataset reusability. - :col_css: col-md-6 - :button_link: intermediate_level_9.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 10: Understand your model - :description: Use advanced visuals to find the best performing model. - :col_css: col-md-6 - :button_link: intermediate_level_10.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 11: Explore SOTA scaling techniques - :description: Explore SOTA techniques to help convergence, stability and scalability. - :col_css: col-md-6 - :button_link: intermediate_level_11.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 12: Deploy your models - :description: Learn how to deploy your models with optimizations like ONNX and torchscript. - :col_css: col-md-6 - :button_link: intermediate_level_12.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 13: Optimize training speed - :description: Use advanced profilers to mixed precision to train bigger models, faster. - :col_css: col-md-6 - :button_link: intermediate_level_13.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 14: Run on on-prem clusters - :description: Run on a custom on-prem cluster or SLURM cluster. - :col_css: col-md-6 - :button_link: intermediate_level_14.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/intermediate_level_10.rst.txt b/docs/_sources/levels/intermediate_level_10.rst.txt deleted file mode 100644 index d7f5dc5..0000000 --- a/docs/_sources/levels/intermediate_level_10.rst.txt +++ /dev/null @@ -1,45 +0,0 @@ -:orphan: - -############################### -Level 10: Understand your model -############################### - -Find the best model using advanced visualizations for deeper insights. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: 1: Alter checkpoint behavior - :description: Learn to monitor metrics and enable checkpointing by condition. - :col_css: col-md-4 - :button_link: ../common/checkpointing_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: 2: Visualize more than metrics - :description: Use advanced visualization techniques provided by experiment managers. - :col_css: col-md-4 - :button_link: ../visualize/logging_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: 3: Granular control of logging - :description: Gain granular control over logging to optimize for speed. - :col_css: col-md-4 - :button_link: ../visualize/logging_advanced.html - :height: 150 - :tag: advanced - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/intermediate_level_11.rst.txt b/docs/_sources/levels/intermediate_level_11.rst.txt deleted file mode 100644 index 4c7ed06..0000000 --- a/docs/_sources/levels/intermediate_level_11.rst.txt +++ /dev/null @@ -1,37 +0,0 @@ -:orphan: - -######################################### -Level 11: Explore SOTA scaling techniques -######################################### - -In this level you'll explore SOTA techniques to help convergence, stability and scalability. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: 1: Half precision training - :description: Enable your models to train faster and save memory with different floating-point precision settings. - :col_css: col-md-6 - :button_link: ../common/precision_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: 2: SOTA scaling techniques - :description: Enable techniques to help scaling and convergence. - :col_css: col-md-6 - :button_link: ../advanced/training_tricks.html - :height: 150 - :tag: basic - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/intermediate_level_12.rst.txt b/docs/_sources/levels/intermediate_level_12.rst.txt deleted file mode 100644 index fe1c076..0000000 --- a/docs/_sources/levels/intermediate_level_12.rst.txt +++ /dev/null @@ -1,46 +0,0 @@ -:orphan: - -############################ -Level 12: Deploy your models -############################ - -In this level you'll learn a few options for deploying models into production. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Deploy with ONNX - :description: Optimize models for enterprise-scale production environments with ONNX. - :col_css: col-md-4 - :button_link: ../deploy/production_advanced.html - :height: 180 - :tag: advanced - -.. displayitem:: - :header: Deploy with torchscript - :description: Optimize models for enterprise-scale production environments with torchscript. - :col_css: col-md-4 - :button_link: ../deploy/production_advanced_2.html - :height: 180 - :tag: advanced - -.. displayitem:: - :header: Compress models for fast inference - :description: Compress model size for deployment with Quantization and Pruning. - :col_css: col-md-4 - :button_link: ../advanced/pruning_quantization.html - :height: 180 - :tag: advanced - - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/intermediate_level_13.rst.txt b/docs/_sources/levels/intermediate_level_13.rst.txt deleted file mode 100644 index 38ac7aa..0000000 --- a/docs/_sources/levels/intermediate_level_13.rst.txt +++ /dev/null @@ -1,45 +0,0 @@ -:orphan: - -################################# -Level 13: Optimize training speed -################################# - -In this level you'll use advanced profilers and mixed precision techniques to train bigger models faster. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Explore advanced mixed precision settings - :description: Enable state-of-the-art scaling with advanced mix-precision settings. - :col_css: col-md-4 - :button_link: ../common/precision_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Enable advanced profilers - :description: Tune model performance with profilers. - :col_css: col-md-4 - :button_link: ../tuning/profiler_basic.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Profile PyTorch operations - :description: Learn to find bottlenecks in PyTorch operations. - :col_css: col-md-4 - :button_link: ../tuning/profiler_intermediate.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/intermediate_level_14.rst.txt b/docs/_sources/levels/intermediate_level_14.rst.txt deleted file mode 100644 index a779ede..0000000 --- a/docs/_sources/levels/intermediate_level_14.rst.txt +++ /dev/null @@ -1,45 +0,0 @@ -:orphan: - -################################# -Level 14: Run on on-prem clusters -################################# - -In this level you'll learn to run on onprem clusters. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Run on an on-prem cluster - :description: Learn to train models on a general compute cluster. - :col_css: col-md-4 - :button_link: ../clouds/cluster_intermediate_1.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Run on a SLURM cluster - :description: Run models on a SLURM-managed cluster - :col_css: col-md-4 - :button_link: ../clouds/cluster_advanced.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Run with Torch Distributed - :description: Run models on a cluster with torch distributed. - :col_css: col-md-4 - :button_link: ../clouds/cluster_intermediate_2.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/intermediate_level_7.rst.txt b/docs/_sources/levels/intermediate_level_7.rst.txt deleted file mode 100644 index cc55fd7..0000000 --- a/docs/_sources/levels/intermediate_level_7.rst.txt +++ /dev/null @@ -1,51 +0,0 @@ -:orphan: - -###################################### -Level 7: Interactive cloud development -###################################### - -Learn to develop models on cloud GPUs and TPUs. - ----- - -.. raw:: html - -
-
- -.. displayitem:: - :header: Prepare your code (Optional) - :description: Prepare your code to run on any hardware. - :col_css: col-md-3 - :button_link: ../accelerators/accelerator_prepare.html - :height: 180 - :tag: basic - -.. displayitem:: - :header: Access a cloud machine with GPUs - :description: Learn how to get a cloud machine with single or multiple GPUs. - :col_css: col-md-3 - :button_link: ../clouds/session_basic.html - :height: 180 - :tag: basic - -.. displayitem:: - :header: GPU Training - :description: Learn the basics on single and multi-GPU training. - :col_css: col-md-3 - :button_link: ../accelerators/gpu_basic.html - :height: 180 - :tag: basic - -.. displayitem:: - :header: TPU Training - :description: Learn the basics on single and multi-TPU core training. - :col_css: col-md-3 - :button_link: ../accelerators/tpu_basic.html - :height: 180 - :tag: basic - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/intermediate_level_8.rst.txt b/docs/_sources/levels/intermediate_level_8.rst.txt deleted file mode 100644 index 190364a..0000000 --- a/docs/_sources/levels/intermediate_level_8.rst.txt +++ /dev/null @@ -1,53 +0,0 @@ -:orphan: - -################################ -Level 8: Run models on the cloud -################################ - -Learn to run models on the cloud in the background asynchroneously. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: 1: Run a model in the background on the cloud - :description: Learn to run a model in the background on a cloud machine. - :col_css: col-md-6 - :button_link: ../clouds/run_basic.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: 2: Save up to 80% on cloud costs with fault-tolerant training - :description: Run on the cloud for 1/10th the price with fault-tolerant training. - :col_css: col-md-6 - :button_link: ../clouds/fault_tolerant_training_basic.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: 3: Run many models at once - :description: Run many models at once (sweep) to find the best performing model. - :col_css: col-md-6 - :button_link: ../clouds/run_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: 4: Run on your own cloud - :description: Learn how to run on your Company or University private clouds. - :col_css: col-md-6 - :button_link: ../clouds/run_expert.html - :height: 150 - :tag: expert - -.. raw:: html - -
-
diff --git a/docs/_sources/levels/intermediate_level_9.rst.txt b/docs/_sources/levels/intermediate_level_9.rst.txt deleted file mode 100644 index 8c537d7..0000000 --- a/docs/_sources/levels/intermediate_level_9.rst.txt +++ /dev/null @@ -1,45 +0,0 @@ -:orphan: - -################################# -Level 9: Modularize your projects -################################# - -This module teaches you how to setup complex projects that can be controlled via the CLI. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: 1: Modularize your datasets - :description: Reuse datasets across models by using DataModules - :col_css: col-md-4 - :button_link: ../data/datamodule.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: 2: Control it all from the CLI - :description: Learn to control a LightningModule and LightningDataModule from the CLI - :col_css: col-md-4 - :button_link: ../cli/lightning_cli_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: 3: Mix models and datasets - :description: Register models, datasets, optimizers and learning rate schedulers - :col_css: col-md-4 - :button_link: ../cli/lightning_cli_intermediate_2.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
diff --git a/docs/_sources/links.rst.txt b/docs/_sources/links.rst.txt deleted file mode 100644 index 64ec918..0000000 --- a/docs/_sources/links.rst.txt +++ /dev/null @@ -1,2 +0,0 @@ -.. _PyTorchJob: https://www.kubeflow.org/docs/components/training/pytorch/ -.. _Kubeflow: https://www.kubeflow.org diff --git a/docs/_sources/model/build_model.rst.txt b/docs/_sources/model/build_model.rst.txt deleted file mode 100644 index 8d12110..0000000 --- a/docs/_sources/model/build_model.rst.txt +++ /dev/null @@ -1,55 +0,0 @@ -:orphan: - -############# -Build a Model -############# - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: 1: Train a model - :description: Build a model to learn the basic ideas of Lightning - :col_css: col-md-4 - :button_link: train_model_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: 2: Validate and test a model - :description: Add a validation and test data split to avoid overfitting. - :col_css: col-md-4 - :button_link: validate_model_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: 3: Supercharge training - :description: Enable state-of-the-art training techniques with the Trainer features. - :col_css: col-md-4 - :button_link: build_model_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: LightningModule API - :description: Dig into LightningModule API in depth - :col_css: col-md-4 - :button_link: ../common/lightning_module.html#lightningmodule-api - :height: 150 - -.. displayitem:: - :header: Trainer API - :description: Dig into Trainer API in depth - :col_css: col-md-4 - :button_link: ../common/trainer.html#trainer-class-api - :height: 150 - -.. raw:: html - -
-
diff --git a/docs/_sources/model/build_model_advanced.rst.txt b/docs/_sources/model/build_model_advanced.rst.txt deleted file mode 100644 index 33be842..0000000 --- a/docs/_sources/model/build_model_advanced.rst.txt +++ /dev/null @@ -1,25 +0,0 @@ -:orphan: - -######################## -Own your loop (advanced) -######################## - -*********************** -Customize training loop -*********************** - -.. image:: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/custom_loop.png - :width: 600 - :alt: Injecting custom code in a training loop - -Inject custom code anywhere in the Training loop using any of the 20+ methods (:ref:`lightning_hooks`) available in the LightningModule. - -.. testcode:: - - class LitModel(pl.LightningModule): - def backward(self, loss, optimizer, optimizer_idx): - loss.backward() - ----- - -.. include:: manual_optimization.rst diff --git a/docs/_sources/model/build_model_expert.rst.txt b/docs/_sources/model/build_model_expert.rst.txt deleted file mode 100644 index f321e90..0000000 --- a/docs/_sources/model/build_model_expert.rst.txt +++ /dev/null @@ -1,7 +0,0 @@ -:orphan: - -######################### -Raw PyTorch loop (expert) -######################### - -.. include:: ../starter/lightning_lite.rst diff --git a/docs/_sources/model/build_model_intermediate.rst.txt b/docs/_sources/model/build_model_intermediate.rst.txt deleted file mode 100644 index 55f1247..0000000 --- a/docs/_sources/model/build_model_intermediate.rst.txt +++ /dev/null @@ -1,47 +0,0 @@ -:orphan: - -################################### -Supercharge training (intermediate) -################################### - -************************ -Enable training features -************************ -Enable advanced training features using Trainer arguments. These are SOTA techniques that are automatically integrated into your training loop without changes to your code. - -.. code:: - - # train 1TB+ parameter models with Deepspeed/fsdp - trainer = Trainer( - devices=4, - accelerator="gpu", - strategy="deepspeed_stage_2", - precision=16 - ) - - # 20+ helpful arguments for rapid idea iteration - trainer = Trainer( - max_epochs=10, - min_epochs=5, - overfit_batches=1 - ) - - # access the latest state of the art techniques - trainer = Trainer(callbacks=[StochasticWeightAveraging(...)]) - ----- - -****************** -Extend the Trainer -****************** - -.. raw:: html - - - -If you have multiple lines of code with similar functionalities, you can use *callbacks* to easily group them together and toggle all of those lines on or off at the same time. - -.. code:: - - trainer = Trainer(callbacks=[AWSCheckpoints()]) diff --git a/docs/_sources/model/manual_optimization.rst.txt b/docs/_sources/model/manual_optimization.rst.txt deleted file mode 100644 index e4a31dd..0000000 --- a/docs/_sources/model/manual_optimization.rst.txt +++ /dev/null @@ -1,290 +0,0 @@ -******************* -Manual Optimization -******************* - -For advanced research topics like reinforcement learning, sparse coding, or GAN research, it may be desirable to -manually manage the optimization process. - -This is only recommended for experts who need ultimate flexibility. -Lightning will handle only accelerator, precision and strategy logic. -The users are left with ``optimizer.zero_grad()``, gradient accumulation, model toggling, etc.. - -To manually optimize, do the following: - -* Set ``self.automatic_optimization=False`` in your ``LightningModule``'s ``__init__``. -* Use the following functions and call them manually: - - * ``self.optimizers()`` to access your optimizers (one or multiple) - * ``optimizer.zero_grad()`` to clear the gradients from the previous training step - * ``self.manual_backward(loss)`` instead of ``loss.backward()`` - * ``optimizer.step()`` to update your model parameters - -Here is a minimal example of manual optimization. - -.. testcode:: python - - from pytorch_lightning import LightningModule - - - class MyModel(LightningModule): - def __init__(self): - super().__init__() - # Important: This property activates manual optimization. - self.automatic_optimization = False - - def training_step(self, batch, batch_idx): - opt = self.optimizers() - opt.zero_grad() - loss = self.compute_loss(batch) - self.manual_backward(loss) - opt.step() - -.. warning:: - Before 1.2, ``optimizer.step()`` was calling ``optimizer.zero_grad()`` internally. - From 1.2, it is left to the user's expertise. - -.. tip:: - Be careful where you call ``optimizer.zero_grad()``, or your model won't converge. - It is good practice to call ``optimizer.zero_grad()`` before ``self.manual_backward(loss)``. - - -Access your Own Optimizer -========================= - -The provided ``optimizer`` is a :class:`~pytorch_lightning.core.optimizer.LightningOptimizer` object wrapping your own optimizer -configured in your :meth:`~pytorch_lightning.core.lightning.LightningModule.configure_optimizers`. You can access your own optimizer -with ``optimizer.optimizer``. However, if you use your own optimizer to perform a step, Lightning won't be able to -support accelerators, precision and profiling for you. - -.. testcode:: python - - class Model(LightningModule): - def __init__(self): - super().__init__() - self.automatic_optimization = False - ... - - def training_step(self, batch, batch_idx): - optimizer = self.optimizers() - - # `optimizer` is a `LightningOptimizer` wrapping the optimizer. - # To access it, do the following. - # However, it won't work on TPU, AMP, etc... - optimizer = optimizer.optimizer - ... - -Gradient Accumulation -===================== - -You can accumulate gradients over batches similarly to ``accumulate_grad_batches`` argument in -:ref:`Trainer ` for automatic optimization. To perform gradient accumulation with one optimizer -after every ``N`` steps, you can do as such. - -.. testcode:: python - - def __init__(self): - super().__init__() - self.automatic_optimization = False - - - def training_step(self, batch, batch_idx): - opt = self.optimizers() - - loss = self.compute_loss(batch) - self.manual_backward(loss) - - # accumulate gradients of N batches - if (batch_idx + 1) % N == 0: - opt.step() - opt.zero_grad() - - -Use Multiple Optimizers (like GANs) -=================================== - -Here is an example training a simple GAN with multiple optimizers using manual optimization. - -.. testcode:: python - - import torch - from torch import Tensor - from pytorch_lightning import LightningModule - - - class SimpleGAN(LightningModule): - def __init__(self): - super().__init__() - self.G = Generator() - self.D = Discriminator() - - # Important: This property activates manual optimization. - self.automatic_optimization = False - - def sample_z(self, n) -> Tensor: - sample = self._Z.sample((n,)) - return sample - - def sample_G(self, n) -> Tensor: - z = self.sample_z(n) - return self.G(z) - - def training_step(self, batch, batch_idx): - # Implementation follows the PyTorch tutorial: - # https://pytorch.org/tutorials/beginner/dcgan_faces_tutorial.html - g_opt, d_opt = self.optimizers() - - X, _ = batch - batch_size = X.shape[0] - - real_label = torch.ones((batch_size, 1), device=self.device) - fake_label = torch.zeros((batch_size, 1), device=self.device) - - g_X = self.sample_G(batch_size) - - ########################## - # Optimize Discriminator # - ########################## - d_x = self.D(X) - errD_real = self.criterion(d_x, real_label) - - d_z = self.D(g_X.detach()) - errD_fake = self.criterion(d_z, fake_label) - - errD = errD_real + errD_fake - - d_opt.zero_grad() - self.manual_backward(errD) - d_opt.step() - - ###################### - # Optimize Generator # - ###################### - d_z = self.D(g_X) - errG = self.criterion(d_z, real_label) - - g_opt.zero_grad() - self.manual_backward(errG) - g_opt.step() - - self.log_dict({"g_loss": errG, "d_loss": errD}, prog_bar=True) - - def configure_optimizers(self): - g_opt = torch.optim.Adam(self.G.parameters(), lr=1e-5) - d_opt = torch.optim.Adam(self.D.parameters(), lr=1e-5) - return g_opt, d_opt - - -Learning Rate Scheduling -======================== - -Every optimizer you use can be paired with any -`Learning Rate Scheduler `_. Please see the -documentation of :meth:`~pytorch_lightning.core.lightning.LightningModule.configure_optimizers` for all the available options - -You can call ``lr_scheduler.step()`` at arbitrary intervals. -Use ``self.lr_schedulers()`` in your :class:`~pytorch_lightning.core.lightning.LightningModule` to access any learning rate schedulers -defined in your :meth:`~pytorch_lightning.core.lightning.LightningModule.configure_optimizers`. - -.. warning:: - * Before v1.3, Lightning automatically called ``lr_scheduler.step()`` in both automatic and manual optimization. From - 1.3, ``lr_scheduler.step()`` is now for the user to call at arbitrary intervals. - * Note that the ``lr_scheduler_config`` keys, such as ``"frequency"`` and ``"interval"``, will be ignored even if they are provided in - your :meth:`~pytorch_lightning.core.lightning.LightningModule.configure_optimizers` during manual optimization. - -Here is an example calling ``lr_scheduler.step()`` every step. - -.. testcode:: python - - # step every batch - def __init__(self): - super().__init__() - self.automatic_optimization = False - - - def training_step(self, batch, batch_idx): - # do forward, backward, and optimization - ... - - # single scheduler - sch = self.lr_schedulers() - sch.step() - - # multiple schedulers - sch1, sch2 = self.lr_schedulers() - sch1.step() - sch2.step() - -If you want to call ``lr_scheduler.step()`` every ``N`` steps/epochs, do the following. - -.. testcode:: python - - def __init__(self): - super().__init__() - self.automatic_optimization = False - - - def training_step(self, batch, batch_idx): - # do forward, backward, and optimization - ... - - sch = self.lr_schedulers() - - # step every N batches - if (batch_idx + 1) % N == 0: - sch.step() - - # step every N epochs - if self.trainer.is_last_batch and (self.trainer.current_epoch + 1) % N == 0: - sch.step() - -If you want to call schedulers that require a metric value after each epoch, consider doing the following: - -.. testcode:: - - def __init__(self): - super().__init__() - self.automatic_optimization = False - - - def training_epoch_end(self, outputs): - sch = self.lr_schedulers() - - # If the selected scheduler is a ReduceLROnPlateau scheduler. - if isinstance(sch, torch.optim.lr_scheduler.ReduceLROnPlateau): - sch.step(self.trainer.callback_metrics["loss"]) - -Use Closure for LBFGS-like Optimizers -===================================== - -It is a good practice to provide the optimizer with a closure function that performs a ``forward``, ``zero_grad`` and -``backward`` of your model. It is optional for most optimizers, but makes your code compatible if you switch to an -optimizer which requires a closure, such as :class:`~torch.optim.LBFGS`. - -See `the PyTorch docs `_ for more about the closure. - -Here is an example using a closure function. - -.. testcode:: python - - def __init__(self): - super().__init__() - self.automatic_optimization = False - - - def configure_optimizers(self): - return torch.optim.LBFGS(...) - - - def training_step(self, batch, batch_idx): - opt = self.optimizers() - - def closure(): - loss = self.compute_loss(batch) - opt.zero_grad() - self.manual_backward(loss) - return loss - - opt.step(closure=closure) - -.. warning:: - The :class:`~torch.optim.LBFGS` optimizer is not supported for apex AMP, native AMP, IPUs, or DeepSpeed. diff --git a/docs/_sources/model/own_your_loop.rst.txt b/docs/_sources/model/own_your_loop.rst.txt deleted file mode 100644 index 5982b0a..0000000 --- a/docs/_sources/model/own_your_loop.rst.txt +++ /dev/null @@ -1,41 +0,0 @@ -:orphan: - -################################ -Use a pure PyTorch training loop -################################ - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Enable manual optimization - :description: Gain control of the training loop with manual optimization and LightningModule methods. - :col_css: col-md-4 - :button_link: build_model_advanced.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Use a Raw PyTorch Loop - :description: Migrate complex PyTorch projects to Lightning and push bleeding-edge research with the raw PyTorch loop. - :col_css: col-md-4 - :button_link: build_model_expert.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Make a custom Lightning Loop - :description: Conduct bleeding-edge research like meta-learning and RL with a custom Loop. - :col_css: col-md-4 - :button_link: loops.html - :height: 150 - :tag: expert - -.. raw:: html - -
-
diff --git a/docs/_sources/model/train_model_basic.rst.txt b/docs/_sources/model/train_model_basic.rst.txt deleted file mode 100644 index 24bdab8..0000000 --- a/docs/_sources/model/train_model_basic.rst.txt +++ /dev/null @@ -1,129 +0,0 @@ -:orphan: - -##################### -Train a model (basic) -##################### -**Audience**: Users who need to train a model without coding their own training loops. - ----- - -*********** -Add imports -*********** -Add the relevant imports at the top of the file - -.. code:: python - - import os - import torch - from torch import nn - import torch.nn.functional as F - from torchvision import transforms - from torchvision.datasets import MNIST - from torch.utils.data import DataLoader, random_split - import pytorch_lightning as pl - ----- - -***************************** -Define the PyTorch nn.Modules -***************************** - -.. code:: python - - class Encoder(nn.Module): - def __init__(self): - self.l1 = nn.Sequential(nn.Linear(28 * 28, 64), nn.ReLU(), nn.Linear(64, 3)) - - def forward(self, x): - return self.l1(x) - - - class Decoder(nn.Module): - def __init__(self): - self.l1 = nn.Sequential(nn.Linear(3, 64), nn.ReLU(), nn.Linear(64, 28 * 28)) - - def forward(self, x): - return self.l1(x) - ----- - -************************ -Define a LightningModule -************************ -The LightningModule is the full **recipe** that defines how your nn.Modules interact. - -- The **training_step** defines how the *nn.Modules* interact together. -- In the **configure_optimizers** define the optimizer(s) for your models. - -.. code:: python - - class LitAutoEncoder(pl.LightningModule): - def __init__(self, encoder, decoder): - super().__init__() - self.encoder = encoder - self.decoder = decoder - - def training_step(self, batch, batch_idx): - # training_step defines the train loop. - x, y = batch - x = x.view(x.size(0), -1) - z = self.encoder(x) - x_hat = self.decoder(z) - loss = F.mse_loss(x_hat, x) - return loss - - def configure_optimizers(self): - optimizer = torch.optim.Adam(self.parameters(), lr=1e-3) - return optimizer - ----- - -*************************** -Define the training dataset -*************************** -Define a PyTorch :class:`~torch.utils.data.DataLoader` which contains your training dataset. - -.. code-block:: python - - dataset = MNIST(os.getcwd(), download=True, transform=transforms.ToTensor()) - train_loader = DataLoader(dataset) - ----- - -*************** -Train the model -*************** -To train the model use the Lightning :doc:`Trainer <../common/trainer>` which handles all the engineering and abstracts away all the complexity needed for scale. - -.. code-block:: python - - # model - autoencoder = LitAutoEncoder(Encoder(), Decoder()) - - # train model - trainer = pl.Trainer() - trainer.fit(model=autoencoder, train_dataloaders=train_loader) - ----- - -*************************** -Eliminate the training loop -*************************** -Under the hood, the Lightning Trainer runs the following training loop on your behalf - -.. code:: python - - autoencoder = LitAutoEncoder(encoder, decoder) - optimizer = autoencoder.configure_optimizers() - - for batch, batch_idx in enumerate(train_loader): - loss = autoencoder(batch, batch_idx) - - loss.backward() - optimizer.step() - optimizer.zero_grad() - -The power of Lightning comes when the training loop gets complicated as you add validation/test splits, schedulers, distributed training and all the latest SOTA techniques. - -With Lightning, you can add mix all these techniques together without needing to rewrite a new loop every time. diff --git a/docs/_sources/starter/converting.rst.txt b/docs/_sources/starter/converting.rst.txt deleted file mode 100644 index 952a93a..0000000 --- a/docs/_sources/starter/converting.rst.txt +++ /dev/null @@ -1,197 +0,0 @@ -.. _converting: - -###################################### -How to Organize PyTorch Into Lightning -###################################### - -To enable your code to work with Lightning, perform the following to organize PyTorch into Lightning. - --------- - -****************************** -1. Keep you Computational Code -****************************** - -Keep your regular nn.Module architecture - -.. testcode:: - - import pytorch_lightning as pl - import torch - import torch.nn as nn - import torch.nn.functional as F - - - class LitModel(nn.Module): - def __init__(self): - super().__init__() - self.layer_1 = nn.Linear(28 * 28, 128) - self.layer_2 = nn.Linear(128, 10) - - def forward(self, x): - x = x.view(x.size(0), -1) - x = self.layer_1(x) - x = F.relu(x) - x = self.layer_2(x) - return x - --------- - -*************************** -2. Configure Training Logic -*************************** -In the training_step of the LightningModule configure how your training routine behaves with a batch of training data: - -.. testcode:: - - class LitModel(pl.LightningModule): - def __init__(self, encoder): - super().__init__() - self.encoder = encoder - - def training_step(self, batch, batch_idx): - x, y = batch - y_hat = self.encoder(x) - loss = F.cross_entropy(y_hat, y) - return loss - -.. note:: If you need to fully own the training loop for complicated legacy projects, check out :doc:`Own your loop <../model/own_your_loop>`. - ----- - -**************************************** -3. Move Optimizer(s) and LR Scheduler(s) -**************************************** -Move your optimizers to the :meth:`~pytorch_lightning.core.lightning.LightningModule.configure_optimizers` hook. - -.. testcode:: - - class LitModel(pl.LightningModule): - def configure_optimizers(self): - optimizer = torch.optim.Adam(self.encoder.parameters(), lr=1e-3) - lr_scheduler = torch.optim.lr_scheduler.StepLR(optimizer, step_size=1) - return [optimizer], [lr_scheduler] - --------- - -*************************************** -4. Organize Validation Logic (optional) -*************************************** -If you need a validation loop, configure how your validation routine behaves with a batch of validation data: - -.. testcode:: - - class LitModel(pl.LightningModule): - def validation_step(self, batch, batch_idx): - x, y = batch - y_hat = self.encoder(x) - val_loss = F.cross_entropy(y_hat, y) - self.log("val_loss", val_loss) - -.. tip:: ``trainer.validate()`` loads the best checkpoint automatically by default if checkpointing was enabled during fitting. - --------- - -************************************ -5. Organize Testing Logic (optional) -************************************ -If you need a test loop, configure how your testing routine behaves with a batch of test data: - -.. testcode:: - - class LitModel(pl.LightningModule): - def test_step(self, batch, batch_idx): - x, y = batch - y_hat = self.encoder(x) - test_loss = F.cross_entropy(y_hat, y) - self.log("test_loss", test_loss) - --------- - -**************************************** -6. Configure Prediction Logic (optional) -**************************************** -If you need a prediction loop, configure how your prediction routine behaves with a batch of test data: - -.. testcode:: - - class LitModel(LightningModule): - def predict_step(self, batch, batch_idx): - x, y = batch - pred = self.encoder(x) - return pred - --------- - -****************************************** -7. Remove any .cuda() or .to(device) Calls -****************************************** - -Your :doc:`LightningModule <../common/lightning_module>` can automatically run on any hardware! - -If you have any explicit calls to ``.cuda()`` or ``.to(device)``, you can remove them since Lightning makes sure that the data coming from :class:`~torch.utils.data.DataLoader` -and all the :class:`~torch.nn.Module` instances initialized inside ``LightningModule.__init__`` are moved to the respective devices automatically. -If you still need to access the current device, you can use ``self.device`` anywhere in your ``LightningModule`` except in the ``__init__`` and ``setup`` methods. - -.. testcode:: - - class LitModel(LightningModule): - def training_step(self, batch, batch_idx): - z = torch.randn(4, 5, device=self.device) - ... - -Hint: If you are initializing a :class:`~torch.Tensor` within the ``LightningModule.__init__`` method and want it to be moved to the device automatically you should call -:meth:`~torch.nn.Module.register_buffer` to register it as a parameter. - -.. testcode:: - - class LitModel(LightningModule): - def __init__(self): - super().__init__() - self.register_buffer("running_mean", torch.zeros(num_features)) - --------- - -******************** -8. Use your own data -******************** -Regular PyTorch DataLoaders work with Lightning. For more modular and scalable datasets, check out :doc:`LightningDataModule <../data/datamodule>`. - ----- - -************ -Good to know -************ - -Additionally, you can run only the validation loop using :meth:`~pytorch_lightning.trainer.trainer.Trainer.validate` method. - -.. code-block:: python - - model = LitModel() - trainer.validate(model) - -.. note:: ``model.eval()`` and ``torch.no_grad()`` are called automatically for validation. - - -The test loop isn't used within :meth:`~pytorch_lightning.trainer.trainer.Trainer.fit`, therefore, you would need to explicitly call :meth:`~pytorch_lightning.trainer.trainer.Trainer.test`. - -.. code-block:: python - - model = LitModel() - trainer.test(model) - -.. note:: ``model.eval()`` and ``torch.no_grad()`` are called automatically for testing. - -.. tip:: ``trainer.test()`` loads the best checkpoint automatically by default if checkpointing is enabled. - - -The predict loop will not be used until you call :meth:`~pytorch_lightning.trainer.trainer.Trainer.predict`. - -.. code-block:: python - - model = LitModel() - trainer.predict(model) - -.. note:: ``model.eval()`` and ``torch.no_grad()`` are called automatically for testing. - -.. tip:: ``trainer.predict()`` loads the best checkpoint automatically by default if checkpointing is enabled. diff --git a/docs/_sources/starter/installation.rst.txt b/docs/_sources/starter/installation.rst.txt deleted file mode 100644 index 6b72585..0000000 --- a/docs/_sources/starter/installation.rst.txt +++ /dev/null @@ -1,72 +0,0 @@ -:orphan: - -.. _installation: - -############ -Installation -############ - --------------- - -********************* -Installation with pip -********************* - -Install any supported version of PyTorch if you want from `PyTorch Installation Page `_. -Now you can install using `pip `_ using the following command: - -.. code-block:: bash - - pip install pytorch-lightning - --------------- - -*********************** -Installation with Conda -*********************** - -If you don't have conda installed, follow the `Conda Installation Guide `_. -Lightning can be installed with `conda `_ using the following command: - -.. code-block:: bash - - conda install pytorch-lightning -c conda-forge - -You can also use `Conda Environments `_: - -.. code-block:: bash - - conda activate my_env - conda install pytorch-lightning -c conda-forge - --------------- - -************************ -Installation from Source -************************ - -Install nightly from the source. Note that it contains all the bug fixes and newly released features that -are not published yet. This is the bleeding edge, so use it at your own discretion. - -.. code-block:: bash - - pip install https://github.com/PyTorchLightning/pytorch-lightning/archive/master.zip - -Install future patch releases from the source. Note that the patch release contains only the bug fixes for the recent major release. - -.. code-block:: bash - - pip install https://github.com/PyTorchLightning/pytorch-lightning/archive/refs/heads/release/1.5.x.zip - --------------- - -****************** -Lightning Coverage -****************** - -PyTorch Lightning is maintained and tested on different Python and PyTorch versions. - -Check out the `CI Coverage `_ for more info. - -It is rigorously tested across multiple GPUs, TPUs, CPUs and IPUs. GPU tests run on two NVIDIA P100. TPU tests run on Google GKE TPUv2/3. -TPU py3.7 means we support Colab and Kaggle env. IPU tests run on MK1 IPU boxes. diff --git a/docs/_sources/starter/introduction.rst.txt b/docs/_sources/starter/introduction.rst.txt deleted file mode 100644 index a5e92d2..0000000 --- a/docs/_sources/starter/introduction.rst.txt +++ /dev/null @@ -1,406 +0,0 @@ -:orphan: - -############################### -Lightning 15분 만에 배워보기 -############################### - -**필요한 배경지식:** 없음 - -**목표:** 이 문서에서는 일반적인 Lightning 워크플로우의 주요한 7단계를 안내합니다. - -PyTorch Lightning(파이토치 라이트닝)은 대규모로 엄청 빠른 성능을 요구하면서 최대한의 유연성을 필요로 하는 -전문적인 AI 연구자들과 머신러닝 엔지니어들을 위한 "배터리가 포함된(batteries included)" 딥러닝 프레임워크입니다. - -.. join_slack:: - :align: left - :margin: 20 - -Lightning(라이트닝)은 반복적으로 사용하는 코드(boilerplate)를 제거하고 확장성(scalability)을 확보하도록 PyTorch 코드를 재구성합니다. - -.. raw:: html - - - -| - -PyTorch 코드를 재구성함으로써, Lightning에서는 이런 것들이 가능해집니다: - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: 완전한 유연성 - :description: 반복되는 코드 없이 PyTorch를 그대로 사용하여 아이디어를 구현합니다. - :col_css: col-md-3 - :image_center: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/card_full_control.png - :height: 290 - -.. displayitem:: - :header: 재현성 + 가독성 - :description: 연구용 코드와 엔지니어링 코드를 분리하여 재현성을 갖추고 더 나은 가독성을 제공합니다. - :col_css: col-md-3 - :image_center: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/card_no_boilerplate.png - :height: 290 - -.. displayitem:: - :header: 간단한 다중 GPU 학습 - :description: 코드 변경 없이 여러개의 GPU/TPU/HPU 등을 사용합니다. - :col_css: col-md-3 - :image_center: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/card_hardware.png - :height: 290 - -.. displayitem:: - :header: 테스트 완료 - :description: 이미 모든 테스트를 완료하여 직접 테스트 할 필요없습니다. - :col_css: col-md-3 - :image_center: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/card_testing.png - :height: 290 - -.. raw:: html - -
-
- -.. End of callout item section - ----- - -****************************** -1: PyTorch Lightning 설치하기 -****************************** -.. raw:: html - -
-
- -`pip `_ 사용자라면, - -.. code-block:: bash - - pip install pytorch-lightning - -.. raw:: html - -
-
- -`conda `_ 사용자라면, - -.. code-block:: bash - - conda install pytorch-lightning -c conda-forge - -.. raw:: html - -
-
- -또는 `advanced install guide `_ 를 참조하세요. - ----- - -.. _new_project: - -***************************** -2: LightningModule 정의하기 -***************************** - -LightningModule을 사용하여 PyTorch nn.Module이 training_step (뿐만 아니라 validation_step이나 test_step) 내에서 복잡한 방식으로 함께 동작할 수 있도록 합니다. - -.. testcode:: - - import os - from torch import optim, nn, utils, Tensor - from tests.helpers.datasets import MNIST - import pytorch_lightning as pl - - # 원하는만큼의 nn.Module (또는 기존 모델)을 정의합니다. - encoder = nn.Sequential(nn.Linear(28 * 28, 64), nn.ReLU(), nn.Linear(64, 3)) - decoder = nn.Sequential(nn.Linear(3, 64), nn.ReLU(), nn.Linear(64, 28 * 28)) - - # LightningModule을 정의합니다. - class LitAutoEncoder(pl.LightningModule): - def __init__(self, encoder, decoder): - super().__init__() - self.encoder = encoder - self.decoder = decoder - - def training_step(self, batch, batch_idx): - # training_step defines the train loop. - # it is independent of forward - x, y = batch - x = x.view(x.size(0), -1) - z = self.encoder(x) - x_hat = self.decoder(z) - loss = nn.functional.mse_loss(x_hat, x) - # Logging to TensorBoard by default - self.log("train_loss", loss) - return loss - - def configure_optimizers(self): - optimizer = optim.Adam(self.parameters(), lr=1e-3) - return optimizer - - - # 오토인코더(autoencoder)를 초기화합니다. - autoencoder = LitAutoEncoder(encoder, decoder) - ----- - -********************** -3: 데이터셋 정의하기 -********************** - -Lightning은 *어떠한* 순회 가능한 객체(iterable; :class:`~torch.utils.data.DataLoader`, numpy 등...)도 학습/검증/테스트/예측용으로 나누어 사용할 수 있습니다. - -.. code-block:: python - - # 데이터를 설정합니다. - dataset = MNIST(os.getcwd(), download=True) - train_loader = utils.data.DataLoader(dataset) - ----- - -****************** -4: 모델 학습하기 -****************** - -Lightning :doc:`Trainer <../common/trainer>` 는 모든 :doc:`LightningModule <../common/lightning_module>` 과 데이터셋을 "함께(mix)" 학습할 수 있으며, -확장에 필요한 모든 엔지니어링적 복잡성들을 추상화(abstract)합니다. - -.. code-block:: python - - # 모델을 학습합니다 (힌트: 빠른 아이디어 반복에 도움이 되는 Trainer의 인자들을 참고하세요) - trainer = pl.Trainer(limit_train_batches=100, max_epochs=1) - trainer.fit(model=autoencoder, train_dataloaders=train_loader) - -Lightning :doc:`Trainer <../common/trainer>` 는 아래 예시들을 포함하여 `40종류 이상의 기법들 <../common/trainer.html#trainer-flags>`_ 을 자동화합니다: - -* 에폭(epoch) 및 배치(batch) 반복 -* ``optimizer.step()``, ``loss.backward()``, ``optimizer.zero_grad()`` 호출 -* 평가(evaluation) 도중 경사도(grads) 활성화/비활성화를 위한 ``model.eval()`` 호출 -* :doc:`체크포인트(checkpoint) 저장하기 및 불러오기 <../common/checkpointing>` -* 텐서보드(tensorboard) (:doc:`loggers <../visualize/loggers>` 옵션 참조) -* :doc:`Multi-GPU <../accelerators/gpu>` 지원 -* :doc:`TPU <../accelerators/tpu>` -* :ref:`16비트 정밀도(precision) AMP ` 지원 - ----- - - -****************** -5: 모델 사용하기 -****************** - -모델을 학습한 뒤에는 ONNX, TorchScript로 내보내기(export)하여 상용 환경에 포함하거나 단순히 가중치를 불러오고 예측을 실행할 수 있습니다. - -.. code:: python - - # 체크포인트(checkpoint)를 불러옵니다. - checkpoint = "./lightning_logs/version_0/checkpoints/epoch=0-step=100.ckpt" - autoencoder = LitAutoEncoder.load_from_checkpoint(checkpoint, encoder=encoder, decoder=decoder) - - # 학습한 nn.Module을 선택합니다. - encoder = autoencoder.encoder - encoder.eval() - - # 4개의 가짜 이미지로 예측(embed)합니다! - fake_image_batch = Tensor(4, 28 * 28) - embeddings = encoder(fake_image_batch) - print("⚡" * 20, "\nPredictions (4 image embeddings):\n", embeddings, "\n", "⚡" * 20) - ----- - -********************* -6: 학습 시각화하기 -********************* - -Lightning에는 *많은* 배터리가 포함되어 있습니다. 실험을 시각화하는데 사용하는 텐서보드(Tensorboard)도 유용한 도구 중 하나입니다. - -명령줄(commandline)에서 아래를 실행하고 브라우저에서 **http://localhost:6006/** 을 열어보세요. - -.. code:: bash - - tensorboard --logdir . - ----- - -************************* -7: 엄청 빠르게 학습하기 -************************* - -Trainer에 인자(argument)를 사용하여 고급 학습 기능을 사용할 수 있습니다. 이는 다른 코드를 변경하지 않으면서 학습 단계(train loop)에 자동으로 통합할 수 있도록 하는 최신(state-of-the-art)의 기술입니다. - -.. code:: - - # 4개의 GPU에서 학습 - trainer = Trainer( - devices=4, - accelerator="gpu", - ) - - # Deepspeed/FSDP를 사용하여 1TB 이상의 매개변수를 갖는 모델 학습 - trainer = Trainer( - devices=4, - accelerator="gpu", - strategy="deepspeed_stage_2", - precision=16 - ) - - # 빠른 아이디어 반복을 위한 20개 이상의 유용한 플래그(flag) - trainer = Trainer( - max_epochs=10, - min_epochs=5, - overfit_batches=1 - ) - - # 최신 기술을 사용 - trainer = Trainer(callbacks=[StochasticWeightAveraging(...)]) - ----- - -******************** -유연성 극대화하기 -******************** - -Lightning의 핵심 원칙은 **PyTorch의 어떠한 부분도 숨기지 않으면서** 언제나 최대한의 유연성을 제공하는 것입니다. - -Lightning은 프로젝트의 복잡도에 따라 *추가적인* 5단계의 유연성을 제공합니다. - ----- - -학습 단계(loop) 사용자 정의하기 -================================== - -.. image:: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/custom_loop.png - :width: 600 - :alt: Injecting custom code in a training loop - -LightningModule에서 사용할 수 있는 20개 이상의 메소드 (:ref:`lightning_hooks`) 중 일부를 사용하여 훈련 단계 어디에든 사용자 정의 코드를 삽입할 수 있습니다. - -.. testcode:: - - class LitAutoEncoder(pl.LightningModule): - def backward(self, loss, optimizer, optimizer_idx): - loss.backward() - ----- - -Trainer 확장하기 -================== - -.. raw:: html - - - -유사한 기능을 하는 여러줄의 코드가 있는 경우, 콜백(callback)을 사용하여 손쉽게 그룹으로 묶어서 해당하는 코드들을 동시에 켜거나 끌 수 있습니다. - -.. code:: - - trainer = Trainer(callbacks=[AWSCheckpoints()]) - ----- - -PyTorch 자체의 반복(loop) 사용하기 -=================================== - -최첨단 연구 시 특정 유형의 작업들을 위해, Lightning은 전문가들이 다양한 방식으로 학습 단계를 완전히 제어할 수 있는 기능을 제공합니다. - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: 직접 최적화(manual optimization) - :description: 자동화된 학습 단계에서 최적화 단계는 사용자가 직접 관여합니다. - :col_css: col-md-4 - :image_center: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/manual_opt.png - :button_link: ../model/build_model_advanced.html#manual-optimization - :image_height: 220px - :height: 320 - -.. displayitem:: - :header: Lightning Lite(라이트닝 라이트) - :description: 복잡한 PyTorch 프로젝트를 이관하기 위한 반복 단계를 완벽히 제어합니다. - :col_css: col-md-4 - :image_center: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/lite.png - :button_link: ../model/build_model_expert.html - :image_height: 220px - :height: 320 - -.. displayitem:: - :header: 반복(Loop) - :description: 메타학습(meta-learning), 강화학습(reinforcement learning), GAN을 완벽히 제어합니다. - :col_css: col-md-4 - :image_center: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/loops.png - :button_link: ../extensions/loops.html - :image_height: 220px - :height: 320 - -.. raw:: html - -
-
- -.. End of callout item section - ----- - -********** -다음 단계 -********** - -사용 사례에 따라, 아래 내용들 중 하나를 다음 단계로 살펴보세요. - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Level 2: Add a validation and test set - :description: Add validation and test sets to avoid over/underfitting. - :button_link: ../levels/basic_level_2.html - :col_css: col-md-3 - :height: 180 - :tag: basic - -.. displayitem:: - :header: See more examples - :description: See examples across computer vision, NLP, RL, etc... - :col_css: col-md-3 - :button_link: ../tutorials.html - :height: 180 - :tag: basic - -.. displayitem:: - :header: I need my raw PyTorch Loop - :description: Expert-level control for researchers working on the bleeding-edge - :col_css: col-md-3 - :button_link: ../model/build_model_expert.html - :height: 180 - :tag: expert - -.. displayitem:: - :header: Deploy your model - :description: Learn how to predict or put your model into production - :col_css: col-md-3 - :button_link: ../deploy/production.html - :height: 180 - :tag: basic - -.. raw:: html - -
-
diff --git a/docs/_sources/starter/lightning_lite.rst.txt b/docs/_sources/starter/lightning_lite.rst.txt deleted file mode 100644 index 61b69cd..0000000 --- a/docs/_sources/starter/lightning_lite.rst.txt +++ /dev/null @@ -1,727 +0,0 @@ -########################################### -LightningLite (Stepping Stone to Lightning) -########################################### - - -:class:`~pytorch_lightning.lite.LightningLite` enables pure PyTorch users to scale their existing code -on any kind of device while retaining full control over their own loops and optimization logic. - -.. image:: https://pl-public-data.s3.amazonaws.com/docs/static/images/lite/lightning_lite.gif - :alt: Animation showing how to convert your PyTorch code to LightningLite. - :width: 500 - :align: center - -| - -:class:`~pytorch_lightning.lite.LightningLite` is the right tool for you if you match one of the two following descriptions: - -- I want to quickly scale my existing code to multiple devices with minimal code changes. -- I would like to convert my existing code to the Lightning API, but a full path to Lightning transition might be too complex. I am looking for a stepping stone to ensure reproducibility during the transition. - - -.. warning:: :class:`~pytorch_lightning.lite.LightningLite` is currently a beta feature. Its API is subject to change based on your feedback. - - ----------- - -**************** -Learn by example -**************** - - -My Existing PyTorch Code -======================== - -The ``run`` function contains custom training loop used to train ``MyModel`` on ``MyDataset`` for ``num_epochs`` epochs. - -.. code-block:: python - - import torch - from torch import nn - from torch.utils.data import DataLoader, Dataset - - - class MyModel(nn.Module): - ... - - - class MyDataset(Dataset): - ... - - - def run(args): - device = "cuda" if torch.cuda.is_available() else "cpu" - - model = MyModel(...).to(device) - optimizer = torch.optim.SGD(model.parameters(), ...) - - dataloader = DataLoader(MyDataset(...), ...) - - model.train() - for epoch in range(args.num_epochs): - for batch in dataloader: - batch = batch.to(device) - optimizer.zero_grad() - loss = model(batch) - loss.backward() - optimizer.step() - - - run(args) - ----------- - - -Convert to LightningLite -======================== - -Here are five required steps to convert to :class:`~pytorch_lightning.lite.LightningLite`. - -1. Subclass :class:`~pytorch_lightning.lite.LightningLite` and override its :meth:`~pytorch_lightning.lite.LightningLite.run` method. -2. Move the body of your existing ``run`` function into :class:`~pytorch_lightning.lite.LightningLite` ``run`` method. -3. Remove all ``.to(...)``, ``.cuda()`` etc calls since :class:`~pytorch_lightning.lite.LightningLite` will take care of it. -4. Apply :meth:`~pytorch_lightning.lite.LightningLite.setup` over each model and optimizers pair and :meth:`~pytorch_lightning.lite.LightningLite.setup_dataloaders` on all your dataloaders and replace ``loss.backward()`` by ``self.backward(loss)``. -5. Instantiate your :class:`~pytorch_lightning.lite.LightningLite` subclass and call its :meth:`~pytorch_lightning.lite.LightningLite.run` method. - -| - -.. code-block:: python - - import torch - from torch import nn - from torch.utils.data import DataLoader, Dataset - from pytorch_lightning.lite import LightningLite - - - class MyModel(nn.Module): - ... - - - class MyDataset(Dataset): - ... - - - class Lite(LightningLite): - def run(self, args): - - model = MyModel(...) - optimizer = torch.optim.SGD(model.parameters(), ...) - model, optimizer = self.setup(model, optimizer) # Scale your model / optimizers - - dataloader = DataLoader(MyDataset(...), ...) - dataloader = self.setup_dataloaders(dataloader) # Scale your dataloaders - - model.train() - for epoch in range(args.num_epochs): - for batch in dataloader: - optimizer.zero_grad() - loss = model(batch) - self.backward(loss) # instead of loss.backward() - optimizer.step() - - - Lite(...).run(args) - - -That's all. You can now train on any kind of device and scale your training. Check out `this `_ full MNIST training example with LightningLite. - -:class:`~pytorch_lightning.lite.LightningLite` takes care of device management, so you don't have to. -You should remove any device-specific logic within your code. - -Here is how to train on eight GPUs with `torch.bfloat16 `_ precision: - -.. code-block:: python - - Lite(strategy="ddp", devices=8, accelerator="gpu", precision="bf16").run(10) - -Here is how to use `DeepSpeed Zero3 `_ with eight GPUs and precision 16: - -.. code-block:: python - - Lite(strategy="deepspeed", devices=8, accelerator="gpu", precision=16).run(10) - -:class:`~pytorch_lightning.lite.LightningLite` can also figure it out automatically for you! - -.. code-block:: python - - Lite(devices="auto", accelerator="auto", precision=16).run(10) - -You can also easily use distributed collectives if required. -Here is an example while running on 256 GPUs (eight GPUs times 32 nodes). - -.. code-block:: python - - class Lite(LightningLite): - def run(self): - - # Transfer and concatenate tensors across processes - self.all_gather(...) - - # Transfer an object from one process to all the others - self.broadcast(..., src=...) - - # The total number of processes running across all devices and nodes. - self.world_size - - # The global index of the current process across all devices and nodes. - self.global_rank - - # The index of the current process among the processes running on the local node. - self.local_rank - - # The index of the current node. - self.node_rank - - # Wether this global rank is rank zero. - if self.is_global_zero: - # do something on rank 0 - ... - - # Wait for all processes to enter this call. - self.barrier() - - - Lite(strategy="ddp", devices=8, num_nodes=32, accelerator="gpu").run() - - -If you require custom data or model device placement, you can deactivate -:class:`~pytorch_lightning.lite.LightningLite` automatic placement by doing -``self.setup_dataloaders(..., move_to_device=False)`` for the data and -``self.setup(..., move_to_device=False)`` for the model. -Furthermore, you can access the current device from ``self.device`` or -rely on :meth:`~pytorch_lightning.lite.LightningLite.to_device` -utility to move an object to the current device. - - -.. note:: We recommend instantiating the models within the :meth:`~pytorch_lightning.lite.LightningLite.run` method as large models would cause an out-of-memory error otherwise. - -.. tip:: - - If you have hundreds or thousands of lines within your :meth:`~pytorch_lightning.lite.LightningLite.run` function - and you are feeling unsure about them, then that is the correct feeling. - In 2019, our :class:`~pytorch_lightning.core.lightning.LightningModule` was getting larger - and we got the same feeling, so we started to organize our code for simplicity, interoperability and standardization. - This is definitely a good sign that you should consider refactoring your code and / or switching to - :class:`~pytorch_lightning.core.lightning.LightningModule` ultimately. - - ----------- - - -Distributed Training Pitfalls -============================= - -The :class:`~pytorch_lightning.lite.LightningLite` provides you with the tools to scale your training, -but there are several major challenges ahead of you now: - - -.. list-table:: - :widths: 50 50 - :header-rows: 0 - - * - Processes divergence - - This happens when processes execute a different section of the code due to different if/else conditions, race conditions on existing files and so on, resulting in hanging. - * - Cross processes reduction - - Miscalculated metrics or gradients due to errors in their reduction. - * - Large sharded models - - Instantiation, materialization and state management of large models. - * - Rank 0 only actions - - Logging, profiling, and so on. - * - Checkpointing / Early stopping / Callbacks / Logging - - Ability to customize your training behavior easily and make it stateful. - * - Fault-tolerant training - - Ability to resume from a failure as if it never happened. - - -If you are facing one of those challenges, then you are already meeting the limit of :class:`~pytorch_lightning.lite.LightningLite`. -We recommend you to convert to :doc:`Lightning <../starter/introduction>`, so you never have to worry about those. - ----------- - -Convert to Lightning -==================== - -:class:`~pytorch_lightning.lite.LightningLite` is a stepping stone to transition fully to the Lightning API and benefit -from its hundreds of features. - -You can see our :class:`~pytorch_lightning.lite.LightningLite` class as a -future :class:`~pytorch_lightning.core.lightning.LightningModule`, and slowly refactor your code into its API. -Below, the :meth:`~pytorch_lightning.core.lightning.LightningModule.training_step`, :meth:`~pytorch_lightning.core.lightning.LightningModule.forward`, -:meth:`~pytorch_lightning.core.lightning.LightningModule.configure_optimizers`, :meth:`~pytorch_lightning.core.lightning.LightningModule.train_dataloader` methods -are implemented. - - -.. code-block:: python - - class Lite(LightningLite): - - # 1. This would become the LightningModule `__init__` function. - def run(self, args): - self.args = args - - self.model = MyModel(...) - - self.fit() # This would be automated by the Lightning Trainer. - - # 2. This can be fully removed as Lightning creates its own fitting loop, - # and sets up the model, optimizer, dataloader, etc for you. - def fit(self): - # setup everything - optimizer = self.configure_optimizers() - self.model, optimizer = self.setup(self.model, optimizer) - dataloader = self.setup_dataloaders(self.train_dataloader()) - - # start fitting - self.model.train() - for epoch in range(num_epochs): - for batch in enumerate(dataloader): - optimizer.zero_grad() - loss = self.training_step(batch, batch_idx) - self.backward(loss) - optimizer.step() - - # 3. This stays here as it belongs to the LightningModule. - def forward(self, x): - return self.model(x) - - def training_step(self, batch, batch_idx): - return self.forward(batch) - - def configure_optimizers(self): - return torch.optim.SGD(self.model.parameters(), ...) - - # 4. [Optionally] This can stay here or be extracted to the LightningDataModule to enable higher composability. - def train_dataloader(self): - return DataLoader(MyDataset(...), ...) - - - Lite(...).run(args) - - -Finally, change the :meth:`~pytorch_lightning.lite.LightningLite.run` into a -:meth:`~pytorch_lightning.core.lightning.LightningModule.__init__` and drop the ``fit`` call from inside. - -.. code-block:: python - - from pytorch_lightning import LightningDataModule, LightningModule, Trainer - - - class LightningModel(LightningModule): - def __init__(self, args): - super().__init__() - self.model = MyModel(...) - - def forward(self, x): - return self.model(x) - - def training_step(self, batch, batch_idx): - loss = self(batch) - self.log("train_loss", loss) - return loss - - def configure_optimizers(self): - return torch.optim.SGD(self.model.parameters(), lr=0.001) - - - class BoringDataModule(LightningDataModule): - def train_dataloader(self): - return DataLoader(MyDataset(...), ...) - - - trainer = Trainer(max_epochs=10) - trainer.fit(LightningModel(), datamodule=BoringDataModule()) - - -You have successfully converted to PyTorch Lightning, and can now benefit from its hundred of features! - ----------- - -******************** -Lightning Lite Flags -******************** - -Lite is specialized in accelerated distributed training and inference. It offers you convenient ways to configure -your device and communication strategy and to switch seamlessly from one to the other. The terminology and usage are -identical to Lightning, which means minimum effort for you to convert when you decide to do so. - - -accelerator -=========== - -Choose one of ``"cpu"``, ``"gpu"``, ``"tpu"``, ``"auto"`` (IPU support is coming soon). - -.. code-block:: python - - # CPU accelerator - lite = Lite(accelerator="cpu") - - # Running with GPU Accelerator using 2 GPUs - lite = Lite(devices=2, accelerator="gpu") - - # Running with TPU Accelerator using 8 tpu cores - lite = Lite(devices=8, accelerator="tpu") - - # Running with GPU Accelerator using the DistributedDataParallel strategy - lite = Lite(devices=4, accelerator="gpu", strategy="ddp") - -The ``"auto"`` option recognizes the machine you are on and selects the available accelerator. - -.. code-block:: python - - # If your machine has GPUs, it will use the GPU Accelerator - lite = Lite(devices=2, accelerator="auto") - - -strategy -======== - -Choose a training strategy: ``"dp"``, ``"ddp"``, ``"ddp_spawn"``, ``"tpu_spawn"``, ``"deepspeed"``, ``"ddp_sharded"``, or ``"ddp_sharded_spawn"``. - -.. code-block:: python - - # Running with the DistributedDataParallel strategy on 4 GPUs - lite = Lite(strategy="ddp", accelerator="gpu", devices=4) - - # Running with the DDP Spawn strategy using 4 cpu processes - lite = Lite(strategy="ddp_spawn", accelerator="cpu", devices=4) - - -Additionally, you can pass in your custom strategy by configuring additional parameters. - -.. code-block:: python - - from pytorch_lightning.strategies import DeepSpeedStrategy - - lite = Lite(strategy=DeepSpeedStrategy(stage=2), accelerator="gpu", devices=2) - - -Support for Horovod and Fully Sharded training strategies are coming soon. - - -devices -======= - -Configure the devices to run on. Can be of type: - -- int: the number of devices (e.g., GPUs) to train on -- list of int: which device index (e.g., GPU ID) to train on (0-indexed) -- str: a string representation of one of the above - -.. code-block:: python - - # default used by Lite, i.e., use the CPU - lite = Lite(devices=None) - - # equivalent - lite = Lite(devices=0) - - # int: run on two GPUs - lite = Lite(devices=2, accelerator="gpu") - - # list: run on GPUs 1, 4 (by bus ordering) - lite = Lite(devices=[1, 4], accelerator="gpu") - lite = Lite(devices="1, 4", accelerator="gpu") # equivalent - - # -1: run on all GPUs - lite = Lite(devices=-1, accelerator="gpu") - lite = Lite(devices="-1", accelerator="gpu") # equivalent - - - -gpus -==== - -.. warning:: ``gpus=x`` has been deprecated in v1.7 and will be removed in v2.0. - Please use ``accelerator='gpu'`` and ``devices=x`` instead. - -Shorthand for setting ``devices=X`` and ``accelerator="gpu"``. - -.. code-block:: python - - # Run on two GPUs - lite = Lite(accelerator="gpu", devices=2) - - # Equivalent - lite = Lite(devices=2, accelerator="gpu") - - -tpu_cores -========= - -.. warning:: ``tpu_cores=x`` has been deprecated in v1.7 and will be removed in v2.0. - Please use ``accelerator='tpu'`` and ``devices=x`` instead. - -Shorthand for ``devices=X`` and ``accelerator="tpu"``. - -.. code-block:: python - - # Run on eight TPUs - lite = Lite(accelerator="tpu", devices=8) - - # Equivalent - lite = Lite(devices=8, accelerator="tpu") - - -num_nodes -========= - - -Number of cluster nodes for distributed operation. - -.. code-block:: python - - # Default used by Lite - lite = Lite(num_nodes=1) - - # Run on 8 nodes - lite = Lite(num_nodes=8) - - -Learn more about distributed multi-node training on clusters :doc:`here <../clouds/cluster>`. - - -precision -========= - -Lightning Lite supports double precision (64), full precision (32), or half precision (16) operation (including `bfloat16 `_). -Half precision, or mixed precision, is the combined use of 32 and 16-bit floating points to reduce the memory footprint during model training. -This can result in improved performance, achieving significant speedups on modern GPUs. - -.. code-block:: python - - # Default used by the Lite - lite = Lite(precision=32, devices=1) - - # 16-bit (mixed) precision - lite = Lite(precision=16, devices=1) - - # 16-bit bfloat precision - lite = Lite(precision="bf16", devices=1) - - # 64-bit (double) precision - lite = Lite(precision=64, devices=1) - - -plugins -======= - -:ref:`Plugins` allow you to connect arbitrary backends, precision libraries, clusters etc. For example: -To define your own behavior, subclass the relevant class and pass it in. Here's an example linking up your own -:class:`~pytorch_lightning.plugins.environments.ClusterEnvironment`. - -.. code-block:: python - - from pytorch_lightning.plugins.environments import ClusterEnvironment - - - class MyCluster(ClusterEnvironment): - @property - def main_address(self): - return your_main_address - - @property - def main_port(self): - return your_main_port - - def world_size(self): - return the_world_size - - - lite = Lite(plugins=[MyCluster()], ...) - - ----------- - - -********************** -Lightning Lite Methods -********************** - - -run -=== - -The run method serves two purposes: - -1. Override this method from the :class:`~pytorch_lightning.lite.lite.LightningLite` class and put your - training (or inference) code inside. -2. Launch the training procedure by calling the run method. Lite will take care of setting up the distributed backend. - -You can optionally pass arguments to the run method. For example, the hyperparameters or a backbone for the model. - -.. code-block:: python - - from pytorch_lightning.lite import LightningLite - - - class Lite(LightningLite): - - # Input arguments are optional; put whatever you need - def run(self, learning_rate, num_layers): - """Here goes your training loop""" - - - lite = Lite(accelerator="gpu", devices=2) - lite.run(learning_rate=0.01, num_layers=12) - - -setup -===== - -Set up a model and corresponding optimizer(s). If you need to set up multiple models, call ``setup()`` on each of them. -Moves the model and optimizer to the correct device automatically. - -.. code-block:: python - - model = nn.Linear(32, 64) - optimizer = torch.optim.SGD(model.parameters(), lr=0.001) - - # Set up model and optimizer for accelerated training - model, optimizer = self.setup(model, optimizer) - - # If you don't want Lite to set the device - model, optimizer = self.setup(model, optimizer, move_to_device=False) - - -The setup method also prepares the model for the selected precision choice so that operations during ``forward()`` get -cast automatically. - -setup_dataloaders -================= - -Set up one or multiple dataloaders for accelerated operation. If you are running a distributed strategy (e.g., DDP), Lite -replaces the sampler automatically for you. In addition, the dataloader will be configured to move the returned -data tensors to the correct device automatically. - -.. code-block:: python - - train_data = torch.utils.DataLoader(train_dataset, ...) - test_data = torch.utils.DataLoader(test_dataset, ...) - - train_data, test_data = self.setup_dataloaders(train_data, test_data) - - # If you don't want Lite to move the data to the device - train_data, test_data = self.setup_dataloaders(train_data, test_data, move_to_device=False) - - # If you don't want Lite to replace the sampler in the context of distributed training - train_data, test_data = self.setup_dataloaders(train_data, test_data, replace_sampler=False) - - -backward -======== - -This replaces any occurrences of ``loss.backward()`` and makes your code accelerator and precision agnostic. - -.. code-block:: python - - output = model(input) - loss = loss_fn(output, target) - - # loss.backward() - self.backward(loss) - - -to_device -========= - -Use :meth:`~pytorch_lightning.lite.lite.LightningLite.to_device` to move models, tensors or collections of tensors to -the current device. By default :meth:`~pytorch_lightning.lite.lite.LightningLite.setup` and -:meth:`~pytorch_lightning.lite.lite.LightningLite.setup_dataloaders` already move the model and data to the correct -device, so calling this method is only necessary for manual operation when needed. - -.. code-block:: python - - data = torch.load("dataset.pt") - data = self.to_device(data) - - -seed_everything -=============== - -Make your code reproducible by calling this method at the beginning of your run. - -.. code-block:: python - - # Instead of `torch.manual_seed(...)`, call: - self.seed_everything(1234) - - -This covers PyTorch, NumPy and Python random number generators. In addition, Lite takes care of properly initializing -the seed of dataloader worker processes (can be turned off by passing ``workers=False``). - - -autocast -======== - -Let the precision backend autocast the block of code under this context manager. This is optional and already done by -Lite for the model's forward method (once the model was :meth:`~pytorch_lightning.lite.lite.LightningLite.setup`). -You need this only if you wish to autocast more operations outside the ones in model forward: - -.. code-block:: python - - model, optimizer = self.setup(model, optimizer) - - # Lite handles precision automatically for the model - output = model(inputs) - - with self.autocast(): # optional - loss = loss_function(output, target) - - self.backward(loss) - ... - - -print -===== - -Print to the console via the built-in print function, but only on the main process. -This avoids excessive printing and logs when running on multiple devices/nodes. - - -.. code-block:: python - - # Print only on the main process - self.print(f"{epoch}/{num_epochs}| Train Epoch Loss: {loss}") - - -save -==== - -Save contents to a checkpoint. Replaces all occurrences of ``torch.save(...)`` in your code. Lite will take care of -handling the saving part correctly, no matter if you are running a single device, multi-devices or multi-nodes. - -.. code-block:: python - - # Instead of `torch.save(...)`, call: - self.save(model.state_dict(), "path/to/checkpoint.ckpt") - - -load -==== - -Load checkpoint contents from a file. Replaces all occurrences of ``torch.load(...)`` in your code. Lite will take care of -handling the loading part correctly, no matter if you are running a single device, multi-device, or multi-node. - -.. code-block:: python - - # Instead of `torch.load(...)`, call: - self.load("path/to/checkpoint.ckpt") - - -barrier -======= - -Call this if you want all processes to wait and synchronize. Once all processes have entered this call, -execution continues. Useful for example when you want to download data on one process and make all others wait until -the data is written to disk. - -.. code-block:: python - - # Download data only on one process - if self.global_rank == 0: - download_data("http://...") - - # Wait until all processes meet up here - self.barrier() - - # All processes are allowed to read the data now diff --git a/docs/_sources/starter/style_guide.rst.txt b/docs/_sources/starter/style_guide.rst.txt deleted file mode 100644 index ecdbae6..0000000 --- a/docs/_sources/starter/style_guide.rst.txt +++ /dev/null @@ -1,231 +0,0 @@ -################ -스타일 가이드 -################ - -파이토치 라이트닝(PyTorch Lightning)의 주요한 목표는 가독성과 재현성을 개선하는 것입니다. GitHub 저장소나 연구 프로젝트에서 -:class:`~pytorch_lightning.core.lightning.LightningModule` 을 발견하고, 관심있는 부분을 찾기 위해 정확히 어디를 봐야할지 정확히 알고 있다고 상상해보세요. - -이 스타일 가이드의 목표는 Lightning의 코드가 유사하게 구성되도록 권장하는데 있습니다. - --------------- - -*************** -LightningModule -*************** - -These are best practices for structuring your :class:`~pytorch_lightning.core.lightning.LightningModule` class: - -Systems vs Models -================= - -.. figure:: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/pl_docs/model_system.png - :width: 400 - -The main principle behind a LightningModule is that a full system should be self-contained. -In Lightning, we differentiate between a system and a model. - -A model is something like a resnet18, RNN, and so on. - -A system defines how a collection of models interact with each other with user-defined training/evaluation logic. Examples of this are: - -* GANs -* Seq2Seq -* BERT -* etc. - -A LightningModule can define both a system and a model: - -Here's a LightningModule that defines a system. This structure is what we recommend as a best practice. Keeping the model separate from the system improves -modularity, which eventually helps in better testing, reduces dependencies on the system and makes it easier to refactor. - -.. testcode:: - - class Encoder(nn.Module): - ... - - - class Decoder(nn.Module): - ... - - - class AutoEncoder(nn.Module): - def __init__(self): - super().__init__() - self.encoder = Encoder() - self.decoder = Decoder() - - def forward(self, x): - return self.encoder(x) - - - class AutoEncoderSystem(LightningModule): - def __init__(self): - super().__init__() - self.auto_encoder = AutoEncoder() - - -For fast prototyping, it's often useful to define all the computations in a LightningModule. For reusability -and scalability, it might be better to pass in the relevant backbones. - -Here's a LightningModule that defines a model. Although, we do not recommend to define a model like in the example. - -.. testcode:: - - class LitModel(LightningModule): - def __init__(self): - super().__init__() - self.layer_1 = nn.Linear() - self.layer_2 = nn.Linear() - self.layer_3 = nn.Linear() - - -Self-contained -============== - -A Lightning module should be self-contained. To see how self-contained your model is, a good test is to ask -yourself this question: - -"Can someone drop this file into a Trainer without knowing anything about the internals?" - -For example, we couple the optimizer with a model because the majority of models require a specific optimizer with -a specific learning rate scheduler to work well. - -Init -==== -The first place where LightningModules tend to stop being self-contained is in the init. Try to define all the relevant -sensible defaults in the init so that the user doesn't have to guess. - -Here's an example where a user will have to go hunt through files to figure out how to init this LightningModule. - -.. testcode:: - - class LitModel(LightningModule): - def __init__(self, params): - self.lr = params.lr - self.coef_x = params.coef_x - -Models defined as such leave you with many questions, such as what is ``coef_x``? Is it a string? A float? What is the range? -Instead, be explicit in your init - -.. testcode:: - - class LitModel(LightningModule): - def __init__(self, encoder: nn.Module, coef_x: float = 0.2, lr: float = 1e-3): - ... - -Now the user doesn't have to guess. Instead, they know the value type, and the model has a sensible default where the -user can see the value immediately. - - -Method Order -============ -The only required methods in the LightningModule are: - -* init -* training_step -* configure_optimizers - -However, if you decide to implement the rest of the optional methods, the recommended order is: - -* model/system definition (init) -* if doing inference, define forward -* training hooks -* validation hooks -* test hooks -* predict hooks -* configure_optimizers -* any other hooks - -In practice, the code looks like this: - -.. code-block:: - - class LitModel(pl.LightningModule): - - def __init__(...): - - def forward(...): - - def training_step(...): - - def training_step_end(...): - - def training_epoch_end(...): - - def validation_step(...): - - def validation_step_end(...): - - def validation_epoch_end(...): - - def test_step(...): - - def test_step_end(...): - - def test_epoch_end(...): - - def configure_optimizers(...): - - def any_extra_hook(...): - - -Forward vs training_step -======================== - -We recommend using :meth:`~pytorch_lightning.core.lightning.LightningModule.forward` for inference/predictions and keeping -:meth:`~pytorch_lightning.core.lightning.LightningModule.training_step` independent. - -.. code-block:: python - - def forward(self, x): - embeddings = self.encoder(x) - return embeddings - - - def training_step(self, batch, batch_idx): - x, _ = batch - z = self.encoder(x) - pred = self.decoder(z) - ... - - --------------- - -**** -Data -**** - -These are best practices for handling data. - -DataLoaders -=========== - -Lightning uses :class:`~torch.utils.data.DataLoader` to handle all the data flow through the system. Whenever you structure dataloaders, -make sure to tune the number of workers for maximum efficiency. - -.. warning:: Make sure not to use ``Trainer(strategy="ddp_spawn")`` with ``num_workers>0`` in the DataLoader or you will bottleneck you code. - -DataModules -=========== - -The :class:`~pytorch_lightning.core.datamodule.LightningDataModule` is designed as a way of decoupling data-related -hooks from the :class:`~pytorch_lightning.core.lightning.LightningModule` so you can develop dataset agnostic models. It makes it easy to hot swap different -datasets with your model, so you can test it and benchmark it across domains. It also makes sharing and reusing the exact data splits and transforms across projects possible. - -Check out :ref:`data` document to understand data management within Lightning and its best practices. - -* What dataset splits were used? -* How many samples does this dataset have overall and within each split? -* Which transforms were used? - -It's for this reason that we recommend you use datamodules. This is especially important when collaborating because -it will save your team a lot of time as well. - -All they need to do is drop a datamodule into the Trainer and not worry about what was done to the data. - -This is true for both academic and corporate settings where data cleaning and ad-hoc instructions slow down the progress -of iterating through ideas. - -- Checkout the live examples to get your hands dirty: -- `Introduction to PyTorch Lightning `_ -- `Introduction to DataModules `_ diff --git a/docs/_sources/tuning/profiler.rst.txt b/docs/_sources/tuning/profiler.rst.txt deleted file mode 100644 index 1ff7c24..0000000 --- a/docs/_sources/tuning/profiler.rst.txt +++ /dev/null @@ -1,49 +0,0 @@ -.. _profiler: - -############################# -Find bottlenecks in your code -############################# - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Basic - :description: Learn to find bottlenecks in the training loop. - :col_css: col-md-3 - :button_link: profiler_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Intermediate - :description: Learn to find bottlenecks in PyTorch operations. - :col_css: col-md-3 - :button_link: profiler_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Advanced - :description: Learn to profile TPU code. - :col_css: col-md-3 - :button_link: profiler_advanced.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Expert - :description: Learn to build your own profiler or profile custom pieces of code - :col_css: col-md-3 - :button_link: profiler_expert.html - :height: 150 - :tag: expert - -.. raw:: html - -
-
diff --git a/docs/_sources/tuning/profiler_advanced.rst.txt b/docs/_sources/tuning/profiler_advanced.rst.txt deleted file mode 100644 index ad2ab9e..0000000 --- a/docs/_sources/tuning/profiler_advanced.rst.txt +++ /dev/null @@ -1,74 +0,0 @@ -:orphan: - -.. _profiler_advanced: - -######################################## -Find bottlenecks in your code (advanced) -######################################## -**Audience**: Users who want to profile their TPU models to find bottlenecks and improve performance. - ----- - -************************ -Profile cloud TPU models -************************ -To profile TPU models use the :class:`~pytorch_lightning.profiler.xla.XLAProfiler` - -.. code-block:: python - - from pytorch_lightning.profiler import XLAProfiler - - profiler = XLAProfiler(port=9001) - trainer = Trainer(profiler=profiler) - ----- - -************************************* -Capture profiling logs in Tensorboard -************************************* -To capture profile logs in Tensorboard, follow these instructions: - ----- - -0: Setup the required installs -============================== -Use this `guide `_ to help you with the Cloud TPU required installations. - ----- - -1: Start Tensorboard -==================== -Start the `TensorBoard `_ server: - -.. code-block:: bash - - tensorboard --logdir ./tensorboard --port 9001 - -Now open the following url on your browser - -.. code-block:: bash - - http://localhost:9001/#profile - ----- - -2: Capture the profile -====================== -Once the code you want to profile is running: - -1. click on the ``CAPTURE PROFILE`` button. -2. Enter ``localhost:9001`` (default port for XLA Profiler) as the Profile Service URL. -3. Enter the number of milliseconds for the profiling duration -4. Click ``CAPTURE`` - ----- - -3: Don't stop your code -======================= -Make sure the code is running while you are trying to capture the traces. It will lead to better performance insights if the profiling duration is longer than the step time. - ----- - -4: View the profiling logs -========================== -Once the capture is finished, the page will refresh and you can browse through the insights using the **Tools** dropdown at the top left diff --git a/docs/_sources/tuning/profiler_basic.rst.txt b/docs/_sources/tuning/profiler_basic.rst.txt deleted file mode 100644 index 899e657..0000000 --- a/docs/_sources/tuning/profiler_basic.rst.txt +++ /dev/null @@ -1,121 +0,0 @@ -:orphan: - -.. _profiler_basic: - -##################################### -Find bottlenecks in your code (basic) -##################################### -**Audience**: Users who want to learn the basics of removing bottlenecks from their code - ----- - -************************ -Why do I need profiling? -************************ -Profiling helps you find bottlenecks in your code by capturing analytics such as how long a function takes or how much memory is used. - ------------- - -****************************** -Find training loop bottlenecks -****************************** -The most basic profile measures all the key methods across **Callbacks**, **DataModules** and the **LightningModule** in the training loop. - -.. code-block:: python - - trainer = Trainer(profiler="simple") - -Once the **.fit()** function has completed, you'll see an output like this: - -.. code-block:: - - FIT Profiler Report - - ----------------------------------------------------------------------------------------------- - | Action | Mean duration (s) | Total time (s) | - ----------------------------------------------------------------------------------------------- - | [LightningModule]BoringModel.prepare_data | 10.0001 | 20.00 | - | run_training_epoch | 6.1558 | 6.1558 | - | run_training_batch | 0.0022506 | 0.015754 | - | [LightningModule]BoringModel.optimizer_step | 0.0017477 | 0.012234 | - | [LightningModule]BoringModel.val_dataloader | 0.00024388 | 0.00024388 | - | on_train_batch_start | 0.00014637 | 0.0010246 | - | [LightningModule]BoringModel.teardown | 2.15e-06 | 2.15e-06 | - | [LightningModule]BoringModel.on_train_start | 1.644e-06 | 1.644e-06 | - | [LightningModule]BoringModel.on_train_end | 1.516e-06 | 1.516e-06 | - | [LightningModule]BoringModel.on_fit_end | 1.426e-06 | 1.426e-06 | - | [LightningModule]BoringModel.setup | 1.403e-06 | 1.403e-06 | - | [LightningModule]BoringModel.on_fit_start | 1.226e-06 | 1.226e-06 | - ----------------------------------------------------------------------------------------------- - -In this report we can see that the slowest function is **prepare_data**. Now you can figure out why data preparation is slowing down your training. - -The simple profiler measures all the standard methods used in the training loop automatically, including: - -- on_train_epoch_start -- on_train_epoch_end -- on_train_batch_start -- model_backward -- on_after_backward -- optimizer_step -- on_train_batch_end -- training_step_end -- on_training_end -- etc... - ----- - -************************************** -Profile the time within every function -************************************** -To profile the time within every function, use the :class:`~pytorch_lightning.profiler.advanced.AdvancedProfiler` built on top of Python's `cProfiler `_. - - -.. code-block:: python - - trainer = Trainer(profiler="advanced") - -Once the **.fit()** function has completed, you'll see an output like this: - -.. code-block:: - - Profiler Report - - Profile stats for: get_train_batch - 4869394 function calls (4863767 primitive calls) in 18.893 seconds - Ordered by: cumulative time - List reduced from 76 to 10 due to restriction <10> - ncalls tottime percall cumtime percall filename:lineno(function) - 3752/1876 0.011 0.000 18.887 0.010 {built-in method builtins.next} - 1876 0.008 0.000 18.877 0.010 dataloader.py:344(__next__) - 1876 0.074 0.000 18.869 0.010 dataloader.py:383(_next_data) - 1875 0.012 0.000 18.721 0.010 fetch.py:42(fetch) - 1875 0.084 0.000 18.290 0.010 fetch.py:44() - 60000 1.759 0.000 18.206 0.000 mnist.py:80(__getitem__) - 60000 0.267 0.000 13.022 0.000 transforms.py:68(__call__) - 60000 0.182 0.000 7.020 0.000 transforms.py:93(__call__) - 60000 1.651 0.000 6.839 0.000 functional.py:42(to_tensor) - 60000 0.260 0.000 5.734 0.000 transforms.py:167(__call__) - -If the profiler report becomes too long, you can stream the report to a file: - -.. code-block:: python - - from pytorch_lightning.profiler import AdvancedProfiler - - profiler = AdvancedProfiler(dirpath=".", filename="perf_logs") - trainer = Trainer(profiler=profiler) - ----- - -************************* -Measure accelerator usage -************************* -Another helpful technique to detect bottlenecks is to ensure that you're using the full capacity of your accelerator (GPU/TPU/IPU/HPU). -This can be measured with the :class:`~pytorch_lightning.callbacks.device_stats_monitor.DeviceStatsMonitor`: - -.. testcode:: - - from pytorch_lightning.callbacks import DeviceStatsMonitor - - trainer = Trainer(callbacks=[DeviceStatsMonitor()]) diff --git a/docs/_sources/tuning/profiler_expert.rst.txt b/docs/_sources/tuning/profiler_expert.rst.txt deleted file mode 100644 index 64ff784..0000000 --- a/docs/_sources/tuning/profiler_expert.rst.txt +++ /dev/null @@ -1,108 +0,0 @@ -:orphan: - -.. _profiler_expert: - -###################################### -Find bottlenecks in your code (expert) -###################################### -**Audience**: Users who want to build their own profilers. - ----- - -*********************** -Build your own profiler -*********************** -To build your own profiler, subclass :class:`~pytorch_lightning.profiler.base.Profiler` -and override some of its methods. Here is a simple example that profiles the first occurrence and total calls of each action: - -.. code-block:: python - - from pytorch_lightning.profiler import Profiler - from collections import defaultdict - import time - - - class ActionCountProfiler(Profiler): - def __init__(self, dirpath=None, filename=None): - super().__init__(dirpath=dirpath, filename=filename) - self._action_count = defaultdict(int) - self._action_first_occurrence = {} - - def start(self, action_name): - if action_name not in self._action_first_occurrence: - self._action_first_occurrence[action_name] = time.strftime("%m/%d/%Y, %H:%M:%S") - - def stop(self, action_name): - self._action_count[action_name] += 1 - - def summary(self): - res = f"\nProfile Summary: \n" - max_len = max(len(x) for x in self._action_count) - - for action_name in self._action_count: - # generate summary for actions called more than once - if self._action_count[action_name] > 1: - res += ( - f"{action_name:<{max_len}s} \t " - + "self._action_first_occurrence[action_name]} \t " - + "{self._action_count[action_name]} \n" - ) - - return res - - def teardown(self, stage): - self._action_count = {} - self._action_first_occurrence = {} - super().teardown(stage=stage) - -.. code-block:: python - - trainer = Trainer(profiler=ActionCountProfiler()) - trainer.fit(...) - ----- - -********************************** -Profile custom actions of interest -********************************** -To profile a specific action of interest, reference a profiler in the LightningModule. - -.. code-block:: python - - from pytorch_lightning.profiler import SimpleProfiler, PassThroughProfiler - - - class MyModel(LightningModule): - def __init__(self, profiler=None): - self.profiler = profiler or PassThroughProfiler() - -To profile in any part of your code, use the **self.profiler.profile()** function - -.. code-block:: python - - class MyModel(LightningModule): - def custom_processing_step(self, data): - with self.profiler.profile("my_custom_action"): - ... - return data - -Here's the full code: - -.. code-block:: python - - from pytorch_lightning.profiler import SimpleProfiler, PassThroughProfiler - - - class MyModel(LightningModule): - def __init__(self, profiler=None): - self.profiler = profiler or PassThroughProfiler() - - def custom_processing_step(self, data): - with self.profiler.profile("my_custom_action"): - ... - return data - - - profiler = SimpleProfiler() - model = MyModel(profiler) - trainer = Trainer(profiler=profiler, max_epochs=1) diff --git a/docs/_sources/tuning/profiler_intermediate.rst.txt b/docs/_sources/tuning/profiler_intermediate.rst.txt deleted file mode 100644 index d2b64b5..0000000 --- a/docs/_sources/tuning/profiler_intermediate.rst.txt +++ /dev/null @@ -1,181 +0,0 @@ -:orphan: - -.. _profiler_intermediate: - -############################################ -Find bottlenecks in your code (intermediate) -############################################ -**Audience**: Users who want to see more granular profiling information - ----- - -************************** -Profile pytorch operations -************************** -To understand the cost of each PyTorch operation, use the :class:`~pytorch_lightning.profiler.pytorch.PyTorchProfiler` built on top of the `PyTorch profiler `__. - -.. code-block:: python - - from pytorch_lightning.profiler import PyTorchProfiler - - profiler = PyTorchProfiler() - trainer = Trainer(profiler=profiler) - -The profiler will generate an output like this: - -.. code-block:: - - Profiler Report - - Profile stats for: training_step - --------------------- --------------- --------------- --------------- --------------- --------------- - Name Self CPU total % Self CPU total CPU total % CPU total CPU time avg - --------------------- --------------- --------------- --------------- --------------- --------------- - t 62.10% 1.044ms 62.77% 1.055ms 1.055ms - addmm 32.32% 543.135us 32.69% 549.362us 549.362us - mse_loss 1.35% 22.657us 3.58% 60.105us 60.105us - mean 0.22% 3.694us 2.05% 34.523us 34.523us - div_ 0.64% 10.756us 1.90% 32.001us 16.000us - ones_like 0.21% 3.461us 0.81% 13.669us 13.669us - sum_out 0.45% 7.638us 0.74% 12.432us 12.432us - transpose 0.23% 3.786us 0.68% 11.393us 11.393us - as_strided 0.60% 10.060us 0.60% 10.060us 3.353us - to 0.18% 3.059us 0.44% 7.464us 7.464us - empty_like 0.14% 2.387us 0.41% 6.859us 6.859us - empty_strided 0.38% 6.351us 0.38% 6.351us 3.175us - fill_ 0.28% 4.782us 0.33% 5.566us 2.783us - expand 0.20% 3.336us 0.28% 4.743us 4.743us - empty 0.27% 4.456us 0.27% 4.456us 2.228us - copy_ 0.15% 2.526us 0.15% 2.526us 2.526us - broadcast_tensors 0.15% 2.492us 0.15% 2.492us 2.492us - size 0.06% 0.967us 0.06% 0.967us 0.484us - is_complex 0.06% 0.961us 0.06% 0.961us 0.481us - stride 0.03% 0.517us 0.03% 0.517us 0.517us - --------------------- --------------- --------------- --------------- --------------- --------------- - Self CPU time total: 1.681ms - -.. note:: - When using the PyTorch Profiler, wall clock time will not not be representative of the true wall clock time. - This is due to forcing profiled operations to be measured synchronously, when many CUDA ops happen asynchronously. - It is recommended to use this Profiler to find bottlenecks/breakdowns, however for end to end wall clock time use - the ``SimpleProfiler``. - ----- - -*************************** -Profile a distributed model -*************************** -To profile a distributed model, use the :class:`~pytorch_lightning.profiler.pytorch.PyTorchProfiler` with the *filename* argument which will save a report per rank. - -.. code-block:: python - - from pytorch_lightning.profiler import PyTorchProfiler - - profiler = PyTorchProfiler(filename="perf-logs") - trainer = Trainer(profiler=profiler) - -With two ranks, it will generate a report like so: - -.. code-block:: - - Profiler Report: rank 0 - - Profile stats for: training_step - --------------------- --------------- --------------- --------------- --------------- --------------- - Name Self CPU total % Self CPU total CPU total % CPU total CPU time avg - --------------------- --------------- --------------- --------------- --------------- --------------- - t 62.10% 1.044ms 62.77% 1.055ms 1.055ms - addmm 32.32% 543.135us 32.69% 549.362us 549.362us - mse_loss 1.35% 22.657us 3.58% 60.105us 60.105us - mean 0.22% 3.694us 2.05% 34.523us 34.523us - div_ 0.64% 10.756us 1.90% 32.001us 16.000us - ones_like 0.21% 3.461us 0.81% 13.669us 13.669us - sum_out 0.45% 7.638us 0.74% 12.432us 12.432us - transpose 0.23% 3.786us 0.68% 11.393us 11.393us - as_strided 0.60% 10.060us 0.60% 10.060us 3.353us - to 0.18% 3.059us 0.44% 7.464us 7.464us - empty_like 0.14% 2.387us 0.41% 6.859us 6.859us - empty_strided 0.38% 6.351us 0.38% 6.351us 3.175us - fill_ 0.28% 4.782us 0.33% 5.566us 2.783us - expand 0.20% 3.336us 0.28% 4.743us 4.743us - empty 0.27% 4.456us 0.27% 4.456us 2.228us - copy_ 0.15% 2.526us 0.15% 2.526us 2.526us - broadcast_tensors 0.15% 2.492us 0.15% 2.492us 2.492us - size 0.06% 0.967us 0.06% 0.967us 0.484us - is_complex 0.06% 0.961us 0.06% 0.961us 0.481us - stride 0.03% 0.517us 0.03% 0.517us 0.517us - --------------------- --------------- --------------- --------------- --------------- --------------- - Self CPU time total: 1.681ms - -.. code-block:: - - Profiler Report: rank 1 - - Profile stats for: training_step - --------------------- --------------- --------------- --------------- --------------- --------------- - Name Self CPU total % Self CPU total CPU total % CPU total CPU time avg - --------------------- --------------- --------------- --------------- --------------- --------------- - t 42.10% 1.044ms 62.77% 1.055ms 1.055ms - addmm 32.32% 543.135us 32.69% 549.362us 549.362us - mse_loss 1.35% 22.657us 3.58% 60.105us 60.105us - mean 0.22% 3.694us 2.05% 34.523us 34.523us - div_ 0.64% 10.756us 1.90% 32.001us 16.000us - ones_like 0.21% 3.461us 0.81% 13.669us 13.669us - sum_out 0.45% 7.638us 0.74% 12.432us 12.432us - transpose 0.23% 3.786us 0.68% 11.393us 11.393us - as_strided 0.60% 10.060us 0.60% 10.060us 3.353us - to 0.18% 3.059us 0.44% 7.464us 7.464us - empty_like 0.14% 2.387us 0.41% 6.859us 6.859us - empty_strided 0.38% 6.351us 0.38% 6.351us 3.175us - fill_ 0.28% 4.782us 0.33% 5.566us 2.783us - expand 0.20% 3.336us 0.28% 4.743us 4.743us - empty 0.27% 4.456us 0.27% 4.456us 2.228us - copy_ 0.15% 2.526us 0.15% 2.526us 2.526us - broadcast_tensors 0.15% 2.492us 0.15% 2.492us 2.492us - size 0.06% 0.967us 0.06% 0.967us 0.484us - is_complex 0.06% 0.961us 0.06% 0.961us 0.481us - stride 0.03% 0.517us 0.03% 0.517us 0.517us - --------------------- --------------- --------------- --------------- --------------- --------------- - Self CPU time total: 1.681ms - -This profiler will record ``training_step``, ``backward``, ``validation_step``, ``test_step``, and ``predict_step`` by default. -The output below shows the profiling for the action ``training_step``. The user can provide ``PyTorchProfiler(record_functions={...})`` -to extend the scope of profiled functions. - -.. note:: - When using the PyTorch Profiler, wall clock time will not not be representative of the true wall clock time. - This is due to forcing profiled operations to be measured synchronously, when many CUDA ops happen asynchronously. - It is recommended to use this Profiler to find bottlenecks/breakdowns, however for end to end wall clock time use - the ``SimpleProfiler``. - ----- - -***************************** -Visualize profiled operations -***************************** -To visualize the profiled operations, enable **emit_nvtx** in the :class:`~pytorch_lightning.profiler.pytorch.PyTorchProfiler`. - -.. code-block:: python - - from pytorch_lightning.profiler import PyTorchProfiler - - profiler = PyTorchProfiler(emit_nvtx=True) - trainer = Trainer(profiler=profiler) - -Then run as following: - -.. code-block:: - - nvprof --profile-from-start off -o trace_name.prof -- - -To visualize the profiled operation, you can either use **nvvp**: - -.. code-block:: - - nvvp trace_name.prof - -or python: - -.. code-block:: - - python -c 'import torch; print(torch.autograd.profiler.load_nvprof("trace_name.prof"))' diff --git a/docs/_sources/visualize/experiment_managers.rst.txt b/docs/_sources/visualize/experiment_managers.rst.txt deleted file mode 100644 index 30fada9..0000000 --- a/docs/_sources/visualize/experiment_managers.rst.txt +++ /dev/null @@ -1,25 +0,0 @@ -****************** -Manage Experiments -****************** -To track other artifacts, such as histograms or model topology graphs first select one of the many experiment managers (*loggers*) supported by Lightning - -.. code-block:: python - - from pytorch_lightning import loggers as pl_loggers - - tensorboard = pl_loggers.TensorBoardLogger() - trainer = Trainer(logger=tensorboard) - -then access the logger's API directly - -.. code-block:: python - - def training_step(self): - tensorboard = self.logger.experiment - tensorboard.add_image() - tensorboard.add_histogram(...) - tensorboard.add_figure(...) - ----- - -.. include:: supported_exp_managers.rst diff --git a/docs/_sources/visualize/loggers.rst.txt b/docs/_sources/visualize/loggers.rst.txt deleted file mode 100644 index bdf95ec..0000000 --- a/docs/_sources/visualize/loggers.rst.txt +++ /dev/null @@ -1,56 +0,0 @@ -.. _loggers: - -############################### -Track and Visualize Experiments -############################### - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Basic - :description: Learn how to track and visualize metrics, images and text. - :col_css: col-md-4 - :button_link: logging_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Intermediate - :description: Enable third-party experiment managers with advanced visualizations. - :col_css: col-md-4 - :button_link: logging_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Advanced - :description: Optimize model speed with advanced self.log arguments and cloud logging. - :col_css: col-md-4 - :button_link: logging_advanced.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Expert - :description: Make your own progress-bar or integrate a new experiment manager. - :col_css: col-md-4 - :button_link: logging_expert.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: LightningModule.log API - :description: Dig into the LightningModule.log API in depth - :col_css: col-md-4 - :button_link: ../common/lightning_module.html#log - :height: 150 - -.. raw:: html - -
-
diff --git a/docs/_sources/visualize/logging_advanced.rst.txt b/docs/_sources/visualize/logging_advanced.rst.txt deleted file mode 100644 index ca11e39..0000000 --- a/docs/_sources/visualize/logging_advanced.rst.txt +++ /dev/null @@ -1,385 +0,0 @@ -:orphan: - -.. _logging_advanced: - -########################################## -Track and Visualize Experiments (advanced) -########################################## -**Audience:** Users who want to do advanced speed optimizations by customizing the logging behavior. - ----- - -**************************** -Change progress bar defaults -**************************** -To change the default values (ie: version number) shown in the progress bar, override the :meth:`~pytorch_lightning.callbacks.progress.base.ProgressBarBase.get_metrics` method in your logger. - -.. code-block:: python - - from pytorch_lightning.callbacks.progress import Tqdm - - - class CustomProgressBar(Tqdm): - def get_metrics(self, *args, **kwargs): - # don't show the version number - items = super().get_metrics() - items.pop("v_num", None) - return items - ----- - -************************************ -Customize tracking to speed up model -************************************ - - -Modify logging frequency -======================== - -Logging a metric on every single batch can slow down training. By default, Lightning logs every 50 rows, or 50 training steps. -To change this behaviour, set the *log_every_n_steps* :class:`~pytorch_lightning.trainer.trainer.Trainer` flag. - -.. testcode:: - - k = 10 - trainer = Trainer(log_every_n_steps=k) - ----- - -Modify flushing frequency -========================= - -Metrics are kept in memory for N steps to improve training efficiency. Every N steps, metrics flush to disk. To change the frequency of this flushing, use the *flush_logs_every_n_steps* Trainer argument. - -.. code-block:: python - - # faster training, high memory - Trainer(flush_logs_every_n_steps=500) - - # slower training, low memory - Trainer(flush_logs_every_n_steps=500) - -The higher *flush_logs_every_n_steps* is, the faster the model will train but the memory will build up until the next flush. -The smaller *flush_logs_every_n_steps* is, the slower the model will train but memory will be kept to a minimum. - -TODO: chart - ----- - -****************** -Customize self.log -****************** - -The LightningModule *self.log* method offers many configurations to customize its behavior. - ----- - -add_dataloader_idx -================== -**Default:** True - -If True, appends the index of the current dataloader to the name (when using multiple dataloaders). If False, user needs to give unique names for each dataloader to not mix the values. - -.. code-block:: python - - self.log(add_dataloader_idx=True) - ----- - -batch_size -========== -**Default:** None - -Current batch size used for accumulating logs logged with ``on_epoch=True``. This will be directly inferred from the loaded batch, but for some data structures you might need to explicitly provide it. - -.. code-block:: python - - self.log(batch_size=32) - ----- - -enable_graph -============ -**Default:** True - -If True, will not auto detach the graph. - -.. code-block:: python - - self.log(enable_graph=True) - ----- - -logger -====== -**Default:** True - -Send logs to the logger like ``Tensorboard``, or any other custom logger passed to the :class:`~pytorch_lightning.trainer.trainer.Trainer` (Default: ``True``). - -.. code-block:: python - - self.log(logger=True) - ----- - -on_epoch -======== -**Default:** It varies - -If this is True, that specific *self.log* call accumulates and reduces all metrics to the end of the epoch. - -.. code-block:: python - - self.log(on_epoch=True) - -The default value depends in which function this is called - -.. code-block:: python - - def training_step(self, batch, batch_idx): - # Default: False - self.log(on_epoch=False) - - - def validation_step(self, batch, batch_idx): - # Default: True - self.log(on_epoch=True) - - - def test_step(self, batch, batch_idx): - # Default: True - self.log(on_epoch=True) - ----- - -on_step -======= -**Default:** It varies - -If this is True, that specific *self.log* call will NOT accumulate metrics. Instead it will generate a timeseries across steps. - -.. code-block:: python - - self.log(on_step=True) - -The default value depends in which function this is called - -.. code-block:: python - - def training_step(self, batch, batch_idx): - # Default: True - self.log(on_step=True) - - - def validation_step(self, batch, batch_idx): - # Default: False - self.log(on_step=False) - - - def test_step(self, batch, batch_idx): - # Default: False - self.log(on_step=False) - - ----- - -prog_bar -======== -**Default:** False - -If set to True, logs will be sent to the progress bar. - -.. code-block:: python - - self.log(prog_bar=True) - ----- - -rank_zero_only -============== -**Default:** True - -Whether the value will be logged only on rank 0. This will prevent synchronization which would produce a deadlock as not all processes would perform this log call. - -.. code-block:: python - - self.log(rank_zero_only=True) - ----- - -reduce_fx -========= -**Default:** :meth:`torch.mean` - -Reduction function over step values for end of epoch. Uses :meth:`torch.mean` by default. - -.. code-block:: python - - self.log(reduce_fx=torch.mean) - ----- - -sync_dist -========= -**Default:** False - -If True, reduces the metric across devices. Use with care as this may lead to a significant communication overhead. - -.. code-block:: python - - self.log(sync_dist=False) - ----- - -sync_dist_group -=============== -**Default:** None - -The DDP group to sync across. - -.. code-block:: python - - import torch.distributed as dist - - group = dist.init_process_group("nccl", rank=self.global_rank, world_size=self.world_size) - self.log(sync_dist_group=group) - ----- - -*************************************** -Enable metrics for distributed training -*************************************** -For certain types of metrics that need complex aggregation, we recommended to build your metric using torchmetric which ensures all the complexities of metric aggregation in distributed environments is handled. - -First, implement your metric: - -.. code-block:: python - - import torch - import torchmetrics - - - class MyAccuracy(Metric): - def __init__(self, dist_sync_on_step=False): - # call `self.add_state`for every internal state that is needed for the metrics computations - # dist_reduce_fx indicates the function that should be used to reduce - # state from multiple processes - super().__init__(dist_sync_on_step=dist_sync_on_step) - - self.add_state("correct", default=torch.tensor(0), dist_reduce_fx="sum") - self.add_state("total", default=torch.tensor(0), dist_reduce_fx="sum") - - def update(self, preds: torch.Tensor, target: torch.Tensor): - # update metric states - preds, target = self._input_format(preds, target) - assert preds.shape == target.shape - - self.correct += torch.sum(preds == target) - self.total += target.numel() - - def compute(self): - # compute final result - return self.correct.float() / self.total - -To use the metric inside Lightning, 1) initialize it in the init, 2) compute the metric, 3) pass it into *self.log* - -.. code-block:: python - - class LitModel(LightningModule): - def __init__(self): - # 1. initialize the metric - self.accuracy = MyAccuracy() - - def training_step(self, batch, batch_idx): - x, y = batch - preds = self(x) - - # 2. compute the metric - self.accuracy(preds, y) - - # 3. log it - self.log("train_acc_step", self.accuracy) - ----- - -******************************** -Log to a custom cloud filesystem -******************************** -Lightning is integrated with the major remote file systems including local filesystems and several cloud storage providers such as -`S3 `_ on `AWS `_, `GCS `_ on `Google Cloud `_, -or `ADL `_ on `Azure `_. - -PyTorch Lightning uses `fsspec `_ internally to handle all filesystem operations. - -To save logs to a remote filesystem, prepend a protocol like "s3:/" to the root_dir used for writing and reading model data. - -.. code-block:: python - - from pytorch_lightning.loggers import TensorBoardLogger - - logger = TensorBoardLogger(save_dir="s3://my_bucket/logs/") - - trainer = Trainer(logger=logger) - trainer.fit(model) - ----- - -********************************* -Track both step and epoch metrics -********************************* -To track the timeseries over steps (*on_step*) as well as the accumulated epoch metric (*on_epoch*), set both to True - -.. code-block:: python - - self.log(on_step=True, on_epoch=True) - -Setting both to True will generate two graphs with *_step* for the timeseries over steps and *_epoch* for the epoch metric. - -# TODO: show images of both - ----- - -************************************** -Understand self.log automatic behavior -************************************** -This table shows the default values of *on_step* and *on_epoch* depending on the *LightningModule* or *Callback* method. - ----- - -In LightningModule -================== - -.. list-table:: Default behavior of logging in ightningModule - :widths: 50 25 25 - :header-rows: 1 - - * - Method - - on_step - - on_epoch - * - on_after_backward, on_before_backward, on_before_optimizer_step, on_before_zero_grad, training_step, training_step_end - - True - - False - * - training_epoch_end, test_epoch_end, test_step, test_step_end, validation_epoch_end, validation_step, validation_step_end - - False - - True - ----- - -In Callback -=========== - -.. list-table:: Default behavior of logging in Callback - :widths: 50 25 25 - :header-rows: 1 - - * - Method - - on_step - - on_epoch - * - on_after_backward, on_before_backward, on_before_optimizer_step, on_before_zero_grad, on_train_batch_start, on_train_batch_end - - True - - False - * - on_train_epoch_start, on_train_epoch_end, on_train_start, on_validation_batch_start, on_validation_batch_end, on_validation_start, on_validation_epoch_start, on_validation_epoch_end - - False - - True - -.. note:: To add logging to an unsupported method, please open an issue with a clear description of why it is blocking you. diff --git a/docs/_sources/visualize/logging_basic.rst.txt b/docs/_sources/visualize/logging_basic.rst.txt deleted file mode 100644 index 8732305..0000000 --- a/docs/_sources/visualize/logging_basic.rst.txt +++ /dev/null @@ -1,146 +0,0 @@ -:orphan: - -.. _logging_basic: - -####################################### -Track and Visualize Experiments (basic) -####################################### -**Audience:** Users who want to visualize and monitor their model development - ----- - -******************************* -Why do I need to track metrics? -******************************* -In model development, we track values of interest such as the *validation_loss* to visualize the learning process for our models. Model development is like driving a car without windows, charts and logs provide the *windows* to know where to drive the car. - -With Lightning, you can visualize virtually anything you can think of: numbers, text, images, audio. Your creativity and imagination are the only limiting factor. - ----- - -************* -Track metrics -************* -Metric visualization is the most basic but powerful way of understanding how your model is doing throughout the model development process. - -To track a metric, simply use the *self.log* method available inside the *LightningModule* - -.. code-block:: python - - class LitModel(pl.LightningModule): - def training_step(self, batch, batch_idx): - value = self.global_step - self.log("some_value", self.global_step) - -To log multiple metrics at once, use *self.log_dict* - -.. code-block:: python - - values = {"loss": loss, "acc": acc, "metric_n": metric_n} # add more items if needed - self.log_dict(values) - -TODO: show plot of metric changing over time - ----- - -View in the commandline -======================= - -To view metrics in the commandline progress bar, set the *prog_bar* argument to True. - -.. code-block:: python - - self.log(prog_bar=True) - -TODO: need progress bar here - ----- - -View in the browser -=================== -To view metrics in the browser you need to use an *experiment manager* with these capabilities. By Default, Lightning uses Tensorboard which is free and opensource. - -Tensorboard is already enabled by default - -.. code-block:: python - - # every trainer already has tensorboard enabled by default - trainer = Trainer() - -To launch the tensorboard dashboard run the following command on the commandline. - -.. code-block:: bash - - tensorboard --logdir=lightning_logs/ - -If you're using a notebook environment such as *colab* or *kaggle* or *jupyter*, launch Tensorboard with this command - -.. code-block:: bash - - %reload_ext tensorboard - %tensorboard --logdir=lightning_logs/ - ----- - -Accumulate a metric -=================== -When *self.log* is called inside the *training_step*, it generates a timeseries showing how the metric behaves over time. - -TODO: show chart - -However, For the validation and test sets we are not generally interested in plotting the metric values per batch of data. Instead, we want to compute a summary statistic (such as average, min or max) across the full split of data. - -When you call self.log inside the *validation_step* and *test_step*, Lightning automatically accumulates the metric and averages it once it's gone through the whole split (*epoch*). - -.. code-block:: python - - def validation_step(self, batch, batch_idx): - value = batch_idx + 1 - self.log("average_value", value) - -TODO: show single point plotted - -If you don't want to average, add your own function in the *reduce_fx* argument. - -.. code-block:: python - - # default function - self.log(reduce_fx=torch.mean) - ----- - -************ -Track images -************ -If your *experiment manager* supports image visualization, simply *log* the image with *self.log* - -.. code-block:: python - - # (32 batch samples, 3 channels, 32 width, 32 height) - image = torch.Tensor(32, 3, 28, 28) - self.log("an_image", image) - ----- - -********** -Track text -********** -If your *experiment manager* supports text visualization, simply *log* the text with *self.log* - -.. code-block:: python - - text = "hello world" - self.log("some_text", text) - -# TODO: show screenshot - ----- - -****************************** -Configure the saving directory -****************************** -By default, anything that is logged is saved to the current working directory. To use a different directory, set the *default_root_dir* argument in the Trainer. - -.. code-block:: python - - Trainer(default_root_dir="/your/custom/path") diff --git a/docs/_sources/visualize/logging_expert.rst.txt b/docs/_sources/visualize/logging_expert.rst.txt deleted file mode 100644 index 3b44ee9..0000000 --- a/docs/_sources/visualize/logging_expert.rst.txt +++ /dev/null @@ -1,135 +0,0 @@ -:orphan: - -.. _logging_expert: - -######################################## -Track and Visualize Experiments (expert) -######################################## -**Audience:** Users who want to make their own progress bars or integrate new experiment managers. - ----- - -*********************** -Change the progress bar -*********************** - -If you'd like to change the way the progress bar displays information you can use some of our built-in progress bard or build your own. - ----- - -Use the TQDMProgressBar -======================= -To use the TQDMProgressBar pass it into the *callbacks* :class:`~pytorch_lightning.trainer.trainer.Trainer` argument. - -.. code-block:: python - - from pytorch_lightning.callbacks import TQDMProgressBar - - trainer = Trainer(callbacks=[TQDMProgressBar()]) - ----- - -Use the RichProgressBar -======================= -The RichProgressBar can add custom colors and beautiful formatting for your progress bars. First, install the *`rich `_* library - -.. code-block:: bash - - pip install rich - -Then pass the callback into the callbacks :class:`~pytorch_lightning.trainer.trainer.Trainer` argument: - -.. code-block:: python - - from pytorch_lightning.callbacks import RichProgressBar - - trainer = Trainer(callbacks=[RichProgressBar()]) - -The rich progress bar can also have custom themes - -.. code-block:: python - - from pytorch_lightning.callbacks import RichProgressBar - from pytorch_lightning.callbacks.progress.rich_progress import RichProgressBarTheme - - # create your own theme! - theme = RichProgressBarTheme(description="green_yellow", progress_bar="green1") - - # init as normal - progress_bar = RichProgressBar(theme=theme) - trainer = Trainer(callbacks=progress_bar) - ----- - -************************ -Customize a progress bar -************************ -To customize either the :class:`~pytorch_lightning.callbacks.TQDMProgressBar` or the :class:`~pytorch_lightning.callbacks.RichProgressBar`, subclass it and override any of its methods. - -.. code-block:: python - - from pytorch_lightning.callbacks import TQDMProgressBar - - - class LitProgressBar(TQDMProgressBar): - def init_validation_tqdm(self): - bar = super().init_validation_tqdm() - bar.set_description("running validation...") - return bar - ----- - -*************************** -Build your own progress bar -*************************** -To build your own progress bar, subclass :class:`~pytorch_lightning.callbacks.ProgressBarBase` - -.. code-block:: python - - from pytorch_lightning.callbacks import ProgressBarBase - - - class LitProgressBar(ProgressBarBase): - def __init__(self): - super().__init__() # don't forget this :) - self.enable = True - - def disable(self): - self.enable = False - - def on_train_batch_end(self, trainer, pl_module, outputs, batch_idx): - super().on_train_batch_end(trainer, pl_module, outputs, batch_idx) # don't forget this :) - percent = (self.train_batch_idx / self.total_train_batches) * 100 - sys.stdout.flush() - sys.stdout.write(f"{percent:.01f} percent complete \r") - - - bar = LitProgressBar() - trainer = Trainer(callbacks=[bar]) - ----- - -******************************* -Integrate an experiment manager -******************************* -To create an integration between a custom logger and Lightning, subclass :class:`~pytorch_lightning.loggers.base.LightningLoggerBase` - -.. code-block:: python - - from pytorch_lightning.loggers import Logger - - - class LitLogger(Logger): - @property - def name(self) -> str: - return "my-experiment" - - @property - def version(self): - return "version_0" - - def log_metrics(self, metrics, step=None): - print("my logged metrics", metrics) - - def log_hyperparams(self, params, *args, **kwargs): - print("my logged hyperparameters", params) diff --git a/docs/_sources/visualize/logging_intermediate.rst.txt b/docs/_sources/visualize/logging_intermediate.rst.txt deleted file mode 100644 index 1b0dd6b..0000000 --- a/docs/_sources/visualize/logging_intermediate.rst.txt +++ /dev/null @@ -1,80 +0,0 @@ -.. _logging_intermediate: - -############################################## -Track and Visualize Experiments (intermediate) -############################################## -**Audience:** Users who want to track more complex outputs and use third-party experiment managers. - ----- - -******************************* -Track audio and other artifacts -******************************* -To track other artifacts, such as histograms or model topology graphs first select one of the many loggers supported by Lightning - -.. code-block:: python - - from pytorch_lightning import loggers as pl_loggers - - tensorboard = pl_loggers.TensorBoardLogger() - trainer = Trainer(logger=tensorboard) - -then access the logger's API directly - -.. code-block:: python - - def training_step(self): - tensorboard = self.logger.experiment - tensorboard.add_image() - tensorboard.add_histogram(...) - tensorboard.add_figure(...) - ----- - -.. include:: supported_exp_managers.rst - ----- - -**************************************** -Track multiple metrics in the same chart -**************************************** -If your logger supports plotting multiple metrics on the same chart, pass in a dictionary to *self.log*. - -.. code-block:: python - - self.log("performance", {"acc": acc, "recall": recall}) - ----- - -********************* -Track hyperparameters -********************* -To track hyperparameters, first call *save_hyperparameters* from the LightningModule init: - -.. code-block:: python - - class MyLightningModule(LightningModule): - def __init__(self, learning_rate, another_parameter, *args, **kwargs): - super().__init__() - self.save_hyperparameters() - -If your logger supports tracked hyperparameters, the hyperparameters will automatically show up on the logger dashboard. - -TODO: show tracked hyperparameters. - ----- - -******************** -Track model topology -******************** -Multiple loggers support visualizing the model topology. Here's an example that tracks the model topology using Tensorboard. - -.. code-block:: python - - def any_lightning_module_function_or_hook(self): - tensorboard_logger = self.logger.experiment - - prototype_array = torch.Tensor(32, 1, 28, 27) - tensorboard_logger.log_graph(model=self, input_array=prototype_array) - -TODO: show tensorboard topology. diff --git a/docs/_sources/visualize/supported_exp_managers.rst.txt b/docs/_sources/visualize/supported_exp_managers.rst.txt deleted file mode 100644 index 1a15ee2..0000000 --- a/docs/_sources/visualize/supported_exp_managers.rst.txt +++ /dev/null @@ -1,198 +0,0 @@ -Comet.ml -======== -To use `Comet.ml `_ first install the comet package: - -.. code-block:: bash - - pip install comet-ml - -Configure the logger and pass it to the :class:`~pytorch_lightning.trainer.trainer.Trainer`: - -.. code-block:: python - - from pytorch_lightning.loggers import CometLogger - - comet_logger = CometLogger(api_key="YOUR_COMET_API_KEY") - trainer = Trainer(logger=comet_logger) - -Access the comet logger from any function (except the LightningModule *init*) to use its API for tracking advanced artifacts - -.. code-block:: python - - class LitModel(LightningModule): - def any_lightning_module_function_or_hook(self): - comet = self.logger.experiment - fake_images = torch.Tensor(32, 3, 28, 28) - comet.add_image("generated_images", fake_images, 0) - -Here's the full documentation for the :class:`~pytorch_lightning.loggers.CometLogger`. - ----- - -MLflow -====== -To use `MLflow `_ first install the MLflow package: - -.. code-block:: bash - - pip install mlflow - -Configure the logger and pass it to the :class:`~pytorch_lightning.trainer.trainer.Trainer`: - -.. code-block:: python - - from pytorch_lightning.loggers import MLFlowLogger - - mlf_logger = MLFlowLogger(experiment_name="lightning_logs", tracking_uri="file:./ml-runs") - trainer = Trainer(logger=mlf_logger) - -Access the comet logger from any function (except the LightningModule *init*) to use its API for tracking advanced artifacts - -.. code-block:: python - - class LitModel(LightningModule): - def any_lightning_module_function_or_hook(self): - mlf_logger = self.logger.experiment - fake_images = torch.Tensor(32, 3, 28, 28) - mlf_logger.add_image("generated_images", fake_images, 0) - -Here's the full documentation for the :class:`~pytorch_lightning.loggers.MLFlowLogger`. - ----- - -Neptune.ai -========== -To use `Neptune.ai `_ first install the neptune package: - -.. code-block:: bash - - pip install neptune-client - -or with conda: - -.. code-block:: bash - - conda install -c conda-forge neptune-client - -Configure the logger and pass it to the :class:`~pytorch_lightning.trainer.trainer.Trainer`: - -.. code-block:: python - - from pytorch_lightning.loggers import NeptuneLogger - - neptune_logger = NeptuneLogger( - api_key="ANONYMOUS", # replace with your own - project="common/pytorch-lightning-integration", # format "" - ) - trainer = Trainer(logger=neptune_logger) - -Access the neptune logger from any function (except the LightningModule *init*) to use its API for tracking advanced artifacts - -.. code-block:: python - - class LitModel(LightningModule): - def any_lightning_module_function_or_hook(self): - neptune_logger = self.logger.experiment["your/metadata/structure"] - neptune_logger.log(metadata) - -Here's the full documentation for the :class:`~pytorch_lightning.loggers.NeptuneLogger`. - ----- - -Tensorboard -=========== -`TensorBoard `_ already comes installed with Lightning. If you removed the install install the following package. - -.. code-block:: bash - - pip install tensorboard - -Configure the logger and pass it to the :class:`~pytorch_lightning.trainer.trainer.Trainer`: - -.. code-block:: python - - from pytorch_lightning.loggers import TensorBoardLogger - - logger = TensorBoardLogger() - trainer = Trainer(logger=logger) - -Access the tensorboard logger from any function (except the LightningModule *init*) to use its API for tracking advanced artifacts - -.. code-block:: python - - class LitModel(LightningModule): - def any_lightning_module_function_or_hook(self): - tensorboard_logger = self.logger.experiment - fake_images = torch.Tensor(32, 3, 28, 28) - tensorboard_logger.add_image("generated_images", fake_images, 0) - -Here's the full documentation for the :class:`~pytorch_lightning.loggers.TensorBoardLogger`. - ----- - -Weights and Biases -================== -To use `Weights and Biases `_ (wandb) first install the wandb package: - -.. code-block:: bash - - pip install wandb - -Configure the logger and pass it to the :class:`~pytorch_lightning.trainer.trainer.Trainer`: - -.. code-block:: python - - from pytorch_lightning.loggers import WandbLogger - - wandb_logger = WandbLogger(project="MNIST", log_model="all") - trainer = Trainer(logger=wandb_logger) - - # log gradients and model topology - wandb_logger.watch(model) - -Access the wandb logger from any function (except the LightningModule *init*) to use its API for tracking advanced artifacts - -.. code-block:: python - - class MyModule(LightningModule): - def any_lightning_module_function_or_hook(self): - wandb_logger = self.logger.experiment - fake_images = torch.Tensor(32, 3, 28, 28) - - # Option 1 - wandb_logger.log({"generated_images": [wandb.Image(fake_images, caption="...")]}) - - # Option 2 for specifically logging images - wandb_logger.log_image(key="generated_images", images=[fake_images]) - -Here's the full documentation for the :class:`~pytorch_lightning.loggers.WandbLogger`. -`Demo in Google Colab `__ with hyperparameter search and model logging. - ----- - -Use multiple exp managers -========================= -To use multiple experiment managers at the same time, pass a list to the *logger* :class:`~pytorch_lightning.trainer.trainer.Trainer` argument. - -.. code-block:: python - - from pytorch_lightning.loggers import TensorBoardLogger, WandbLogger - - logger1 = TensorBoardLogger() - logger2 = WandbLogger() - trainer = Trainer(logger=[logger1, logger2]) - - -Access all loggers from any function (except the LightningModule *init*) to use their APIs for tracking advanced artifacts - -.. code-block:: python - - class MyModule(LightningModule): - def any_lightning_module_function_or_hook(self): - tensorboard_logger = self.logger.experiment[0] - wandb_logger = self.logger.experiment[1] - - fake_images = torch.Tensor(32, 3, 28, 28) - - tensorboard_logger.add_image("generated_images", fake_images, 0) - wandb_logger.add_image("generated_images", fake_images, 0) diff --git a/docs/_static/basic.css b/docs/_static/basic.css deleted file mode 100644 index bf18350..0000000 --- a/docs/_static/basic.css +++ /dev/null @@ -1,906 +0,0 @@ -/* - * basic.css - * ~~~~~~~~~ - * - * Sphinx stylesheet -- basic theme. - * - * :copyright: Copyright 2007-2022 by the Sphinx team, see AUTHORS. - * :license: BSD, see LICENSE for details. - * - */ - -/* -- main layout ----------------------------------------------------------- */ - -div.clearer { - clear: both; -} - -div.section::after { - display: block; - content: ''; - clear: left; -} - -/* -- relbar ---------------------------------------------------------------- */ - -div.related { - width: 100%; - font-size: 90%; -} - -div.related h3 { - display: none; -} - -div.related ul { - margin: 0; - padding: 0 0 0 10px; - list-style: none; -} - -div.related li { - display: inline; -} - -div.related li.right { - float: right; - margin-right: 5px; -} - -/* -- sidebar --------------------------------------------------------------- */ - -div.sphinxsidebarwrapper { - padding: 10px 5px 0 10px; -} - -div.sphinxsidebar { - float: left; - width: 230px; - margin-left: -100%; - font-size: 90%; - word-wrap: break-word; - overflow-wrap : break-word; -} - -div.sphinxsidebar ul { - list-style: none; -} - -div.sphinxsidebar ul ul, -div.sphinxsidebar ul.want-points { - margin-left: 20px; - list-style: square; -} - -div.sphinxsidebar ul ul { - margin-top: 0; - margin-bottom: 0; -} - -div.sphinxsidebar form { - margin-top: 10px; -} - -div.sphinxsidebar input { - border: 1px solid #98dbcc; - font-family: sans-serif; - font-size: 1em; -} - -div.sphinxsidebar #searchbox form.search { - overflow: hidden; -} - -div.sphinxsidebar #searchbox input[type="text"] { - float: left; - width: 80%; - padding: 0.25em; - box-sizing: border-box; -} - -div.sphinxsidebar #searchbox input[type="submit"] { - float: left; - width: 20%; - border-left: none; - padding: 0.25em; - box-sizing: border-box; -} - - -img { - border: 0; - max-width: 100%; -} - -/* -- search page ----------------------------------------------------------- */ - -ul.search { - margin: 10px 0 0 20px; - padding: 0; -} - -ul.search li { - padding: 5px 0 5px 20px; - background-image: url(file.png); - background-repeat: no-repeat; - background-position: 0 7px; -} - -ul.search li a { - font-weight: bold; -} - -ul.search li p.context { - color: #888; - margin: 2px 0 0 30px; - text-align: left; -} - -ul.keywordmatches li.goodmatch a { - font-weight: bold; -} - -/* -- index page ------------------------------------------------------------ */ - -table.contentstable { - width: 90%; - margin-left: auto; - margin-right: auto; -} - -table.contentstable p.biglink { - line-height: 150%; -} - -a.biglink { - font-size: 1.3em; -} - -span.linkdescr { - font-style: italic; - padding-top: 5px; - font-size: 90%; -} - -/* -- general index --------------------------------------------------------- */ - -table.indextable { - width: 100%; -} - -table.indextable td { - text-align: left; - vertical-align: top; -} - -table.indextable ul { - margin-top: 0; - margin-bottom: 0; - list-style-type: none; -} - -table.indextable > tbody > tr > td > ul { - padding-left: 0em; -} - -table.indextable tr.pcap { - height: 10px; -} - -table.indextable tr.cap { - margin-top: 10px; - background-color: #f2f2f2; -} - -img.toggler { - margin-right: 3px; - margin-top: 3px; - cursor: pointer; -} - -div.modindex-jumpbox { - border-top: 1px solid #ddd; - border-bottom: 1px solid #ddd; - margin: 1em 0 1em 0; - padding: 0.4em; -} - -div.genindex-jumpbox { - border-top: 1px solid #ddd; - border-bottom: 1px solid #ddd; - margin: 1em 0 1em 0; - padding: 0.4em; -} - -/* -- domain module index --------------------------------------------------- */ - -table.modindextable td { - padding: 2px; - border-collapse: collapse; -} - -/* -- general body styles --------------------------------------------------- */ - -div.body { - min-width: 450px; - max-width: 800px; -} - -div.body p, div.body dd, div.body li, div.body blockquote { - -moz-hyphens: auto; - -ms-hyphens: auto; - -webkit-hyphens: auto; - hyphens: auto; -} - -a.headerlink { - visibility: hidden; -} - -a.brackets:before, -span.brackets > a:before{ - content: "["; -} - -a.brackets:after, -span.brackets > a:after { - content: "]"; -} - -h1:hover > a.headerlink, -h2:hover > a.headerlink, -h3:hover > a.headerlink, -h4:hover > a.headerlink, -h5:hover > a.headerlink, -h6:hover > a.headerlink, -dt:hover > a.headerlink, -caption:hover > a.headerlink, -p.caption:hover > a.headerlink, -div.code-block-caption:hover > a.headerlink { - visibility: visible; -} - -div.body p.caption { - text-align: inherit; -} - -div.body td { - text-align: left; -} - -.first { - margin-top: 0 !important; -} - -p.rubric { - margin-top: 30px; - font-weight: bold; -} - -img.align-left, figure.align-left, .figure.align-left, object.align-left { - clear: left; - float: left; - margin-right: 1em; -} - -img.align-right, figure.align-right, .figure.align-right, object.align-right { - clear: right; - float: right; - margin-left: 1em; -} - -img.align-center, figure.align-center, .figure.align-center, object.align-center { - display: block; - margin-left: auto; - margin-right: auto; -} - -img.align-default, figure.align-default, .figure.align-default { - display: block; - margin-left: auto; - margin-right: auto; -} - -.align-left { - text-align: left; -} - -.align-center { - text-align: center; -} - -.align-default { - text-align: center; -} - -.align-right { - text-align: right; -} - -/* -- sidebars -------------------------------------------------------------- */ - -div.sidebar, -aside.sidebar { - margin: 0 0 0.5em 1em; - border: 1px solid #ddb; - padding: 7px; - background-color: #ffe; - width: 40%; - float: right; - clear: right; - overflow-x: auto; -} - -p.sidebar-title { - font-weight: bold; -} - -div.admonition, div.topic, blockquote { - clear: left; -} - -/* -- topics ---------------------------------------------------------------- */ - -div.topic { - border: 1px solid #ccc; - padding: 7px; - margin: 10px 0 10px 0; -} - -p.topic-title { - font-size: 1.1em; - font-weight: bold; - margin-top: 10px; -} - -/* -- admonitions ----------------------------------------------------------- */ - -div.admonition { - margin-top: 10px; - margin-bottom: 10px; - padding: 7px; -} - -div.admonition dt { - font-weight: bold; -} - -p.admonition-title { - margin: 0px 10px 5px 0px; - font-weight: bold; -} - -div.body p.centered { - text-align: center; - margin-top: 25px; -} - -/* -- content of sidebars/topics/admonitions -------------------------------- */ - -div.sidebar > :last-child, -aside.sidebar > :last-child, -div.topic > :last-child, -div.admonition > :last-child { - margin-bottom: 0; -} - -div.sidebar::after, -aside.sidebar::after, -div.topic::after, -div.admonition::after, -blockquote::after { - display: block; - content: ''; - clear: both; -} - -/* -- tables ---------------------------------------------------------------- */ - -table.docutils { - margin-top: 10px; - margin-bottom: 10px; - border: 0; - border-collapse: collapse; -} - -table.align-center { - margin-left: auto; - margin-right: auto; -} - -table.align-default { - margin-left: auto; - margin-right: auto; -} - -table caption span.caption-number { - font-style: italic; -} - -table caption span.caption-text { -} - -table.docutils td, table.docutils th { - padding: 1px 8px 1px 5px; - border-top: 0; - border-left: 0; - border-right: 0; - border-bottom: 1px solid #aaa; -} - -table.footnote td, table.footnote th { - border: 0 !important; -} - -th { - text-align: left; - padding-right: 5px; -} - -table.citation { - border-left: solid 1px gray; - margin-left: 1px; -} - -table.citation td { - border-bottom: none; -} - -th > :first-child, -td > :first-child { - margin-top: 0px; -} - -th > :last-child, -td > :last-child { - margin-bottom: 0px; -} - -/* -- figures --------------------------------------------------------------- */ - -div.figure, figure { - margin: 0.5em; - padding: 0.5em; -} - -div.figure p.caption, figcaption { - padding: 0.3em; -} - -div.figure p.caption span.caption-number, -figcaption span.caption-number { - font-style: italic; -} - -div.figure p.caption span.caption-text, -figcaption span.caption-text { -} - -/* -- field list styles ----------------------------------------------------- */ - -table.field-list td, table.field-list th { - border: 0 !important; -} - -.field-list ul { - margin: 0; - padding-left: 1em; -} - -.field-list p { - margin: 0; -} - -.field-name { - -moz-hyphens: manual; - -ms-hyphens: manual; - -webkit-hyphens: manual; - hyphens: manual; -} - -/* -- hlist styles ---------------------------------------------------------- */ - -table.hlist { - margin: 1em 0; -} - -table.hlist td { - vertical-align: top; -} - -/* -- object description styles --------------------------------------------- */ - -.sig { - font-family: 'Consolas', 'Menlo', 'DejaVu Sans Mono', 'Bitstream Vera Sans Mono', monospace; -} - -.sig-name, code.descname { - background-color: transparent; - font-weight: bold; -} - -.sig-name { - font-size: 1.1em; -} - -code.descname { - font-size: 1.2em; -} - -.sig-prename, code.descclassname { - background-color: transparent; -} - -.optional { - font-size: 1.3em; -} - -.sig-paren { - font-size: larger; -} - -.sig-param.n { - font-style: italic; -} - -/* C++ specific styling */ - -.sig-inline.c-texpr, -.sig-inline.cpp-texpr { - font-family: unset; -} - -.sig.c .k, .sig.c .kt, -.sig.cpp .k, .sig.cpp .kt { - color: #0033B3; -} - -.sig.c .m, -.sig.cpp .m { - color: #1750EB; -} - -.sig.c .s, .sig.c .sc, -.sig.cpp .s, .sig.cpp .sc { - color: #067D17; -} - - -/* -- other body styles ----------------------------------------------------- */ - -ol.arabic { - list-style: decimal; -} - -ol.loweralpha { - list-style: lower-alpha; -} - -ol.upperalpha { - list-style: upper-alpha; -} - -ol.lowerroman { - list-style: lower-roman; -} - -ol.upperroman { - list-style: upper-roman; -} - -:not(li) > ol > li:first-child > :first-child, -:not(li) > ul > li:first-child > :first-child { - margin-top: 0px; -} - -:not(li) > ol > li:last-child > :last-child, -:not(li) > ul > li:last-child > :last-child { - margin-bottom: 0px; -} - -ol.simple ol p, -ol.simple ul p, -ul.simple ol p, -ul.simple ul p { - margin-top: 0; -} - -ol.simple > li:not(:first-child) > p, -ul.simple > li:not(:first-child) > p { - margin-top: 0; -} - -ol.simple p, -ul.simple p { - margin-bottom: 0; -} - -dl.footnote > dt, -dl.citation > dt { - float: left; - margin-right: 0.5em; -} - -dl.footnote > dd, -dl.citation > dd { - margin-bottom: 0em; -} - -dl.footnote > dd:after, -dl.citation > dd:after { - content: ""; - clear: both; -} - -dl.field-list { - display: grid; - grid-template-columns: fit-content(30%) auto; -} - -dl.field-list > dt { - font-weight: bold; - word-break: break-word; - padding-left: 0.5em; - padding-right: 5px; -} - -dl.field-list > dt:after { - content: ":"; -} - -dl.field-list > dd { - padding-left: 0.5em; - margin-top: 0em; - margin-left: 0em; - margin-bottom: 0em; -} - -dl { - margin-bottom: 15px; -} - -dd > :first-child { - margin-top: 0px; -} - -dd ul, dd table { - margin-bottom: 10px; -} - -dd { - margin-top: 3px; - margin-bottom: 10px; - margin-left: 30px; -} - -dl > dd:last-child, -dl > dd:last-child > :last-child { - margin-bottom: 0; -} - -dt:target, span.highlighted { - background-color: #fbe54e; -} - -rect.highlighted { - fill: #fbe54e; -} - -dl.glossary dt { - font-weight: bold; - font-size: 1.1em; -} - -.versionmodified { - font-style: italic; -} - -.system-message { - background-color: #fda; - padding: 5px; - border: 3px solid red; -} - -.footnote:target { - background-color: #ffa; -} - -.line-block { - display: block; - margin-top: 1em; - margin-bottom: 1em; -} - -.line-block .line-block { - margin-top: 0; - margin-bottom: 0; - margin-left: 1.5em; -} - -.guilabel, .menuselection { - font-family: sans-serif; -} - -.accelerator { - text-decoration: underline; -} - -.classifier { - font-style: oblique; -} - -.classifier:before { - font-style: normal; - margin: 0 0.5em; - content: ":"; - display: inline-block; -} - -abbr, acronym { - border-bottom: dotted 1px; - cursor: help; -} - -/* -- code displays --------------------------------------------------------- */ - -pre { - overflow: auto; - overflow-y: hidden; /* fixes display issues on Chrome browsers */ -} - -pre, div[class*="highlight-"] { - clear: both; -} - -span.pre { - -moz-hyphens: none; - -ms-hyphens: none; - -webkit-hyphens: none; - hyphens: none; - white-space: nowrap; -} - -div[class*="highlight-"] { - margin: 1em 0; -} - -td.linenos pre { - border: 0; - background-color: transparent; - color: #aaa; -} - -table.highlighttable { - display: block; -} - -table.highlighttable tbody { - display: block; -} - -table.highlighttable tr { - display: flex; -} - -table.highlighttable td { - margin: 0; - padding: 0; -} - -table.highlighttable td.linenos { - padding-right: 0.5em; -} - -table.highlighttable td.code { - flex: 1; - overflow: hidden; -} - -.highlight .hll { - display: block; -} - -div.highlight pre, -table.highlighttable pre { - margin: 0; -} - -div.code-block-caption + div { - margin-top: 0; -} - -div.code-block-caption { - margin-top: 1em; - padding: 2px 5px; - font-size: small; -} - -div.code-block-caption code { - background-color: transparent; -} - -table.highlighttable td.linenos, -span.linenos, -div.highlight span.gp { /* gp: Generic.Prompt */ - user-select: none; - -webkit-user-select: text; /* Safari fallback only */ - -webkit-user-select: none; /* Chrome/Safari */ - -moz-user-select: none; /* Firefox */ - -ms-user-select: none; /* IE10+ */ -} - -div.code-block-caption span.caption-number { - padding: 0.1em 0.3em; - font-style: italic; -} - -div.code-block-caption span.caption-text { -} - -div.literal-block-wrapper { - margin: 1em 0; -} - -code.xref, a code { - background-color: transparent; - font-weight: bold; -} - -h1 code, h2 code, h3 code, h4 code, h5 code, h6 code { - background-color: transparent; -} - -.viewcode-link { - float: right; -} - -.viewcode-back { - float: right; - font-family: sans-serif; -} - -div.viewcode-block:target { - margin: -1px -10px; - padding: 0 10px; -} - -/* -- math display ---------------------------------------------------------- */ - -img.math { - vertical-align: middle; -} - -div.body div.math p { - text-align: center; -} - -span.eqno { - float: right; -} - -span.eqno a.headerlink { - position: absolute; - z-index: 1; -} - -div.math:hover a.headerlink { - visibility: visible; -} - -/* -- printout stylesheet --------------------------------------------------- */ - -@media print { - div.document, - div.documentwrapper, - div.bodywrapper { - margin: 0 !important; - width: 100%; - } - - div.sphinxsidebar, - div.related, - div.footer, - #top-link { - display: none; - } -} \ No newline at end of file diff --git a/docs/_static/check-solid.svg b/docs/_static/check-solid.svg deleted file mode 100644 index 92fad4b..0000000 --- a/docs/_static/check-solid.svg +++ /dev/null @@ -1,4 +0,0 @@ - - - - diff --git a/docs/_static/classtemplate.rst b/docs/_static/classtemplate.rst deleted file mode 100644 index 398a0ec..0000000 --- a/docs/_static/classtemplate.rst +++ /dev/null @@ -1,14 +0,0 @@ -.. role:: hidden - :class: hidden-section -.. currentmodule:: {{ module }} - - -{{ name | underline }} - -.. autoclass:: {{ name }} - :members: - - -.. - autogenerated from source/_templates/classtemplate.rst - note it does not have :inherited-members: diff --git a/docs/_static/clipboard.min.js b/docs/_static/clipboard.min.js deleted file mode 100644 index 54b3c46..0000000 --- a/docs/_static/clipboard.min.js +++ /dev/null @@ -1,7 +0,0 @@ -/*! - * clipboard.js v2.0.8 - * https://clipboardjs.com/ - * - * Licensed MIT © Zeno Rocha - */ -!function(t,e){"object"==typeof exports&&"object"==typeof module?module.exports=e():"function"==typeof define&&define.amd?define([],e):"object"==typeof exports?exports.ClipboardJS=e():t.ClipboardJS=e()}(this,function(){return n={686:function(t,e,n){"use strict";n.d(e,{default:function(){return o}});var e=n(279),i=n.n(e),e=n(370),u=n.n(e),e=n(817),c=n.n(e);function a(t){try{return document.execCommand(t)}catch(t){return}}var f=function(t){t=c()(t);return a("cut"),t};var l=function(t){var e,n,o,r=1 - - - - diff --git a/docs/_static/copybutton.css b/docs/_static/copybutton.css deleted file mode 100644 index 40eafe5..0000000 --- a/docs/_static/copybutton.css +++ /dev/null @@ -1,93 +0,0 @@ -/* Copy buttons */ -button.copybtn { - position: absolute; - display: flex; - top: .3em; - right: .3em; - width: 1.7em; - height: 1.7em; - opacity: 0; - transition: opacity 0.3s, border .3s, background-color .3s; - user-select: none; - padding: 0; - border: none; - outline: none; - border-radius: 0.4em; - /* The colors that GitHub uses */ - border: #1b1f2426 1px solid; - background-color: #f6f8fa; - color: #57606a; -} - -button.copybtn.success { - border-color: #22863a; - color: #22863a; -} - -button.copybtn svg { - stroke: currentColor; - width: 1.5em; - height: 1.5em; - padding: 0.1em; -} - -div.highlight { - position: relative; -} - -.highlight:hover button.copybtn { - opacity: 1; -} - -.highlight button.copybtn:hover { - background-color: rgb(235, 235, 235); -} - -.highlight button.copybtn:active { - background-color: rgb(187, 187, 187); -} - -/** - * A minimal CSS-only tooltip copied from: - * https://codepen.io/mildrenben/pen/rVBrpK - * - * To use, write HTML like the following: - * - *

Short

- */ - .o-tooltip--left { - position: relative; - } - - .o-tooltip--left:after { - opacity: 0; - visibility: hidden; - position: absolute; - content: attr(data-tooltip); - padding: .2em; - font-size: .8em; - left: -.2em; - background: grey; - color: white; - white-space: nowrap; - z-index: 2; - border-radius: 2px; - transform: translateX(-102%) translateY(0); - transition: opacity 0.2s cubic-bezier(0.64, 0.09, 0.08, 1), transform 0.2s cubic-bezier(0.64, 0.09, 0.08, 1); -} - -.o-tooltip--left:hover:after { - display: block; - opacity: 1; - visibility: visible; - transform: translateX(-100%) translateY(0); - transition: opacity 0.2s cubic-bezier(0.64, 0.09, 0.08, 1), transform 0.2s cubic-bezier(0.64, 0.09, 0.08, 1); - transition-delay: .5s; -} - -/* By default the copy button shouldn't show up when printing a page */ -@media print { - button.copybtn { - display: none; - } -} diff --git a/docs/_static/copybutton.js b/docs/_static/copybutton.js deleted file mode 100644 index 40ac331..0000000 --- a/docs/_static/copybutton.js +++ /dev/null @@ -1,220 +0,0 @@ -// Localization support -const messages = { - 'en': { - 'copy': 'Copy', - 'copy_to_clipboard': 'Copy to clipboard', - 'copy_success': 'Copied!', - 'copy_failure': 'Failed to copy', - }, - 'es' : { - 'copy': 'Copiar', - 'copy_to_clipboard': 'Copiar al portapapeles', - 'copy_success': '¡Copiado!', - 'copy_failure': 'Error al copiar', - }, - 'de' : { - 'copy': 'Kopieren', - 'copy_to_clipboard': 'In die Zwischenablage kopieren', - 'copy_success': 'Kopiert!', - 'copy_failure': 'Fehler beim Kopieren', - }, - 'fr' : { - 'copy': 'Copier', - 'copy_to_clipboard': 'Copié dans le presse-papier', - 'copy_success': 'Copié !', - 'copy_failure': 'Échec de la copie', - }, - 'ru': { - 'copy': 'Скопировать', - 'copy_to_clipboard': 'Скопировать в буфер', - 'copy_success': 'Скопировано!', - 'copy_failure': 'Не удалось скопировать', - }, - 'zh-CN': { - 'copy': '复制', - 'copy_to_clipboard': '复制到剪贴板', - 'copy_success': '复制成功!', - 'copy_failure': '复制失败', - }, - 'it' : { - 'copy': 'Copiare', - 'copy_to_clipboard': 'Copiato negli appunti', - 'copy_success': 'Copiato!', - 'copy_failure': 'Errore durante la copia', - } -} - -let locale = 'en' -if( document.documentElement.lang !== undefined - && messages[document.documentElement.lang] !== undefined ) { - locale = document.documentElement.lang -} - -let doc_url_root = DOCUMENTATION_OPTIONS.URL_ROOT; -if (doc_url_root == '#') { - doc_url_root = ''; -} - -/** - * SVG files for our copy buttons - */ -let iconCheck = ` - ${messages[locale]['copy_success']} - - -` - -// If the user specified their own SVG use that, otherwise use the default -let iconCopy = ``; -if (!iconCopy) { - iconCopy = ` - ${messages[locale]['copy_to_clipboard']} - - - -` -} - -/** - * Set up copy/paste for code blocks - */ - -const runWhenDOMLoaded = cb => { - if (document.readyState != 'loading') { - cb() - } else if (document.addEventListener) { - document.addEventListener('DOMContentLoaded', cb) - } else { - document.attachEvent('onreadystatechange', function() { - if (document.readyState == 'complete') cb() - }) - } -} - -const codeCellId = index => `codecell${index}` - -// Clears selected text since ClipboardJS will select the text when copying -const clearSelection = () => { - if (window.getSelection) { - window.getSelection().removeAllRanges() - } else if (document.selection) { - document.selection.empty() - } -} - -// Changes tooltip text for two seconds, then changes it back -const temporarilyChangeTooltip = (el, oldText, newText) => { - el.setAttribute('data-tooltip', newText) - el.classList.add('success') - setTimeout(() => el.setAttribute('data-tooltip', oldText), 2000) - setTimeout(() => el.classList.remove('success'), 2000) -} - -// Changes the copy button icon for two seconds, then changes it back -const temporarilyChangeIcon = (el) => { - el.innerHTML = iconCheck; - setTimeout(() => {el.innerHTML = iconCopy}, 2000) -} - -const addCopyButtonToCodeCells = () => { - // If ClipboardJS hasn't loaded, wait a bit and try again. This - // happens because we load ClipboardJS asynchronously. - if (window.ClipboardJS === undefined) { - setTimeout(addCopyButtonToCodeCells, 250) - return - } - - // Add copybuttons to all of our code cells - const codeCells = document.querySelectorAll('div.highlight pre') - codeCells.forEach((codeCell, index) => { - const id = codeCellId(index) - codeCell.setAttribute('id', id) - - const clipboardButton = id => - `` - codeCell.insertAdjacentHTML('afterend', clipboardButton(id)) - }) - -function escapeRegExp(string) { - return string.replace(/[.*+?^${}()|[\]\\]/g, '\\$&'); // $& means the whole matched string -} - -// Callback when a copy button is clicked. Will be passed the node that was clicked -// should then grab the text and replace pieces of text that shouldn't be used in output -function formatCopyText(textContent, copybuttonPromptText, isRegexp = false, onlyCopyPromptLines = true, removePrompts = true, copyEmptyLines = true, lineContinuationChar = "", hereDocDelim = "") { - - var regexp; - var match; - - // Do we check for line continuation characters and "HERE-documents"? - var useLineCont = !!lineContinuationChar - var useHereDoc = !!hereDocDelim - - // create regexp to capture prompt and remaining line - if (isRegexp) { - regexp = new RegExp('^(' + copybuttonPromptText + ')(.*)') - } else { - regexp = new RegExp('^(' + escapeRegExp(copybuttonPromptText) + ')(.*)') - } - - const outputLines = []; - var promptFound = false; - var gotLineCont = false; - var gotHereDoc = false; - const lineGotPrompt = []; - for (const line of textContent.split('\n')) { - match = line.match(regexp) - if (match || gotLineCont || gotHereDoc) { - promptFound = regexp.test(line) - lineGotPrompt.push(promptFound) - if (removePrompts && promptFound) { - outputLines.push(match[2]) - } else { - outputLines.push(line) - } - gotLineCont = line.endsWith(lineContinuationChar) & useLineCont - if (line.includes(hereDocDelim) & useHereDoc) - gotHereDoc = !gotHereDoc - } else if (!onlyCopyPromptLines) { - outputLines.push(line) - } else if (copyEmptyLines && line.trim() === '') { - outputLines.push(line) - } - } - - // If no lines with the prompt were found then just use original lines - if (lineGotPrompt.some(v => v === true)) { - textContent = outputLines.join('\n'); - } - - // Remove a trailing newline to avoid auto-running when pasting - if (textContent.endsWith("\n")) { - textContent = textContent.slice(0, -1) - } - return textContent -} - - -var copyTargetText = (trigger) => { - var target = document.querySelector(trigger.attributes['data-clipboard-target'].value); - return formatCopyText(target.innerText, '', false, true, true, true, '', '') -} - - // Initialize with a callback so we can modify the text before copy - const clipboard = new ClipboardJS('.copybtn', {text: copyTargetText}) - - // Update UI with error/success messages - clipboard.on('success', event => { - clearSelection() - temporarilyChangeTooltip(event.trigger, messages[locale]['copy'], messages[locale]['copy_success']) - temporarilyChangeIcon(event.trigger) - }) - - clipboard.on('error', event => { - temporarilyChangeTooltip(event.trigger, messages[locale]['copy'], messages[locale]['copy_failure']) - }) -} - -runWhenDOMLoaded(addCopyButtonToCodeCells) \ No newline at end of file diff --git a/docs/_static/copybutton_funcs.js b/docs/_static/copybutton_funcs.js deleted file mode 100644 index b9168c5..0000000 --- a/docs/_static/copybutton_funcs.js +++ /dev/null @@ -1,58 +0,0 @@ -function escapeRegExp(string) { - return string.replace(/[.*+?^${}()|[\]\\]/g, '\\$&'); // $& means the whole matched string -} - -// Callback when a copy button is clicked. Will be passed the node that was clicked -// should then grab the text and replace pieces of text that shouldn't be used in output -export function formatCopyText(textContent, copybuttonPromptText, isRegexp = false, onlyCopyPromptLines = true, removePrompts = true, copyEmptyLines = true, lineContinuationChar = "", hereDocDelim = "") { - - var regexp; - var match; - - // Do we check for line continuation characters and "HERE-documents"? - var useLineCont = !!lineContinuationChar - var useHereDoc = !!hereDocDelim - - // create regexp to capture prompt and remaining line - if (isRegexp) { - regexp = new RegExp('^(' + copybuttonPromptText + ')(.*)') - } else { - regexp = new RegExp('^(' + escapeRegExp(copybuttonPromptText) + ')(.*)') - } - - const outputLines = []; - var promptFound = false; - var gotLineCont = false; - var gotHereDoc = false; - const lineGotPrompt = []; - for (const line of textContent.split('\n')) { - match = line.match(regexp) - if (match || gotLineCont || gotHereDoc) { - promptFound = regexp.test(line) - lineGotPrompt.push(promptFound) - if (removePrompts && promptFound) { - outputLines.push(match[2]) - } else { - outputLines.push(line) - } - gotLineCont = line.endsWith(lineContinuationChar) & useLineCont - if (line.includes(hereDocDelim) & useHereDoc) - gotHereDoc = !gotHereDoc - } else if (!onlyCopyPromptLines) { - outputLines.push(line) - } else if (copyEmptyLines && line.trim() === '') { - outputLines.push(line) - } - } - - // If no lines with the prompt were found then just use original lines - if (lineGotPrompt.some(v => v === true)) { - textContent = outputLines.join('\n'); - } - - // Remove a trailing newline to avoid auto-running when pasting - if (textContent.endsWith("\n")) { - textContent = textContent.slice(0, -1) - } - return textContent -} diff --git a/docs/_static/css/theme.css b/docs/_static/css/theme.css deleted file mode 100644 index 9597990..0000000 --- a/docs/_static/css/theme.css +++ /dev/null @@ -1,14638 +0,0 @@ -@charset "UTF-8"; -/*! - * Bootstrap v4.6.1 (https://getbootstrap.com/) - * Copyright 2011-2021 The Bootstrap Authors - * Copyright 2011-2021 Twitter, Inc. - * Licensed under MIT (https://github.com/twbs/bootstrap/blob/main/LICENSE) - */ -:root { - --blue: #007bff; - --indigo: #6610f2; - --purple: #6f42c1; - --pink: #e83e8c; - --red: #dc3545; - --orange: #fd7e14; - --yellow: #ffc107; - --green: #28a745; - --teal: #20c997; - --cyan: #17a2b8; - --white: #fff; - --gray: #6c757d; - --gray-dark: #343a40; - --primary: #007bff; - --secondary: #6c757d; - --success: #28a745; - --info: #17a2b8; - --warning: #ffc107; - --danger: #dc3545; - --light: #f8f9fa; - --dark: #343a40; - --breakpoint-xs: 0; - --breakpoint-sm: 576px; - --breakpoint-md: 768px; - --breakpoint-lg: 992px; - --breakpoint-xl: 1200px; - --font-family-sans-serif: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, "Helvetica Neue", Arial, "Noto Sans", "Liberation Sans", sans-serif, "Apple Color Emoji", "Segoe UI Emoji", "Segoe UI Symbol", "Noto Color Emoji"; - --font-family-monospace: SFMono-Regular, Menlo, Monaco, Consolas, "Liberation Mono", "Courier New", monospace; -} - -*, -*::before, -*::after { - -webkit-box-sizing: border-box; - box-sizing: border-box; -} - -html { - font-family: sans-serif; - line-height: 1.15; - -webkit-text-size-adjust: 100%; - -webkit-tap-highlight-color: rgba(0, 0, 0, 0); -} - -article, aside, figcaption, figure, footer, header, hgroup, main, nav, section { - display: block; -} - -body { - margin: 0; - font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, "Helvetica Neue", Arial, "Noto Sans", "Liberation Sans", sans-serif, "Apple Color Emoji", "Segoe UI Emoji", "Segoe UI Symbol", "Noto Color Emoji"; - font-size: 1rem; - font-weight: 400; - line-height: 1.5; - color: #212529; - text-align: left; - background-color: #fff; -} - -[tabindex="-1"]:focus:not(:focus-visible) { - outline: 0 !important; -} - -hr { - -webkit-box-sizing: content-box; - box-sizing: content-box; - height: 0; - overflow: visible; -} - -h1, h2, h3, h4, h5, h6 { - margin-top: 0; - margin-bottom: 0.5rem; -} - -p { - margin-top: 0; - margin-bottom: 1rem; -} - -abbr[title], -abbr[data-original-title] { - text-decoration: underline; - -webkit-text-decoration: underline dotted; - text-decoration: underline dotted; - cursor: help; - border-bottom: 0; - -webkit-text-decoration-skip-ink: none; - text-decoration-skip-ink: none; -} - -address { - margin-bottom: 1rem; - font-style: normal; - line-height: inherit; -} - -ol, -ul, -dl { - margin-top: 0; - margin-bottom: 1rem; -} - -ol ol, -ul ul, -ol ul, -ul ol { - margin-bottom: 0; -} - -dt { - font-weight: 700; -} - -dd { - margin-bottom: .5rem; - margin-left: 0; -} - -blockquote { - margin: 0 0 1rem; -} - -b, -strong { - font-weight: bolder; -} - -small { - font-size: 80%; -} - -sub, -sup { - position: relative; - font-size: 75%; - line-height: 0; - vertical-align: baseline; -} - -sub { - bottom: -.25em; -} - -sup { - top: -.5em; -} - -a { - color: #007bff; - text-decoration: none; - background-color: transparent; -} -a:hover { - color: #0056b3; - text-decoration: underline; -} - -a:not([href]):not([class]) { - color: inherit; - text-decoration: none; -} -a:not([href]):not([class]):hover { - color: inherit; - text-decoration: none; -} - -pre, -code, -kbd, -samp { - font-family: SFMono-Regular, Menlo, Monaco, Consolas, "Liberation Mono", "Courier New", monospace; - font-size: 1em; -} - -pre { - margin-top: 0; - margin-bottom: 1rem; - overflow: auto; - -ms-overflow-style: scrollbar; -} - -figure { - margin: 0 0 1rem; -} - -img { - vertical-align: middle; - border-style: none; -} - -svg { - overflow: hidden; - vertical-align: middle; -} - -table { - border-collapse: collapse; -} - -caption { - padding-top: 0.75rem; - padding-bottom: 0.75rem; - color: #6c757d; - text-align: left; - caption-side: bottom; -} - -th { - text-align: inherit; - text-align: -webkit-match-parent; -} - -label { - display: inline-block; - margin-bottom: 0.5rem; -} - -button { - border-radius: 0; -} - -button:focus:not(:focus-visible) { - outline: 0; -} - -input, -button, -select, -optgroup, -textarea { - margin: 0; - font-family: inherit; - font-size: inherit; - line-height: inherit; -} - -button, -input { - overflow: visible; -} - -button, -select { - text-transform: none; -} - -[role="button"] { - cursor: pointer; -} - -select { - word-wrap: normal; -} - -button, -[type="button"], -[type="reset"], -[type="submit"] { - -webkit-appearance: button; -} - -button:not(:disabled), -[type="button"]:not(:disabled), -[type="reset"]:not(:disabled), -[type="submit"]:not(:disabled) { - cursor: pointer; -} - -button::-moz-focus-inner, -[type="button"]::-moz-focus-inner, -[type="reset"]::-moz-focus-inner, -[type="submit"]::-moz-focus-inner { - padding: 0; - border-style: none; -} - -input[type="radio"], -input[type="checkbox"] { - -webkit-box-sizing: border-box; - box-sizing: border-box; - padding: 0; -} - -textarea { - overflow: auto; - resize: vertical; -} - -fieldset { - min-width: 0; - padding: 0; - margin: 0; - border: 0; -} - -legend { - display: block; - width: 100%; - max-width: 100%; - padding: 0; - margin-bottom: .5rem; - font-size: 1.5rem; - line-height: inherit; - color: inherit; - white-space: normal; -} - -progress { - vertical-align: baseline; -} - -[type="number"]::-webkit-inner-spin-button, -[type="number"]::-webkit-outer-spin-button { - height: auto; -} - -[type="search"] { - outline-offset: -2px; - -webkit-appearance: none; -} - -[type="search"]::-webkit-search-decoration { - -webkit-appearance: none; -} - -::-webkit-file-upload-button { - font: inherit; - -webkit-appearance: button; -} - -output { - display: inline-block; -} - -summary { - display: list-item; - cursor: pointer; -} - -template { - display: none; -} - -[hidden] { - display: none !important; -} - -h1, h2, h3, h4, h5, h6, -.h1, .h2, .h3, .h4, .h5, .h6 { - margin-bottom: 0.5rem; - font-weight: 500; - line-height: 1.2; -} - -h1, .h1 { - font-size: 2.5rem; -} - -h2, .h2 { - font-size: 2rem; -} - -h3, .h3 { - font-size: 1.75rem; -} - -h4, .h4 { - font-size: 1.5rem; -} - -h5, .h5 { - font-size: 1.25rem; -} - -h6, .h6 { - font-size: 1rem; -} - -.lead { - font-size: 1.25rem; - font-weight: 300; -} - -.display-1 { - font-size: 6rem; - font-weight: 300; - line-height: 1.2; -} - -.display-2 { - font-size: 5.5rem; - font-weight: 300; - line-height: 1.2; -} - -.display-3 { - font-size: 4.5rem; - font-weight: 300; - line-height: 1.2; -} - -.display-4 { - font-size: 3.5rem; - font-weight: 300; - line-height: 1.2; -} - -hr { - margin-top: 1rem; - margin-bottom: 1rem; - border: 0; - border-top: 1px solid rgba(0, 0, 0, 0.1); -} - -small, -.small { - font-size: 80%; - font-weight: 400; -} - -mark, -.mark { - padding: 0.2em; - background-color: #fcf8e3; -} - -.list-unstyled { - padding-left: 0; - list-style: none; -} - -.list-inline { - padding-left: 0; - list-style: none; -} - -.list-inline-item { - display: inline-block; -} -.list-inline-item:not(:last-child) { - margin-right: 0.5rem; -} - -.initialism { - font-size: 90%; - text-transform: uppercase; -} - -.blockquote { - margin-bottom: 1rem; - font-size: 1.25rem; -} - -.blockquote-footer { - display: block; - font-size: 80%; - color: #6c757d; -} -.blockquote-footer::before { - content: "\2014\00A0"; -} - -.img-fluid { - max-width: 100%; - height: auto; -} - -.img-thumbnail { - padding: 0.25rem; - background-color: #fff; - border: 1px solid #dee2e6; - border-radius: 0.25rem; - max-width: 100%; - height: auto; -} - -.figure { - display: inline-block; -} - -.figure-img { - margin-bottom: 0.5rem; - line-height: 1; -} - -.figure-caption { - font-size: 90%; - color: #6c757d; -} - -code { - font-size: 87.5%; - color: #e83e8c; - word-wrap: break-word; -} -a > code { - color: inherit; -} - -kbd { - padding: 0.2rem 0.4rem; - font-size: 87.5%; - color: #fff; - background-color: #212529; - border-radius: 0.2rem; -} -kbd kbd { - padding: 0; - font-size: 100%; - font-weight: 700; -} - -pre { - display: block; - font-size: 87.5%; - color: #212529; -} -pre code { - font-size: inherit; - color: inherit; - word-break: normal; -} - -.pre-scrollable { - max-height: 340px; - overflow-y: scroll; -} - -.container, -.container-fluid, -.container-sm, -.container-md, -.container-lg, -.container-xl { - width: 100%; - padding-right: 15px; - padding-left: 15px; - margin-right: auto; - margin-left: auto; -} - -@media (min-width: 576px) { - .container, .container-sm { - max-width: 540px; - } -} -@media (min-width: 768px) { - .container, .container-sm, .container-md { - max-width: 720px; - } -} -@media (min-width: 992px) { - .container, .container-sm, .container-md, .container-lg { - max-width: 960px; - } -} -@media (min-width: 1200px) { - .container, .container-sm, .container-md, .container-lg, .container-xl { - max-width: 1140px; - } -} -.row { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -ms-flex-wrap: wrap; - flex-wrap: wrap; - margin-right: -15px; - margin-left: -15px; -} - -.no-gutters { - margin-right: 0; - margin-left: 0; -} -.no-gutters > .col, -.no-gutters > [class*="col-"] { - padding-right: 0; - padding-left: 0; -} - -.col-1, .col-2, .col-3, .col-4, .col-5, .col-6, .col-7, .col-8, .col-9, .col-10, .col-11, .col-12, .col, -.col-auto, .col-sm-1, .col-sm-2, .col-sm-3, .col-sm-4, .col-sm-5, .col-sm-6, .col-sm-7, .col-sm-8, .col-sm-9, .col-sm-10, .col-sm-11, .col-sm-12, .col-sm, -.col-sm-auto, .col-md-1, .col-md-2, .col-md-3, .col-md-4, .col-md-5, .col-md-6, .col-md-7, .col-md-8, .col-md-9, .col-md-10, .col-md-11, .col-md-12, .col-md, -.col-md-auto, .col-lg-1, .col-lg-2, .col-lg-3, .col-lg-4, .col-lg-5, .col-lg-6, .col-lg-7, .col-lg-8, .col-lg-9, .col-lg-10, .col-lg-11, .col-lg-12, .col-lg, -.col-lg-auto, .col-xl-1, .col-xl-2, .col-xl-3, .col-xl-4, .col-xl-5, .col-xl-6, .col-xl-7, .col-xl-8, .col-xl-9, .col-xl-10, .col-xl-11, .col-xl-12, .col-xl, -.col-xl-auto { - position: relative; - width: 100%; - padding-right: 15px; - padding-left: 15px; -} - -.col { - -ms-flex-preferred-size: 0; - flex-basis: 0; - -webkit-box-flex: 1; - -ms-flex-positive: 1; - flex-grow: 1; - max-width: 100%; -} - -.row-cols-1 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 100%; - flex: 0 0 100%; - max-width: 100%; -} - -.row-cols-2 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 50%; - flex: 0 0 50%; - max-width: 50%; -} - -.row-cols-3 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 33.3333333333%; - flex: 0 0 33.3333333333%; - max-width: 33.3333333333%; -} - -.row-cols-4 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 25%; - flex: 0 0 25%; - max-width: 25%; -} - -.row-cols-5 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 20%; - flex: 0 0 20%; - max-width: 20%; -} - -.row-cols-6 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 16.6666666667%; - flex: 0 0 16.6666666667%; - max-width: 16.6666666667%; -} - -.col-auto { - -webkit-box-flex: 0; - -ms-flex: 0 0 auto; - flex: 0 0 auto; - width: auto; - max-width: 100%; -} - -.col-1 { - -webkit-box-flex: 0; - -ms-flex: 0 0 8.33333333%; - flex: 0 0 8.33333333%; - max-width: 8.33333333%; -} - -.col-2 { - -webkit-box-flex: 0; - -ms-flex: 0 0 16.66666667%; - flex: 0 0 16.66666667%; - max-width: 16.66666667%; -} - -.col-3 { - -webkit-box-flex: 0; - -ms-flex: 0 0 25%; - flex: 0 0 25%; - max-width: 25%; -} - -.col-4 { - -webkit-box-flex: 0; - -ms-flex: 0 0 33.33333333%; - flex: 0 0 33.33333333%; - max-width: 33.33333333%; -} - -.col-5 { - -webkit-box-flex: 0; - -ms-flex: 0 0 41.66666667%; - flex: 0 0 41.66666667%; - max-width: 41.66666667%; -} - -.col-6 { - -webkit-box-flex: 0; - -ms-flex: 0 0 50%; - flex: 0 0 50%; - max-width: 50%; -} - -.col-7 { - -webkit-box-flex: 0; - -ms-flex: 0 0 58.33333333%; - flex: 0 0 58.33333333%; - max-width: 58.33333333%; -} - -.col-8 { - -webkit-box-flex: 0; - -ms-flex: 0 0 66.66666667%; - flex: 0 0 66.66666667%; - max-width: 66.66666667%; -} - -.col-9 { - -webkit-box-flex: 0; - -ms-flex: 0 0 75%; - flex: 0 0 75%; - max-width: 75%; -} - -.col-10 { - -webkit-box-flex: 0; - -ms-flex: 0 0 83.33333333%; - flex: 0 0 83.33333333%; - max-width: 83.33333333%; -} - -.col-11 { - -webkit-box-flex: 0; - -ms-flex: 0 0 91.66666667%; - flex: 0 0 91.66666667%; - max-width: 91.66666667%; -} - -.col-12 { - -webkit-box-flex: 0; - -ms-flex: 0 0 100%; - flex: 0 0 100%; - max-width: 100%; -} - -.order-first { - -webkit-box-ordinal-group: 0; - -ms-flex-order: -1; - order: -1; -} - -.order-last { - -webkit-box-ordinal-group: 14; - -ms-flex-order: 13; - order: 13; -} - -.order-0 { - -webkit-box-ordinal-group: 1; - -ms-flex-order: 0; - order: 0; -} - -.order-1 { - -webkit-box-ordinal-group: 2; - -ms-flex-order: 1; - order: 1; -} - -.order-2 { - -webkit-box-ordinal-group: 3; - -ms-flex-order: 2; - order: 2; -} - -.order-3 { - -webkit-box-ordinal-group: 4; - -ms-flex-order: 3; - order: 3; -} - -.order-4 { - -webkit-box-ordinal-group: 5; - -ms-flex-order: 4; - order: 4; -} - -.order-5 { - -webkit-box-ordinal-group: 6; - -ms-flex-order: 5; - order: 5; -} - -.order-6 { - -webkit-box-ordinal-group: 7; - -ms-flex-order: 6; - order: 6; -} - -.order-7 { - -webkit-box-ordinal-group: 8; - -ms-flex-order: 7; - order: 7; -} - -.order-8 { - -webkit-box-ordinal-group: 9; - -ms-flex-order: 8; - order: 8; -} - -.order-9 { - -webkit-box-ordinal-group: 10; - -ms-flex-order: 9; - order: 9; -} - -.order-10 { - -webkit-box-ordinal-group: 11; - -ms-flex-order: 10; - order: 10; -} - -.order-11 { - -webkit-box-ordinal-group: 12; - -ms-flex-order: 11; - order: 11; -} - -.order-12 { - -webkit-box-ordinal-group: 13; - -ms-flex-order: 12; - order: 12; -} - -.offset-1 { - margin-left: 8.33333333%; -} - -.offset-2 { - margin-left: 16.66666667%; -} - -.offset-3 { - margin-left: 25%; -} - -.offset-4 { - margin-left: 33.33333333%; -} - -.offset-5 { - margin-left: 41.66666667%; -} - -.offset-6 { - margin-left: 50%; -} - -.offset-7 { - margin-left: 58.33333333%; -} - -.offset-8 { - margin-left: 66.66666667%; -} - -.offset-9 { - margin-left: 75%; -} - -.offset-10 { - margin-left: 83.33333333%; -} - -.offset-11 { - margin-left: 91.66666667%; -} - -@media (min-width: 576px) { - .col-sm { - -ms-flex-preferred-size: 0; - flex-basis: 0; - -webkit-box-flex: 1; - -ms-flex-positive: 1; - flex-grow: 1; - max-width: 100%; - } - - .row-cols-sm-1 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 100%; - flex: 0 0 100%; - max-width: 100%; - } - - .row-cols-sm-2 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 50%; - flex: 0 0 50%; - max-width: 50%; - } - - .row-cols-sm-3 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 33.3333333333%; - flex: 0 0 33.3333333333%; - max-width: 33.3333333333%; - } - - .row-cols-sm-4 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 25%; - flex: 0 0 25%; - max-width: 25%; - } - - .row-cols-sm-5 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 20%; - flex: 0 0 20%; - max-width: 20%; - } - - .row-cols-sm-6 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 16.6666666667%; - flex: 0 0 16.6666666667%; - max-width: 16.6666666667%; - } - - .col-sm-auto { - -webkit-box-flex: 0; - -ms-flex: 0 0 auto; - flex: 0 0 auto; - width: auto; - max-width: 100%; - } - - .col-sm-1 { - -webkit-box-flex: 0; - -ms-flex: 0 0 8.33333333%; - flex: 0 0 8.33333333%; - max-width: 8.33333333%; - } - - .col-sm-2 { - -webkit-box-flex: 0; - -ms-flex: 0 0 16.66666667%; - flex: 0 0 16.66666667%; - max-width: 16.66666667%; - } - - .col-sm-3 { - -webkit-box-flex: 0; - -ms-flex: 0 0 25%; - flex: 0 0 25%; - max-width: 25%; - } - - .col-sm-4 { - -webkit-box-flex: 0; - -ms-flex: 0 0 33.33333333%; - flex: 0 0 33.33333333%; - max-width: 33.33333333%; - } - - .col-sm-5 { - -webkit-box-flex: 0; - -ms-flex: 0 0 41.66666667%; - flex: 0 0 41.66666667%; - max-width: 41.66666667%; - } - - .col-sm-6 { - -webkit-box-flex: 0; - -ms-flex: 0 0 50%; - flex: 0 0 50%; - max-width: 50%; - } - - .col-sm-7 { - -webkit-box-flex: 0; - -ms-flex: 0 0 58.33333333%; - flex: 0 0 58.33333333%; - max-width: 58.33333333%; - } - - .col-sm-8 { - -webkit-box-flex: 0; - -ms-flex: 0 0 66.66666667%; - flex: 0 0 66.66666667%; - max-width: 66.66666667%; - } - - .col-sm-9 { - -webkit-box-flex: 0; - -ms-flex: 0 0 75%; - flex: 0 0 75%; - max-width: 75%; - } - - .col-sm-10 { - -webkit-box-flex: 0; - -ms-flex: 0 0 83.33333333%; - flex: 0 0 83.33333333%; - max-width: 83.33333333%; - } - - .col-sm-11 { - -webkit-box-flex: 0; - -ms-flex: 0 0 91.66666667%; - flex: 0 0 91.66666667%; - max-width: 91.66666667%; - } - - .col-sm-12 { - -webkit-box-flex: 0; - -ms-flex: 0 0 100%; - flex: 0 0 100%; - max-width: 100%; - } - - .order-sm-first { - -webkit-box-ordinal-group: 0; - -ms-flex-order: -1; - order: -1; - } - - .order-sm-last { - -webkit-box-ordinal-group: 14; - -ms-flex-order: 13; - order: 13; - } - - .order-sm-0 { - -webkit-box-ordinal-group: 1; - -ms-flex-order: 0; - order: 0; - } - - .order-sm-1 { - -webkit-box-ordinal-group: 2; - -ms-flex-order: 1; - order: 1; - } - - .order-sm-2 { - -webkit-box-ordinal-group: 3; - -ms-flex-order: 2; - order: 2; - } - - .order-sm-3 { - -webkit-box-ordinal-group: 4; - -ms-flex-order: 3; - order: 3; - } - - .order-sm-4 { - -webkit-box-ordinal-group: 5; - -ms-flex-order: 4; - order: 4; - } - - .order-sm-5 { - -webkit-box-ordinal-group: 6; - -ms-flex-order: 5; - order: 5; - } - - .order-sm-6 { - -webkit-box-ordinal-group: 7; - -ms-flex-order: 6; - order: 6; - } - - .order-sm-7 { - -webkit-box-ordinal-group: 8; - -ms-flex-order: 7; - order: 7; - } - - .order-sm-8 { - -webkit-box-ordinal-group: 9; - -ms-flex-order: 8; - order: 8; - } - - .order-sm-9 { - -webkit-box-ordinal-group: 10; - -ms-flex-order: 9; - order: 9; - } - - .order-sm-10 { - -webkit-box-ordinal-group: 11; - -ms-flex-order: 10; - order: 10; - } - - .order-sm-11 { - -webkit-box-ordinal-group: 12; - -ms-flex-order: 11; - order: 11; - } - - .order-sm-12 { - -webkit-box-ordinal-group: 13; - -ms-flex-order: 12; - order: 12; - } - - .offset-sm-0 { - margin-left: 0; - } - - .offset-sm-1 { - margin-left: 8.33333333%; - } - - .offset-sm-2 { - margin-left: 16.66666667%; - } - - .offset-sm-3 { - margin-left: 25%; - } - - .offset-sm-4 { - margin-left: 33.33333333%; - } - - .offset-sm-5 { - margin-left: 41.66666667%; - } - - .offset-sm-6 { - margin-left: 50%; - } - - .offset-sm-7 { - margin-left: 58.33333333%; - } - - .offset-sm-8 { - margin-left: 66.66666667%; - } - - .offset-sm-9 { - margin-left: 75%; - } - - .offset-sm-10 { - margin-left: 83.33333333%; - } - - .offset-sm-11 { - margin-left: 91.66666667%; - } -} -@media (min-width: 768px) { - .col-md { - -ms-flex-preferred-size: 0; - flex-basis: 0; - -webkit-box-flex: 1; - -ms-flex-positive: 1; - flex-grow: 1; - max-width: 100%; - } - - .row-cols-md-1 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 100%; - flex: 0 0 100%; - max-width: 100%; - } - - .row-cols-md-2 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 50%; - flex: 0 0 50%; - max-width: 50%; - } - - .row-cols-md-3 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 33.3333333333%; - flex: 0 0 33.3333333333%; - max-width: 33.3333333333%; - } - - .row-cols-md-4 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 25%; - flex: 0 0 25%; - max-width: 25%; - } - - .row-cols-md-5 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 20%; - flex: 0 0 20%; - max-width: 20%; - } - - .row-cols-md-6 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 16.6666666667%; - flex: 0 0 16.6666666667%; - max-width: 16.6666666667%; - } - - .col-md-auto { - -webkit-box-flex: 0; - -ms-flex: 0 0 auto; - flex: 0 0 auto; - width: auto; - max-width: 100%; - } - - .col-md-1 { - -webkit-box-flex: 0; - -ms-flex: 0 0 8.33333333%; - flex: 0 0 8.33333333%; - max-width: 8.33333333%; - } - - .col-md-2 { - -webkit-box-flex: 0; - -ms-flex: 0 0 16.66666667%; - flex: 0 0 16.66666667%; - max-width: 16.66666667%; - } - - .col-md-3 { - -webkit-box-flex: 0; - -ms-flex: 0 0 25%; - flex: 0 0 25%; - max-width: 25%; - } - - .col-md-4 { - -webkit-box-flex: 0; - -ms-flex: 0 0 33.33333333%; - flex: 0 0 33.33333333%; - max-width: 33.33333333%; - } - - .col-md-5 { - -webkit-box-flex: 0; - -ms-flex: 0 0 41.66666667%; - flex: 0 0 41.66666667%; - max-width: 41.66666667%; - } - - .col-md-6 { - -webkit-box-flex: 0; - -ms-flex: 0 0 50%; - flex: 0 0 50%; - max-width: 50%; - } - - .col-md-7 { - -webkit-box-flex: 0; - -ms-flex: 0 0 58.33333333%; - flex: 0 0 58.33333333%; - max-width: 58.33333333%; - } - - .col-md-8 { - -webkit-box-flex: 0; - -ms-flex: 0 0 66.66666667%; - flex: 0 0 66.66666667%; - max-width: 66.66666667%; - } - - .col-md-9 { - -webkit-box-flex: 0; - -ms-flex: 0 0 75%; - flex: 0 0 75%; - max-width: 75%; - } - - .col-md-10 { - -webkit-box-flex: 0; - -ms-flex: 0 0 83.33333333%; - flex: 0 0 83.33333333%; - max-width: 83.33333333%; - } - - .col-md-11 { - -webkit-box-flex: 0; - -ms-flex: 0 0 91.66666667%; - flex: 0 0 91.66666667%; - max-width: 91.66666667%; - } - - .col-md-12 { - -webkit-box-flex: 0; - -ms-flex: 0 0 100%; - flex: 0 0 100%; - max-width: 100%; - } - - .order-md-first { - -webkit-box-ordinal-group: 0; - -ms-flex-order: -1; - order: -1; - } - - .order-md-last { - -webkit-box-ordinal-group: 14; - -ms-flex-order: 13; - order: 13; - } - - .order-md-0 { - -webkit-box-ordinal-group: 1; - -ms-flex-order: 0; - order: 0; - } - - .order-md-1 { - -webkit-box-ordinal-group: 2; - -ms-flex-order: 1; - order: 1; - } - - .order-md-2 { - -webkit-box-ordinal-group: 3; - -ms-flex-order: 2; - order: 2; - } - - .order-md-3 { - -webkit-box-ordinal-group: 4; - -ms-flex-order: 3; - order: 3; - } - - .order-md-4 { - -webkit-box-ordinal-group: 5; - -ms-flex-order: 4; - order: 4; - } - - .order-md-5 { - -webkit-box-ordinal-group: 6; - -ms-flex-order: 5; - order: 5; - } - - .order-md-6 { - -webkit-box-ordinal-group: 7; - -ms-flex-order: 6; - order: 6; - } - - .order-md-7 { - -webkit-box-ordinal-group: 8; - -ms-flex-order: 7; - order: 7; - } - - .order-md-8 { - -webkit-box-ordinal-group: 9; - -ms-flex-order: 8; - order: 8; - } - - .order-md-9 { - -webkit-box-ordinal-group: 10; - -ms-flex-order: 9; - order: 9; - } - - .order-md-10 { - -webkit-box-ordinal-group: 11; - -ms-flex-order: 10; - order: 10; - } - - .order-md-11 { - -webkit-box-ordinal-group: 12; - -ms-flex-order: 11; - order: 11; - } - - .order-md-12 { - -webkit-box-ordinal-group: 13; - -ms-flex-order: 12; - order: 12; - } - - .offset-md-0 { - margin-left: 0; - } - - .offset-md-1 { - margin-left: 8.33333333%; - } - - .offset-md-2 { - margin-left: 16.66666667%; - } - - .offset-md-3 { - margin-left: 25%; - } - - .offset-md-4 { - margin-left: 33.33333333%; - } - - .offset-md-5 { - margin-left: 41.66666667%; - } - - .offset-md-6 { - margin-left: 50%; - } - - .offset-md-7 { - margin-left: 58.33333333%; - } - - .offset-md-8 { - margin-left: 66.66666667%; - } - - .offset-md-9 { - margin-left: 75%; - } - - .offset-md-10 { - margin-left: 83.33333333%; - } - - .offset-md-11 { - margin-left: 91.66666667%; - } -} -@media (min-width: 992px) { - .col-lg { - -ms-flex-preferred-size: 0; - flex-basis: 0; - -webkit-box-flex: 1; - -ms-flex-positive: 1; - flex-grow: 1; - max-width: 100%; - } - - .row-cols-lg-1 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 100%; - flex: 0 0 100%; - max-width: 100%; - } - - .row-cols-lg-2 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 50%; - flex: 0 0 50%; - max-width: 50%; - } - - .row-cols-lg-3 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 33.3333333333%; - flex: 0 0 33.3333333333%; - max-width: 33.3333333333%; - } - - .row-cols-lg-4 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 25%; - flex: 0 0 25%; - max-width: 25%; - } - - .row-cols-lg-5 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 20%; - flex: 0 0 20%; - max-width: 20%; - } - - .row-cols-lg-6 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 16.6666666667%; - flex: 0 0 16.6666666667%; - max-width: 16.6666666667%; - } - - .col-lg-auto { - -webkit-box-flex: 0; - -ms-flex: 0 0 auto; - flex: 0 0 auto; - width: auto; - max-width: 100%; - } - - .col-lg-1 { - -webkit-box-flex: 0; - -ms-flex: 0 0 8.33333333%; - flex: 0 0 8.33333333%; - max-width: 8.33333333%; - } - - .col-lg-2 { - -webkit-box-flex: 0; - -ms-flex: 0 0 16.66666667%; - flex: 0 0 16.66666667%; - max-width: 16.66666667%; - } - - .col-lg-3 { - -webkit-box-flex: 0; - -ms-flex: 0 0 25%; - flex: 0 0 25%; - max-width: 25%; - } - - .col-lg-4 { - -webkit-box-flex: 0; - -ms-flex: 0 0 33.33333333%; - flex: 0 0 33.33333333%; - max-width: 33.33333333%; - } - - .col-lg-5 { - -webkit-box-flex: 0; - -ms-flex: 0 0 41.66666667%; - flex: 0 0 41.66666667%; - max-width: 41.66666667%; - } - - .col-lg-6 { - -webkit-box-flex: 0; - -ms-flex: 0 0 50%; - flex: 0 0 50%; - max-width: 50%; - } - - .col-lg-7 { - -webkit-box-flex: 0; - -ms-flex: 0 0 58.33333333%; - flex: 0 0 58.33333333%; - max-width: 58.33333333%; - } - - .col-lg-8 { - -webkit-box-flex: 0; - -ms-flex: 0 0 66.66666667%; - flex: 0 0 66.66666667%; - max-width: 66.66666667%; - } - - .col-lg-9 { - -webkit-box-flex: 0; - -ms-flex: 0 0 75%; - flex: 0 0 75%; - max-width: 75%; - } - - .col-lg-10 { - -webkit-box-flex: 0; - -ms-flex: 0 0 83.33333333%; - flex: 0 0 83.33333333%; - max-width: 83.33333333%; - } - - .col-lg-11 { - -webkit-box-flex: 0; - -ms-flex: 0 0 91.66666667%; - flex: 0 0 91.66666667%; - max-width: 91.66666667%; - } - - .col-lg-12 { - -webkit-box-flex: 0; - -ms-flex: 0 0 100%; - flex: 0 0 100%; - max-width: 100%; - } - - .order-lg-first { - -webkit-box-ordinal-group: 0; - -ms-flex-order: -1; - order: -1; - } - - .order-lg-last { - -webkit-box-ordinal-group: 14; - -ms-flex-order: 13; - order: 13; - } - - .order-lg-0 { - -webkit-box-ordinal-group: 1; - -ms-flex-order: 0; - order: 0; - } - - .order-lg-1 { - -webkit-box-ordinal-group: 2; - -ms-flex-order: 1; - order: 1; - } - - .order-lg-2 { - -webkit-box-ordinal-group: 3; - -ms-flex-order: 2; - order: 2; - } - - .order-lg-3 { - -webkit-box-ordinal-group: 4; - -ms-flex-order: 3; - order: 3; - } - - .order-lg-4 { - -webkit-box-ordinal-group: 5; - -ms-flex-order: 4; - order: 4; - } - - .order-lg-5 { - -webkit-box-ordinal-group: 6; - -ms-flex-order: 5; - order: 5; - } - - .order-lg-6 { - -webkit-box-ordinal-group: 7; - -ms-flex-order: 6; - order: 6; - } - - .order-lg-7 { - -webkit-box-ordinal-group: 8; - -ms-flex-order: 7; - order: 7; - } - - .order-lg-8 { - -webkit-box-ordinal-group: 9; - -ms-flex-order: 8; - order: 8; - } - - .order-lg-9 { - -webkit-box-ordinal-group: 10; - -ms-flex-order: 9; - order: 9; - } - - .order-lg-10 { - -webkit-box-ordinal-group: 11; - -ms-flex-order: 10; - order: 10; - } - - .order-lg-11 { - -webkit-box-ordinal-group: 12; - -ms-flex-order: 11; - order: 11; - } - - .order-lg-12 { - -webkit-box-ordinal-group: 13; - -ms-flex-order: 12; - order: 12; - } - - .offset-lg-0 { - margin-left: 0; - } - - .offset-lg-1 { - margin-left: 8.33333333%; - } - - .offset-lg-2 { - margin-left: 16.66666667%; - } - - .offset-lg-3 { - margin-left: 25%; - } - - .offset-lg-4 { - margin-left: 33.33333333%; - } - - .offset-lg-5 { - margin-left: 41.66666667%; - } - - .offset-lg-6 { - margin-left: 50%; - } - - .offset-lg-7 { - margin-left: 58.33333333%; - } - - .offset-lg-8 { - margin-left: 66.66666667%; - } - - .offset-lg-9 { - margin-left: 75%; - } - - .offset-lg-10 { - margin-left: 83.33333333%; - } - - .offset-lg-11 { - margin-left: 91.66666667%; - } -} -@media (min-width: 1200px) { - .col-xl { - -ms-flex-preferred-size: 0; - flex-basis: 0; - -webkit-box-flex: 1; - -ms-flex-positive: 1; - flex-grow: 1; - max-width: 100%; - } - - .row-cols-xl-1 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 100%; - flex: 0 0 100%; - max-width: 100%; - } - - .row-cols-xl-2 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 50%; - flex: 0 0 50%; - max-width: 50%; - } - - .row-cols-xl-3 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 33.3333333333%; - flex: 0 0 33.3333333333%; - max-width: 33.3333333333%; - } - - .row-cols-xl-4 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 25%; - flex: 0 0 25%; - max-width: 25%; - } - - .row-cols-xl-5 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 20%; - flex: 0 0 20%; - max-width: 20%; - } - - .row-cols-xl-6 > * { - -webkit-box-flex: 0; - -ms-flex: 0 0 16.6666666667%; - flex: 0 0 16.6666666667%; - max-width: 16.6666666667%; - } - - .col-xl-auto { - -webkit-box-flex: 0; - -ms-flex: 0 0 auto; - flex: 0 0 auto; - width: auto; - max-width: 100%; - } - - .col-xl-1 { - -webkit-box-flex: 0; - -ms-flex: 0 0 8.33333333%; - flex: 0 0 8.33333333%; - max-width: 8.33333333%; - } - - .col-xl-2 { - -webkit-box-flex: 0; - -ms-flex: 0 0 16.66666667%; - flex: 0 0 16.66666667%; - max-width: 16.66666667%; - } - - .col-xl-3 { - -webkit-box-flex: 0; - -ms-flex: 0 0 25%; - flex: 0 0 25%; - max-width: 25%; - } - - .col-xl-4 { - -webkit-box-flex: 0; - -ms-flex: 0 0 33.33333333%; - flex: 0 0 33.33333333%; - max-width: 33.33333333%; - } - - .col-xl-5 { - -webkit-box-flex: 0; - -ms-flex: 0 0 41.66666667%; - flex: 0 0 41.66666667%; - max-width: 41.66666667%; - } - - .col-xl-6 { - -webkit-box-flex: 0; - -ms-flex: 0 0 50%; - flex: 0 0 50%; - max-width: 50%; - } - - .col-xl-7 { - -webkit-box-flex: 0; - -ms-flex: 0 0 58.33333333%; - flex: 0 0 58.33333333%; - max-width: 58.33333333%; - } - - .col-xl-8 { - -webkit-box-flex: 0; - -ms-flex: 0 0 66.66666667%; - flex: 0 0 66.66666667%; - max-width: 66.66666667%; - } - - .col-xl-9 { - -webkit-box-flex: 0; - -ms-flex: 0 0 75%; - flex: 0 0 75%; - max-width: 75%; - } - - .col-xl-10 { - -webkit-box-flex: 0; - -ms-flex: 0 0 83.33333333%; - flex: 0 0 83.33333333%; - max-width: 83.33333333%; - } - - .col-xl-11 { - -webkit-box-flex: 0; - -ms-flex: 0 0 91.66666667%; - flex: 0 0 91.66666667%; - max-width: 91.66666667%; - } - - .col-xl-12 { - -webkit-box-flex: 0; - -ms-flex: 0 0 100%; - flex: 0 0 100%; - max-width: 100%; - } - - .order-xl-first { - -webkit-box-ordinal-group: 0; - -ms-flex-order: -1; - order: -1; - } - - .order-xl-last { - -webkit-box-ordinal-group: 14; - -ms-flex-order: 13; - order: 13; - } - - .order-xl-0 { - -webkit-box-ordinal-group: 1; - -ms-flex-order: 0; - order: 0; - } - - .order-xl-1 { - -webkit-box-ordinal-group: 2; - -ms-flex-order: 1; - order: 1; - } - - .order-xl-2 { - -webkit-box-ordinal-group: 3; - -ms-flex-order: 2; - order: 2; - } - - .order-xl-3 { - -webkit-box-ordinal-group: 4; - -ms-flex-order: 3; - order: 3; - } - - .order-xl-4 { - -webkit-box-ordinal-group: 5; - -ms-flex-order: 4; - order: 4; - } - - .order-xl-5 { - -webkit-box-ordinal-group: 6; - -ms-flex-order: 5; - order: 5; - } - - .order-xl-6 { - -webkit-box-ordinal-group: 7; - -ms-flex-order: 6; - order: 6; - } - - .order-xl-7 { - -webkit-box-ordinal-group: 8; - -ms-flex-order: 7; - order: 7; - } - - .order-xl-8 { - -webkit-box-ordinal-group: 9; - -ms-flex-order: 8; - order: 8; - } - - .order-xl-9 { - -webkit-box-ordinal-group: 10; - -ms-flex-order: 9; - order: 9; - } - - .order-xl-10 { - -webkit-box-ordinal-group: 11; - -ms-flex-order: 10; - order: 10; - } - - .order-xl-11 { - -webkit-box-ordinal-group: 12; - -ms-flex-order: 11; - order: 11; - } - - .order-xl-12 { - -webkit-box-ordinal-group: 13; - -ms-flex-order: 12; - order: 12; - } - - .offset-xl-0 { - margin-left: 0; - } - - .offset-xl-1 { - margin-left: 8.33333333%; - } - - .offset-xl-2 { - margin-left: 16.66666667%; - } - - .offset-xl-3 { - margin-left: 25%; - } - - .offset-xl-4 { - margin-left: 33.33333333%; - } - - .offset-xl-5 { - margin-left: 41.66666667%; - } - - .offset-xl-6 { - margin-left: 50%; - } - - .offset-xl-7 { - margin-left: 58.33333333%; - } - - .offset-xl-8 { - margin-left: 66.66666667%; - } - - .offset-xl-9 { - margin-left: 75%; - } - - .offset-xl-10 { - margin-left: 83.33333333%; - } - - .offset-xl-11 { - margin-left: 91.66666667%; - } -} -.table { - width: 100%; - margin-bottom: 1rem; - color: #212529; -} -.table th, -.table td { - padding: 0.75rem; - vertical-align: top; - border-top: 1px solid #dee2e6; -} -.table thead th { - vertical-align: bottom; - border-bottom: 2px solid #dee2e6; -} -.table tbody + tbody { - border-top: 2px solid #dee2e6; -} - -.table-sm th, -.table-sm td { - padding: 0.3rem; -} - -.table-bordered { - border: 1px solid #dee2e6; -} -.table-bordered th, -.table-bordered td { - border: 1px solid #dee2e6; -} -.table-bordered thead th, -.table-bordered thead td { - border-bottom-width: 2px; -} - -.table-borderless th, -.table-borderless td, -.table-borderless thead th, -.table-borderless tbody + tbody { - border: 0; -} - -.table-striped tbody tr:nth-of-type(odd) { - background-color: rgba(0, 0, 0, 0.05); -} - -.table-hover tbody tr:hover { - color: #212529; - background-color: rgba(0, 0, 0, 0.075); -} - -.table-primary, -.table-primary > th, -.table-primary > td { - background-color: #b8daff; -} -.table-primary th, -.table-primary td, -.table-primary thead th, -.table-primary tbody + tbody { - border-color: #7abaff; -} - -.table-hover .table-primary:hover { - background-color: #9fcdff; -} -.table-hover .table-primary:hover > td, -.table-hover .table-primary:hover > th { - background-color: #9fcdff; -} - -.table-secondary, -.table-secondary > th, -.table-secondary > td { - background-color: #d6d8db; -} -.table-secondary th, -.table-secondary td, -.table-secondary thead th, -.table-secondary tbody + tbody { - border-color: #b3b7bb; -} - -.table-hover .table-secondary:hover { - background-color: #c8cbcf; -} -.table-hover .table-secondary:hover > td, -.table-hover .table-secondary:hover > th { - background-color: #c8cbcf; -} - -.table-success, -.table-success > th, -.table-success > td { - background-color: #c3e6cb; -} -.table-success th, -.table-success td, -.table-success thead th, -.table-success tbody + tbody { - border-color: #8fd19e; -} - -.table-hover .table-success:hover { - background-color: #b1dfbb; -} -.table-hover .table-success:hover > td, -.table-hover .table-success:hover > th { - background-color: #b1dfbb; -} - -.table-info, -.table-info > th, -.table-info > td { - background-color: #bee5eb; -} -.table-info th, -.table-info td, -.table-info thead th, -.table-info tbody + tbody { - border-color: #86cfda; -} - -.table-hover .table-info:hover { - background-color: #abdde5; -} -.table-hover .table-info:hover > td, -.table-hover .table-info:hover > th { - background-color: #abdde5; -} - -.table-warning, -.table-warning > th, -.table-warning > td { - background-color: #ffeeba; -} -.table-warning th, -.table-warning td, -.table-warning thead th, -.table-warning tbody + tbody { - border-color: #ffdf7e; -} - -.table-hover .table-warning:hover { - background-color: #ffe8a1; -} -.table-hover .table-warning:hover > td, -.table-hover .table-warning:hover > th { - background-color: #ffe8a1; -} - -.table-danger, -.table-danger > th, -.table-danger > td { - background-color: #f5c6cb; -} -.table-danger th, -.table-danger td, -.table-danger thead th, -.table-danger tbody + tbody { - border-color: #ed969e; -} - -.table-hover .table-danger:hover { - background-color: #f1b0b7; -} -.table-hover .table-danger:hover > td, -.table-hover .table-danger:hover > th { - background-color: #f1b0b7; -} - -.table-light, -.table-light > th, -.table-light > td { - background-color: #fdfdfe; -} -.table-light th, -.table-light td, -.table-light thead th, -.table-light tbody + tbody { - border-color: #fbfcfc; -} - -.table-hover .table-light:hover { - background-color: #ececf6; -} -.table-hover .table-light:hover > td, -.table-hover .table-light:hover > th { - background-color: #ececf6; -} - -.table-dark, -.table-dark > th, -.table-dark > td { - background-color: #c6c8ca; -} -.table-dark th, -.table-dark td, -.table-dark thead th, -.table-dark tbody + tbody { - border-color: #95999c; -} - -.table-hover .table-dark:hover { - background-color: #b9bbbe; -} -.table-hover .table-dark:hover > td, -.table-hover .table-dark:hover > th { - background-color: #b9bbbe; -} - -.table-active, -.table-active > th, -.table-active > td { - background-color: rgba(0, 0, 0, 0.075); -} - -.table-hover .table-active:hover { - background-color: rgba(0, 0, 0, 0.075); -} -.table-hover .table-active:hover > td, -.table-hover .table-active:hover > th { - background-color: rgba(0, 0, 0, 0.075); -} - -.table .thead-dark th { - color: #fff; - background-color: #343a40; - border-color: #454d55; -} -.table .thead-light th { - color: #495057; - background-color: #e9ecef; - border-color: #dee2e6; -} - -.table-dark { - color: #fff; - background-color: #343a40; -} -.table-dark th, -.table-dark td, -.table-dark thead th { - border-color: #454d55; -} -.table-dark.table-bordered { - border: 0; -} -.table-dark.table-striped tbody tr:nth-of-type(odd) { - background-color: rgba(255, 255, 255, 0.05); -} -.table-dark.table-hover tbody tr:hover { - color: #fff; - background-color: rgba(255, 255, 255, 0.075); -} - -@media (max-width: 575.98px) { - .table-responsive-sm { - display: block; - width: 100%; - overflow-x: auto; - -webkit-overflow-scrolling: touch; - } - .table-responsive-sm > .table-bordered { - border: 0; - } -} -@media (max-width: 767.98px) { - .table-responsive-md { - display: block; - width: 100%; - overflow-x: auto; - -webkit-overflow-scrolling: touch; - } - .table-responsive-md > .table-bordered { - border: 0; - } -} -@media (max-width: 991.98px) { - .table-responsive-lg { - display: block; - width: 100%; - overflow-x: auto; - -webkit-overflow-scrolling: touch; - } - .table-responsive-lg > .table-bordered { - border: 0; - } -} -@media (max-width: 1199.98px) { - .table-responsive-xl { - display: block; - width: 100%; - overflow-x: auto; - -webkit-overflow-scrolling: touch; - } - .table-responsive-xl > .table-bordered { - border: 0; - } -} -.table-responsive { - display: block; - width: 100%; - overflow-x: auto; - -webkit-overflow-scrolling: touch; -} -.table-responsive > .table-bordered { - border: 0; -} - -.form-control { - display: block; - width: 100%; - height: calc(1.5em + 0.75rem + 2px); - padding: 0.375rem 0.75rem; - font-size: 1rem; - font-weight: 400; - line-height: 1.5; - color: #495057; - background-color: #fff; - background-clip: padding-box; - border: 1px solid #ced4da; - border-radius: 0.25rem; - -webkit-transition: border-color 0.15s ease-in-out, -webkit-box-shadow 0.15s ease-in-out; - transition: border-color 0.15s ease-in-out, -webkit-box-shadow 0.15s ease-in-out; - transition: border-color 0.15s ease-in-out, box-shadow 0.15s ease-in-out; - transition: border-color 0.15s ease-in-out, box-shadow 0.15s ease-in-out, -webkit-box-shadow 0.15s ease-in-out; -} -@media (prefers-reduced-motion: reduce) { - .form-control { - -webkit-transition: none; - transition: none; - } -} -.form-control::-ms-expand { - background-color: transparent; - border: 0; -} -.form-control:focus { - color: #495057; - background-color: #fff; - border-color: #80bdff; - outline: 0; - -webkit-box-shadow: 0 0 0 0.2rem rgba(0, 123, 255, 0.25); - box-shadow: 0 0 0 0.2rem rgba(0, 123, 255, 0.25); -} -.form-control::-webkit-input-placeholder { - color: #6c757d; - opacity: 1; -} -.form-control::-moz-placeholder { - color: #6c757d; - opacity: 1; -} -.form-control:-ms-input-placeholder { - color: #6c757d; - opacity: 1; -} -.form-control::-ms-input-placeholder { - color: #6c757d; - opacity: 1; -} -.form-control::placeholder { - color: #6c757d; - opacity: 1; -} -.form-control:disabled, .form-control[readonly] { - background-color: #e9ecef; - opacity: 1; -} - -input[type="date"].form-control, -input[type="time"].form-control, -input[type="datetime-local"].form-control, -input[type="month"].form-control { - -webkit-appearance: none; - -moz-appearance: none; - appearance: none; -} - -select.form-control:-moz-focusring { - color: transparent; - text-shadow: 0 0 0 #495057; -} -select.form-control:focus::-ms-value { - color: #495057; - background-color: #fff; -} - -.form-control-file, -.form-control-range { - display: block; - width: 100%; -} - -.col-form-label { - padding-top: calc(0.375rem + 1px); - padding-bottom: calc(0.375rem + 1px); - margin-bottom: 0; - font-size: inherit; - line-height: 1.5; -} - -.col-form-label-lg { - padding-top: calc(0.5rem + 1px); - padding-bottom: calc(0.5rem + 1px); - font-size: 1.25rem; - line-height: 1.5; -} - -.col-form-label-sm { - padding-top: calc(0.25rem + 1px); - padding-bottom: calc(0.25rem + 1px); - font-size: 0.875rem; - line-height: 1.5; -} - -.form-control-plaintext { - display: block; - width: 100%; - padding: 0.375rem 0; - margin-bottom: 0; - font-size: 1rem; - line-height: 1.5; - color: #212529; - background-color: transparent; - border: solid transparent; - border-width: 1px 0; -} -.form-control-plaintext.form-control-sm, .form-control-plaintext.form-control-lg { - padding-right: 0; - padding-left: 0; -} - -.form-control-sm { - height: calc(1.5em + 0.5rem + 2px); - padding: 0.25rem 0.5rem; - font-size: 0.875rem; - line-height: 1.5; - border-radius: 0.2rem; -} - -.form-control-lg { - height: calc(1.5em + 1rem + 2px); - padding: 0.5rem 1rem; - font-size: 1.25rem; - line-height: 1.5; - border-radius: 0.3rem; -} - -select.form-control[size], select.form-control[multiple] { - height: auto; -} - -textarea.form-control { - height: auto; -} - -.form-group { - margin-bottom: 1rem; -} - -.form-text { - display: block; - margin-top: 0.25rem; -} - -.form-row { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -ms-flex-wrap: wrap; - flex-wrap: wrap; - margin-right: -5px; - margin-left: -5px; -} -.form-row > .col, -.form-row > [class*="col-"] { - padding-right: 5px; - padding-left: 5px; -} - -.form-check { - position: relative; - display: block; - padding-left: 1.25rem; -} - -.form-check-input { - position: absolute; - margin-top: 0.3rem; - margin-left: -1.25rem; -} -.form-check-input[disabled] ~ .form-check-label, .form-check-input:disabled ~ .form-check-label { - color: #6c757d; -} - -.form-check-label { - margin-bottom: 0; -} - -.form-check-inline { - display: -webkit-inline-box; - display: -ms-inline-flexbox; - display: inline-flex; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; - padding-left: 0; - margin-right: 0.75rem; -} -.form-check-inline .form-check-input { - position: static; - margin-top: 0; - margin-right: 0.3125rem; - margin-left: 0; -} - -.valid-feedback { - display: none; - width: 100%; - margin-top: 0.25rem; - font-size: 80%; - color: #28a745; -} - -.valid-tooltip { - position: absolute; - top: 100%; - left: 0; - z-index: 5; - display: none; - max-width: 100%; - padding: 0.25rem 0.5rem; - margin-top: .1rem; - font-size: 0.875rem; - line-height: 1.5; - color: #fff; - background-color: rgba(40, 167, 69, 0.9); - border-radius: 0.25rem; -} -.form-row > .col > .valid-tooltip, .form-row > [class*="col-"] > .valid-tooltip { - left: 5px; -} - -.was-validated :valid ~ .valid-feedback, -.was-validated :valid ~ .valid-tooltip, -.is-valid ~ .valid-feedback, -.is-valid ~ .valid-tooltip { - display: block; -} - -.was-validated .form-control:valid, .form-control.is-valid { - border-color: #28a745; - padding-right: calc(1.5em + 0.75rem) !important; - background-image: url("data:image/svg+xml,%3csvg xmlns='http://www.w3.org/2000/svg' width='8' height='8' viewBox='0 0 8 8'%3e%3cpath fill='%2328a745' d='M2.3 6.73L.6 4.53c-.4-1.04.46-1.4 1.1-.8l1.1 1.4 3.4-3.8c.6-.63 1.6-.27 1.2.7l-4 4.6c-.43.5-.8.4-1.1.1z'/%3e%3c/svg%3e"); - background-repeat: no-repeat; - background-position: right calc(0.375em + 0.1875rem) center; - background-size: calc(0.75em + 0.375rem) calc(0.75em + 0.375rem); -} -.was-validated .form-control:valid:focus, .form-control.is-valid:focus { - border-color: #28a745; - -webkit-box-shadow: 0 0 0 0.2rem rgba(40, 167, 69, 0.25); - box-shadow: 0 0 0 0.2rem rgba(40, 167, 69, 0.25); -} - -.was-validated select.form-control:valid, select.form-control.is-valid { - padding-right: 3rem !important; - background-position: right 1.5rem center; -} - -.was-validated textarea.form-control:valid, textarea.form-control.is-valid { - padding-right: calc(1.5em + 0.75rem); - background-position: top calc(0.375em + 0.1875rem) right calc(0.375em + 0.1875rem); -} - -.was-validated .custom-select:valid, .custom-select.is-valid { - border-color: #28a745; - padding-right: calc(0.75em + 2.3125rem) !important; - background: url("data:image/svg+xml,%3csvg xmlns='http://www.w3.org/2000/svg' width='4' height='5' viewBox='0 0 4 5'%3e%3cpath fill='%23343a40' d='M2 0L0 2h4zm0 5L0 3h4z'/%3e%3c/svg%3e") right 0.75rem center/8px 10px no-repeat, #fff url("data:image/svg+xml,%3csvg xmlns='http://www.w3.org/2000/svg' width='8' height='8' viewBox='0 0 8 8'%3e%3cpath fill='%2328a745' d='M2.3 6.73L.6 4.53c-.4-1.04.46-1.4 1.1-.8l1.1 1.4 3.4-3.8c.6-.63 1.6-.27 1.2.7l-4 4.6c-.43.5-.8.4-1.1.1z'/%3e%3c/svg%3e") center right 1.75rem/calc(0.75em + 0.375rem) calc(0.75em + 0.375rem) no-repeat; -} -.was-validated .custom-select:valid:focus, .custom-select.is-valid:focus { - border-color: #28a745; - -webkit-box-shadow: 0 0 0 0.2rem rgba(40, 167, 69, 0.25); - box-shadow: 0 0 0 0.2rem rgba(40, 167, 69, 0.25); -} - -.was-validated .form-check-input:valid ~ .form-check-label, .form-check-input.is-valid ~ .form-check-label { - color: #28a745; -} -.was-validated .form-check-input:valid ~ .valid-feedback, -.was-validated .form-check-input:valid ~ .valid-tooltip, .form-check-input.is-valid ~ .valid-feedback, -.form-check-input.is-valid ~ .valid-tooltip { - display: block; -} - -.was-validated .custom-control-input:valid ~ .custom-control-label, .custom-control-input.is-valid ~ .custom-control-label { - color: #28a745; -} -.was-validated .custom-control-input:valid ~ .custom-control-label::before, .custom-control-input.is-valid ~ .custom-control-label::before { - border-color: #28a745; -} -.was-validated .custom-control-input:valid:checked ~ .custom-control-label::before, .custom-control-input.is-valid:checked ~ .custom-control-label::before { - border-color: #34ce57; - background-color: #34ce57; -} -.was-validated .custom-control-input:valid:focus ~ .custom-control-label::before, .custom-control-input.is-valid:focus ~ .custom-control-label::before { - -webkit-box-shadow: 0 0 0 0.2rem rgba(40, 167, 69, 0.25); - box-shadow: 0 0 0 0.2rem rgba(40, 167, 69, 0.25); -} -.was-validated .custom-control-input:valid:focus:not(:checked) ~ .custom-control-label::before, .custom-control-input.is-valid:focus:not(:checked) ~ .custom-control-label::before { - border-color: #28a745; -} - -.was-validated .custom-file-input:valid ~ .custom-file-label, .custom-file-input.is-valid ~ .custom-file-label { - border-color: #28a745; -} -.was-validated .custom-file-input:valid:focus ~ .custom-file-label, .custom-file-input.is-valid:focus ~ .custom-file-label { - border-color: #28a745; - -webkit-box-shadow: 0 0 0 0.2rem rgba(40, 167, 69, 0.25); - box-shadow: 0 0 0 0.2rem rgba(40, 167, 69, 0.25); -} - -.invalid-feedback { - display: none; - width: 100%; - margin-top: 0.25rem; - font-size: 80%; - color: #dc3545; -} - -.invalid-tooltip { - position: absolute; - top: 100%; - left: 0; - z-index: 5; - display: none; - max-width: 100%; - padding: 0.25rem 0.5rem; - margin-top: .1rem; - font-size: 0.875rem; - line-height: 1.5; - color: #fff; - background-color: rgba(220, 53, 69, 0.9); - border-radius: 0.25rem; -} -.form-row > .col > .invalid-tooltip, .form-row > [class*="col-"] > .invalid-tooltip { - left: 5px; -} - -.was-validated :invalid ~ .invalid-feedback, -.was-validated :invalid ~ .invalid-tooltip, -.is-invalid ~ .invalid-feedback, -.is-invalid ~ .invalid-tooltip { - display: block; -} - -.was-validated .form-control:invalid, .form-control.is-invalid { - border-color: #dc3545; - padding-right: calc(1.5em + 0.75rem) !important; - background-image: url("data:image/svg+xml,%3csvg xmlns='http://www.w3.org/2000/svg' width='12' height='12' fill='none' stroke='%23dc3545' viewBox='0 0 12 12'%3e%3ccircle cx='6' cy='6' r='4.5'/%3e%3cpath stroke-linejoin='round' d='M5.8 3.6h.4L6 6.5z'/%3e%3ccircle cx='6' cy='8.2' r='.6' fill='%23dc3545' stroke='none'/%3e%3c/svg%3e"); - background-repeat: no-repeat; - background-position: right calc(0.375em + 0.1875rem) center; - background-size: calc(0.75em + 0.375rem) calc(0.75em + 0.375rem); -} -.was-validated .form-control:invalid:focus, .form-control.is-invalid:focus { - border-color: #dc3545; - -webkit-box-shadow: 0 0 0 0.2rem rgba(220, 53, 69, 0.25); - box-shadow: 0 0 0 0.2rem rgba(220, 53, 69, 0.25); -} - -.was-validated select.form-control:invalid, select.form-control.is-invalid { - padding-right: 3rem !important; - background-position: right 1.5rem center; -} - -.was-validated textarea.form-control:invalid, textarea.form-control.is-invalid { - padding-right: calc(1.5em + 0.75rem); - background-position: top calc(0.375em + 0.1875rem) right calc(0.375em + 0.1875rem); -} - -.was-validated .custom-select:invalid, .custom-select.is-invalid { - border-color: #dc3545; - padding-right: calc(0.75em + 2.3125rem) !important; - background: url("data:image/svg+xml,%3csvg xmlns='http://www.w3.org/2000/svg' width='4' height='5' viewBox='0 0 4 5'%3e%3cpath fill='%23343a40' d='M2 0L0 2h4zm0 5L0 3h4z'/%3e%3c/svg%3e") right 0.75rem center/8px 10px no-repeat, #fff url("data:image/svg+xml,%3csvg xmlns='http://www.w3.org/2000/svg' width='12' height='12' fill='none' stroke='%23dc3545' viewBox='0 0 12 12'%3e%3ccircle cx='6' cy='6' r='4.5'/%3e%3cpath stroke-linejoin='round' d='M5.8 3.6h.4L6 6.5z'/%3e%3ccircle cx='6' cy='8.2' r='.6' fill='%23dc3545' stroke='none'/%3e%3c/svg%3e") center right 1.75rem/calc(0.75em + 0.375rem) calc(0.75em + 0.375rem) no-repeat; -} -.was-validated .custom-select:invalid:focus, .custom-select.is-invalid:focus { - border-color: #dc3545; - -webkit-box-shadow: 0 0 0 0.2rem rgba(220, 53, 69, 0.25); - box-shadow: 0 0 0 0.2rem rgba(220, 53, 69, 0.25); -} - -.was-validated .form-check-input:invalid ~ .form-check-label, .form-check-input.is-invalid ~ .form-check-label { - color: #dc3545; -} -.was-validated .form-check-input:invalid ~ .invalid-feedback, -.was-validated .form-check-input:invalid ~ .invalid-tooltip, .form-check-input.is-invalid ~ .invalid-feedback, -.form-check-input.is-invalid ~ .invalid-tooltip { - display: block; -} - -.was-validated .custom-control-input:invalid ~ .custom-control-label, .custom-control-input.is-invalid ~ .custom-control-label { - color: #dc3545; -} -.was-validated .custom-control-input:invalid ~ .custom-control-label::before, .custom-control-input.is-invalid ~ .custom-control-label::before { - border-color: #dc3545; -} -.was-validated .custom-control-input:invalid:checked ~ .custom-control-label::before, .custom-control-input.is-invalid:checked ~ .custom-control-label::before { - border-color: #e4606d; - background-color: #e4606d; -} -.was-validated .custom-control-input:invalid:focus ~ .custom-control-label::before, .custom-control-input.is-invalid:focus ~ .custom-control-label::before { - -webkit-box-shadow: 0 0 0 0.2rem rgba(220, 53, 69, 0.25); - box-shadow: 0 0 0 0.2rem rgba(220, 53, 69, 0.25); -} -.was-validated .custom-control-input:invalid:focus:not(:checked) ~ .custom-control-label::before, .custom-control-input.is-invalid:focus:not(:checked) ~ .custom-control-label::before { - border-color: #dc3545; -} - -.was-validated .custom-file-input:invalid ~ .custom-file-label, .custom-file-input.is-invalid ~ .custom-file-label { - border-color: #dc3545; -} -.was-validated .custom-file-input:invalid:focus ~ .custom-file-label, .custom-file-input.is-invalid:focus ~ .custom-file-label { - border-color: #dc3545; - -webkit-box-shadow: 0 0 0 0.2rem rgba(220, 53, 69, 0.25); - box-shadow: 0 0 0 0.2rem rgba(220, 53, 69, 0.25); -} - -.form-inline { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-flow: row wrap; - flex-flow: row wrap; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; -} -.form-inline .form-check { - width: 100%; -} -@media (min-width: 576px) { - .form-inline label { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; - -webkit-box-pack: center; - -ms-flex-pack: center; - justify-content: center; - margin-bottom: 0; - } - .form-inline .form-group { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-flex: 0; - -ms-flex: 0 0 auto; - flex: 0 0 auto; - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-flow: row wrap; - flex-flow: row wrap; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; - margin-bottom: 0; - } - .form-inline .form-control { - display: inline-block; - width: auto; - vertical-align: middle; - } - .form-inline .form-control-plaintext { - display: inline-block; - } - .form-inline .input-group, - .form-inline .custom-select { - width: auto; - } - .form-inline .form-check { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; - -webkit-box-pack: center; - -ms-flex-pack: center; - justify-content: center; - width: auto; - padding-left: 0; - } - .form-inline .form-check-input { - position: relative; - -ms-flex-negative: 0; - flex-shrink: 0; - margin-top: 0; - margin-right: 0.25rem; - margin-left: 0; - } - .form-inline .custom-control { - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; - -webkit-box-pack: center; - -ms-flex-pack: center; - justify-content: center; - } - .form-inline .custom-control-label { - margin-bottom: 0; - } -} - -.btn { - display: inline-block; - font-weight: 400; - color: #212529; - text-align: center; - vertical-align: middle; - -webkit-user-select: none; - -moz-user-select: none; - -ms-user-select: none; - user-select: none; - background-color: transparent; - border: 1px solid transparent; - padding: 0.375rem 0.75rem; - font-size: 1rem; - line-height: 1.5; - border-radius: 0.25rem; - -webkit-transition: color 0.15s ease-in-out, background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, -webkit-box-shadow 0.15s ease-in-out; - transition: color 0.15s ease-in-out, background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, -webkit-box-shadow 0.15s ease-in-out; - transition: color 0.15s ease-in-out, background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, box-shadow 0.15s ease-in-out; - transition: color 0.15s ease-in-out, background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, box-shadow 0.15s ease-in-out, -webkit-box-shadow 0.15s ease-in-out; -} -@media (prefers-reduced-motion: reduce) { - .btn { - -webkit-transition: none; - transition: none; - } -} -.btn:hover { - color: #212529; - text-decoration: none; -} -.btn:focus, .btn.focus { - outline: 0; - -webkit-box-shadow: 0 0 0 0.2rem rgba(0, 123, 255, 0.25); - box-shadow: 0 0 0 0.2rem rgba(0, 123, 255, 0.25); -} -.btn.disabled, .btn:disabled { - opacity: 0.65; -} -.btn:not(:disabled):not(.disabled) { - cursor: pointer; -} - -a.btn.disabled, -fieldset:disabled a.btn { - pointer-events: none; -} - -.btn-primary { - color: #fff; - background-color: #007bff; - border-color: #007bff; -} -.btn-primary:hover { - color: #fff; - background-color: #0069d9; - border-color: #0062cc; -} -.btn-primary:focus, .btn-primary.focus { - color: #fff; - background-color: #0069d9; - border-color: #0062cc; - -webkit-box-shadow: 0 0 0 0.2rem rgba(38, 143, 255, 0.5); - box-shadow: 0 0 0 0.2rem rgba(38, 143, 255, 0.5); -} -.btn-primary.disabled, .btn-primary:disabled { - color: #fff; - background-color: #007bff; - border-color: #007bff; -} -.btn-primary:not(:disabled):not(.disabled):active, .btn-primary:not(:disabled):not(.disabled).active, .show > .btn-primary.dropdown-toggle { - color: #fff; - background-color: #0062cc; - border-color: #005cbf; -} -.btn-primary:not(:disabled):not(.disabled):active:focus, .btn-primary:not(:disabled):not(.disabled).active:focus, .show > .btn-primary.dropdown-toggle:focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(38, 143, 255, 0.5); - box-shadow: 0 0 0 0.2rem rgba(38, 143, 255, 0.5); -} - -.btn-secondary { - color: #fff; - background-color: #6c757d; - border-color: #6c757d; -} -.btn-secondary:hover { - color: #fff; - background-color: #5a6268; - border-color: #545b62; -} -.btn-secondary:focus, .btn-secondary.focus { - color: #fff; - background-color: #5a6268; - border-color: #545b62; - -webkit-box-shadow: 0 0 0 0.2rem rgba(130, 138, 145, 0.5); - box-shadow: 0 0 0 0.2rem rgba(130, 138, 145, 0.5); -} -.btn-secondary.disabled, .btn-secondary:disabled { - color: #fff; - background-color: #6c757d; - border-color: #6c757d; -} -.btn-secondary:not(:disabled):not(.disabled):active, .btn-secondary:not(:disabled):not(.disabled).active, .show > .btn-secondary.dropdown-toggle { - color: #fff; - background-color: #545b62; - border-color: #4e555b; -} -.btn-secondary:not(:disabled):not(.disabled):active:focus, .btn-secondary:not(:disabled):not(.disabled).active:focus, .show > .btn-secondary.dropdown-toggle:focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(130, 138, 145, 0.5); - box-shadow: 0 0 0 0.2rem rgba(130, 138, 145, 0.5); -} - -.btn-success { - color: #fff; - background-color: #28a745; - border-color: #28a745; -} -.btn-success:hover { - color: #fff; - background-color: #218838; - border-color: #1e7e34; -} -.btn-success:focus, .btn-success.focus { - color: #fff; - background-color: #218838; - border-color: #1e7e34; - -webkit-box-shadow: 0 0 0 0.2rem rgba(72, 180, 97, 0.5); - box-shadow: 0 0 0 0.2rem rgba(72, 180, 97, 0.5); -} -.btn-success.disabled, .btn-success:disabled { - color: #fff; - background-color: #28a745; - border-color: #28a745; -} -.btn-success:not(:disabled):not(.disabled):active, .btn-success:not(:disabled):not(.disabled).active, .show > .btn-success.dropdown-toggle { - color: #fff; - background-color: #1e7e34; - border-color: #1c7430; -} -.btn-success:not(:disabled):not(.disabled):active:focus, .btn-success:not(:disabled):not(.disabled).active:focus, .show > .btn-success.dropdown-toggle:focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(72, 180, 97, 0.5); - box-shadow: 0 0 0 0.2rem rgba(72, 180, 97, 0.5); -} - -.btn-info { - color: #fff; - background-color: #17a2b8; - border-color: #17a2b8; -} -.btn-info:hover { - color: #fff; - background-color: #138496; - border-color: #117a8b; -} -.btn-info:focus, .btn-info.focus { - color: #fff; - background-color: #138496; - border-color: #117a8b; - -webkit-box-shadow: 0 0 0 0.2rem rgba(58, 176, 195, 0.5); - box-shadow: 0 0 0 0.2rem rgba(58, 176, 195, 0.5); -} -.btn-info.disabled, .btn-info:disabled { - color: #fff; - background-color: #17a2b8; - border-color: #17a2b8; -} -.btn-info:not(:disabled):not(.disabled):active, .btn-info:not(:disabled):not(.disabled).active, .show > .btn-info.dropdown-toggle { - color: #fff; - background-color: #117a8b; - border-color: #10707f; -} -.btn-info:not(:disabled):not(.disabled):active:focus, .btn-info:not(:disabled):not(.disabled).active:focus, .show > .btn-info.dropdown-toggle:focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(58, 176, 195, 0.5); - box-shadow: 0 0 0 0.2rem rgba(58, 176, 195, 0.5); -} - -.btn-warning { - color: #212529; - background-color: #ffc107; - border-color: #ffc107; -} -.btn-warning:hover { - color: #212529; - background-color: #e0a800; - border-color: #d39e00; -} -.btn-warning:focus, .btn-warning.focus { - color: #212529; - background-color: #e0a800; - border-color: #d39e00; - -webkit-box-shadow: 0 0 0 0.2rem rgba(222, 170, 12, 0.5); - box-shadow: 0 0 0 0.2rem rgba(222, 170, 12, 0.5); -} -.btn-warning.disabled, .btn-warning:disabled { - color: #212529; - background-color: #ffc107; - border-color: #ffc107; -} -.btn-warning:not(:disabled):not(.disabled):active, .btn-warning:not(:disabled):not(.disabled).active, .show > .btn-warning.dropdown-toggle { - color: #212529; - background-color: #d39e00; - border-color: #c69500; -} -.btn-warning:not(:disabled):not(.disabled):active:focus, .btn-warning:not(:disabled):not(.disabled).active:focus, .show > .btn-warning.dropdown-toggle:focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(222, 170, 12, 0.5); - box-shadow: 0 0 0 0.2rem rgba(222, 170, 12, 0.5); -} - -.btn-danger { - color: #fff; - background-color: #dc3545; - border-color: #dc3545; -} -.btn-danger:hover { - color: #fff; - background-color: #c82333; - border-color: #bd2130; -} -.btn-danger:focus, .btn-danger.focus { - color: #fff; - background-color: #c82333; - border-color: #bd2130; - -webkit-box-shadow: 0 0 0 0.2rem rgba(225, 83, 97, 0.5); - box-shadow: 0 0 0 0.2rem rgba(225, 83, 97, 0.5); -} -.btn-danger.disabled, .btn-danger:disabled { - color: #fff; - background-color: #dc3545; - border-color: #dc3545; -} -.btn-danger:not(:disabled):not(.disabled):active, .btn-danger:not(:disabled):not(.disabled).active, .show > .btn-danger.dropdown-toggle { - color: #fff; - background-color: #bd2130; - border-color: #b21f2d; -} -.btn-danger:not(:disabled):not(.disabled):active:focus, .btn-danger:not(:disabled):not(.disabled).active:focus, .show > .btn-danger.dropdown-toggle:focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(225, 83, 97, 0.5); - box-shadow: 0 0 0 0.2rem rgba(225, 83, 97, 0.5); -} - -.btn-light { - color: #212529; - background-color: #f8f9fa; - border-color: #f8f9fa; -} -.btn-light:hover { - color: #212529; - background-color: #e2e6ea; - border-color: #dae0e5; -} -.btn-light:focus, .btn-light.focus { - color: #212529; - background-color: #e2e6ea; - border-color: #dae0e5; - -webkit-box-shadow: 0 0 0 0.2rem rgba(216, 217, 219, 0.5); - box-shadow: 0 0 0 0.2rem rgba(216, 217, 219, 0.5); -} -.btn-light.disabled, .btn-light:disabled { - color: #212529; - background-color: #f8f9fa; - border-color: #f8f9fa; -} -.btn-light:not(:disabled):not(.disabled):active, .btn-light:not(:disabled):not(.disabled).active, .show > .btn-light.dropdown-toggle { - color: #212529; - background-color: #dae0e5; - border-color: #d3d9df; -} -.btn-light:not(:disabled):not(.disabled):active:focus, .btn-light:not(:disabled):not(.disabled).active:focus, .show > .btn-light.dropdown-toggle:focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(216, 217, 219, 0.5); - box-shadow: 0 0 0 0.2rem rgba(216, 217, 219, 0.5); -} - -.btn-dark { - color: #fff; - background-color: #343a40; - border-color: #343a40; -} -.btn-dark:hover { - color: #fff; - background-color: #23272b; - border-color: #1d2124; -} -.btn-dark:focus, .btn-dark.focus { - color: #fff; - background-color: #23272b; - border-color: #1d2124; - -webkit-box-shadow: 0 0 0 0.2rem rgba(82, 88, 93, 0.5); - box-shadow: 0 0 0 0.2rem rgba(82, 88, 93, 0.5); -} -.btn-dark.disabled, .btn-dark:disabled { - color: #fff; - background-color: #343a40; - border-color: #343a40; -} -.btn-dark:not(:disabled):not(.disabled):active, .btn-dark:not(:disabled):not(.disabled).active, .show > .btn-dark.dropdown-toggle { - color: #fff; - background-color: #1d2124; - border-color: #171a1d; -} -.btn-dark:not(:disabled):not(.disabled):active:focus, .btn-dark:not(:disabled):not(.disabled).active:focus, .show > .btn-dark.dropdown-toggle:focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(82, 88, 93, 0.5); - box-shadow: 0 0 0 0.2rem rgba(82, 88, 93, 0.5); -} - -.btn-outline-primary { - color: #007bff; - border-color: #007bff; -} -.btn-outline-primary:hover { - color: #fff; - background-color: #007bff; - border-color: #007bff; -} -.btn-outline-primary:focus, .btn-outline-primary.focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(0, 123, 255, 0.5); - box-shadow: 0 0 0 0.2rem rgba(0, 123, 255, 0.5); -} -.btn-outline-primary.disabled, .btn-outline-primary:disabled { - color: #007bff; - background-color: transparent; -} -.btn-outline-primary:not(:disabled):not(.disabled):active, .btn-outline-primary:not(:disabled):not(.disabled).active, .show > .btn-outline-primary.dropdown-toggle { - color: #fff; - background-color: #007bff; - border-color: #007bff; -} -.btn-outline-primary:not(:disabled):not(.disabled):active:focus, .btn-outline-primary:not(:disabled):not(.disabled).active:focus, .show > .btn-outline-primary.dropdown-toggle:focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(0, 123, 255, 0.5); - box-shadow: 0 0 0 0.2rem rgba(0, 123, 255, 0.5); -} - -.btn-outline-secondary { - color: #6c757d; - border-color: #6c757d; -} -.btn-outline-secondary:hover { - color: #fff; - background-color: #6c757d; - border-color: #6c757d; -} -.btn-outline-secondary:focus, .btn-outline-secondary.focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(108, 117, 125, 0.5); - box-shadow: 0 0 0 0.2rem rgba(108, 117, 125, 0.5); -} -.btn-outline-secondary.disabled, .btn-outline-secondary:disabled { - color: #6c757d; - background-color: transparent; -} -.btn-outline-secondary:not(:disabled):not(.disabled):active, .btn-outline-secondary:not(:disabled):not(.disabled).active, .show > .btn-outline-secondary.dropdown-toggle { - color: #fff; - background-color: #6c757d; - border-color: #6c757d; -} -.btn-outline-secondary:not(:disabled):not(.disabled):active:focus, .btn-outline-secondary:not(:disabled):not(.disabled).active:focus, .show > .btn-outline-secondary.dropdown-toggle:focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(108, 117, 125, 0.5); - box-shadow: 0 0 0 0.2rem rgba(108, 117, 125, 0.5); -} - -.btn-outline-success { - color: #28a745; - border-color: #28a745; -} -.btn-outline-success:hover { - color: #fff; - background-color: #28a745; - border-color: #28a745; -} -.btn-outline-success:focus, .btn-outline-success.focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(40, 167, 69, 0.5); - box-shadow: 0 0 0 0.2rem rgba(40, 167, 69, 0.5); -} -.btn-outline-success.disabled, .btn-outline-success:disabled { - color: #28a745; - background-color: transparent; -} -.btn-outline-success:not(:disabled):not(.disabled):active, .btn-outline-success:not(:disabled):not(.disabled).active, .show > .btn-outline-success.dropdown-toggle { - color: #fff; - background-color: #28a745; - border-color: #28a745; -} -.btn-outline-success:not(:disabled):not(.disabled):active:focus, .btn-outline-success:not(:disabled):not(.disabled).active:focus, .show > .btn-outline-success.dropdown-toggle:focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(40, 167, 69, 0.5); - box-shadow: 0 0 0 0.2rem rgba(40, 167, 69, 0.5); -} - -.btn-outline-info { - color: #17a2b8; - border-color: #17a2b8; -} -.btn-outline-info:hover { - color: #fff; - background-color: #17a2b8; - border-color: #17a2b8; -} -.btn-outline-info:focus, .btn-outline-info.focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(23, 162, 184, 0.5); - box-shadow: 0 0 0 0.2rem rgba(23, 162, 184, 0.5); -} -.btn-outline-info.disabled, .btn-outline-info:disabled { - color: #17a2b8; - background-color: transparent; -} -.btn-outline-info:not(:disabled):not(.disabled):active, .btn-outline-info:not(:disabled):not(.disabled).active, .show > .btn-outline-info.dropdown-toggle { - color: #fff; - background-color: #17a2b8; - border-color: #17a2b8; -} -.btn-outline-info:not(:disabled):not(.disabled):active:focus, .btn-outline-info:not(:disabled):not(.disabled).active:focus, .show > .btn-outline-info.dropdown-toggle:focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(23, 162, 184, 0.5); - box-shadow: 0 0 0 0.2rem rgba(23, 162, 184, 0.5); -} - -.btn-outline-warning { - color: #ffc107; - border-color: #ffc107; -} -.btn-outline-warning:hover { - color: #212529; - background-color: #ffc107; - border-color: #ffc107; -} -.btn-outline-warning:focus, .btn-outline-warning.focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(255, 193, 7, 0.5); - box-shadow: 0 0 0 0.2rem rgba(255, 193, 7, 0.5); -} -.btn-outline-warning.disabled, .btn-outline-warning:disabled { - color: #ffc107; - background-color: transparent; -} -.btn-outline-warning:not(:disabled):not(.disabled):active, .btn-outline-warning:not(:disabled):not(.disabled).active, .show > .btn-outline-warning.dropdown-toggle { - color: #212529; - background-color: #ffc107; - border-color: #ffc107; -} -.btn-outline-warning:not(:disabled):not(.disabled):active:focus, .btn-outline-warning:not(:disabled):not(.disabled).active:focus, .show > .btn-outline-warning.dropdown-toggle:focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(255, 193, 7, 0.5); - box-shadow: 0 0 0 0.2rem rgba(255, 193, 7, 0.5); -} - -.btn-outline-danger { - color: #dc3545; - border-color: #dc3545; -} -.btn-outline-danger:hover { - color: #fff; - background-color: #dc3545; - border-color: #dc3545; -} -.btn-outline-danger:focus, .btn-outline-danger.focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(220, 53, 69, 0.5); - box-shadow: 0 0 0 0.2rem rgba(220, 53, 69, 0.5); -} -.btn-outline-danger.disabled, .btn-outline-danger:disabled { - color: #dc3545; - background-color: transparent; -} -.btn-outline-danger:not(:disabled):not(.disabled):active, .btn-outline-danger:not(:disabled):not(.disabled).active, .show > .btn-outline-danger.dropdown-toggle { - color: #fff; - background-color: #dc3545; - border-color: #dc3545; -} -.btn-outline-danger:not(:disabled):not(.disabled):active:focus, .btn-outline-danger:not(:disabled):not(.disabled).active:focus, .show > .btn-outline-danger.dropdown-toggle:focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(220, 53, 69, 0.5); - box-shadow: 0 0 0 0.2rem rgba(220, 53, 69, 0.5); -} - -.btn-outline-light { - color: #f8f9fa; - border-color: #f8f9fa; -} -.btn-outline-light:hover { - color: #212529; - background-color: #f8f9fa; - border-color: #f8f9fa; -} -.btn-outline-light:focus, .btn-outline-light.focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(248, 249, 250, 0.5); - box-shadow: 0 0 0 0.2rem rgba(248, 249, 250, 0.5); -} -.btn-outline-light.disabled, .btn-outline-light:disabled { - color: #f8f9fa; - background-color: transparent; -} -.btn-outline-light:not(:disabled):not(.disabled):active, .btn-outline-light:not(:disabled):not(.disabled).active, .show > .btn-outline-light.dropdown-toggle { - color: #212529; - background-color: #f8f9fa; - border-color: #f8f9fa; -} -.btn-outline-light:not(:disabled):not(.disabled):active:focus, .btn-outline-light:not(:disabled):not(.disabled).active:focus, .show > .btn-outline-light.dropdown-toggle:focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(248, 249, 250, 0.5); - box-shadow: 0 0 0 0.2rem rgba(248, 249, 250, 0.5); -} - -.btn-outline-dark { - color: #343a40; - border-color: #343a40; -} -.btn-outline-dark:hover { - color: #fff; - background-color: #343a40; - border-color: #343a40; -} -.btn-outline-dark:focus, .btn-outline-dark.focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(52, 58, 64, 0.5); - box-shadow: 0 0 0 0.2rem rgba(52, 58, 64, 0.5); -} -.btn-outline-dark.disabled, .btn-outline-dark:disabled { - color: #343a40; - background-color: transparent; -} -.btn-outline-dark:not(:disabled):not(.disabled):active, .btn-outline-dark:not(:disabled):not(.disabled).active, .show > .btn-outline-dark.dropdown-toggle { - color: #fff; - background-color: #343a40; - border-color: #343a40; -} -.btn-outline-dark:not(:disabled):not(.disabled):active:focus, .btn-outline-dark:not(:disabled):not(.disabled).active:focus, .show > .btn-outline-dark.dropdown-toggle:focus { - -webkit-box-shadow: 0 0 0 0.2rem rgba(52, 58, 64, 0.5); - box-shadow: 0 0 0 0.2rem rgba(52, 58, 64, 0.5); -} - -.btn-link { - font-weight: 400; - color: #007bff; - text-decoration: none; -} -.btn-link:hover { - color: #0056b3; - text-decoration: underline; -} -.btn-link:focus, .btn-link.focus { - text-decoration: underline; -} -.btn-link:disabled, .btn-link.disabled { - color: #6c757d; - pointer-events: none; -} - -.btn-lg, .btn-group-lg > .btn { - padding: 0.5rem 1rem; - font-size: 1.25rem; - line-height: 1.5; - border-radius: 0.3rem; -} - -.btn-sm, .btn-group-sm > .btn { - padding: 0.25rem 0.5rem; - font-size: 0.875rem; - line-height: 1.5; - border-radius: 0.2rem; -} - -.btn-block { - display: block; - width: 100%; -} -.btn-block + .btn-block { - margin-top: 0.5rem; -} - -input[type="submit"].btn-block, -input[type="reset"].btn-block, -input[type="button"].btn-block { - width: 100%; -} - -.fade { - -webkit-transition: opacity 0.15s linear; - transition: opacity 0.15s linear; -} -@media (prefers-reduced-motion: reduce) { - .fade { - -webkit-transition: none; - transition: none; - } -} -.fade:not(.show) { - opacity: 0; -} - -.collapse:not(.show) { - display: none; -} - -.collapsing { - position: relative; - height: 0; - overflow: hidden; - -webkit-transition: height 0.35s ease; - transition: height 0.35s ease; -} -@media (prefers-reduced-motion: reduce) { - .collapsing { - -webkit-transition: none; - transition: none; - } -} - -.dropup, -.dropright, -.dropdown, -.dropleft { - position: relative; -} - -.dropdown-toggle { - white-space: nowrap; -} -.dropdown-toggle::after { - display: inline-block; - margin-left: 0.255em; - vertical-align: 0.255em; - content: ""; - border-top: 0.3em solid; - border-right: 0.3em solid transparent; - border-bottom: 0; - border-left: 0.3em solid transparent; -} -.dropdown-toggle:empty::after { - margin-left: 0; -} - -.dropdown-menu { - position: absolute; - top: 100%; - left: 0; - z-index: 1000; - display: none; - float: left; - min-width: 10rem; - padding: 0.5rem 0; - margin: 0.125rem 0 0; - font-size: 1rem; - color: #212529; - text-align: left; - list-style: none; - background-color: #fff; - background-clip: padding-box; - border: 1px solid rgba(0, 0, 0, 0.15); - border-radius: 0.25rem; -} - -.dropdown-menu-left { - right: auto; - left: 0; -} - -.dropdown-menu-right { - right: 0; - left: auto; -} - -@media (min-width: 576px) { - .dropdown-menu-sm-left { - right: auto; - left: 0; - } - - .dropdown-menu-sm-right { - right: 0; - left: auto; - } -} -@media (min-width: 768px) { - .dropdown-menu-md-left { - right: auto; - left: 0; - } - - .dropdown-menu-md-right { - right: 0; - left: auto; - } -} -@media (min-width: 992px) { - .dropdown-menu-lg-left { - right: auto; - left: 0; - } - - .dropdown-menu-lg-right { - right: 0; - left: auto; - } -} -@media (min-width: 1200px) { - .dropdown-menu-xl-left { - right: auto; - left: 0; - } - - .dropdown-menu-xl-right { - right: 0; - left: auto; - } -} -.dropup .dropdown-menu { - top: auto; - bottom: 100%; - margin-top: 0; - margin-bottom: 0.125rem; -} -.dropup .dropdown-toggle::after { - display: inline-block; - margin-left: 0.255em; - vertical-align: 0.255em; - content: ""; - border-top: 0; - border-right: 0.3em solid transparent; - border-bottom: 0.3em solid; - border-left: 0.3em solid transparent; -} -.dropup .dropdown-toggle:empty::after { - margin-left: 0; -} - -.dropright .dropdown-menu { - top: 0; - right: auto; - left: 100%; - margin-top: 0; - margin-left: 0.125rem; -} -.dropright .dropdown-toggle::after { - display: inline-block; - margin-left: 0.255em; - vertical-align: 0.255em; - content: ""; - border-top: 0.3em solid transparent; - border-right: 0; - border-bottom: 0.3em solid transparent; - border-left: 0.3em solid; -} -.dropright .dropdown-toggle:empty::after { - margin-left: 0; -} -.dropright .dropdown-toggle::after { - vertical-align: 0; -} - -.dropleft .dropdown-menu { - top: 0; - right: 100%; - left: auto; - margin-top: 0; - margin-right: 0.125rem; -} -.dropleft .dropdown-toggle::after { - display: inline-block; - margin-left: 0.255em; - vertical-align: 0.255em; - content: ""; -} -.dropleft .dropdown-toggle::after { - display: none; -} -.dropleft .dropdown-toggle::before { - display: inline-block; - margin-right: 0.255em; - vertical-align: 0.255em; - content: ""; - border-top: 0.3em solid transparent; - border-right: 0.3em solid; - border-bottom: 0.3em solid transparent; -} -.dropleft .dropdown-toggle:empty::after { - margin-left: 0; -} -.dropleft .dropdown-toggle::before { - vertical-align: 0; -} - -.dropdown-menu[x-placement^="top"], .dropdown-menu[x-placement^="right"], .dropdown-menu[x-placement^="bottom"], .dropdown-menu[x-placement^="left"] { - right: auto; - bottom: auto; -} - -.dropdown-divider { - height: 0; - margin: 0.5rem 0; - overflow: hidden; - border-top: 1px solid #e9ecef; -} - -.dropdown-item { - display: block; - width: 100%; - padding: 0.25rem 1.5rem; - clear: both; - font-weight: 400; - color: #212529; - text-align: inherit; - white-space: nowrap; - background-color: transparent; - border: 0; -} -.dropdown-item:hover, .dropdown-item:focus { - color: #16181b; - text-decoration: none; - background-color: #e9ecef; -} -.dropdown-item.active, .dropdown-item:active { - color: #fff; - text-decoration: none; - background-color: #007bff; -} -.dropdown-item.disabled, .dropdown-item:disabled { - color: #adb5bd; - pointer-events: none; - background-color: transparent; -} - -.dropdown-menu.show { - display: block; -} - -.dropdown-header { - display: block; - padding: 0.5rem 1.5rem; - margin-bottom: 0; - font-size: 0.875rem; - color: #6c757d; - white-space: nowrap; -} - -.dropdown-item-text { - display: block; - padding: 0.25rem 1.5rem; - color: #212529; -} - -.btn-group, -.btn-group-vertical { - position: relative; - display: -webkit-inline-box; - display: -ms-inline-flexbox; - display: inline-flex; - vertical-align: middle; -} -.btn-group > .btn, -.btn-group-vertical > .btn { - position: relative; - -webkit-box-flex: 1; - -ms-flex: 1 1 auto; - flex: 1 1 auto; -} -.btn-group > .btn:hover, -.btn-group-vertical > .btn:hover { - z-index: 1; -} -.btn-group > .btn:focus, .btn-group > .btn:active, .btn-group > .btn.active, -.btn-group-vertical > .btn:focus, -.btn-group-vertical > .btn:active, -.btn-group-vertical > .btn.active { - z-index: 1; -} - -.btn-toolbar { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -ms-flex-wrap: wrap; - flex-wrap: wrap; - -webkit-box-pack: start; - -ms-flex-pack: start; - justify-content: flex-start; -} -.btn-toolbar .input-group { - width: auto; -} - -.btn-group > .btn:not(:first-child), -.btn-group > .btn-group:not(:first-child) { - margin-left: -1px; -} -.btn-group > .btn:not(:last-child):not(.dropdown-toggle), -.btn-group > .btn-group:not(:last-child) > .btn { - border-top-right-radius: 0; - border-bottom-right-radius: 0; -} -.btn-group > .btn:not(:first-child), -.btn-group > .btn-group:not(:first-child) > .btn { - border-top-left-radius: 0; - border-bottom-left-radius: 0; -} - -.dropdown-toggle-split { - padding-right: 0.5625rem; - padding-left: 0.5625rem; -} -.dropdown-toggle-split::after, .dropup .dropdown-toggle-split::after, .dropright .dropdown-toggle-split::after { - margin-left: 0; -} -.dropleft .dropdown-toggle-split::before { - margin-right: 0; -} - -.btn-sm + .dropdown-toggle-split, .btn-group-sm > .btn + .dropdown-toggle-split { - padding-right: 0.375rem; - padding-left: 0.375rem; -} - -.btn-lg + .dropdown-toggle-split, .btn-group-lg > .btn + .dropdown-toggle-split { - padding-right: 0.75rem; - padding-left: 0.75rem; -} - -.btn-group-vertical { - -webkit-box-orient: vertical; - -webkit-box-direction: normal; - -ms-flex-direction: column; - flex-direction: column; - -webkit-box-align: start; - -ms-flex-align: start; - align-items: flex-start; - -webkit-box-pack: center; - -ms-flex-pack: center; - justify-content: center; -} -.btn-group-vertical > .btn, -.btn-group-vertical > .btn-group { - width: 100%; -} -.btn-group-vertical > .btn:not(:first-child), -.btn-group-vertical > .btn-group:not(:first-child) { - margin-top: -1px; -} -.btn-group-vertical > .btn:not(:last-child):not(.dropdown-toggle), -.btn-group-vertical > .btn-group:not(:last-child) > .btn { - border-bottom-right-radius: 0; - border-bottom-left-radius: 0; -} -.btn-group-vertical > .btn:not(:first-child), -.btn-group-vertical > .btn-group:not(:first-child) > .btn { - border-top-left-radius: 0; - border-top-right-radius: 0; -} - -.btn-group-toggle > .btn, -.btn-group-toggle > .btn-group > .btn { - margin-bottom: 0; -} -.btn-group-toggle > .btn input[type="radio"], -.btn-group-toggle > .btn input[type="checkbox"], -.btn-group-toggle > .btn-group > .btn input[type="radio"], -.btn-group-toggle > .btn-group > .btn input[type="checkbox"] { - position: absolute; - clip: rect(0, 0, 0, 0); - pointer-events: none; -} - -.input-group { - position: relative; - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -ms-flex-wrap: wrap; - flex-wrap: wrap; - -webkit-box-align: stretch; - -ms-flex-align: stretch; - align-items: stretch; - width: 100%; -} -.input-group > .form-control, -.input-group > .form-control-plaintext, -.input-group > .custom-select, -.input-group > .custom-file { - position: relative; - -webkit-box-flex: 1; - -ms-flex: 1 1 auto; - flex: 1 1 auto; - width: 1%; - min-width: 0; - margin-bottom: 0; -} -.input-group > .form-control + .form-control, -.input-group > .form-control + .custom-select, -.input-group > .form-control + .custom-file, -.input-group > .form-control-plaintext + .form-control, -.input-group > .form-control-plaintext + .custom-select, -.input-group > .form-control-plaintext + .custom-file, -.input-group > .custom-select + .form-control, -.input-group > .custom-select + .custom-select, -.input-group > .custom-select + .custom-file, -.input-group > .custom-file + .form-control, -.input-group > .custom-file + .custom-select, -.input-group > .custom-file + .custom-file { - margin-left: -1px; -} -.input-group > .form-control:focus, -.input-group > .custom-select:focus, -.input-group > .custom-file .custom-file-input:focus ~ .custom-file-label { - z-index: 3; -} -.input-group > .custom-file .custom-file-input:focus { - z-index: 4; -} -.input-group > .form-control:not(:first-child), -.input-group > .custom-select:not(:first-child) { - border-top-left-radius: 0; - border-bottom-left-radius: 0; -} -.input-group > .custom-file { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; -} -.input-group > .custom-file:not(:last-child) .custom-file-label, .input-group > .custom-file:not(:last-child) .custom-file-label::after { - border-top-right-radius: 0; - border-bottom-right-radius: 0; -} -.input-group > .custom-file:not(:first-child) .custom-file-label { - border-top-left-radius: 0; - border-bottom-left-radius: 0; -} -.input-group:not(.has-validation) > .form-control:not(:last-child), -.input-group:not(.has-validation) > .custom-select:not(:last-child), -.input-group:not(.has-validation) > .custom-file:not(:last-child) .custom-file-label, -.input-group:not(.has-validation) > .custom-file:not(:last-child) .custom-file-label::after { - border-top-right-radius: 0; - border-bottom-right-radius: 0; -} -.input-group.has-validation > .form-control:nth-last-child(n + 3), -.input-group.has-validation > .custom-select:nth-last-child(n + 3), -.input-group.has-validation > .custom-file:nth-last-child(n + 3) .custom-file-label, -.input-group.has-validation > .custom-file:nth-last-child(n + 3) .custom-file-label::after { - border-top-right-radius: 0; - border-bottom-right-radius: 0; -} - -.input-group-prepend, -.input-group-append { - display: -webkit-box; - display: -ms-flexbox; - display: flex; -} -.input-group-prepend .btn, -.input-group-append .btn { - position: relative; - z-index: 2; -} -.input-group-prepend .btn:focus, -.input-group-append .btn:focus { - z-index: 3; -} -.input-group-prepend .btn + .btn, -.input-group-prepend .btn + .input-group-text, -.input-group-prepend .input-group-text + .input-group-text, -.input-group-prepend .input-group-text + .btn, -.input-group-append .btn + .btn, -.input-group-append .btn + .input-group-text, -.input-group-append .input-group-text + .input-group-text, -.input-group-append .input-group-text + .btn { - margin-left: -1px; -} - -.input-group-prepend { - margin-right: -1px; -} - -.input-group-append { - margin-left: -1px; -} - -.input-group-text { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; - padding: 0.375rem 0.75rem; - margin-bottom: 0; - font-size: 1rem; - font-weight: 400; - line-height: 1.5; - color: #495057; - text-align: center; - white-space: nowrap; - background-color: #e9ecef; - border: 1px solid #ced4da; - border-radius: 0.25rem; -} -.input-group-text input[type="radio"], -.input-group-text input[type="checkbox"] { - margin-top: 0; -} - -.input-group-lg > .form-control:not(textarea), -.input-group-lg > .custom-select { - height: calc(1.5em + 1rem + 2px); -} - -.input-group-lg > .form-control, -.input-group-lg > .custom-select, -.input-group-lg > .input-group-prepend > .input-group-text, -.input-group-lg > .input-group-append > .input-group-text, -.input-group-lg > .input-group-prepend > .btn, -.input-group-lg > .input-group-append > .btn { - padding: 0.5rem 1rem; - font-size: 1.25rem; - line-height: 1.5; - border-radius: 0.3rem; -} - -.input-group-sm > .form-control:not(textarea), -.input-group-sm > .custom-select { - height: calc(1.5em + 0.5rem + 2px); -} - -.input-group-sm > .form-control, -.input-group-sm > .custom-select, -.input-group-sm > .input-group-prepend > .input-group-text, -.input-group-sm > .input-group-append > .input-group-text, -.input-group-sm > .input-group-prepend > .btn, -.input-group-sm > .input-group-append > .btn { - padding: 0.25rem 0.5rem; - font-size: 0.875rem; - line-height: 1.5; - border-radius: 0.2rem; -} - -.input-group-lg > .custom-select, -.input-group-sm > .custom-select { - padding-right: 1.75rem; -} - -.input-group > .input-group-prepend > .btn, -.input-group > .input-group-prepend > .input-group-text, -.input-group:not(.has-validation) > .input-group-append:not(:last-child) > .btn, -.input-group:not(.has-validation) > .input-group-append:not(:last-child) > .input-group-text, -.input-group.has-validation > .input-group-append:nth-last-child(n + 3) > .btn, -.input-group.has-validation > .input-group-append:nth-last-child(n + 3) > .input-group-text, -.input-group > .input-group-append:last-child > .btn:not(:last-child):not(.dropdown-toggle), -.input-group > .input-group-append:last-child > .input-group-text:not(:last-child) { - border-top-right-radius: 0; - border-bottom-right-radius: 0; -} - -.input-group > .input-group-append > .btn, -.input-group > .input-group-append > .input-group-text, -.input-group > .input-group-prepend:not(:first-child) > .btn, -.input-group > .input-group-prepend:not(:first-child) > .input-group-text, -.input-group > .input-group-prepend:first-child > .btn:not(:first-child), -.input-group > .input-group-prepend:first-child > .input-group-text:not(:first-child) { - border-top-left-radius: 0; - border-bottom-left-radius: 0; -} - -.custom-control { - position: relative; - z-index: 1; - display: block; - min-height: 1.5rem; - padding-left: 1.5rem; - -webkit-print-color-adjust: exact; - color-adjust: exact; -} - -.custom-control-inline { - display: -webkit-inline-box; - display: -ms-inline-flexbox; - display: inline-flex; - margin-right: 1rem; -} - -.custom-control-input { - position: absolute; - left: 0; - z-index: -1; - width: 1rem; - height: 1.25rem; - opacity: 0; -} -.custom-control-input:checked ~ .custom-control-label::before { - color: #fff; - border-color: #007bff; - background-color: #007bff; -} -.custom-control-input:focus ~ .custom-control-label::before { - -webkit-box-shadow: 0 0 0 0.2rem rgba(0, 123, 255, 0.25); - box-shadow: 0 0 0 0.2rem rgba(0, 123, 255, 0.25); -} -.custom-control-input:focus:not(:checked) ~ .custom-control-label::before { - border-color: #80bdff; -} -.custom-control-input:not(:disabled):active ~ .custom-control-label::before { - color: #fff; - background-color: #b3d7ff; - border-color: #b3d7ff; -} -.custom-control-input[disabled] ~ .custom-control-label, .custom-control-input:disabled ~ .custom-control-label { - color: #6c757d; -} -.custom-control-input[disabled] ~ .custom-control-label::before, .custom-control-input:disabled ~ .custom-control-label::before { - background-color: #e9ecef; -} - -.custom-control-label { - position: relative; - margin-bottom: 0; - vertical-align: top; -} -.custom-control-label::before { - position: absolute; - top: 0.25rem; - left: -1.5rem; - display: block; - width: 1rem; - height: 1rem; - pointer-events: none; - content: ""; - background-color: #fff; - border: #adb5bd solid 1px; -} -.custom-control-label::after { - position: absolute; - top: 0.25rem; - left: -1.5rem; - display: block; - width: 1rem; - height: 1rem; - content: ""; - background: 50% / 50% 50% no-repeat; -} - -.custom-checkbox .custom-control-label::before { - border-radius: 0.25rem; -} -.custom-checkbox .custom-control-input:checked ~ .custom-control-label::after { - background-image: url("data:image/svg+xml,%3csvg xmlns='http://www.w3.org/2000/svg' width='8' height='8' viewBox='0 0 8 8'%3e%3cpath fill='%23fff' d='M6.564.75l-3.59 3.612-1.538-1.55L0 4.26l2.974 2.99L8 2.193z'/%3e%3c/svg%3e"); -} -.custom-checkbox .custom-control-input:indeterminate ~ .custom-control-label::before { - border-color: #007bff; - background-color: #007bff; -} -.custom-checkbox .custom-control-input:indeterminate ~ .custom-control-label::after { - background-image: url("data:image/svg+xml,%3csvg xmlns='http://www.w3.org/2000/svg' width='4' height='4' viewBox='0 0 4 4'%3e%3cpath stroke='%23fff' d='M0 2h4'/%3e%3c/svg%3e"); -} -.custom-checkbox .custom-control-input:disabled:checked ~ .custom-control-label::before { - background-color: rgba(0, 123, 255, 0.5); -} -.custom-checkbox .custom-control-input:disabled:indeterminate ~ .custom-control-label::before { - background-color: rgba(0, 123, 255, 0.5); -} - -.custom-radio .custom-control-label::before { - border-radius: 50%; -} -.custom-radio .custom-control-input:checked ~ .custom-control-label::after { - background-image: url("data:image/svg+xml,%3csvg xmlns='http://www.w3.org/2000/svg' width='12' height='12' viewBox='-4 -4 8 8'%3e%3ccircle r='3' fill='%23fff'/%3e%3c/svg%3e"); -} -.custom-radio .custom-control-input:disabled:checked ~ .custom-control-label::before { - background-color: rgba(0, 123, 255, 0.5); -} - -.custom-switch { - padding-left: 2.25rem; -} -.custom-switch .custom-control-label::before { - left: -2.25rem; - width: 1.75rem; - pointer-events: all; - border-radius: 0.5rem; -} -.custom-switch .custom-control-label::after { - top: calc(0.25rem + 2px); - left: calc(-2.25rem + 2px); - width: calc(1rem - 4px); - height: calc(1rem - 4px); - background-color: #adb5bd; - border-radius: 0.5rem; - -webkit-transition: background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, -webkit-transform 0.15s ease-in-out, -webkit-box-shadow 0.15s ease-in-out; - transition: background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, -webkit-transform 0.15s ease-in-out, -webkit-box-shadow 0.15s ease-in-out; - transition: transform 0.15s ease-in-out, background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, box-shadow 0.15s ease-in-out; - transition: transform 0.15s ease-in-out, background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, box-shadow 0.15s ease-in-out, -webkit-transform 0.15s ease-in-out, -webkit-box-shadow 0.15s ease-in-out; -} -@media (prefers-reduced-motion: reduce) { - .custom-switch .custom-control-label::after { - -webkit-transition: none; - transition: none; - } -} -.custom-switch .custom-control-input:checked ~ .custom-control-label::after { - background-color: #fff; - -webkit-transform: translateX(0.75rem); - transform: translateX(0.75rem); -} -.custom-switch .custom-control-input:disabled:checked ~ .custom-control-label::before { - background-color: rgba(0, 123, 255, 0.5); -} - -.custom-select { - display: inline-block; - width: 100%; - height: calc(1.5em + 0.75rem + 2px); - padding: 0.375rem 1.75rem 0.375rem 0.75rem; - font-size: 1rem; - font-weight: 400; - line-height: 1.5; - color: #495057; - vertical-align: middle; - background: #fff url("data:image/svg+xml,%3csvg xmlns='http://www.w3.org/2000/svg' width='4' height='5' viewBox='0 0 4 5'%3e%3cpath fill='%23343a40' d='M2 0L0 2h4zm0 5L0 3h4z'/%3e%3c/svg%3e") right 0.75rem center/8px 10px no-repeat; - border: 1px solid #ced4da; - border-radius: 0.25rem; - -webkit-appearance: none; - -moz-appearance: none; - appearance: none; -} -.custom-select:focus { - border-color: #80bdff; - outline: 0; - -webkit-box-shadow: 0 0 0 0.2rem rgba(0, 123, 255, 0.25); - box-shadow: 0 0 0 0.2rem rgba(0, 123, 255, 0.25); -} -.custom-select:focus::-ms-value { - color: #495057; - background-color: #fff; -} -.custom-select[multiple], .custom-select[size]:not([size="1"]) { - height: auto; - padding-right: 0.75rem; - background-image: none; -} -.custom-select:disabled { - color: #6c757d; - background-color: #e9ecef; -} -.custom-select::-ms-expand { - display: none; -} -.custom-select:-moz-focusring { - color: transparent; - text-shadow: 0 0 0 #495057; -} - -.custom-select-sm { - height: calc(1.5em + 0.5rem + 2px); - padding-top: 0.25rem; - padding-bottom: 0.25rem; - padding-left: 0.5rem; - font-size: 0.875rem; -} - -.custom-select-lg { - height: calc(1.5em + 1rem + 2px); - padding-top: 0.5rem; - padding-bottom: 0.5rem; - padding-left: 1rem; - font-size: 1.25rem; -} - -.custom-file { - position: relative; - display: inline-block; - width: 100%; - height: calc(1.5em + 0.75rem + 2px); - margin-bottom: 0; -} - -.custom-file-input { - position: relative; - z-index: 2; - width: 100%; - height: calc(1.5em + 0.75rem + 2px); - margin: 0; - overflow: hidden; - opacity: 0; -} -.custom-file-input:focus ~ .custom-file-label { - border-color: #80bdff; - -webkit-box-shadow: 0 0 0 0.2rem rgba(0, 123, 255, 0.25); - box-shadow: 0 0 0 0.2rem rgba(0, 123, 255, 0.25); -} -.custom-file-input[disabled] ~ .custom-file-label, .custom-file-input:disabled ~ .custom-file-label { - background-color: #e9ecef; -} -.custom-file-input:lang(en) ~ .custom-file-label::after { - content: "Browse"; -} -.custom-file-input ~ .custom-file-label[data-browse]::after { - content: attr(data-browse); -} - -.custom-file-label { - position: absolute; - top: 0; - right: 0; - left: 0; - z-index: 1; - height: calc(1.5em + 0.75rem + 2px); - padding: 0.375rem 0.75rem; - overflow: hidden; - font-weight: 400; - line-height: 1.5; - color: #495057; - background-color: #fff; - border: 1px solid #ced4da; - border-radius: 0.25rem; -} -.custom-file-label::after { - position: absolute; - top: 0; - right: 0; - bottom: 0; - z-index: 3; - display: block; - height: calc(1.5em + 0.75rem); - padding: 0.375rem 0.75rem; - line-height: 1.5; - color: #495057; - content: "Browse"; - background-color: #e9ecef; - border-left: inherit; - border-radius: 0 0.25rem 0.25rem 0; -} - -.custom-range { - width: 100%; - height: 1.4rem; - padding: 0; - background-color: transparent; - -webkit-appearance: none; - -moz-appearance: none; - appearance: none; -} -.custom-range:focus { - outline: 0; -} -.custom-range:focus::-webkit-slider-thumb { - -webkit-box-shadow: 0 0 0 1px #fff, 0 0 0 0.2rem rgba(0, 123, 255, 0.25); - box-shadow: 0 0 0 1px #fff, 0 0 0 0.2rem rgba(0, 123, 255, 0.25); -} -.custom-range:focus::-moz-range-thumb { - box-shadow: 0 0 0 1px #fff, 0 0 0 0.2rem rgba(0, 123, 255, 0.25); -} -.custom-range:focus::-ms-thumb { - box-shadow: 0 0 0 1px #fff, 0 0 0 0.2rem rgba(0, 123, 255, 0.25); -} -.custom-range::-moz-focus-outer { - border: 0; -} -.custom-range::-webkit-slider-thumb { - width: 1rem; - height: 1rem; - margin-top: -0.25rem; - background-color: #007bff; - border: 0; - border-radius: 1rem; - -webkit-transition: background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, -webkit-box-shadow 0.15s ease-in-out; - transition: background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, -webkit-box-shadow 0.15s ease-in-out; - transition: background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, box-shadow 0.15s ease-in-out; - transition: background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, box-shadow 0.15s ease-in-out, -webkit-box-shadow 0.15s ease-in-out; - -webkit-appearance: none; - appearance: none; -} -@media (prefers-reduced-motion: reduce) { - .custom-range::-webkit-slider-thumb { - -webkit-transition: none; - transition: none; - } -} -.custom-range::-webkit-slider-thumb:active { - background-color: #b3d7ff; -} -.custom-range::-webkit-slider-runnable-track { - width: 100%; - height: 0.5rem; - color: transparent; - cursor: pointer; - background-color: #dee2e6; - border-color: transparent; - border-radius: 1rem; -} -.custom-range::-moz-range-thumb { - width: 1rem; - height: 1rem; - background-color: #007bff; - border: 0; - border-radius: 1rem; - -moz-transition: background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, box-shadow 0.15s ease-in-out; - transition: background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, box-shadow 0.15s ease-in-out; - -moz-appearance: none; - appearance: none; -} -@media (prefers-reduced-motion: reduce) { - .custom-range::-moz-range-thumb { - -moz-transition: none; - transition: none; - } -} -.custom-range::-moz-range-thumb:active { - background-color: #b3d7ff; -} -.custom-range::-moz-range-track { - width: 100%; - height: 0.5rem; - color: transparent; - cursor: pointer; - background-color: #dee2e6; - border-color: transparent; - border-radius: 1rem; -} -.custom-range::-ms-thumb { - width: 1rem; - height: 1rem; - margin-top: 0; - margin-right: 0.2rem; - margin-left: 0.2rem; - background-color: #007bff; - border: 0; - border-radius: 1rem; - -ms-transition: background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, box-shadow 0.15s ease-in-out; - transition: background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, box-shadow 0.15s ease-in-out; - appearance: none; -} -@media (prefers-reduced-motion: reduce) { - .custom-range::-ms-thumb { - -ms-transition: none; - transition: none; - } -} -.custom-range::-ms-thumb:active { - background-color: #b3d7ff; -} -.custom-range::-ms-track { - width: 100%; - height: 0.5rem; - color: transparent; - cursor: pointer; - background-color: transparent; - border-color: transparent; - border-width: 0.5rem; -} -.custom-range::-ms-fill-lower { - background-color: #dee2e6; - border-radius: 1rem; -} -.custom-range::-ms-fill-upper { - margin-right: 15px; - background-color: #dee2e6; - border-radius: 1rem; -} -.custom-range:disabled::-webkit-slider-thumb { - background-color: #adb5bd; -} -.custom-range:disabled::-webkit-slider-runnable-track { - cursor: default; -} -.custom-range:disabled::-moz-range-thumb { - background-color: #adb5bd; -} -.custom-range:disabled::-moz-range-track { - cursor: default; -} -.custom-range:disabled::-ms-thumb { - background-color: #adb5bd; -} - -.custom-control-label::before, -.custom-file-label, -.custom-select { - -webkit-transition: background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, -webkit-box-shadow 0.15s ease-in-out; - transition: background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, -webkit-box-shadow 0.15s ease-in-out; - transition: background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, box-shadow 0.15s ease-in-out; - transition: background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, box-shadow 0.15s ease-in-out, -webkit-box-shadow 0.15s ease-in-out; -} -@media (prefers-reduced-motion: reduce) { - .custom-control-label::before, - .custom-file-label, - .custom-select { - -webkit-transition: none; - transition: none; - } -} - -.nav { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -ms-flex-wrap: wrap; - flex-wrap: wrap; - padding-left: 0; - margin-bottom: 0; - list-style: none; -} - -.nav-link { - display: block; - padding: 0.5rem 1rem; -} -.nav-link:hover, .nav-link:focus { - text-decoration: none; -} -.nav-link.disabled { - color: #6c757d; - pointer-events: none; - cursor: default; -} - -.nav-tabs { - border-bottom: 1px solid #dee2e6; -} -.nav-tabs .nav-link { - margin-bottom: -1px; - border: 1px solid transparent; - border-top-left-radius: 0.25rem; - border-top-right-radius: 0.25rem; -} -.nav-tabs .nav-link:hover, .nav-tabs .nav-link:focus { - border-color: #e9ecef #e9ecef #dee2e6; -} -.nav-tabs .nav-link.disabled { - color: #6c757d; - background-color: transparent; - border-color: transparent; -} -.nav-tabs .nav-link.active, -.nav-tabs .nav-item.show .nav-link { - color: #495057; - background-color: #fff; - border-color: #dee2e6 #dee2e6 #fff; -} -.nav-tabs .dropdown-menu { - margin-top: -1px; - border-top-left-radius: 0; - border-top-right-radius: 0; -} - -.nav-pills .nav-link { - border-radius: 0.25rem; -} -.nav-pills .nav-link.active, -.nav-pills .show > .nav-link { - color: #fff; - background-color: #007bff; -} - -.nav-fill > .nav-link, -.nav-fill .nav-item { - -webkit-box-flex: 1; - -ms-flex: 1 1 auto; - flex: 1 1 auto; - text-align: center; -} - -.nav-justified > .nav-link, -.nav-justified .nav-item { - -ms-flex-preferred-size: 0; - flex-basis: 0; - -webkit-box-flex: 1; - -ms-flex-positive: 1; - flex-grow: 1; - text-align: center; -} - -.tab-content > .tab-pane { - display: none; -} -.tab-content > .active { - display: block; -} - -.navbar { - position: relative; - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -ms-flex-wrap: wrap; - flex-wrap: wrap; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; - -webkit-box-pack: justify; - -ms-flex-pack: justify; - justify-content: space-between; - padding: 0.5rem 1rem; -} -.navbar .container, -.navbar .container-fluid, -.navbar .container-sm, -.navbar .container-md, -.navbar .container-lg, -.navbar .container-xl { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -ms-flex-wrap: wrap; - flex-wrap: wrap; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; - -webkit-box-pack: justify; - -ms-flex-pack: justify; - justify-content: space-between; -} - -.navbar-brand { - display: inline-block; - padding-top: 0.3125rem; - padding-bottom: 0.3125rem; - margin-right: 1rem; - font-size: 1.25rem; - line-height: inherit; - white-space: nowrap; -} -.navbar-brand:hover, .navbar-brand:focus { - text-decoration: none; -} - -.navbar-nav { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-orient: vertical; - -webkit-box-direction: normal; - -ms-flex-direction: column; - flex-direction: column; - padding-left: 0; - margin-bottom: 0; - list-style: none; -} -.navbar-nav .nav-link { - padding-right: 0; - padding-left: 0; -} -.navbar-nav .dropdown-menu { - position: static; - float: none; -} - -.navbar-text { - display: inline-block; - padding-top: 0.5rem; - padding-bottom: 0.5rem; -} - -.navbar-collapse { - -ms-flex-preferred-size: 100%; - flex-basis: 100%; - -webkit-box-flex: 1; - -ms-flex-positive: 1; - flex-grow: 1; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; -} - -.navbar-toggler { - padding: 0.25rem 0.75rem; - font-size: 1.25rem; - line-height: 1; - background-color: transparent; - border: 1px solid transparent; - border-radius: 0.25rem; -} -.navbar-toggler:hover, .navbar-toggler:focus { - text-decoration: none; -} - -.navbar-toggler-icon { - display: inline-block; - width: 1.5em; - height: 1.5em; - vertical-align: middle; - content: ""; - background: 50% / 100% 100% no-repeat; -} - -.navbar-nav-scroll { - max-height: 75vh; - overflow-y: auto; -} - -@media (max-width: 575.98px) { - .navbar-expand-sm > .container, - .navbar-expand-sm > .container-fluid, - .navbar-expand-sm > .container-sm, - .navbar-expand-sm > .container-md, - .navbar-expand-sm > .container-lg, - .navbar-expand-sm > .container-xl { - padding-right: 0; - padding-left: 0; - } -} -@media (min-width: 576px) { - .navbar-expand-sm { - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-flow: row nowrap; - flex-flow: row nowrap; - -webkit-box-pack: start; - -ms-flex-pack: start; - justify-content: flex-start; - } - .navbar-expand-sm .navbar-nav { - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-direction: row; - flex-direction: row; - } - .navbar-expand-sm .navbar-nav .dropdown-menu { - position: absolute; - } - .navbar-expand-sm .navbar-nav .nav-link { - padding-right: 0.5rem; - padding-left: 0.5rem; - } - .navbar-expand-sm > .container, - .navbar-expand-sm > .container-fluid, - .navbar-expand-sm > .container-sm, - .navbar-expand-sm > .container-md, - .navbar-expand-sm > .container-lg, - .navbar-expand-sm > .container-xl { - -ms-flex-wrap: nowrap; - flex-wrap: nowrap; - } - .navbar-expand-sm .navbar-nav-scroll { - overflow: visible; - } - .navbar-expand-sm .navbar-collapse { - display: -webkit-box !important; - display: -ms-flexbox !important; - display: flex !important; - -ms-flex-preferred-size: auto; - flex-basis: auto; - } - .navbar-expand-sm .navbar-toggler { - display: none; - } -} -@media (max-width: 767.98px) { - .navbar-expand-md > .container, - .navbar-expand-md > .container-fluid, - .navbar-expand-md > .container-sm, - .navbar-expand-md > .container-md, - .navbar-expand-md > .container-lg, - .navbar-expand-md > .container-xl { - padding-right: 0; - padding-left: 0; - } -} -@media (min-width: 768px) { - .navbar-expand-md { - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-flow: row nowrap; - flex-flow: row nowrap; - -webkit-box-pack: start; - -ms-flex-pack: start; - justify-content: flex-start; - } - .navbar-expand-md .navbar-nav { - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-direction: row; - flex-direction: row; - } - .navbar-expand-md .navbar-nav .dropdown-menu { - position: absolute; - } - .navbar-expand-md .navbar-nav .nav-link { - padding-right: 0.5rem; - padding-left: 0.5rem; - } - .navbar-expand-md > .container, - .navbar-expand-md > .container-fluid, - .navbar-expand-md > .container-sm, - .navbar-expand-md > .container-md, - .navbar-expand-md > .container-lg, - .navbar-expand-md > .container-xl { - -ms-flex-wrap: nowrap; - flex-wrap: nowrap; - } - .navbar-expand-md .navbar-nav-scroll { - overflow: visible; - } - .navbar-expand-md .navbar-collapse { - display: -webkit-box !important; - display: -ms-flexbox !important; - display: flex !important; - -ms-flex-preferred-size: auto; - flex-basis: auto; - } - .navbar-expand-md .navbar-toggler { - display: none; - } -} -@media (max-width: 991.98px) { - .navbar-expand-lg > .container, - .navbar-expand-lg > .container-fluid, - .navbar-expand-lg > .container-sm, - .navbar-expand-lg > .container-md, - .navbar-expand-lg > .container-lg, - .navbar-expand-lg > .container-xl { - padding-right: 0; - padding-left: 0; - } -} -@media (min-width: 992px) { - .navbar-expand-lg { - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-flow: row nowrap; - flex-flow: row nowrap; - -webkit-box-pack: start; - -ms-flex-pack: start; - justify-content: flex-start; - } - .navbar-expand-lg .navbar-nav { - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-direction: row; - flex-direction: row; - } - .navbar-expand-lg .navbar-nav .dropdown-menu { - position: absolute; - } - .navbar-expand-lg .navbar-nav .nav-link { - padding-right: 0.5rem; - padding-left: 0.5rem; - } - .navbar-expand-lg > .container, - .navbar-expand-lg > .container-fluid, - .navbar-expand-lg > .container-sm, - .navbar-expand-lg > .container-md, - .navbar-expand-lg > .container-lg, - .navbar-expand-lg > .container-xl { - -ms-flex-wrap: nowrap; - flex-wrap: nowrap; - } - .navbar-expand-lg .navbar-nav-scroll { - overflow: visible; - } - .navbar-expand-lg .navbar-collapse { - display: -webkit-box !important; - display: -ms-flexbox !important; - display: flex !important; - -ms-flex-preferred-size: auto; - flex-basis: auto; - } - .navbar-expand-lg .navbar-toggler { - display: none; - } -} -@media (max-width: 1199.98px) { - .navbar-expand-xl > .container, - .navbar-expand-xl > .container-fluid, - .navbar-expand-xl > .container-sm, - .navbar-expand-xl > .container-md, - .navbar-expand-xl > .container-lg, - .navbar-expand-xl > .container-xl { - padding-right: 0; - padding-left: 0; - } -} -@media (min-width: 1200px) { - .navbar-expand-xl { - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-flow: row nowrap; - flex-flow: row nowrap; - -webkit-box-pack: start; - -ms-flex-pack: start; - justify-content: flex-start; - } - .navbar-expand-xl .navbar-nav { - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-direction: row; - flex-direction: row; - } - .navbar-expand-xl .navbar-nav .dropdown-menu { - position: absolute; - } - .navbar-expand-xl .navbar-nav .nav-link { - padding-right: 0.5rem; - padding-left: 0.5rem; - } - .navbar-expand-xl > .container, - .navbar-expand-xl > .container-fluid, - .navbar-expand-xl > .container-sm, - .navbar-expand-xl > .container-md, - .navbar-expand-xl > .container-lg, - .navbar-expand-xl > .container-xl { - -ms-flex-wrap: nowrap; - flex-wrap: nowrap; - } - .navbar-expand-xl .navbar-nav-scroll { - overflow: visible; - } - .navbar-expand-xl .navbar-collapse { - display: -webkit-box !important; - display: -ms-flexbox !important; - display: flex !important; - -ms-flex-preferred-size: auto; - flex-basis: auto; - } - .navbar-expand-xl .navbar-toggler { - display: none; - } -} -.navbar-expand { - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-flow: row nowrap; - flex-flow: row nowrap; - -webkit-box-pack: start; - -ms-flex-pack: start; - justify-content: flex-start; -} -.navbar-expand > .container, -.navbar-expand > .container-fluid, -.navbar-expand > .container-sm, -.navbar-expand > .container-md, -.navbar-expand > .container-lg, -.navbar-expand > .container-xl { - padding-right: 0; - padding-left: 0; -} -.navbar-expand .navbar-nav { - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-direction: row; - flex-direction: row; -} -.navbar-expand .navbar-nav .dropdown-menu { - position: absolute; -} -.navbar-expand .navbar-nav .nav-link { - padding-right: 0.5rem; - padding-left: 0.5rem; -} -.navbar-expand > .container, -.navbar-expand > .container-fluid, -.navbar-expand > .container-sm, -.navbar-expand > .container-md, -.navbar-expand > .container-lg, -.navbar-expand > .container-xl { - -ms-flex-wrap: nowrap; - flex-wrap: nowrap; -} -.navbar-expand .navbar-nav-scroll { - overflow: visible; -} -.navbar-expand .navbar-collapse { - display: -webkit-box !important; - display: -ms-flexbox !important; - display: flex !important; - -ms-flex-preferred-size: auto; - flex-basis: auto; -} -.navbar-expand .navbar-toggler { - display: none; -} - -.navbar-light .navbar-brand { - color: rgba(0, 0, 0, 0.9); -} -.navbar-light .navbar-brand:hover, .navbar-light .navbar-brand:focus { - color: rgba(0, 0, 0, 0.9); -} -.navbar-light .navbar-nav .nav-link { - color: rgba(0, 0, 0, 0.5); -} -.navbar-light .navbar-nav .nav-link:hover, .navbar-light .navbar-nav .nav-link:focus { - color: rgba(0, 0, 0, 0.7); -} -.navbar-light .navbar-nav .nav-link.disabled { - color: rgba(0, 0, 0, 0.3); -} -.navbar-light .navbar-nav .show > .nav-link, -.navbar-light .navbar-nav .active > .nav-link, -.navbar-light .navbar-nav .nav-link.show, -.navbar-light .navbar-nav .nav-link.active { - color: rgba(0, 0, 0, 0.9); -} -.navbar-light .navbar-toggler { - color: rgba(0, 0, 0, 0.5); - border-color: rgba(0, 0, 0, 0.1); -} -.navbar-light .navbar-toggler-icon { - background-image: url("data:image/svg+xml,%3csvg xmlns='http://www.w3.org/2000/svg' width='30' height='30' viewBox='0 0 30 30'%3e%3cpath stroke='rgba%280, 0, 0, 0.5%29' stroke-linecap='round' stroke-miterlimit='10' stroke-width='2' d='M4 7h22M4 15h22M4 23h22'/%3e%3c/svg%3e"); -} -.navbar-light .navbar-text { - color: rgba(0, 0, 0, 0.5); -} -.navbar-light .navbar-text a { - color: rgba(0, 0, 0, 0.9); -} -.navbar-light .navbar-text a:hover, .navbar-light .navbar-text a:focus { - color: rgba(0, 0, 0, 0.9); -} - -.navbar-dark .navbar-brand { - color: #fff; -} -.navbar-dark .navbar-brand:hover, .navbar-dark .navbar-brand:focus { - color: #fff; -} -.navbar-dark .navbar-nav .nav-link { - color: rgba(255, 255, 255, 0.5); -} -.navbar-dark .navbar-nav .nav-link:hover, .navbar-dark .navbar-nav .nav-link:focus { - color: rgba(255, 255, 255, 0.75); -} -.navbar-dark .navbar-nav .nav-link.disabled { - color: rgba(255, 255, 255, 0.25); -} -.navbar-dark .navbar-nav .show > .nav-link, -.navbar-dark .navbar-nav .active > .nav-link, -.navbar-dark .navbar-nav .nav-link.show, -.navbar-dark .navbar-nav .nav-link.active { - color: #fff; -} -.navbar-dark .navbar-toggler { - color: rgba(255, 255, 255, 0.5); - border-color: rgba(255, 255, 255, 0.1); -} -.navbar-dark .navbar-toggler-icon { - background-image: url("data:image/svg+xml,%3csvg xmlns='http://www.w3.org/2000/svg' width='30' height='30' viewBox='0 0 30 30'%3e%3cpath stroke='rgba%28255, 255, 255, 0.5%29' stroke-linecap='round' stroke-miterlimit='10' stroke-width='2' d='M4 7h22M4 15h22M4 23h22'/%3e%3c/svg%3e"); -} -.navbar-dark .navbar-text { - color: rgba(255, 255, 255, 0.5); -} -.navbar-dark .navbar-text a { - color: #fff; -} -.navbar-dark .navbar-text a:hover, .navbar-dark .navbar-text a:focus { - color: #fff; -} - -.card { - position: relative; - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-orient: vertical; - -webkit-box-direction: normal; - -ms-flex-direction: column; - flex-direction: column; - min-width: 0; - word-wrap: break-word; - background-color: #fff; - background-clip: border-box; - border: 1px solid rgba(0, 0, 0, 0.125); - border-radius: 0.25rem; -} -.card > hr { - margin-right: 0; - margin-left: 0; -} -.card > .list-group { - border-top: inherit; - border-bottom: inherit; -} -.card > .list-group:first-child { - border-top-width: 0; - border-top-left-radius: calc(0.25rem - 1px); - border-top-right-radius: calc(0.25rem - 1px); -} -.card > .list-group:last-child { - border-bottom-width: 0; - border-bottom-right-radius: calc(0.25rem - 1px); - border-bottom-left-radius: calc(0.25rem - 1px); -} -.card > .card-header + .list-group, -.card > .list-group + .card-footer { - border-top: 0; -} - -.card-body { - -webkit-box-flex: 1; - -ms-flex: 1 1 auto; - flex: 1 1 auto; - min-height: 1px; - padding: 1.25rem; -} - -.card-title { - margin-bottom: 0.75rem; -} - -.card-subtitle { - margin-top: -0.375rem; - margin-bottom: 0; -} - -.card-text:last-child { - margin-bottom: 0; -} - -.card-link:hover { - text-decoration: none; -} -.card-link + .card-link { - margin-left: 1.25rem; -} - -.card-header { - padding: 0.75rem 1.25rem; - margin-bottom: 0; - background-color: rgba(0, 0, 0, 0.03); - border-bottom: 1px solid rgba(0, 0, 0, 0.125); -} -.card-header:first-child { - border-radius: calc(0.25rem - 1px) calc(0.25rem - 1px) 0 0; -} - -.card-footer { - padding: 0.75rem 1.25rem; - background-color: rgba(0, 0, 0, 0.03); - border-top: 1px solid rgba(0, 0, 0, 0.125); -} -.card-footer:last-child { - border-radius: 0 0 calc(0.25rem - 1px) calc(0.25rem - 1px); -} - -.card-header-tabs { - margin-right: -0.625rem; - margin-bottom: -0.75rem; - margin-left: -0.625rem; - border-bottom: 0; -} - -.card-header-pills { - margin-right: -0.625rem; - margin-left: -0.625rem; -} - -.card-img-overlay { - position: absolute; - top: 0; - right: 0; - bottom: 0; - left: 0; - padding: 1.25rem; - border-radius: calc(0.25rem - 1px); -} - -.card-img, -.card-img-top, -.card-img-bottom { - -ms-flex-negative: 0; - flex-shrink: 0; - width: 100%; -} - -.card-img, -.card-img-top { - border-top-left-radius: calc(0.25rem - 1px); - border-top-right-radius: calc(0.25rem - 1px); -} - -.card-img, -.card-img-bottom { - border-bottom-right-radius: calc(0.25rem - 1px); - border-bottom-left-radius: calc(0.25rem - 1px); -} - -.card-deck .card { - margin-bottom: 15px; -} -@media (min-width: 576px) { - .card-deck { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-flow: row wrap; - flex-flow: row wrap; - margin-right: -15px; - margin-left: -15px; - } - .card-deck .card { - -webkit-box-flex: 1; - -ms-flex: 1 0 0%; - flex: 1 0 0%; - margin-right: 15px; - margin-bottom: 0; - margin-left: 15px; - } -} - -.card-group > .card { - margin-bottom: 15px; -} -@media (min-width: 576px) { - .card-group { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-flow: row wrap; - flex-flow: row wrap; - } - .card-group > .card { - -webkit-box-flex: 1; - -ms-flex: 1 0 0%; - flex: 1 0 0%; - margin-bottom: 0; - } - .card-group > .card + .card { - margin-left: 0; - border-left: 0; - } - .card-group > .card:not(:last-child) { - border-top-right-radius: 0; - border-bottom-right-radius: 0; - } - .card-group > .card:not(:last-child) .card-img-top, - .card-group > .card:not(:last-child) .card-header { - border-top-right-radius: 0; - } - .card-group > .card:not(:last-child) .card-img-bottom, - .card-group > .card:not(:last-child) .card-footer { - border-bottom-right-radius: 0; - } - .card-group > .card:not(:first-child) { - border-top-left-radius: 0; - border-bottom-left-radius: 0; - } - .card-group > .card:not(:first-child) .card-img-top, - .card-group > .card:not(:first-child) .card-header { - border-top-left-radius: 0; - } - .card-group > .card:not(:first-child) .card-img-bottom, - .card-group > .card:not(:first-child) .card-footer { - border-bottom-left-radius: 0; - } -} - -.card-columns .card { - margin-bottom: 0.75rem; -} -@media (min-width: 576px) { - .card-columns { - -webkit-column-count: 3; - -moz-column-count: 3; - column-count: 3; - -webkit-column-gap: 1.25rem; - -moz-column-gap: 1.25rem; - column-gap: 1.25rem; - orphans: 1; - widows: 1; - } - .card-columns .card { - display: inline-block; - width: 100%; - } -} - -.accordion { - overflow-anchor: none; -} -.accordion > .card { - overflow: hidden; -} -.accordion > .card:not(:last-of-type) { - border-bottom: 0; - border-bottom-right-radius: 0; - border-bottom-left-radius: 0; -} -.accordion > .card:not(:first-of-type) { - border-top-left-radius: 0; - border-top-right-radius: 0; -} -.accordion > .card > .card-header { - border-radius: 0; - margin-bottom: -1px; -} - -.breadcrumb { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -ms-flex-wrap: wrap; - flex-wrap: wrap; - padding: 0.75rem 1rem; - margin-bottom: 1rem; - list-style: none; - background-color: #e9ecef; - border-radius: 0.25rem; -} - -.breadcrumb-item + .breadcrumb-item { - padding-left: 0.5rem; -} -.breadcrumb-item + .breadcrumb-item::before { - float: left; - padding-right: 0.5rem; - color: #6c757d; - content: "/"; -} -.breadcrumb-item + .breadcrumb-item:hover::before { - text-decoration: underline; -} -.breadcrumb-item + .breadcrumb-item:hover::before { - text-decoration: none; -} -.breadcrumb-item.active { - color: #6c757d; -} - -.pagination { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - padding-left: 0; - list-style: none; - border-radius: 0.25rem; -} - -.page-link { - position: relative; - display: block; - padding: 0.5rem 0.75rem; - margin-left: -1px; - line-height: 1.25; - color: #007bff; - background-color: #fff; - border: 1px solid #dee2e6; -} -.page-link:hover { - z-index: 2; - color: #0056b3; - text-decoration: none; - background-color: #e9ecef; - border-color: #dee2e6; -} -.page-link:focus { - z-index: 3; - outline: 0; - -webkit-box-shadow: 0 0 0 0.2rem rgba(0, 123, 255, 0.25); - box-shadow: 0 0 0 0.2rem rgba(0, 123, 255, 0.25); -} - -.page-item:first-child .page-link { - margin-left: 0; - border-top-left-radius: 0.25rem; - border-bottom-left-radius: 0.25rem; -} -.page-item:last-child .page-link { - border-top-right-radius: 0.25rem; - border-bottom-right-radius: 0.25rem; -} -.page-item.active .page-link { - z-index: 3; - color: #fff; - background-color: #007bff; - border-color: #007bff; -} -.page-item.disabled .page-link { - color: #6c757d; - pointer-events: none; - cursor: auto; - background-color: #fff; - border-color: #dee2e6; -} - -.pagination-lg .page-link { - padding: 0.75rem 1.5rem; - font-size: 1.25rem; - line-height: 1.5; -} -.pagination-lg .page-item:first-child .page-link { - border-top-left-radius: 0.3rem; - border-bottom-left-radius: 0.3rem; -} -.pagination-lg .page-item:last-child .page-link { - border-top-right-radius: 0.3rem; - border-bottom-right-radius: 0.3rem; -} - -.pagination-sm .page-link { - padding: 0.25rem 0.5rem; - font-size: 0.875rem; - line-height: 1.5; -} -.pagination-sm .page-item:first-child .page-link { - border-top-left-radius: 0.2rem; - border-bottom-left-radius: 0.2rem; -} -.pagination-sm .page-item:last-child .page-link { - border-top-right-radius: 0.2rem; - border-bottom-right-radius: 0.2rem; -} - -.badge { - display: inline-block; - padding: 0.25em 0.4em; - font-size: 75%; - font-weight: 700; - line-height: 1; - text-align: center; - white-space: nowrap; - vertical-align: baseline; - border-radius: 0.25rem; - -webkit-transition: color 0.15s ease-in-out, background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, -webkit-box-shadow 0.15s ease-in-out; - transition: color 0.15s ease-in-out, background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, -webkit-box-shadow 0.15s ease-in-out; - transition: color 0.15s ease-in-out, background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, box-shadow 0.15s ease-in-out; - transition: color 0.15s ease-in-out, background-color 0.15s ease-in-out, border-color 0.15s ease-in-out, box-shadow 0.15s ease-in-out, -webkit-box-shadow 0.15s ease-in-out; -} -@media (prefers-reduced-motion: reduce) { - .badge { - -webkit-transition: none; - transition: none; - } -} -a.badge:hover, a.badge:focus { - text-decoration: none; -} -.badge:empty { - display: none; -} - -.btn .badge { - position: relative; - top: -1px; -} - -.badge-pill { - padding-right: 0.6em; - padding-left: 0.6em; - border-radius: 10rem; -} - -.badge-primary { - color: #fff; - background-color: #007bff; -} -a.badge-primary:hover, a.badge-primary:focus { - color: #fff; - background-color: #0062cc; -} -a.badge-primary:focus, a.badge-primary.focus { - outline: 0; - -webkit-box-shadow: 0 0 0 0.2rem rgba(0, 123, 255, 0.5); - box-shadow: 0 0 0 0.2rem rgba(0, 123, 255, 0.5); -} - -.badge-secondary { - color: #fff; - background-color: #6c757d; -} -a.badge-secondary:hover, a.badge-secondary:focus { - color: #fff; - background-color: #545b62; -} -a.badge-secondary:focus, a.badge-secondary.focus { - outline: 0; - -webkit-box-shadow: 0 0 0 0.2rem rgba(108, 117, 125, 0.5); - box-shadow: 0 0 0 0.2rem rgba(108, 117, 125, 0.5); -} - -.badge-success { - color: #fff; - background-color: #28a745; -} -a.badge-success:hover, a.badge-success:focus { - color: #fff; - background-color: #1e7e34; -} -a.badge-success:focus, a.badge-success.focus { - outline: 0; - -webkit-box-shadow: 0 0 0 0.2rem rgba(40, 167, 69, 0.5); - box-shadow: 0 0 0 0.2rem rgba(40, 167, 69, 0.5); -} - -.badge-info { - color: #fff; - background-color: #17a2b8; -} -a.badge-info:hover, a.badge-info:focus { - color: #fff; - background-color: #117a8b; -} -a.badge-info:focus, a.badge-info.focus { - outline: 0; - -webkit-box-shadow: 0 0 0 0.2rem rgba(23, 162, 184, 0.5); - box-shadow: 0 0 0 0.2rem rgba(23, 162, 184, 0.5); -} - -.badge-warning { - color: #212529; - background-color: #ffc107; -} -a.badge-warning:hover, a.badge-warning:focus { - color: #212529; - background-color: #d39e00; -} -a.badge-warning:focus, a.badge-warning.focus { - outline: 0; - -webkit-box-shadow: 0 0 0 0.2rem rgba(255, 193, 7, 0.5); - box-shadow: 0 0 0 0.2rem rgba(255, 193, 7, 0.5); -} - -.badge-danger { - color: #fff; - background-color: #dc3545; -} -a.badge-danger:hover, a.badge-danger:focus { - color: #fff; - background-color: #bd2130; -} -a.badge-danger:focus, a.badge-danger.focus { - outline: 0; - -webkit-box-shadow: 0 0 0 0.2rem rgba(220, 53, 69, 0.5); - box-shadow: 0 0 0 0.2rem rgba(220, 53, 69, 0.5); -} - -.badge-light { - color: #212529; - background-color: #f8f9fa; -} -a.badge-light:hover, a.badge-light:focus { - color: #212529; - background-color: #dae0e5; -} -a.badge-light:focus, a.badge-light.focus { - outline: 0; - -webkit-box-shadow: 0 0 0 0.2rem rgba(248, 249, 250, 0.5); - box-shadow: 0 0 0 0.2rem rgba(248, 249, 250, 0.5); -} - -.badge-dark { - color: #fff; - background-color: #343a40; -} -a.badge-dark:hover, a.badge-dark:focus { - color: #fff; - background-color: #1d2124; -} -a.badge-dark:focus, a.badge-dark.focus { - outline: 0; - -webkit-box-shadow: 0 0 0 0.2rem rgba(52, 58, 64, 0.5); - box-shadow: 0 0 0 0.2rem rgba(52, 58, 64, 0.5); -} - -.jumbotron { - padding: 2rem 1rem; - margin-bottom: 2rem; - background-color: #e9ecef; - border-radius: 0.3rem; -} -@media (min-width: 576px) { - .jumbotron { - padding: 4rem 2rem; - } -} - -.jumbotron-fluid { - padding-right: 0; - padding-left: 0; - border-radius: 0; -} - -.alert { - position: relative; - padding: 0.75rem 1.25rem; - margin-bottom: 1rem; - border: 1px solid transparent; - border-radius: 0.25rem; -} - -.alert-heading { - color: inherit; -} - -.alert-link { - font-weight: 700; -} - -.alert-dismissible { - padding-right: 4rem; -} -.alert-dismissible .close { - position: absolute; - top: 0; - right: 0; - z-index: 2; - padding: 0.75rem 1.25rem; - color: inherit; -} - -.alert-primary { - color: #004085; - background-color: #cce5ff; - border-color: #b8daff; -} -.alert-primary hr { - border-top-color: #9fcdff; -} -.alert-primary .alert-link { - color: #002752; -} - -.alert-secondary { - color: #383d41; - background-color: #e2e3e5; - border-color: #d6d8db; -} -.alert-secondary hr { - border-top-color: #c8cbcf; -} -.alert-secondary .alert-link { - color: #202326; -} - -.alert-success { - color: #155724; - background-color: #d4edda; - border-color: #c3e6cb; -} -.alert-success hr { - border-top-color: #b1dfbb; -} -.alert-success .alert-link { - color: #0b2e13; -} - -.alert-info { - color: #0c5460; - background-color: #d1ecf1; - border-color: #bee5eb; -} -.alert-info hr { - border-top-color: #abdde5; -} -.alert-info .alert-link { - color: #062c33; -} - -.alert-warning { - color: #856404; - background-color: #fff3cd; - border-color: #ffeeba; -} -.alert-warning hr { - border-top-color: #ffe8a1; -} -.alert-warning .alert-link { - color: #533f03; -} - -.alert-danger { - color: #721c24; - background-color: #f8d7da; - border-color: #f5c6cb; -} -.alert-danger hr { - border-top-color: #f1b0b7; -} -.alert-danger .alert-link { - color: #491217; -} - -.alert-light { - color: #818182; - background-color: #fefefe; - border-color: #fdfdfe; -} -.alert-light hr { - border-top-color: #ececf6; -} -.alert-light .alert-link { - color: #686868; -} - -.alert-dark { - color: #1b1e21; - background-color: #d6d8d9; - border-color: #c6c8ca; -} -.alert-dark hr { - border-top-color: #b9bbbe; -} -.alert-dark .alert-link { - color: #040505; -} - -@-webkit-keyframes progress-bar-stripes { - from { - background-position: 1rem 0; - } - to { - background-position: 0 0; - } -} - -@keyframes progress-bar-stripes { - from { - background-position: 1rem 0; - } - to { - background-position: 0 0; - } -} -.progress { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - height: 1rem; - overflow: hidden; - line-height: 0; - font-size: 0.75rem; - background-color: #e9ecef; - border-radius: 0.25rem; -} - -.progress-bar { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-orient: vertical; - -webkit-box-direction: normal; - -ms-flex-direction: column; - flex-direction: column; - -webkit-box-pack: center; - -ms-flex-pack: center; - justify-content: center; - overflow: hidden; - color: #fff; - text-align: center; - white-space: nowrap; - background-color: #007bff; - -webkit-transition: width 0.6s ease; - transition: width 0.6s ease; -} -@media (prefers-reduced-motion: reduce) { - .progress-bar { - -webkit-transition: none; - transition: none; - } -} - -.progress-bar-striped { - background-image: linear-gradient(45deg, rgba(255, 255, 255, 0.15) 25%, transparent 25%, transparent 50%, rgba(255, 255, 255, 0.15) 50%, rgba(255, 255, 255, 0.15) 75%, transparent 75%, transparent); - background-size: 1rem 1rem; -} - -.progress-bar-animated { - -webkit-animation: 1s linear infinite progress-bar-stripes; - animation: 1s linear infinite progress-bar-stripes; -} -@media (prefers-reduced-motion: reduce) { - .progress-bar-animated { - -webkit-animation: none; - animation: none; - } -} - -.media { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-align: start; - -ms-flex-align: start; - align-items: flex-start; -} - -.media-body { - -webkit-box-flex: 1; - -ms-flex: 1; - flex: 1; -} - -.list-group { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-orient: vertical; - -webkit-box-direction: normal; - -ms-flex-direction: column; - flex-direction: column; - padding-left: 0; - margin-bottom: 0; - border-radius: 0.25rem; -} - -.list-group-item-action { - width: 100%; - color: #495057; - text-align: inherit; -} -.list-group-item-action:hover, .list-group-item-action:focus { - z-index: 1; - color: #495057; - text-decoration: none; - background-color: #f8f9fa; -} -.list-group-item-action:active { - color: #212529; - background-color: #e9ecef; -} - -.list-group-item { - position: relative; - display: block; - padding: 0.75rem 1.25rem; - background-color: #fff; - border: 1px solid rgba(0, 0, 0, 0.125); -} -.list-group-item:first-child { - border-top-left-radius: inherit; - border-top-right-radius: inherit; -} -.list-group-item:last-child { - border-bottom-right-radius: inherit; - border-bottom-left-radius: inherit; -} -.list-group-item.disabled, .list-group-item:disabled { - color: #6c757d; - pointer-events: none; - background-color: #fff; -} -.list-group-item.active { - z-index: 2; - color: #fff; - background-color: #007bff; - border-color: #007bff; -} -.list-group-item + .list-group-item { - border-top-width: 0; -} -.list-group-item + .list-group-item.active { - margin-top: -1px; - border-top-width: 1px; -} - -.list-group-horizontal { - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-direction: row; - flex-direction: row; -} -.list-group-horizontal > .list-group-item:first-child { - border-bottom-left-radius: 0.25rem; - border-top-right-radius: 0; -} -.list-group-horizontal > .list-group-item:last-child { - border-top-right-radius: 0.25rem; - border-bottom-left-radius: 0; -} -.list-group-horizontal > .list-group-item.active { - margin-top: 0; -} -.list-group-horizontal > .list-group-item + .list-group-item { - border-top-width: 1px; - border-left-width: 0; -} -.list-group-horizontal > .list-group-item + .list-group-item.active { - margin-left: -1px; - border-left-width: 1px; -} - -@media (min-width: 576px) { - .list-group-horizontal-sm { - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-direction: row; - flex-direction: row; - } - .list-group-horizontal-sm > .list-group-item:first-child { - border-bottom-left-radius: 0.25rem; - border-top-right-radius: 0; - } - .list-group-horizontal-sm > .list-group-item:last-child { - border-top-right-radius: 0.25rem; - border-bottom-left-radius: 0; - } - .list-group-horizontal-sm > .list-group-item.active { - margin-top: 0; - } - .list-group-horizontal-sm > .list-group-item + .list-group-item { - border-top-width: 1px; - border-left-width: 0; - } - .list-group-horizontal-sm > .list-group-item + .list-group-item.active { - margin-left: -1px; - border-left-width: 1px; - } -} -@media (min-width: 768px) { - .list-group-horizontal-md { - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-direction: row; - flex-direction: row; - } - .list-group-horizontal-md > .list-group-item:first-child { - border-bottom-left-radius: 0.25rem; - border-top-right-radius: 0; - } - .list-group-horizontal-md > .list-group-item:last-child { - border-top-right-radius: 0.25rem; - border-bottom-left-radius: 0; - } - .list-group-horizontal-md > .list-group-item.active { - margin-top: 0; - } - .list-group-horizontal-md > .list-group-item + .list-group-item { - border-top-width: 1px; - border-left-width: 0; - } - .list-group-horizontal-md > .list-group-item + .list-group-item.active { - margin-left: -1px; - border-left-width: 1px; - } -} -@media (min-width: 992px) { - .list-group-horizontal-lg { - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-direction: row; - flex-direction: row; - } - .list-group-horizontal-lg > .list-group-item:first-child { - border-bottom-left-radius: 0.25rem; - border-top-right-radius: 0; - } - .list-group-horizontal-lg > .list-group-item:last-child { - border-top-right-radius: 0.25rem; - border-bottom-left-radius: 0; - } - .list-group-horizontal-lg > .list-group-item.active { - margin-top: 0; - } - .list-group-horizontal-lg > .list-group-item + .list-group-item { - border-top-width: 1px; - border-left-width: 0; - } - .list-group-horizontal-lg > .list-group-item + .list-group-item.active { - margin-left: -1px; - border-left-width: 1px; - } -} -@media (min-width: 1200px) { - .list-group-horizontal-xl { - -webkit-box-orient: horizontal; - -webkit-box-direction: normal; - -ms-flex-direction: row; - flex-direction: row; - } - .list-group-horizontal-xl > .list-group-item:first-child { - border-bottom-left-radius: 0.25rem; - border-top-right-radius: 0; - } - .list-group-horizontal-xl > .list-group-item:last-child { - border-top-right-radius: 0.25rem; - border-bottom-left-radius: 0; - } - .list-group-horizontal-xl > .list-group-item.active { - margin-top: 0; - } - .list-group-horizontal-xl > .list-group-item + .list-group-item { - border-top-width: 1px; - border-left-width: 0; - } - .list-group-horizontal-xl > .list-group-item + .list-group-item.active { - margin-left: -1px; - border-left-width: 1px; - } -} -.list-group-flush { - border-radius: 0; -} -.list-group-flush > .list-group-item { - border-width: 0 0 1px; -} -.list-group-flush > .list-group-item:last-child { - border-bottom-width: 0; -} - -.list-group-item-primary { - color: #004085; - background-color: #b8daff; -} -.list-group-item-primary.list-group-item-action:hover, .list-group-item-primary.list-group-item-action:focus { - color: #004085; - background-color: #9fcdff; -} -.list-group-item-primary.list-group-item-action.active { - color: #fff; - background-color: #004085; - border-color: #004085; -} - -.list-group-item-secondary { - color: #383d41; - background-color: #d6d8db; -} -.list-group-item-secondary.list-group-item-action:hover, .list-group-item-secondary.list-group-item-action:focus { - color: #383d41; - background-color: #c8cbcf; -} -.list-group-item-secondary.list-group-item-action.active { - color: #fff; - background-color: #383d41; - border-color: #383d41; -} - -.list-group-item-success { - color: #155724; - background-color: #c3e6cb; -} -.list-group-item-success.list-group-item-action:hover, .list-group-item-success.list-group-item-action:focus { - color: #155724; - background-color: #b1dfbb; -} -.list-group-item-success.list-group-item-action.active { - color: #fff; - background-color: #155724; - border-color: #155724; -} - -.list-group-item-info { - color: #0c5460; - background-color: #bee5eb; -} -.list-group-item-info.list-group-item-action:hover, .list-group-item-info.list-group-item-action:focus { - color: #0c5460; - background-color: #abdde5; -} -.list-group-item-info.list-group-item-action.active { - color: #fff; - background-color: #0c5460; - border-color: #0c5460; -} - -.list-group-item-warning { - color: #856404; - background-color: #ffeeba; -} -.list-group-item-warning.list-group-item-action:hover, .list-group-item-warning.list-group-item-action:focus { - color: #856404; - background-color: #ffe8a1; -} -.list-group-item-warning.list-group-item-action.active { - color: #fff; - background-color: #856404; - border-color: #856404; -} - -.list-group-item-danger { - color: #721c24; - background-color: #f5c6cb; -} -.list-group-item-danger.list-group-item-action:hover, .list-group-item-danger.list-group-item-action:focus { - color: #721c24; - background-color: #f1b0b7; -} -.list-group-item-danger.list-group-item-action.active { - color: #fff; - background-color: #721c24; - border-color: #721c24; -} - -.list-group-item-light { - color: #818182; - background-color: #fdfdfe; -} -.list-group-item-light.list-group-item-action:hover, .list-group-item-light.list-group-item-action:focus { - color: #818182; - background-color: #ececf6; -} -.list-group-item-light.list-group-item-action.active { - color: #fff; - background-color: #818182; - border-color: #818182; -} - -.list-group-item-dark { - color: #1b1e21; - background-color: #c6c8ca; -} -.list-group-item-dark.list-group-item-action:hover, .list-group-item-dark.list-group-item-action:focus { - color: #1b1e21; - background-color: #b9bbbe; -} -.list-group-item-dark.list-group-item-action.active { - color: #fff; - background-color: #1b1e21; - border-color: #1b1e21; -} - -.close { - float: right; - font-size: 1.5rem; - font-weight: 700; - line-height: 1; - color: #000; - text-shadow: 0 1px 0 #fff; - opacity: .5; -} -.close:hover { - color: #000; - text-decoration: none; -} -.close:not(:disabled):not(.disabled):hover, .close:not(:disabled):not(.disabled):focus { - opacity: .75; -} - -button.close { - padding: 0; - background-color: transparent; - border: 0; -} - -a.close.disabled { - pointer-events: none; -} - -.toast { - -ms-flex-preferred-size: 350px; - flex-basis: 350px; - max-width: 350px; - font-size: 0.875rem; - background-color: rgba(255, 255, 255, 0.85); - background-clip: padding-box; - border: 1px solid rgba(0, 0, 0, 0.1); - -webkit-box-shadow: 0 0.25rem 0.75rem rgba(0, 0, 0, 0.1); - box-shadow: 0 0.25rem 0.75rem rgba(0, 0, 0, 0.1); - opacity: 0; - border-radius: 0.25rem; -} -.toast:not(:last-child) { - margin-bottom: 0.75rem; -} -.toast.showing { - opacity: 1; -} -.toast.show { - display: block; - opacity: 1; -} -.toast.hide { - display: none; -} - -.toast-header { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; - padding: 0.25rem 0.75rem; - color: #6c757d; - background-color: rgba(255, 255, 255, 0.85); - background-clip: padding-box; - border-bottom: 1px solid rgba(0, 0, 0, 0.05); - border-top-left-radius: calc(0.25rem - 1px); - border-top-right-radius: calc(0.25rem - 1px); -} - -.toast-body { - padding: 0.75rem; -} - -.modal-open { - overflow: hidden; -} -.modal-open .modal { - overflow-x: hidden; - overflow-y: auto; -} - -.modal { - position: fixed; - top: 0; - left: 0; - z-index: 1050; - display: none; - width: 100%; - height: 100%; - overflow: hidden; - outline: 0; -} - -.modal-dialog { - position: relative; - width: auto; - margin: 0.5rem; - pointer-events: none; -} -.modal.fade .modal-dialog { - -webkit-transition: -webkit-transform 0.3s ease-out; - transition: -webkit-transform 0.3s ease-out; - transition: transform 0.3s ease-out; - transition: transform 0.3s ease-out, -webkit-transform 0.3s ease-out; - -webkit-transform: translate(0, -50px); - transform: translate(0, -50px); -} -@media (prefers-reduced-motion: reduce) { - .modal.fade .modal-dialog { - -webkit-transition: none; - transition: none; - } -} -.modal.show .modal-dialog { - -webkit-transform: none; - transform: none; -} -.modal.modal-static .modal-dialog { - -webkit-transform: scale(1.02); - transform: scale(1.02); -} - -.modal-dialog-scrollable { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - max-height: calc(100% - 1rem); -} -.modal-dialog-scrollable .modal-content { - max-height: calc(100vh - 1rem); - overflow: hidden; -} -.modal-dialog-scrollable .modal-header, -.modal-dialog-scrollable .modal-footer { - -ms-flex-negative: 0; - flex-shrink: 0; -} -.modal-dialog-scrollable .modal-body { - overflow-y: auto; -} - -.modal-dialog-centered { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; - min-height: calc(100% - 1rem); -} -.modal-dialog-centered::before { - display: block; - height: calc(100vh - 1rem); - height: -webkit-min-content; - height: -moz-min-content; - height: min-content; - content: ""; -} -.modal-dialog-centered.modal-dialog-scrollable { - -webkit-box-orient: vertical; - -webkit-box-direction: normal; - -ms-flex-direction: column; - flex-direction: column; - -webkit-box-pack: center; - -ms-flex-pack: center; - justify-content: center; - height: 100%; -} -.modal-dialog-centered.modal-dialog-scrollable .modal-content { - max-height: none; -} -.modal-dialog-centered.modal-dialog-scrollable::before { - content: none; -} - -.modal-content { - position: relative; - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-orient: vertical; - -webkit-box-direction: normal; - -ms-flex-direction: column; - flex-direction: column; - width: 100%; - pointer-events: auto; - background-color: #fff; - background-clip: padding-box; - border: 1px solid rgba(0, 0, 0, 0.2); - border-radius: 0.3rem; - outline: 0; -} - -.modal-backdrop { - position: fixed; - top: 0; - left: 0; - z-index: 1040; - width: 100vw; - height: 100vh; - background-color: #000; -} -.modal-backdrop.fade { - opacity: 0; -} -.modal-backdrop.show { - opacity: 0.5; -} - -.modal-header { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-align: start; - -ms-flex-align: start; - align-items: flex-start; - -webkit-box-pack: justify; - -ms-flex-pack: justify; - justify-content: space-between; - padding: 1rem 1rem; - border-bottom: 1px solid #dee2e6; - border-top-left-radius: calc(0.3rem - 1px); - border-top-right-radius: calc(0.3rem - 1px); -} -.modal-header .close { - padding: 1rem 1rem; - margin: -1rem -1rem -1rem auto; -} - -.modal-title { - margin-bottom: 0; - line-height: 1.5; -} - -.modal-body { - position: relative; - -webkit-box-flex: 1; - -ms-flex: 1 1 auto; - flex: 1 1 auto; - padding: 1rem; -} - -.modal-footer { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -ms-flex-wrap: wrap; - flex-wrap: wrap; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; - -webkit-box-pack: end; - -ms-flex-pack: end; - justify-content: flex-end; - padding: 0.75rem; - border-top: 1px solid #dee2e6; - border-bottom-right-radius: calc(0.3rem - 1px); - border-bottom-left-radius: calc(0.3rem - 1px); -} -.modal-footer > * { - margin: 0.25rem; -} - -.modal-scrollbar-measure { - position: absolute; - top: -9999px; - width: 50px; - height: 50px; - overflow: scroll; -} - -@media (min-width: 576px) { - .modal-dialog { - max-width: 500px; - margin: 1.75rem auto; - } - - .modal-dialog-scrollable { - max-height: calc(100% - 3.5rem); - } - .modal-dialog-scrollable .modal-content { - max-height: calc(100vh - 3.5rem); - } - - .modal-dialog-centered { - min-height: calc(100% - 3.5rem); - } - .modal-dialog-centered::before { - height: calc(100vh - 3.5rem); - height: -webkit-min-content; - height: -moz-min-content; - height: min-content; - } - - .modal-sm { - max-width: 300px; - } -} -@media (min-width: 992px) { - .modal-lg, - .modal-xl { - max-width: 800px; - } -} -@media (min-width: 1200px) { - .modal-xl { - max-width: 1140px; - } -} -.tooltip { - position: absolute; - z-index: 1070; - display: block; - margin: 0; - font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, "Helvetica Neue", Arial, "Noto Sans", "Liberation Sans", sans-serif, "Apple Color Emoji", "Segoe UI Emoji", "Segoe UI Symbol", "Noto Color Emoji"; - font-style: normal; - font-weight: 400; - line-height: 1.5; - text-align: left; - text-align: start; - text-decoration: none; - text-shadow: none; - text-transform: none; - letter-spacing: normal; - word-break: normal; - word-spacing: normal; - white-space: normal; - line-break: auto; - font-size: 0.875rem; - word-wrap: break-word; - opacity: 0; -} -.tooltip.show { - opacity: 0.9; -} -.tooltip .arrow { - position: absolute; - display: block; - width: 0.8rem; - height: 0.4rem; -} -.tooltip .arrow::before { - position: absolute; - content: ""; - border-color: transparent; - border-style: solid; -} - -.bs-tooltip-top, .bs-tooltip-auto[x-placement^="top"] { - padding: 0.4rem 0; -} -.bs-tooltip-top .arrow, .bs-tooltip-auto[x-placement^="top"] .arrow { - bottom: 0; -} -.bs-tooltip-top .arrow::before, .bs-tooltip-auto[x-placement^="top"] .arrow::before { - top: 0; - border-width: 0.4rem 0.4rem 0; - border-top-color: #000; -} - -.bs-tooltip-right, .bs-tooltip-auto[x-placement^="right"] { - padding: 0 0.4rem; -} -.bs-tooltip-right .arrow, .bs-tooltip-auto[x-placement^="right"] .arrow { - left: 0; - width: 0.4rem; - height: 0.8rem; -} -.bs-tooltip-right .arrow::before, .bs-tooltip-auto[x-placement^="right"] .arrow::before { - right: 0; - border-width: 0.4rem 0.4rem 0.4rem 0; - border-right-color: #000; -} - -.bs-tooltip-bottom, .bs-tooltip-auto[x-placement^="bottom"] { - padding: 0.4rem 0; -} -.bs-tooltip-bottom .arrow, .bs-tooltip-auto[x-placement^="bottom"] .arrow { - top: 0; -} -.bs-tooltip-bottom .arrow::before, .bs-tooltip-auto[x-placement^="bottom"] .arrow::before { - bottom: 0; - border-width: 0 0.4rem 0.4rem; - border-bottom-color: #000; -} - -.bs-tooltip-left, .bs-tooltip-auto[x-placement^="left"] { - padding: 0 0.4rem; -} -.bs-tooltip-left .arrow, .bs-tooltip-auto[x-placement^="left"] .arrow { - right: 0; - width: 0.4rem; - height: 0.8rem; -} -.bs-tooltip-left .arrow::before, .bs-tooltip-auto[x-placement^="left"] .arrow::before { - left: 0; - border-width: 0.4rem 0 0.4rem 0.4rem; - border-left-color: #000; -} - -.tooltip-inner { - max-width: 200px; - padding: 0.25rem 0.5rem; - color: #fff; - text-align: center; - background-color: #000; - border-radius: 0.25rem; -} - -.popover { - position: absolute; - top: 0; - left: 0; - z-index: 1060; - display: block; - max-width: 276px; - font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, "Helvetica Neue", Arial, "Noto Sans", "Liberation Sans", sans-serif, "Apple Color Emoji", "Segoe UI Emoji", "Segoe UI Symbol", "Noto Color Emoji"; - font-style: normal; - font-weight: 400; - line-height: 1.5; - text-align: left; - text-align: start; - text-decoration: none; - text-shadow: none; - text-transform: none; - letter-spacing: normal; - word-break: normal; - word-spacing: normal; - white-space: normal; - line-break: auto; - font-size: 0.875rem; - word-wrap: break-word; - background-color: #fff; - background-clip: padding-box; - border: 1px solid rgba(0, 0, 0, 0.2); - border-radius: 0.3rem; -} -.popover .arrow { - position: absolute; - display: block; - width: 1rem; - height: 0.5rem; - margin: 0 0.3rem; -} -.popover .arrow::before, .popover .arrow::after { - position: absolute; - display: block; - content: ""; - border-color: transparent; - border-style: solid; -} - -.bs-popover-top, .bs-popover-auto[x-placement^="top"] { - margin-bottom: 0.5rem; -} -.bs-popover-top > .arrow, .bs-popover-auto[x-placement^="top"] > .arrow { - bottom: calc(-0.5rem - 1px); -} -.bs-popover-top > .arrow::before, .bs-popover-auto[x-placement^="top"] > .arrow::before { - bottom: 0; - border-width: 0.5rem 0.5rem 0; - border-top-color: rgba(0, 0, 0, 0.25); -} -.bs-popover-top > .arrow::after, .bs-popover-auto[x-placement^="top"] > .arrow::after { - bottom: 1px; - border-width: 0.5rem 0.5rem 0; - border-top-color: #fff; -} - -.bs-popover-right, .bs-popover-auto[x-placement^="right"] { - margin-left: 0.5rem; -} -.bs-popover-right > .arrow, .bs-popover-auto[x-placement^="right"] > .arrow { - left: calc(-0.5rem - 1px); - width: 0.5rem; - height: 1rem; - margin: 0.3rem 0; -} -.bs-popover-right > .arrow::before, .bs-popover-auto[x-placement^="right"] > .arrow::before { - left: 0; - border-width: 0.5rem 0.5rem 0.5rem 0; - border-right-color: rgba(0, 0, 0, 0.25); -} -.bs-popover-right > .arrow::after, .bs-popover-auto[x-placement^="right"] > .arrow::after { - left: 1px; - border-width: 0.5rem 0.5rem 0.5rem 0; - border-right-color: #fff; -} - -.bs-popover-bottom, .bs-popover-auto[x-placement^="bottom"] { - margin-top: 0.5rem; -} -.bs-popover-bottom > .arrow, .bs-popover-auto[x-placement^="bottom"] > .arrow { - top: calc(-0.5rem - 1px); -} -.bs-popover-bottom > .arrow::before, .bs-popover-auto[x-placement^="bottom"] > .arrow::before { - top: 0; - border-width: 0 0.5rem 0.5rem 0.5rem; - border-bottom-color: rgba(0, 0, 0, 0.25); -} -.bs-popover-bottom > .arrow::after, .bs-popover-auto[x-placement^="bottom"] > .arrow::after { - top: 1px; - border-width: 0 0.5rem 0.5rem 0.5rem; - border-bottom-color: #fff; -} -.bs-popover-bottom .popover-header::before, .bs-popover-auto[x-placement^="bottom"] .popover-header::before { - position: absolute; - top: 0; - left: 50%; - display: block; - width: 1rem; - margin-left: -0.5rem; - content: ""; - border-bottom: 1px solid #f7f7f7; -} - -.bs-popover-left, .bs-popover-auto[x-placement^="left"] { - margin-right: 0.5rem; -} -.bs-popover-left > .arrow, .bs-popover-auto[x-placement^="left"] > .arrow { - right: calc(-0.5rem - 1px); - width: 0.5rem; - height: 1rem; - margin: 0.3rem 0; -} -.bs-popover-left > .arrow::before, .bs-popover-auto[x-placement^="left"] > .arrow::before { - right: 0; - border-width: 0.5rem 0 0.5rem 0.5rem; - border-left-color: rgba(0, 0, 0, 0.25); -} -.bs-popover-left > .arrow::after, .bs-popover-auto[x-placement^="left"] > .arrow::after { - right: 1px; - border-width: 0.5rem 0 0.5rem 0.5rem; - border-left-color: #fff; -} - -.popover-header { - padding: 0.5rem 0.75rem; - margin-bottom: 0; - font-size: 1rem; - background-color: #f7f7f7; - border-bottom: 1px solid #ebebeb; - border-top-left-radius: calc(0.3rem - 1px); - border-top-right-radius: calc(0.3rem - 1px); -} -.popover-header:empty { - display: none; -} - -.popover-body { - padding: 0.5rem 0.75rem; - color: #212529; -} - -.carousel { - position: relative; -} - -.carousel.pointer-event { - -ms-touch-action: pan-y; - touch-action: pan-y; -} - -.carousel-inner { - position: relative; - width: 100%; - overflow: hidden; -} -.carousel-inner::after { - display: block; - clear: both; - content: ""; -} - -.carousel-item { - position: relative; - display: none; - float: left; - width: 100%; - margin-right: -100%; - -webkit-backface-visibility: hidden; - backface-visibility: hidden; - -webkit-transition: -webkit-transform 0.6s ease-in-out; - transition: -webkit-transform 0.6s ease-in-out; - transition: transform 0.6s ease-in-out; - transition: transform 0.6s ease-in-out, -webkit-transform 0.6s ease-in-out; -} -@media (prefers-reduced-motion: reduce) { - .carousel-item { - -webkit-transition: none; - transition: none; - } -} - -.carousel-item.active, -.carousel-item-next, -.carousel-item-prev { - display: block; -} - -.carousel-item-next:not(.carousel-item-left), -.active.carousel-item-right { - -webkit-transform: translateX(100%); - transform: translateX(100%); -} - -.carousel-item-prev:not(.carousel-item-right), -.active.carousel-item-left { - -webkit-transform: translateX(-100%); - transform: translateX(-100%); -} - -.carousel-fade .carousel-item { - opacity: 0; - -webkit-transition-property: opacity; - transition-property: opacity; - -webkit-transform: none; - transform: none; -} -.carousel-fade .carousel-item.active, -.carousel-fade .carousel-item-next.carousel-item-left, -.carousel-fade .carousel-item-prev.carousel-item-right { - z-index: 1; - opacity: 1; -} -.carousel-fade .active.carousel-item-left, -.carousel-fade .active.carousel-item-right { - z-index: 0; - opacity: 0; - -webkit-transition: opacity 0s 0.6s; - transition: opacity 0s 0.6s; -} -@media (prefers-reduced-motion: reduce) { - .carousel-fade .active.carousel-item-left, - .carousel-fade .active.carousel-item-right { - -webkit-transition: none; - transition: none; - } -} - -.carousel-control-prev, -.carousel-control-next { - position: absolute; - top: 0; - bottom: 0; - z-index: 1; - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; - -webkit-box-pack: center; - -ms-flex-pack: center; - justify-content: center; - width: 15%; - padding: 0; - color: #fff; - text-align: center; - background: none; - border: 0; - opacity: 0.5; - -webkit-transition: opacity 0.15s ease; - transition: opacity 0.15s ease; -} -@media (prefers-reduced-motion: reduce) { - .carousel-control-prev, - .carousel-control-next { - -webkit-transition: none; - transition: none; - } -} -.carousel-control-prev:hover, .carousel-control-prev:focus, -.carousel-control-next:hover, -.carousel-control-next:focus { - color: #fff; - text-decoration: none; - outline: 0; - opacity: 0.9; -} - -.carousel-control-prev { - left: 0; -} - -.carousel-control-next { - right: 0; -} - -.carousel-control-prev-icon, -.carousel-control-next-icon { - display: inline-block; - width: 20px; - height: 20px; - background: 50% / 100% 100% no-repeat; -} - -.carousel-control-prev-icon { - background-image: url("data:image/svg+xml,%3csvg xmlns='http://www.w3.org/2000/svg' fill='%23fff' width='8' height='8' viewBox='0 0 8 8'%3e%3cpath d='M5.25 0l-4 4 4 4 1.5-1.5L4.25 4l2.5-2.5L5.25 0z'/%3e%3c/svg%3e"); -} - -.carousel-control-next-icon { - background-image: url("data:image/svg+xml,%3csvg xmlns='http://www.w3.org/2000/svg' fill='%23fff' width='8' height='8' viewBox='0 0 8 8'%3e%3cpath d='M2.75 0l-1.5 1.5L3.75 4l-2.5 2.5L2.75 8l4-4-4-4z'/%3e%3c/svg%3e"); -} - -.carousel-indicators { - position: absolute; - right: 0; - bottom: 0; - left: 0; - z-index: 15; - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-pack: center; - -ms-flex-pack: center; - justify-content: center; - padding-left: 0; - margin-right: 15%; - margin-left: 15%; - list-style: none; -} -.carousel-indicators li { - -webkit-box-sizing: content-box; - box-sizing: content-box; - -webkit-box-flex: 0; - -ms-flex: 0 1 auto; - flex: 0 1 auto; - width: 30px; - height: 3px; - margin-right: 3px; - margin-left: 3px; - text-indent: -999px; - cursor: pointer; - background-color: #fff; - background-clip: padding-box; - border-top: 10px solid transparent; - border-bottom: 10px solid transparent; - opacity: .5; - -webkit-transition: opacity 0.6s ease; - transition: opacity 0.6s ease; -} -@media (prefers-reduced-motion: reduce) { - .carousel-indicators li { - -webkit-transition: none; - transition: none; - } -} -.carousel-indicators .active { - opacity: 1; -} - -.carousel-caption { - position: absolute; - right: 15%; - bottom: 20px; - left: 15%; - z-index: 10; - padding-top: 20px; - padding-bottom: 20px; - color: #fff; - text-align: center; -} - -@-webkit-keyframes spinner-border { - to { - -webkit-transform: rotate(360deg); - transform: rotate(360deg); - } -} - -@keyframes spinner-border { - to { - -webkit-transform: rotate(360deg); - transform: rotate(360deg); - } -} -.spinner-border { - display: inline-block; - width: 2rem; - height: 2rem; - vertical-align: -0.125em; - border: 0.25em solid currentColor; - border-right-color: transparent; - border-radius: 50%; - -webkit-animation: .75s linear infinite spinner-border; - animation: .75s linear infinite spinner-border; -} - -.spinner-border-sm { - width: 1rem; - height: 1rem; - border-width: 0.2em; -} - -@-webkit-keyframes spinner-grow { - 0% { - -webkit-transform: scale(0); - transform: scale(0); - } - 50% { - opacity: 1; - -webkit-transform: none; - transform: none; - } -} - -@keyframes spinner-grow { - 0% { - -webkit-transform: scale(0); - transform: scale(0); - } - 50% { - opacity: 1; - -webkit-transform: none; - transform: none; - } -} -.spinner-grow { - display: inline-block; - width: 2rem; - height: 2rem; - vertical-align: -0.125em; - background-color: currentColor; - border-radius: 50%; - opacity: 0; - -webkit-animation: .75s linear infinite spinner-grow; - animation: .75s linear infinite spinner-grow; -} - -.spinner-grow-sm { - width: 1rem; - height: 1rem; -} - -@media (prefers-reduced-motion: reduce) { - .spinner-border, - .spinner-grow { - -webkit-animation-duration: 1.5s; - animation-duration: 1.5s; - } -} -.align-baseline { - vertical-align: baseline !important; -} - -.align-top { - vertical-align: top !important; -} - -.align-middle { - vertical-align: middle !important; -} - -.align-bottom { - vertical-align: bottom !important; -} - -.align-text-bottom { - vertical-align: text-bottom !important; -} - -.align-text-top { - vertical-align: text-top !important; -} - -.bg-primary { - background-color: #007bff !important; -} - -a.bg-primary:hover, a.bg-primary:focus, -button.bg-primary:hover, -button.bg-primary:focus { - background-color: #0062cc !important; -} - -.bg-secondary { - background-color: #6c757d !important; -} - -a.bg-secondary:hover, a.bg-secondary:focus, -button.bg-secondary:hover, -button.bg-secondary:focus { - background-color: #545b62 !important; -} - -.bg-success { - background-color: #28a745 !important; -} - -a.bg-success:hover, a.bg-success:focus, -button.bg-success:hover, -button.bg-success:focus { - background-color: #1e7e34 !important; -} - -.bg-info { - background-color: #17a2b8 !important; -} - -a.bg-info:hover, a.bg-info:focus, -button.bg-info:hover, -button.bg-info:focus { - background-color: #117a8b !important; -} - -.bg-warning { - background-color: #ffc107 !important; -} - -a.bg-warning:hover, a.bg-warning:focus, -button.bg-warning:hover, -button.bg-warning:focus { - background-color: #d39e00 !important; -} - -.bg-danger { - background-color: #dc3545 !important; -} - -a.bg-danger:hover, a.bg-danger:focus, -button.bg-danger:hover, -button.bg-danger:focus { - background-color: #bd2130 !important; -} - -.bg-light { - background-color: #f8f9fa !important; -} - -a.bg-light:hover, a.bg-light:focus, -button.bg-light:hover, -button.bg-light:focus { - background-color: #dae0e5 !important; -} - -.bg-dark { - background-color: #343a40 !important; -} - -a.bg-dark:hover, a.bg-dark:focus, -button.bg-dark:hover, -button.bg-dark:focus { - background-color: #1d2124 !important; -} - -.bg-white { - background-color: #fff !important; -} - -.bg-transparent { - background-color: transparent !important; -} - -.border { - border: 1px solid #dee2e6 !important; -} - -.border-top { - border-top: 1px solid #dee2e6 !important; -} - -.border-right { - border-right: 1px solid #dee2e6 !important; -} - -.border-bottom { - border-bottom: 1px solid #dee2e6 !important; -} - -.border-left { - border-left: 1px solid #dee2e6 !important; -} - -.border-0 { - border: 0 !important; -} - -.border-top-0 { - border-top: 0 !important; -} - -.border-right-0 { - border-right: 0 !important; -} - -.border-bottom-0 { - border-bottom: 0 !important; -} - -.border-left-0 { - border-left: 0 !important; -} - -.border-primary { - border-color: #007bff !important; -} - -.border-secondary { - border-color: #6c757d !important; -} - -.border-success { - border-color: #28a745 !important; -} - -.border-info { - border-color: #17a2b8 !important; -} - -.border-warning { - border-color: #ffc107 !important; -} - -.border-danger { - border-color: #dc3545 !important; -} - -.border-light { - border-color: #f8f9fa !important; -} - -.border-dark { - border-color: #343a40 !important; -} - -.border-white { - border-color: #fff !important; -} - -.rounded-sm { - border-radius: 0.2rem !important; -} - -.rounded { - border-radius: 0.25rem !important; -} - -.rounded-top { - border-top-left-radius: 0.25rem !important; - border-top-right-radius: 0.25rem !important; -} - -.rounded-right { - border-top-right-radius: 0.25rem !important; - border-bottom-right-radius: 0.25rem !important; -} - -.rounded-bottom { - border-bottom-right-radius: 0.25rem !important; - border-bottom-left-radius: 0.25rem !important; -} - -.rounded-left { - border-top-left-radius: 0.25rem !important; - border-bottom-left-radius: 0.25rem !important; -} - -.rounded-lg { - border-radius: 0.3rem !important; -} - -.rounded-circle { - border-radius: 50% !important; -} - -.rounded-pill { - border-radius: 50rem !important; -} - -.rounded-0 { - border-radius: 0 !important; -} - -.clearfix::after { - display: block; - clear: both; - content: ""; -} - -.d-none { - display: none !important; -} - -.d-inline { - display: inline !important; -} - -.d-inline-block { - display: inline-block !important; -} - -.d-block { - display: block !important; -} - -.d-table { - display: table !important; -} - -.d-table-row { - display: table-row !important; -} - -.d-table-cell { - display: table-cell !important; -} - -.d-flex { - display: -webkit-box !important; - display: -ms-flexbox !important; - display: flex !important; -} - -.d-inline-flex { - display: -webkit-inline-box !important; - display: -ms-inline-flexbox !important; - display: inline-flex !important; -} - -@media (min-width: 576px) { - .d-sm-none { - display: none !important; - } - - .d-sm-inline { - display: inline !important; - } - - .d-sm-inline-block { - display: inline-block !important; - } - - .d-sm-block { - display: block !important; - } - - .d-sm-table { - display: table !important; - } - - .d-sm-table-row { - display: table-row !important; - } - - .d-sm-table-cell { - display: table-cell !important; - } - - .d-sm-flex { - display: -webkit-box !important; - display: -ms-flexbox !important; - display: flex !important; - } - - .d-sm-inline-flex { - display: -webkit-inline-box !important; - display: -ms-inline-flexbox !important; - display: inline-flex !important; - } -} -@media (min-width: 768px) { - .d-md-none { - display: none !important; - } - - .d-md-inline { - display: inline !important; - } - - .d-md-inline-block { - display: inline-block !important; - } - - .d-md-block { - display: block !important; - } - - .d-md-table { - display: table !important; - } - - .d-md-table-row { - display: table-row !important; - } - - .d-md-table-cell { - display: table-cell !important; - } - - .d-md-flex { - display: -webkit-box !important; - display: -ms-flexbox !important; - display: flex !important; - } - - .d-md-inline-flex { - display: -webkit-inline-box !important; - display: -ms-inline-flexbox !important; - display: inline-flex !important; - } -} -@media (min-width: 992px) { - .d-lg-none { - display: none !important; - } - - .d-lg-inline { - display: inline !important; - } - - .d-lg-inline-block { - display: inline-block !important; - } - - .d-lg-block { - display: block !important; - } - - .d-lg-table { - display: table !important; - } - - .d-lg-table-row { - display: table-row !important; - } - - .d-lg-table-cell { - display: table-cell !important; - } - - .d-lg-flex { - display: -webkit-box !important; - display: -ms-flexbox !important; - display: flex !important; - } - - .d-lg-inline-flex { - display: -webkit-inline-box !important; - display: -ms-inline-flexbox !important; - display: inline-flex !important; - } -} -@media (min-width: 1200px) { - .d-xl-none { - display: none !important; - } - - .d-xl-inline { - display: inline !important; - } - - .d-xl-inline-block { - display: inline-block !important; - } - - .d-xl-block { - display: block !important; - } - - .d-xl-table { - display: table !important; - } - - .d-xl-table-row { - display: table-row !important; - } - - .d-xl-table-cell { - display: table-cell !important; - } - - .d-xl-flex { - display: -webkit-box !important; - display: -ms-flexbox !important; - display: flex !important; - } - - .d-xl-inline-flex { - display: -webkit-inline-box !important; - display: -ms-inline-flexbox !important; - display: inline-flex !important; - } -} -@media print { - .d-print-none { - display: none !important; - } - - .d-print-inline { - display: inline !important; - } - - .d-print-inline-block { - display: inline-block !important; - } - - .d-print-block { - display: block !important; - } - - .d-print-table { - display: table !important; - } - - .d-print-table-row { - display: table-row !important; - } - - .d-print-table-cell { - display: table-cell !important; - } - - .d-print-flex { - display: -webkit-box !important; - display: -ms-flexbox !important; - display: flex !important; - } - - .d-print-inline-flex { - display: -webkit-inline-box !important; - display: -ms-inline-flexbox !important; - display: inline-flex !important; - } -} -.embed-responsive { - position: relative; - display: block; - width: 100%; - padding: 0; - overflow: hidden; -} -.embed-responsive::before { - display: block; - content: ""; -} -.embed-responsive .embed-responsive-item, -.embed-responsive iframe, -.embed-responsive embed, -.embed-responsive object, -.embed-responsive video { - position: absolute; - top: 0; - bottom: 0; - left: 0; - width: 100%; - height: 100%; - border: 0; -} - -.embed-responsive-21by9::before { - padding-top: 42.85714286%; -} - -.embed-responsive-16by9::before { - padding-top: 56.25%; -} - -.embed-responsive-4by3::before { - padding-top: 75%; -} - -.embed-responsive-1by1::before { - padding-top: 100%; -} - -.flex-row { - -webkit-box-orient: horizontal !important; - -webkit-box-direction: normal !important; - -ms-flex-direction: row !important; - flex-direction: row !important; -} - -.flex-column { - -webkit-box-orient: vertical !important; - -webkit-box-direction: normal !important; - -ms-flex-direction: column !important; - flex-direction: column !important; -} - -.flex-row-reverse { - -webkit-box-orient: horizontal !important; - -webkit-box-direction: reverse !important; - -ms-flex-direction: row-reverse !important; - flex-direction: row-reverse !important; -} - -.flex-column-reverse { - -webkit-box-orient: vertical !important; - -webkit-box-direction: reverse !important; - -ms-flex-direction: column-reverse !important; - flex-direction: column-reverse !important; -} - -.flex-wrap { - -ms-flex-wrap: wrap !important; - flex-wrap: wrap !important; -} - -.flex-nowrap { - -ms-flex-wrap: nowrap !important; - flex-wrap: nowrap !important; -} - -.flex-wrap-reverse { - -ms-flex-wrap: wrap-reverse !important; - flex-wrap: wrap-reverse !important; -} - -.flex-fill { - -webkit-box-flex: 1 !important; - -ms-flex: 1 1 auto !important; - flex: 1 1 auto !important; -} - -.flex-grow-0 { - -webkit-box-flex: 0 !important; - -ms-flex-positive: 0 !important; - flex-grow: 0 !important; -} - -.flex-grow-1 { - -webkit-box-flex: 1 !important; - -ms-flex-positive: 1 !important; - flex-grow: 1 !important; -} - -.flex-shrink-0 { - -ms-flex-negative: 0 !important; - flex-shrink: 0 !important; -} - -.flex-shrink-1 { - -ms-flex-negative: 1 !important; - flex-shrink: 1 !important; -} - -.justify-content-start { - -webkit-box-pack: start !important; - -ms-flex-pack: start !important; - justify-content: flex-start !important; -} - -.justify-content-end { - -webkit-box-pack: end !important; - -ms-flex-pack: end !important; - justify-content: flex-end !important; -} - -.justify-content-center { - -webkit-box-pack: center !important; - -ms-flex-pack: center !important; - justify-content: center !important; -} - -.justify-content-between { - -webkit-box-pack: justify !important; - -ms-flex-pack: justify !important; - justify-content: space-between !important; -} - -.justify-content-around { - -ms-flex-pack: distribute !important; - justify-content: space-around !important; -} - -.align-items-start { - -webkit-box-align: start !important; - -ms-flex-align: start !important; - align-items: flex-start !important; -} - -.align-items-end { - -webkit-box-align: end !important; - -ms-flex-align: end !important; - align-items: flex-end !important; -} - -.align-items-center { - -webkit-box-align: center !important; - -ms-flex-align: center !important; - align-items: center !important; -} - -.align-items-baseline { - -webkit-box-align: baseline !important; - -ms-flex-align: baseline !important; - align-items: baseline !important; -} - -.align-items-stretch { - -webkit-box-align: stretch !important; - -ms-flex-align: stretch !important; - align-items: stretch !important; -} - -.align-content-start { - -ms-flex-line-pack: start !important; - align-content: flex-start !important; -} - -.align-content-end { - -ms-flex-line-pack: end !important; - align-content: flex-end !important; -} - -.align-content-center { - -ms-flex-line-pack: center !important; - align-content: center !important; -} - -.align-content-between { - -ms-flex-line-pack: justify !important; - align-content: space-between !important; -} - -.align-content-around { - -ms-flex-line-pack: distribute !important; - align-content: space-around !important; -} - -.align-content-stretch { - -ms-flex-line-pack: stretch !important; - align-content: stretch !important; -} - -.align-self-auto { - -ms-flex-item-align: auto !important; - align-self: auto !important; -} - -.align-self-start { - -ms-flex-item-align: start !important; - align-self: flex-start !important; -} - -.align-self-end { - -ms-flex-item-align: end !important; - align-self: flex-end !important; -} - -.align-self-center { - -ms-flex-item-align: center !important; - align-self: center !important; -} - -.align-self-baseline { - -ms-flex-item-align: baseline !important; - align-self: baseline !important; -} - -.align-self-stretch { - -ms-flex-item-align: stretch !important; - align-self: stretch !important; -} - -@media (min-width: 576px) { - .flex-sm-row { - -webkit-box-orient: horizontal !important; - -webkit-box-direction: normal !important; - -ms-flex-direction: row !important; - flex-direction: row !important; - } - - .flex-sm-column { - -webkit-box-orient: vertical !important; - -webkit-box-direction: normal !important; - -ms-flex-direction: column !important; - flex-direction: column !important; - } - - .flex-sm-row-reverse { - -webkit-box-orient: horizontal !important; - -webkit-box-direction: reverse !important; - -ms-flex-direction: row-reverse !important; - flex-direction: row-reverse !important; - } - - .flex-sm-column-reverse { - -webkit-box-orient: vertical !important; - -webkit-box-direction: reverse !important; - -ms-flex-direction: column-reverse !important; - flex-direction: column-reverse !important; - } - - .flex-sm-wrap { - -ms-flex-wrap: wrap !important; - flex-wrap: wrap !important; - } - - .flex-sm-nowrap { - -ms-flex-wrap: nowrap !important; - flex-wrap: nowrap !important; - } - - .flex-sm-wrap-reverse { - -ms-flex-wrap: wrap-reverse !important; - flex-wrap: wrap-reverse !important; - } - - .flex-sm-fill { - -webkit-box-flex: 1 !important; - -ms-flex: 1 1 auto !important; - flex: 1 1 auto !important; - } - - .flex-sm-grow-0 { - -webkit-box-flex: 0 !important; - -ms-flex-positive: 0 !important; - flex-grow: 0 !important; - } - - .flex-sm-grow-1 { - -webkit-box-flex: 1 !important; - -ms-flex-positive: 1 !important; - flex-grow: 1 !important; - } - - .flex-sm-shrink-0 { - -ms-flex-negative: 0 !important; - flex-shrink: 0 !important; - } - - .flex-sm-shrink-1 { - -ms-flex-negative: 1 !important; - flex-shrink: 1 !important; - } - - .justify-content-sm-start { - -webkit-box-pack: start !important; - -ms-flex-pack: start !important; - justify-content: flex-start !important; - } - - .justify-content-sm-end { - -webkit-box-pack: end !important; - -ms-flex-pack: end !important; - justify-content: flex-end !important; - } - - .justify-content-sm-center { - -webkit-box-pack: center !important; - -ms-flex-pack: center !important; - justify-content: center !important; - } - - .justify-content-sm-between { - -webkit-box-pack: justify !important; - -ms-flex-pack: justify !important; - justify-content: space-between !important; - } - - .justify-content-sm-around { - -ms-flex-pack: distribute !important; - justify-content: space-around !important; - } - - .align-items-sm-start { - -webkit-box-align: start !important; - -ms-flex-align: start !important; - align-items: flex-start !important; - } - - .align-items-sm-end { - -webkit-box-align: end !important; - -ms-flex-align: end !important; - align-items: flex-end !important; - } - - .align-items-sm-center { - -webkit-box-align: center !important; - -ms-flex-align: center !important; - align-items: center !important; - } - - .align-items-sm-baseline { - -webkit-box-align: baseline !important; - -ms-flex-align: baseline !important; - align-items: baseline !important; - } - - .align-items-sm-stretch { - -webkit-box-align: stretch !important; - -ms-flex-align: stretch !important; - align-items: stretch !important; - } - - .align-content-sm-start { - -ms-flex-line-pack: start !important; - align-content: flex-start !important; - } - - .align-content-sm-end { - -ms-flex-line-pack: end !important; - align-content: flex-end !important; - } - - .align-content-sm-center { - -ms-flex-line-pack: center !important; - align-content: center !important; - } - - .align-content-sm-between { - -ms-flex-line-pack: justify !important; - align-content: space-between !important; - } - - .align-content-sm-around { - -ms-flex-line-pack: distribute !important; - align-content: space-around !important; - } - - .align-content-sm-stretch { - -ms-flex-line-pack: stretch !important; - align-content: stretch !important; - } - - .align-self-sm-auto { - -ms-flex-item-align: auto !important; - align-self: auto !important; - } - - .align-self-sm-start { - -ms-flex-item-align: start !important; - align-self: flex-start !important; - } - - .align-self-sm-end { - -ms-flex-item-align: end !important; - align-self: flex-end !important; - } - - .align-self-sm-center { - -ms-flex-item-align: center !important; - align-self: center !important; - } - - .align-self-sm-baseline { - -ms-flex-item-align: baseline !important; - align-self: baseline !important; - } - - .align-self-sm-stretch { - -ms-flex-item-align: stretch !important; - align-self: stretch !important; - } -} -@media (min-width: 768px) { - .flex-md-row { - -webkit-box-orient: horizontal !important; - -webkit-box-direction: normal !important; - -ms-flex-direction: row !important; - flex-direction: row !important; - } - - .flex-md-column { - -webkit-box-orient: vertical !important; - -webkit-box-direction: normal !important; - -ms-flex-direction: column !important; - flex-direction: column !important; - } - - .flex-md-row-reverse { - -webkit-box-orient: horizontal !important; - -webkit-box-direction: reverse !important; - -ms-flex-direction: row-reverse !important; - flex-direction: row-reverse !important; - } - - .flex-md-column-reverse { - -webkit-box-orient: vertical !important; - -webkit-box-direction: reverse !important; - -ms-flex-direction: column-reverse !important; - flex-direction: column-reverse !important; - } - - .flex-md-wrap { - -ms-flex-wrap: wrap !important; - flex-wrap: wrap !important; - } - - .flex-md-nowrap { - -ms-flex-wrap: nowrap !important; - flex-wrap: nowrap !important; - } - - .flex-md-wrap-reverse { - -ms-flex-wrap: wrap-reverse !important; - flex-wrap: wrap-reverse !important; - } - - .flex-md-fill { - -webkit-box-flex: 1 !important; - -ms-flex: 1 1 auto !important; - flex: 1 1 auto !important; - } - - .flex-md-grow-0 { - -webkit-box-flex: 0 !important; - -ms-flex-positive: 0 !important; - flex-grow: 0 !important; - } - - .flex-md-grow-1 { - -webkit-box-flex: 1 !important; - -ms-flex-positive: 1 !important; - flex-grow: 1 !important; - } - - .flex-md-shrink-0 { - -ms-flex-negative: 0 !important; - flex-shrink: 0 !important; - } - - .flex-md-shrink-1 { - -ms-flex-negative: 1 !important; - flex-shrink: 1 !important; - } - - .justify-content-md-start { - -webkit-box-pack: start !important; - -ms-flex-pack: start !important; - justify-content: flex-start !important; - } - - .justify-content-md-end { - -webkit-box-pack: end !important; - -ms-flex-pack: end !important; - justify-content: flex-end !important; - } - - .justify-content-md-center { - -webkit-box-pack: center !important; - -ms-flex-pack: center !important; - justify-content: center !important; - } - - .justify-content-md-between { - -webkit-box-pack: justify !important; - -ms-flex-pack: justify !important; - justify-content: space-between !important; - } - - .justify-content-md-around { - -ms-flex-pack: distribute !important; - justify-content: space-around !important; - } - - .align-items-md-start { - -webkit-box-align: start !important; - -ms-flex-align: start !important; - align-items: flex-start !important; - } - - .align-items-md-end { - -webkit-box-align: end !important; - -ms-flex-align: end !important; - align-items: flex-end !important; - } - - .align-items-md-center { - -webkit-box-align: center !important; - -ms-flex-align: center !important; - align-items: center !important; - } - - .align-items-md-baseline { - -webkit-box-align: baseline !important; - -ms-flex-align: baseline !important; - align-items: baseline !important; - } - - .align-items-md-stretch { - -webkit-box-align: stretch !important; - -ms-flex-align: stretch !important; - align-items: stretch !important; - } - - .align-content-md-start { - -ms-flex-line-pack: start !important; - align-content: flex-start !important; - } - - .align-content-md-end { - -ms-flex-line-pack: end !important; - align-content: flex-end !important; - } - - .align-content-md-center { - -ms-flex-line-pack: center !important; - align-content: center !important; - } - - .align-content-md-between { - -ms-flex-line-pack: justify !important; - align-content: space-between !important; - } - - .align-content-md-around { - -ms-flex-line-pack: distribute !important; - align-content: space-around !important; - } - - .align-content-md-stretch { - -ms-flex-line-pack: stretch !important; - align-content: stretch !important; - } - - .align-self-md-auto { - -ms-flex-item-align: auto !important; - align-self: auto !important; - } - - .align-self-md-start { - -ms-flex-item-align: start !important; - align-self: flex-start !important; - } - - .align-self-md-end { - -ms-flex-item-align: end !important; - align-self: flex-end !important; - } - - .align-self-md-center { - -ms-flex-item-align: center !important; - align-self: center !important; - } - - .align-self-md-baseline { - -ms-flex-item-align: baseline !important; - align-self: baseline !important; - } - - .align-self-md-stretch { - -ms-flex-item-align: stretch !important; - align-self: stretch !important; - } -} -@media (min-width: 992px) { - .flex-lg-row { - -webkit-box-orient: horizontal !important; - -webkit-box-direction: normal !important; - -ms-flex-direction: row !important; - flex-direction: row !important; - } - - .flex-lg-column { - -webkit-box-orient: vertical !important; - -webkit-box-direction: normal !important; - -ms-flex-direction: column !important; - flex-direction: column !important; - } - - .flex-lg-row-reverse { - -webkit-box-orient: horizontal !important; - -webkit-box-direction: reverse !important; - -ms-flex-direction: row-reverse !important; - flex-direction: row-reverse !important; - } - - .flex-lg-column-reverse { - -webkit-box-orient: vertical !important; - -webkit-box-direction: reverse !important; - -ms-flex-direction: column-reverse !important; - flex-direction: column-reverse !important; - } - - .flex-lg-wrap { - -ms-flex-wrap: wrap !important; - flex-wrap: wrap !important; - } - - .flex-lg-nowrap { - -ms-flex-wrap: nowrap !important; - flex-wrap: nowrap !important; - } - - .flex-lg-wrap-reverse { - -ms-flex-wrap: wrap-reverse !important; - flex-wrap: wrap-reverse !important; - } - - .flex-lg-fill { - -webkit-box-flex: 1 !important; - -ms-flex: 1 1 auto !important; - flex: 1 1 auto !important; - } - - .flex-lg-grow-0 { - -webkit-box-flex: 0 !important; - -ms-flex-positive: 0 !important; - flex-grow: 0 !important; - } - - .flex-lg-grow-1 { - -webkit-box-flex: 1 !important; - -ms-flex-positive: 1 !important; - flex-grow: 1 !important; - } - - .flex-lg-shrink-0 { - -ms-flex-negative: 0 !important; - flex-shrink: 0 !important; - } - - .flex-lg-shrink-1 { - -ms-flex-negative: 1 !important; - flex-shrink: 1 !important; - } - - .justify-content-lg-start { - -webkit-box-pack: start !important; - -ms-flex-pack: start !important; - justify-content: flex-start !important; - } - - .justify-content-lg-end { - -webkit-box-pack: end !important; - -ms-flex-pack: end !important; - justify-content: flex-end !important; - } - - .justify-content-lg-center { - -webkit-box-pack: center !important; - -ms-flex-pack: center !important; - justify-content: center !important; - } - - .justify-content-lg-between { - -webkit-box-pack: justify !important; - -ms-flex-pack: justify !important; - justify-content: space-between !important; - } - - .justify-content-lg-around { - -ms-flex-pack: distribute !important; - justify-content: space-around !important; - } - - .align-items-lg-start { - -webkit-box-align: start !important; - -ms-flex-align: start !important; - align-items: flex-start !important; - } - - .align-items-lg-end { - -webkit-box-align: end !important; - -ms-flex-align: end !important; - align-items: flex-end !important; - } - - .align-items-lg-center { - -webkit-box-align: center !important; - -ms-flex-align: center !important; - align-items: center !important; - } - - .align-items-lg-baseline { - -webkit-box-align: baseline !important; - -ms-flex-align: baseline !important; - align-items: baseline !important; - } - - .align-items-lg-stretch { - -webkit-box-align: stretch !important; - -ms-flex-align: stretch !important; - align-items: stretch !important; - } - - .align-content-lg-start { - -ms-flex-line-pack: start !important; - align-content: flex-start !important; - } - - .align-content-lg-end { - -ms-flex-line-pack: end !important; - align-content: flex-end !important; - } - - .align-content-lg-center { - -ms-flex-line-pack: center !important; - align-content: center !important; - } - - .align-content-lg-between { - -ms-flex-line-pack: justify !important; - align-content: space-between !important; - } - - .align-content-lg-around { - -ms-flex-line-pack: distribute !important; - align-content: space-around !important; - } - - .align-content-lg-stretch { - -ms-flex-line-pack: stretch !important; - align-content: stretch !important; - } - - .align-self-lg-auto { - -ms-flex-item-align: auto !important; - align-self: auto !important; - } - - .align-self-lg-start { - -ms-flex-item-align: start !important; - align-self: flex-start !important; - } - - .align-self-lg-end { - -ms-flex-item-align: end !important; - align-self: flex-end !important; - } - - .align-self-lg-center { - -ms-flex-item-align: center !important; - align-self: center !important; - } - - .align-self-lg-baseline { - -ms-flex-item-align: baseline !important; - align-self: baseline !important; - } - - .align-self-lg-stretch { - -ms-flex-item-align: stretch !important; - align-self: stretch !important; - } -} -@media (min-width: 1200px) { - .flex-xl-row { - -webkit-box-orient: horizontal !important; - -webkit-box-direction: normal !important; - -ms-flex-direction: row !important; - flex-direction: row !important; - } - - .flex-xl-column { - -webkit-box-orient: vertical !important; - -webkit-box-direction: normal !important; - -ms-flex-direction: column !important; - flex-direction: column !important; - } - - .flex-xl-row-reverse { - -webkit-box-orient: horizontal !important; - -webkit-box-direction: reverse !important; - -ms-flex-direction: row-reverse !important; - flex-direction: row-reverse !important; - } - - .flex-xl-column-reverse { - -webkit-box-orient: vertical !important; - -webkit-box-direction: reverse !important; - -ms-flex-direction: column-reverse !important; - flex-direction: column-reverse !important; - } - - .flex-xl-wrap { - -ms-flex-wrap: wrap !important; - flex-wrap: wrap !important; - } - - .flex-xl-nowrap { - -ms-flex-wrap: nowrap !important; - flex-wrap: nowrap !important; - } - - .flex-xl-wrap-reverse { - -ms-flex-wrap: wrap-reverse !important; - flex-wrap: wrap-reverse !important; - } - - .flex-xl-fill { - -webkit-box-flex: 1 !important; - -ms-flex: 1 1 auto !important; - flex: 1 1 auto !important; - } - - .flex-xl-grow-0 { - -webkit-box-flex: 0 !important; - -ms-flex-positive: 0 !important; - flex-grow: 0 !important; - } - - .flex-xl-grow-1 { - -webkit-box-flex: 1 !important; - -ms-flex-positive: 1 !important; - flex-grow: 1 !important; - } - - .flex-xl-shrink-0 { - -ms-flex-negative: 0 !important; - flex-shrink: 0 !important; - } - - .flex-xl-shrink-1 { - -ms-flex-negative: 1 !important; - flex-shrink: 1 !important; - } - - .justify-content-xl-start { - -webkit-box-pack: start !important; - -ms-flex-pack: start !important; - justify-content: flex-start !important; - } - - .justify-content-xl-end { - -webkit-box-pack: end !important; - -ms-flex-pack: end !important; - justify-content: flex-end !important; - } - - .justify-content-xl-center { - -webkit-box-pack: center !important; - -ms-flex-pack: center !important; - justify-content: center !important; - } - - .justify-content-xl-between { - -webkit-box-pack: justify !important; - -ms-flex-pack: justify !important; - justify-content: space-between !important; - } - - .justify-content-xl-around { - -ms-flex-pack: distribute !important; - justify-content: space-around !important; - } - - .align-items-xl-start { - -webkit-box-align: start !important; - -ms-flex-align: start !important; - align-items: flex-start !important; - } - - .align-items-xl-end { - -webkit-box-align: end !important; - -ms-flex-align: end !important; - align-items: flex-end !important; - } - - .align-items-xl-center { - -webkit-box-align: center !important; - -ms-flex-align: center !important; - align-items: center !important; - } - - .align-items-xl-baseline { - -webkit-box-align: baseline !important; - -ms-flex-align: baseline !important; - align-items: baseline !important; - } - - .align-items-xl-stretch { - -webkit-box-align: stretch !important; - -ms-flex-align: stretch !important; - align-items: stretch !important; - } - - .align-content-xl-start { - -ms-flex-line-pack: start !important; - align-content: flex-start !important; - } - - .align-content-xl-end { - -ms-flex-line-pack: end !important; - align-content: flex-end !important; - } - - .align-content-xl-center { - -ms-flex-line-pack: center !important; - align-content: center !important; - } - - .align-content-xl-between { - -ms-flex-line-pack: justify !important; - align-content: space-between !important; - } - - .align-content-xl-around { - -ms-flex-line-pack: distribute !important; - align-content: space-around !important; - } - - .align-content-xl-stretch { - -ms-flex-line-pack: stretch !important; - align-content: stretch !important; - } - - .align-self-xl-auto { - -ms-flex-item-align: auto !important; - align-self: auto !important; - } - - .align-self-xl-start { - -ms-flex-item-align: start !important; - align-self: flex-start !important; - } - - .align-self-xl-end { - -ms-flex-item-align: end !important; - align-self: flex-end !important; - } - - .align-self-xl-center { - -ms-flex-item-align: center !important; - align-self: center !important; - } - - .align-self-xl-baseline { - -ms-flex-item-align: baseline !important; - align-self: baseline !important; - } - - .align-self-xl-stretch { - -ms-flex-item-align: stretch !important; - align-self: stretch !important; - } -} -.float-left { - float: left !important; -} - -.float-right { - float: right !important; -} - -.float-none { - float: none !important; -} - -@media (min-width: 576px) { - .float-sm-left { - float: left !important; - } - - .float-sm-right { - float: right !important; - } - - .float-sm-none { - float: none !important; - } -} -@media (min-width: 768px) { - .float-md-left { - float: left !important; - } - - .float-md-right { - float: right !important; - } - - .float-md-none { - float: none !important; - } -} -@media (min-width: 992px) { - .float-lg-left { - float: left !important; - } - - .float-lg-right { - float: right !important; - } - - .float-lg-none { - float: none !important; - } -} -@media (min-width: 1200px) { - .float-xl-left { - float: left !important; - } - - .float-xl-right { - float: right !important; - } - - .float-xl-none { - float: none !important; - } -} -.user-select-all { - -webkit-user-select: all !important; - -moz-user-select: all !important; - -ms-user-select: all !important; - user-select: all !important; -} - -.user-select-auto { - -webkit-user-select: auto !important; - -moz-user-select: auto !important; - -ms-user-select: auto !important; - user-select: auto !important; -} - -.user-select-none { - -webkit-user-select: none !important; - -moz-user-select: none !important; - -ms-user-select: none !important; - user-select: none !important; -} - -.overflow-auto { - overflow: auto !important; -} - -.overflow-hidden { - overflow: hidden !important; -} - -.position-static { - position: static !important; -} - -.position-relative { - position: relative !important; -} - -.position-absolute { - position: absolute !important; -} - -.position-fixed { - position: fixed !important; -} - -.position-sticky { - position: sticky !important; -} - -.fixed-top { - position: fixed; - top: 0; - right: 0; - left: 0; - z-index: 1030; -} - -.fixed-bottom { - position: fixed; - right: 0; - bottom: 0; - left: 0; - z-index: 1030; -} - -@supports (position: sticky) { - .sticky-top { - position: sticky; - top: 0; - z-index: 1020; - } -} - -.sr-only { - position: absolute; - width: 1px; - height: 1px; - padding: 0; - margin: -1px; - overflow: hidden; - clip: rect(0, 0, 0, 0); - white-space: nowrap; - border: 0; -} - -.sr-only-focusable:active, .sr-only-focusable:focus { - position: static; - width: auto; - height: auto; - overflow: visible; - clip: auto; - white-space: normal; -} - -.shadow-sm { - -webkit-box-shadow: 0 0.125rem 0.25rem rgba(0, 0, 0, 0.075) !important; - box-shadow: 0 0.125rem 0.25rem rgba(0, 0, 0, 0.075) !important; -} - -.shadow { - -webkit-box-shadow: 0 0.5rem 1rem rgba(0, 0, 0, 0.15) !important; - box-shadow: 0 0.5rem 1rem rgba(0, 0, 0, 0.15) !important; -} - -.shadow-lg { - -webkit-box-shadow: 0 1rem 3rem rgba(0, 0, 0, 0.175) !important; - box-shadow: 0 1rem 3rem rgba(0, 0, 0, 0.175) !important; -} - -.shadow-none { - -webkit-box-shadow: none !important; - box-shadow: none !important; -} - -.w-25 { - width: 25% !important; -} - -.w-50 { - width: 50% !important; -} - -.w-75 { - width: 75% !important; -} - -.w-100 { - width: 100% !important; -} - -.w-auto { - width: auto !important; -} - -.h-25 { - height: 25% !important; -} - -.h-50 { - height: 50% !important; -} - -.h-75 { - height: 75% !important; -} - -.h-100 { - height: 100% !important; -} - -.h-auto { - height: auto !important; -} - -.mw-100 { - max-width: 100% !important; -} - -.mh-100 { - max-height: 100% !important; -} - -.min-vw-100 { - min-width: 100vw !important; -} - -.min-vh-100 { - min-height: 100vh !important; -} - -.vw-100 { - width: 100vw !important; -} - -.vh-100 { - height: 100vh !important; -} - -.m-0 { - margin: 0 !important; -} - -.mt-0, -.my-0 { - margin-top: 0 !important; -} - -.mr-0, -.mx-0 { - margin-right: 0 !important; -} - -.mb-0, -.my-0 { - margin-bottom: 0 !important; -} - -.ml-0, -.mx-0 { - margin-left: 0 !important; -} - -.m-1 { - margin: 0.25rem !important; -} - -.mt-1, -.my-1 { - margin-top: 0.25rem !important; -} - -.mr-1, -.mx-1 { - margin-right: 0.25rem !important; -} - -.mb-1, -.my-1 { - margin-bottom: 0.25rem !important; -} - -.ml-1, -.mx-1 { - margin-left: 0.25rem !important; -} - -.m-2 { - margin: 0.5rem !important; -} - -.mt-2, -.my-2 { - margin-top: 0.5rem !important; -} - -.mr-2, -.mx-2 { - margin-right: 0.5rem !important; -} - -.mb-2, -.my-2 { - margin-bottom: 0.5rem !important; -} - -.ml-2, -.mx-2 { - margin-left: 0.5rem !important; -} - -.m-3 { - margin: 1rem !important; -} - -.mt-3, -.my-3 { - margin-top: 1rem !important; -} - -.mr-3, -.mx-3 { - margin-right: 1rem !important; -} - -.mb-3, -.my-3 { - margin-bottom: 1rem !important; -} - -.ml-3, -.mx-3 { - margin-left: 1rem !important; -} - -.m-4 { - margin: 1.5rem !important; -} - -.mt-4, -.my-4 { - margin-top: 1.5rem !important; -} - -.mr-4, -.mx-4 { - margin-right: 1.5rem !important; -} - -.mb-4, -.my-4 { - margin-bottom: 1.5rem !important; -} - -.ml-4, -.mx-4 { - margin-left: 1.5rem !important; -} - -.m-5 { - margin: 3rem !important; -} - -.mt-5, -.my-5 { - margin-top: 3rem !important; -} - -.mr-5, -.mx-5 { - margin-right: 3rem !important; -} - -.mb-5, -.my-5 { - margin-bottom: 3rem !important; -} - -.ml-5, -.mx-5 { - margin-left: 3rem !important; -} - -.p-0 { - padding: 0 !important; -} - -.pt-0, -.py-0 { - padding-top: 0 !important; -} - -.pr-0, -.px-0 { - padding-right: 0 !important; -} - -.pb-0, -.py-0 { - padding-bottom: 0 !important; -} - -.pl-0, -.px-0 { - padding-left: 0 !important; -} - -.p-1 { - padding: 0.25rem !important; -} - -.pt-1, -.py-1 { - padding-top: 0.25rem !important; -} - -.pr-1, -.px-1 { - padding-right: 0.25rem !important; -} - -.pb-1, -.py-1 { - padding-bottom: 0.25rem !important; -} - -.pl-1, -.px-1 { - padding-left: 0.25rem !important; -} - -.p-2 { - padding: 0.5rem !important; -} - -.pt-2, -.py-2 { - padding-top: 0.5rem !important; -} - -.pr-2, -.px-2 { - padding-right: 0.5rem !important; -} - -.pb-2, -.py-2 { - padding-bottom: 0.5rem !important; -} - -.pl-2, -.px-2 { - padding-left: 0.5rem !important; -} - -.p-3 { - padding: 1rem !important; -} - -.pt-3, -.py-3 { - padding-top: 1rem !important; -} - -.pr-3, -.px-3 { - padding-right: 1rem !important; -} - -.pb-3, -.py-3 { - padding-bottom: 1rem !important; -} - -.pl-3, -.px-3 { - padding-left: 1rem !important; -} - -.p-4 { - padding: 1.5rem !important; -} - -.pt-4, -.py-4 { - padding-top: 1.5rem !important; -} - -.pr-4, -.px-4 { - padding-right: 1.5rem !important; -} - -.pb-4, -.py-4 { - padding-bottom: 1.5rem !important; -} - -.pl-4, -.px-4 { - padding-left: 1.5rem !important; -} - -.p-5 { - padding: 3rem !important; -} - -.pt-5, -.py-5 { - padding-top: 3rem !important; -} - -.pr-5, -.px-5 { - padding-right: 3rem !important; -} - -.pb-5, -.py-5 { - padding-bottom: 3rem !important; -} - -.pl-5, -.px-5 { - padding-left: 3rem !important; -} - -.m-n1 { - margin: -0.25rem !important; -} - -.mt-n1, -.my-n1 { - margin-top: -0.25rem !important; -} - -.mr-n1, -.mx-n1 { - margin-right: -0.25rem !important; -} - -.mb-n1, -.my-n1 { - margin-bottom: -0.25rem !important; -} - -.ml-n1, -.mx-n1 { - margin-left: -0.25rem !important; -} - -.m-n2 { - margin: -0.5rem !important; -} - -.mt-n2, -.my-n2 { - margin-top: -0.5rem !important; -} - -.mr-n2, -.mx-n2 { - margin-right: -0.5rem !important; -} - -.mb-n2, -.my-n2 { - margin-bottom: -0.5rem !important; -} - -.ml-n2, -.mx-n2 { - margin-left: -0.5rem !important; -} - -.m-n3 { - margin: -1rem !important; -} - -.mt-n3, -.my-n3 { - margin-top: -1rem !important; -} - -.mr-n3, -.mx-n3 { - margin-right: -1rem !important; -} - -.mb-n3, -.my-n3 { - margin-bottom: -1rem !important; -} - -.ml-n3, -.mx-n3 { - margin-left: -1rem !important; -} - -.m-n4 { - margin: -1.5rem !important; -} - -.mt-n4, -.my-n4 { - margin-top: -1.5rem !important; -} - -.mr-n4, -.mx-n4 { - margin-right: -1.5rem !important; -} - -.mb-n4, -.my-n4 { - margin-bottom: -1.5rem !important; -} - -.ml-n4, -.mx-n4 { - margin-left: -1.5rem !important; -} - -.m-n5 { - margin: -3rem !important; -} - -.mt-n5, -.my-n5 { - margin-top: -3rem !important; -} - -.mr-n5, -.mx-n5 { - margin-right: -3rem !important; -} - -.mb-n5, -.my-n5 { - margin-bottom: -3rem !important; -} - -.ml-n5, -.mx-n5 { - margin-left: -3rem !important; -} - -.m-auto { - margin: auto !important; -} - -.mt-auto, -.my-auto { - margin-top: auto !important; -} - -.mr-auto, -.mx-auto { - margin-right: auto !important; -} - -.mb-auto, -.my-auto { - margin-bottom: auto !important; -} - -.ml-auto, -.mx-auto { - margin-left: auto !important; -} - -@media (min-width: 576px) { - .m-sm-0 { - margin: 0 !important; - } - - .mt-sm-0, - .my-sm-0 { - margin-top: 0 !important; - } - - .mr-sm-0, - .mx-sm-0 { - margin-right: 0 !important; - } - - .mb-sm-0, - .my-sm-0 { - margin-bottom: 0 !important; - } - - .ml-sm-0, - .mx-sm-0 { - margin-left: 0 !important; - } - - .m-sm-1 { - margin: 0.25rem !important; - } - - .mt-sm-1, - .my-sm-1 { - margin-top: 0.25rem !important; - } - - .mr-sm-1, - .mx-sm-1 { - margin-right: 0.25rem !important; - } - - .mb-sm-1, - .my-sm-1 { - margin-bottom: 0.25rem !important; - } - - .ml-sm-1, - .mx-sm-1 { - margin-left: 0.25rem !important; - } - - .m-sm-2 { - margin: 0.5rem !important; - } - - .mt-sm-2, - .my-sm-2 { - margin-top: 0.5rem !important; - } - - .mr-sm-2, - .mx-sm-2 { - margin-right: 0.5rem !important; - } - - .mb-sm-2, - .my-sm-2 { - margin-bottom: 0.5rem !important; - } - - .ml-sm-2, - .mx-sm-2 { - margin-left: 0.5rem !important; - } - - .m-sm-3 { - margin: 1rem !important; - } - - .mt-sm-3, - .my-sm-3 { - margin-top: 1rem !important; - } - - .mr-sm-3, - .mx-sm-3 { - margin-right: 1rem !important; - } - - .mb-sm-3, - .my-sm-3 { - margin-bottom: 1rem !important; - } - - .ml-sm-3, - .mx-sm-3 { - margin-left: 1rem !important; - } - - .m-sm-4 { - margin: 1.5rem !important; - } - - .mt-sm-4, - .my-sm-4 { - margin-top: 1.5rem !important; - } - - .mr-sm-4, - .mx-sm-4 { - margin-right: 1.5rem !important; - } - - .mb-sm-4, - .my-sm-4 { - margin-bottom: 1.5rem !important; - } - - .ml-sm-4, - .mx-sm-4 { - margin-left: 1.5rem !important; - } - - .m-sm-5 { - margin: 3rem !important; - } - - .mt-sm-5, - .my-sm-5 { - margin-top: 3rem !important; - } - - .mr-sm-5, - .mx-sm-5 { - margin-right: 3rem !important; - } - - .mb-sm-5, - .my-sm-5 { - margin-bottom: 3rem !important; - } - - .ml-sm-5, - .mx-sm-5 { - margin-left: 3rem !important; - } - - .p-sm-0 { - padding: 0 !important; - } - - .pt-sm-0, - .py-sm-0 { - padding-top: 0 !important; - } - - .pr-sm-0, - .px-sm-0 { - padding-right: 0 !important; - } - - .pb-sm-0, - .py-sm-0 { - padding-bottom: 0 !important; - } - - .pl-sm-0, - .px-sm-0 { - padding-left: 0 !important; - } - - .p-sm-1 { - padding: 0.25rem !important; - } - - .pt-sm-1, - .py-sm-1 { - padding-top: 0.25rem !important; - } - - .pr-sm-1, - .px-sm-1 { - padding-right: 0.25rem !important; - } - - .pb-sm-1, - .py-sm-1 { - padding-bottom: 0.25rem !important; - } - - .pl-sm-1, - .px-sm-1 { - padding-left: 0.25rem !important; - } - - .p-sm-2 { - padding: 0.5rem !important; - } - - .pt-sm-2, - .py-sm-2 { - padding-top: 0.5rem !important; - } - - .pr-sm-2, - .px-sm-2 { - padding-right: 0.5rem !important; - } - - .pb-sm-2, - .py-sm-2 { - padding-bottom: 0.5rem !important; - } - - .pl-sm-2, - .px-sm-2 { - padding-left: 0.5rem !important; - } - - .p-sm-3 { - padding: 1rem !important; - } - - .pt-sm-3, - .py-sm-3 { - padding-top: 1rem !important; - } - - .pr-sm-3, - .px-sm-3 { - padding-right: 1rem !important; - } - - .pb-sm-3, - .py-sm-3 { - padding-bottom: 1rem !important; - } - - .pl-sm-3, - .px-sm-3 { - padding-left: 1rem !important; - } - - .p-sm-4 { - padding: 1.5rem !important; - } - - .pt-sm-4, - .py-sm-4 { - padding-top: 1.5rem !important; - } - - .pr-sm-4, - .px-sm-4 { - padding-right: 1.5rem !important; - } - - .pb-sm-4, - .py-sm-4 { - padding-bottom: 1.5rem !important; - } - - .pl-sm-4, - .px-sm-4 { - padding-left: 1.5rem !important; - } - - .p-sm-5 { - padding: 3rem !important; - } - - .pt-sm-5, - .py-sm-5 { - padding-top: 3rem !important; - } - - .pr-sm-5, - .px-sm-5 { - padding-right: 3rem !important; - } - - .pb-sm-5, - .py-sm-5 { - padding-bottom: 3rem !important; - } - - .pl-sm-5, - .px-sm-5 { - padding-left: 3rem !important; - } - - .m-sm-n1 { - margin: -0.25rem !important; - } - - .mt-sm-n1, - .my-sm-n1 { - margin-top: -0.25rem !important; - } - - .mr-sm-n1, - .mx-sm-n1 { - margin-right: -0.25rem !important; - } - - .mb-sm-n1, - .my-sm-n1 { - margin-bottom: -0.25rem !important; - } - - .ml-sm-n1, - .mx-sm-n1 { - margin-left: -0.25rem !important; - } - - .m-sm-n2 { - margin: -0.5rem !important; - } - - .mt-sm-n2, - .my-sm-n2 { - margin-top: -0.5rem !important; - } - - .mr-sm-n2, - .mx-sm-n2 { - margin-right: -0.5rem !important; - } - - .mb-sm-n2, - .my-sm-n2 { - margin-bottom: -0.5rem !important; - } - - .ml-sm-n2, - .mx-sm-n2 { - margin-left: -0.5rem !important; - } - - .m-sm-n3 { - margin: -1rem !important; - } - - .mt-sm-n3, - .my-sm-n3 { - margin-top: -1rem !important; - } - - .mr-sm-n3, - .mx-sm-n3 { - margin-right: -1rem !important; - } - - .mb-sm-n3, - .my-sm-n3 { - margin-bottom: -1rem !important; - } - - .ml-sm-n3, - .mx-sm-n3 { - margin-left: -1rem !important; - } - - .m-sm-n4 { - margin: -1.5rem !important; - } - - .mt-sm-n4, - .my-sm-n4 { - margin-top: -1.5rem !important; - } - - .mr-sm-n4, - .mx-sm-n4 { - margin-right: -1.5rem !important; - } - - .mb-sm-n4, - .my-sm-n4 { - margin-bottom: -1.5rem !important; - } - - .ml-sm-n4, - .mx-sm-n4 { - margin-left: -1.5rem !important; - } - - .m-sm-n5 { - margin: -3rem !important; - } - - .mt-sm-n5, - .my-sm-n5 { - margin-top: -3rem !important; - } - - .mr-sm-n5, - .mx-sm-n5 { - margin-right: -3rem !important; - } - - .mb-sm-n5, - .my-sm-n5 { - margin-bottom: -3rem !important; - } - - .ml-sm-n5, - .mx-sm-n5 { - margin-left: -3rem !important; - } - - .m-sm-auto { - margin: auto !important; - } - - .mt-sm-auto, - .my-sm-auto { - margin-top: auto !important; - } - - .mr-sm-auto, - .mx-sm-auto { - margin-right: auto !important; - } - - .mb-sm-auto, - .my-sm-auto { - margin-bottom: auto !important; - } - - .ml-sm-auto, - .mx-sm-auto { - margin-left: auto !important; - } -} -@media (min-width: 768px) { - .m-md-0 { - margin: 0 !important; - } - - .mt-md-0, - .my-md-0 { - margin-top: 0 !important; - } - - .mr-md-0, - .mx-md-0 { - margin-right: 0 !important; - } - - .mb-md-0, - .my-md-0 { - margin-bottom: 0 !important; - } - - .ml-md-0, - .mx-md-0 { - margin-left: 0 !important; - } - - .m-md-1 { - margin: 0.25rem !important; - } - - .mt-md-1, - .my-md-1 { - margin-top: 0.25rem !important; - } - - .mr-md-1, - .mx-md-1 { - margin-right: 0.25rem !important; - } - - .mb-md-1, - .my-md-1 { - margin-bottom: 0.25rem !important; - } - - .ml-md-1, - .mx-md-1 { - margin-left: 0.25rem !important; - } - - .m-md-2 { - margin: 0.5rem !important; - } - - .mt-md-2, - .my-md-2 { - margin-top: 0.5rem !important; - } - - .mr-md-2, - .mx-md-2 { - margin-right: 0.5rem !important; - } - - .mb-md-2, - .my-md-2 { - margin-bottom: 0.5rem !important; - } - - .ml-md-2, - .mx-md-2 { - margin-left: 0.5rem !important; - } - - .m-md-3 { - margin: 1rem !important; - } - - .mt-md-3, - .my-md-3 { - margin-top: 1rem !important; - } - - .mr-md-3, - .mx-md-3 { - margin-right: 1rem !important; - } - - .mb-md-3, - .my-md-3 { - margin-bottom: 1rem !important; - } - - .ml-md-3, - .mx-md-3 { - margin-left: 1rem !important; - } - - .m-md-4 { - margin: 1.5rem !important; - } - - .mt-md-4, - .my-md-4 { - margin-top: 1.5rem !important; - } - - .mr-md-4, - .mx-md-4 { - margin-right: 1.5rem !important; - } - - .mb-md-4, - .my-md-4 { - margin-bottom: 1.5rem !important; - } - - .ml-md-4, - .mx-md-4 { - margin-left: 1.5rem !important; - } - - .m-md-5 { - margin: 3rem !important; - } - - .mt-md-5, - .my-md-5 { - margin-top: 3rem !important; - } - - .mr-md-5, - .mx-md-5 { - margin-right: 3rem !important; - } - - .mb-md-5, - .my-md-5 { - margin-bottom: 3rem !important; - } - - .ml-md-5, - .mx-md-5 { - margin-left: 3rem !important; - } - - .p-md-0 { - padding: 0 !important; - } - - .pt-md-0, - .py-md-0 { - padding-top: 0 !important; - } - - .pr-md-0, - .px-md-0 { - padding-right: 0 !important; - } - - .pb-md-0, - .py-md-0 { - padding-bottom: 0 !important; - } - - .pl-md-0, - .px-md-0 { - padding-left: 0 !important; - } - - .p-md-1 { - padding: 0.25rem !important; - } - - .pt-md-1, - .py-md-1 { - padding-top: 0.25rem !important; - } - - .pr-md-1, - .px-md-1 { - padding-right: 0.25rem !important; - } - - .pb-md-1, - .py-md-1 { - padding-bottom: 0.25rem !important; - } - - .pl-md-1, - .px-md-1 { - padding-left: 0.25rem !important; - } - - .p-md-2 { - padding: 0.5rem !important; - } - - .pt-md-2, - .py-md-2 { - padding-top: 0.5rem !important; - } - - .pr-md-2, - .px-md-2 { - padding-right: 0.5rem !important; - } - - .pb-md-2, - .py-md-2 { - padding-bottom: 0.5rem !important; - } - - .pl-md-2, - .px-md-2 { - padding-left: 0.5rem !important; - } - - .p-md-3 { - padding: 1rem !important; - } - - .pt-md-3, - .py-md-3 { - padding-top: 1rem !important; - } - - .pr-md-3, - .px-md-3 { - padding-right: 1rem !important; - } - - .pb-md-3, - .py-md-3 { - padding-bottom: 1rem !important; - } - - .pl-md-3, - .px-md-3 { - padding-left: 1rem !important; - } - - .p-md-4 { - padding: 1.5rem !important; - } - - .pt-md-4, - .py-md-4 { - padding-top: 1.5rem !important; - } - - .pr-md-4, - .px-md-4 { - padding-right: 1.5rem !important; - } - - .pb-md-4, - .py-md-4 { - padding-bottom: 1.5rem !important; - } - - .pl-md-4, - .px-md-4 { - padding-left: 1.5rem !important; - } - - .p-md-5 { - padding: 3rem !important; - } - - .pt-md-5, - .py-md-5 { - padding-top: 3rem !important; - } - - .pr-md-5, - .px-md-5 { - padding-right: 3rem !important; - } - - .pb-md-5, - .py-md-5 { - padding-bottom: 3rem !important; - } - - .pl-md-5, - .px-md-5 { - padding-left: 3rem !important; - } - - .m-md-n1 { - margin: -0.25rem !important; - } - - .mt-md-n1, - .my-md-n1 { - margin-top: -0.25rem !important; - } - - .mr-md-n1, - .mx-md-n1 { - margin-right: -0.25rem !important; - } - - .mb-md-n1, - .my-md-n1 { - margin-bottom: -0.25rem !important; - } - - .ml-md-n1, - .mx-md-n1 { - margin-left: -0.25rem !important; - } - - .m-md-n2 { - margin: -0.5rem !important; - } - - .mt-md-n2, - .my-md-n2 { - margin-top: -0.5rem !important; - } - - .mr-md-n2, - .mx-md-n2 { - margin-right: -0.5rem !important; - } - - .mb-md-n2, - .my-md-n2 { - margin-bottom: -0.5rem !important; - } - - .ml-md-n2, - .mx-md-n2 { - margin-left: -0.5rem !important; - } - - .m-md-n3 { - margin: -1rem !important; - } - - .mt-md-n3, - .my-md-n3 { - margin-top: -1rem !important; - } - - .mr-md-n3, - .mx-md-n3 { - margin-right: -1rem !important; - } - - .mb-md-n3, - .my-md-n3 { - margin-bottom: -1rem !important; - } - - .ml-md-n3, - .mx-md-n3 { - margin-left: -1rem !important; - } - - .m-md-n4 { - margin: -1.5rem !important; - } - - .mt-md-n4, - .my-md-n4 { - margin-top: -1.5rem !important; - } - - .mr-md-n4, - .mx-md-n4 { - margin-right: -1.5rem !important; - } - - .mb-md-n4, - .my-md-n4 { - margin-bottom: -1.5rem !important; - } - - .ml-md-n4, - .mx-md-n4 { - margin-left: -1.5rem !important; - } - - .m-md-n5 { - margin: -3rem !important; - } - - .mt-md-n5, - .my-md-n5 { - margin-top: -3rem !important; - } - - .mr-md-n5, - .mx-md-n5 { - margin-right: -3rem !important; - } - - .mb-md-n5, - .my-md-n5 { - margin-bottom: -3rem !important; - } - - .ml-md-n5, - .mx-md-n5 { - margin-left: -3rem !important; - } - - .m-md-auto { - margin: auto !important; - } - - .mt-md-auto, - .my-md-auto { - margin-top: auto !important; - } - - .mr-md-auto, - .mx-md-auto { - margin-right: auto !important; - } - - .mb-md-auto, - .my-md-auto { - margin-bottom: auto !important; - } - - .ml-md-auto, - .mx-md-auto { - margin-left: auto !important; - } -} -@media (min-width: 992px) { - .m-lg-0 { - margin: 0 !important; - } - - .mt-lg-0, - .my-lg-0 { - margin-top: 0 !important; - } - - .mr-lg-0, - .mx-lg-0 { - margin-right: 0 !important; - } - - .mb-lg-0, - .my-lg-0 { - margin-bottom: 0 !important; - } - - .ml-lg-0, - .mx-lg-0 { - margin-left: 0 !important; - } - - .m-lg-1 { - margin: 0.25rem !important; - } - - .mt-lg-1, - .my-lg-1 { - margin-top: 0.25rem !important; - } - - .mr-lg-1, - .mx-lg-1 { - margin-right: 0.25rem !important; - } - - .mb-lg-1, - .my-lg-1 { - margin-bottom: 0.25rem !important; - } - - .ml-lg-1, - .mx-lg-1 { - margin-left: 0.25rem !important; - } - - .m-lg-2 { - margin: 0.5rem !important; - } - - .mt-lg-2, - .my-lg-2 { - margin-top: 0.5rem !important; - } - - .mr-lg-2, - .mx-lg-2 { - margin-right: 0.5rem !important; - } - - .mb-lg-2, - .my-lg-2 { - margin-bottom: 0.5rem !important; - } - - .ml-lg-2, - .mx-lg-2 { - margin-left: 0.5rem !important; - } - - .m-lg-3 { - margin: 1rem !important; - } - - .mt-lg-3, - .my-lg-3 { - margin-top: 1rem !important; - } - - .mr-lg-3, - .mx-lg-3 { - margin-right: 1rem !important; - } - - .mb-lg-3, - .my-lg-3 { - margin-bottom: 1rem !important; - } - - .ml-lg-3, - .mx-lg-3 { - margin-left: 1rem !important; - } - - .m-lg-4 { - margin: 1.5rem !important; - } - - .mt-lg-4, - .my-lg-4 { - margin-top: 1.5rem !important; - } - - .mr-lg-4, - .mx-lg-4 { - margin-right: 1.5rem !important; - } - - .mb-lg-4, - .my-lg-4 { - margin-bottom: 1.5rem !important; - } - - .ml-lg-4, - .mx-lg-4 { - margin-left: 1.5rem !important; - } - - .m-lg-5 { - margin: 3rem !important; - } - - .mt-lg-5, - .my-lg-5 { - margin-top: 3rem !important; - } - - .mr-lg-5, - .mx-lg-5 { - margin-right: 3rem !important; - } - - .mb-lg-5, - .my-lg-5 { - margin-bottom: 3rem !important; - } - - .ml-lg-5, - .mx-lg-5 { - margin-left: 3rem !important; - } - - .p-lg-0 { - padding: 0 !important; - } - - .pt-lg-0, - .py-lg-0 { - padding-top: 0 !important; - } - - .pr-lg-0, - .px-lg-0 { - padding-right: 0 !important; - } - - .pb-lg-0, - .py-lg-0 { - padding-bottom: 0 !important; - } - - .pl-lg-0, - .px-lg-0 { - padding-left: 0 !important; - } - - .p-lg-1 { - padding: 0.25rem !important; - } - - .pt-lg-1, - .py-lg-1 { - padding-top: 0.25rem !important; - } - - .pr-lg-1, - .px-lg-1 { - padding-right: 0.25rem !important; - } - - .pb-lg-1, - .py-lg-1 { - padding-bottom: 0.25rem !important; - } - - .pl-lg-1, - .px-lg-1 { - padding-left: 0.25rem !important; - } - - .p-lg-2 { - padding: 0.5rem !important; - } - - .pt-lg-2, - .py-lg-2 { - padding-top: 0.5rem !important; - } - - .pr-lg-2, - .px-lg-2 { - padding-right: 0.5rem !important; - } - - .pb-lg-2, - .py-lg-2 { - padding-bottom: 0.5rem !important; - } - - .pl-lg-2, - .px-lg-2 { - padding-left: 0.5rem !important; - } - - .p-lg-3 { - padding: 1rem !important; - } - - .pt-lg-3, - .py-lg-3 { - padding-top: 1rem !important; - } - - .pr-lg-3, - .px-lg-3 { - padding-right: 1rem !important; - } - - .pb-lg-3, - .py-lg-3 { - padding-bottom: 1rem !important; - } - - .pl-lg-3, - .px-lg-3 { - padding-left: 1rem !important; - } - - .p-lg-4 { - padding: 1.5rem !important; - } - - .pt-lg-4, - .py-lg-4 { - padding-top: 1.5rem !important; - } - - .pr-lg-4, - .px-lg-4 { - padding-right: 1.5rem !important; - } - - .pb-lg-4, - .py-lg-4 { - padding-bottom: 1.5rem !important; - } - - .pl-lg-4, - .px-lg-4 { - padding-left: 1.5rem !important; - } - - .p-lg-5 { - padding: 3rem !important; - } - - .pt-lg-5, - .py-lg-5 { - padding-top: 3rem !important; - } - - .pr-lg-5, - .px-lg-5 { - padding-right: 3rem !important; - } - - .pb-lg-5, - .py-lg-5 { - padding-bottom: 3rem !important; - } - - .pl-lg-5, - .px-lg-5 { - padding-left: 3rem !important; - } - - .m-lg-n1 { - margin: -0.25rem !important; - } - - .mt-lg-n1, - .my-lg-n1 { - margin-top: -0.25rem !important; - } - - .mr-lg-n1, - .mx-lg-n1 { - margin-right: -0.25rem !important; - } - - .mb-lg-n1, - .my-lg-n1 { - margin-bottom: -0.25rem !important; - } - - .ml-lg-n1, - .mx-lg-n1 { - margin-left: -0.25rem !important; - } - - .m-lg-n2 { - margin: -0.5rem !important; - } - - .mt-lg-n2, - .my-lg-n2 { - margin-top: -0.5rem !important; - } - - .mr-lg-n2, - .mx-lg-n2 { - margin-right: -0.5rem !important; - } - - .mb-lg-n2, - .my-lg-n2 { - margin-bottom: -0.5rem !important; - } - - .ml-lg-n2, - .mx-lg-n2 { - margin-left: -0.5rem !important; - } - - .m-lg-n3 { - margin: -1rem !important; - } - - .mt-lg-n3, - .my-lg-n3 { - margin-top: -1rem !important; - } - - .mr-lg-n3, - .mx-lg-n3 { - margin-right: -1rem !important; - } - - .mb-lg-n3, - .my-lg-n3 { - margin-bottom: -1rem !important; - } - - .ml-lg-n3, - .mx-lg-n3 { - margin-left: -1rem !important; - } - - .m-lg-n4 { - margin: -1.5rem !important; - } - - .mt-lg-n4, - .my-lg-n4 { - margin-top: -1.5rem !important; - } - - .mr-lg-n4, - .mx-lg-n4 { - margin-right: -1.5rem !important; - } - - .mb-lg-n4, - .my-lg-n4 { - margin-bottom: -1.5rem !important; - } - - .ml-lg-n4, - .mx-lg-n4 { - margin-left: -1.5rem !important; - } - - .m-lg-n5 { - margin: -3rem !important; - } - - .mt-lg-n5, - .my-lg-n5 { - margin-top: -3rem !important; - } - - .mr-lg-n5, - .mx-lg-n5 { - margin-right: -3rem !important; - } - - .mb-lg-n5, - .my-lg-n5 { - margin-bottom: -3rem !important; - } - - .ml-lg-n5, - .mx-lg-n5 { - margin-left: -3rem !important; - } - - .m-lg-auto { - margin: auto !important; - } - - .mt-lg-auto, - .my-lg-auto { - margin-top: auto !important; - } - - .mr-lg-auto, - .mx-lg-auto { - margin-right: auto !important; - } - - .mb-lg-auto, - .my-lg-auto { - margin-bottom: auto !important; - } - - .ml-lg-auto, - .mx-lg-auto { - margin-left: auto !important; - } -} -@media (min-width: 1200px) { - .m-xl-0 { - margin: 0 !important; - } - - .mt-xl-0, - .my-xl-0 { - margin-top: 0 !important; - } - - .mr-xl-0, - .mx-xl-0 { - margin-right: 0 !important; - } - - .mb-xl-0, - .my-xl-0 { - margin-bottom: 0 !important; - } - - .ml-xl-0, - .mx-xl-0 { - margin-left: 0 !important; - } - - .m-xl-1 { - margin: 0.25rem !important; - } - - .mt-xl-1, - .my-xl-1 { - margin-top: 0.25rem !important; - } - - .mr-xl-1, - .mx-xl-1 { - margin-right: 0.25rem !important; - } - - .mb-xl-1, - .my-xl-1 { - margin-bottom: 0.25rem !important; - } - - .ml-xl-1, - .mx-xl-1 { - margin-left: 0.25rem !important; - } - - .m-xl-2 { - margin: 0.5rem !important; - } - - .mt-xl-2, - .my-xl-2 { - margin-top: 0.5rem !important; - } - - .mr-xl-2, - .mx-xl-2 { - margin-right: 0.5rem !important; - } - - .mb-xl-2, - .my-xl-2 { - margin-bottom: 0.5rem !important; - } - - .ml-xl-2, - .mx-xl-2 { - margin-left: 0.5rem !important; - } - - .m-xl-3 { - margin: 1rem !important; - } - - .mt-xl-3, - .my-xl-3 { - margin-top: 1rem !important; - } - - .mr-xl-3, - .mx-xl-3 { - margin-right: 1rem !important; - } - - .mb-xl-3, - .my-xl-3 { - margin-bottom: 1rem !important; - } - - .ml-xl-3, - .mx-xl-3 { - margin-left: 1rem !important; - } - - .m-xl-4 { - margin: 1.5rem !important; - } - - .mt-xl-4, - .my-xl-4 { - margin-top: 1.5rem !important; - } - - .mr-xl-4, - .mx-xl-4 { - margin-right: 1.5rem !important; - } - - .mb-xl-4, - .my-xl-4 { - margin-bottom: 1.5rem !important; - } - - .ml-xl-4, - .mx-xl-4 { - margin-left: 1.5rem !important; - } - - .m-xl-5 { - margin: 3rem !important; - } - - .mt-xl-5, - .my-xl-5 { - margin-top: 3rem !important; - } - - .mr-xl-5, - .mx-xl-5 { - margin-right: 3rem !important; - } - - .mb-xl-5, - .my-xl-5 { - margin-bottom: 3rem !important; - } - - .ml-xl-5, - .mx-xl-5 { - margin-left: 3rem !important; - } - - .p-xl-0 { - padding: 0 !important; - } - - .pt-xl-0, - .py-xl-0 { - padding-top: 0 !important; - } - - .pr-xl-0, - .px-xl-0 { - padding-right: 0 !important; - } - - .pb-xl-0, - .py-xl-0 { - padding-bottom: 0 !important; - } - - .pl-xl-0, - .px-xl-0 { - padding-left: 0 !important; - } - - .p-xl-1 { - padding: 0.25rem !important; - } - - .pt-xl-1, - .py-xl-1 { - padding-top: 0.25rem !important; - } - - .pr-xl-1, - .px-xl-1 { - padding-right: 0.25rem !important; - } - - .pb-xl-1, - .py-xl-1 { - padding-bottom: 0.25rem !important; - } - - .pl-xl-1, - .px-xl-1 { - padding-left: 0.25rem !important; - } - - .p-xl-2 { - padding: 0.5rem !important; - } - - .pt-xl-2, - .py-xl-2 { - padding-top: 0.5rem !important; - } - - .pr-xl-2, - .px-xl-2 { - padding-right: 0.5rem !important; - } - - .pb-xl-2, - .py-xl-2 { - padding-bottom: 0.5rem !important; - } - - .pl-xl-2, - .px-xl-2 { - padding-left: 0.5rem !important; - } - - .p-xl-3 { - padding: 1rem !important; - } - - .pt-xl-3, - .py-xl-3 { - padding-top: 1rem !important; - } - - .pr-xl-3, - .px-xl-3 { - padding-right: 1rem !important; - } - - .pb-xl-3, - .py-xl-3 { - padding-bottom: 1rem !important; - } - - .pl-xl-3, - .px-xl-3 { - padding-left: 1rem !important; - } - - .p-xl-4 { - padding: 1.5rem !important; - } - - .pt-xl-4, - .py-xl-4 { - padding-top: 1.5rem !important; - } - - .pr-xl-4, - .px-xl-4 { - padding-right: 1.5rem !important; - } - - .pb-xl-4, - .py-xl-4 { - padding-bottom: 1.5rem !important; - } - - .pl-xl-4, - .px-xl-4 { - padding-left: 1.5rem !important; - } - - .p-xl-5 { - padding: 3rem !important; - } - - .pt-xl-5, - .py-xl-5 { - padding-top: 3rem !important; - } - - .pr-xl-5, - .px-xl-5 { - padding-right: 3rem !important; - } - - .pb-xl-5, - .py-xl-5 { - padding-bottom: 3rem !important; - } - - .pl-xl-5, - .px-xl-5 { - padding-left: 3rem !important; - } - - .m-xl-n1 { - margin: -0.25rem !important; - } - - .mt-xl-n1, - .my-xl-n1 { - margin-top: -0.25rem !important; - } - - .mr-xl-n1, - .mx-xl-n1 { - margin-right: -0.25rem !important; - } - - .mb-xl-n1, - .my-xl-n1 { - margin-bottom: -0.25rem !important; - } - - .ml-xl-n1, - .mx-xl-n1 { - margin-left: -0.25rem !important; - } - - .m-xl-n2 { - margin: -0.5rem !important; - } - - .mt-xl-n2, - .my-xl-n2 { - margin-top: -0.5rem !important; - } - - .mr-xl-n2, - .mx-xl-n2 { - margin-right: -0.5rem !important; - } - - .mb-xl-n2, - .my-xl-n2 { - margin-bottom: -0.5rem !important; - } - - .ml-xl-n2, - .mx-xl-n2 { - margin-left: -0.5rem !important; - } - - .m-xl-n3 { - margin: -1rem !important; - } - - .mt-xl-n3, - .my-xl-n3 { - margin-top: -1rem !important; - } - - .mr-xl-n3, - .mx-xl-n3 { - margin-right: -1rem !important; - } - - .mb-xl-n3, - .my-xl-n3 { - margin-bottom: -1rem !important; - } - - .ml-xl-n3, - .mx-xl-n3 { - margin-left: -1rem !important; - } - - .m-xl-n4 { - margin: -1.5rem !important; - } - - .mt-xl-n4, - .my-xl-n4 { - margin-top: -1.5rem !important; - } - - .mr-xl-n4, - .mx-xl-n4 { - margin-right: -1.5rem !important; - } - - .mb-xl-n4, - .my-xl-n4 { - margin-bottom: -1.5rem !important; - } - - .ml-xl-n4, - .mx-xl-n4 { - margin-left: -1.5rem !important; - } - - .m-xl-n5 { - margin: -3rem !important; - } - - .mt-xl-n5, - .my-xl-n5 { - margin-top: -3rem !important; - } - - .mr-xl-n5, - .mx-xl-n5 { - margin-right: -3rem !important; - } - - .mb-xl-n5, - .my-xl-n5 { - margin-bottom: -3rem !important; - } - - .ml-xl-n5, - .mx-xl-n5 { - margin-left: -3rem !important; - } - - .m-xl-auto { - margin: auto !important; - } - - .mt-xl-auto, - .my-xl-auto { - margin-top: auto !important; - } - - .mr-xl-auto, - .mx-xl-auto { - margin-right: auto !important; - } - - .mb-xl-auto, - .my-xl-auto { - margin-bottom: auto !important; - } - - .ml-xl-auto, - .mx-xl-auto { - margin-left: auto !important; - } -} -.stretched-link::after { - position: absolute; - top: 0; - right: 0; - bottom: 0; - left: 0; - z-index: 1; - pointer-events: auto; - content: ""; - background-color: rgba(0, 0, 0, 0); -} - -.text-monospace { - font-family: SFMono-Regular, Menlo, Monaco, Consolas, "Liberation Mono", "Courier New", monospace !important; -} - -.text-justify { - text-align: justify !important; -} - -.text-wrap { - white-space: normal !important; -} - -.text-nowrap { - white-space: nowrap !important; -} - -.text-truncate { - overflow: hidden; - text-overflow: ellipsis; - white-space: nowrap; -} - -.text-left { - text-align: left !important; -} - -.text-right { - text-align: right !important; -} - -.text-center { - text-align: center !important; -} - -@media (min-width: 576px) { - .text-sm-left { - text-align: left !important; - } - - .text-sm-right { - text-align: right !important; - } - - .text-sm-center { - text-align: center !important; - } -} -@media (min-width: 768px) { - .text-md-left { - text-align: left !important; - } - - .text-md-right { - text-align: right !important; - } - - .text-md-center { - text-align: center !important; - } -} -@media (min-width: 992px) { - .text-lg-left { - text-align: left !important; - } - - .text-lg-right { - text-align: right !important; - } - - .text-lg-center { - text-align: center !important; - } -} -@media (min-width: 1200px) { - .text-xl-left { - text-align: left !important; - } - - .text-xl-right { - text-align: right !important; - } - - .text-xl-center { - text-align: center !important; - } -} -.text-lowercase { - text-transform: lowercase !important; -} - -.text-uppercase { - text-transform: uppercase !important; -} - -.text-capitalize { - text-transform: capitalize !important; -} - -.font-weight-light { - font-weight: 300 !important; -} - -.font-weight-lighter { - font-weight: lighter !important; -} - -.font-weight-normal { - font-weight: 400 !important; -} - -.font-weight-bold { - font-weight: 700 !important; -} - -.font-weight-bolder { - font-weight: bolder !important; -} - -.font-italic { - font-style: italic !important; -} - -.text-white { - color: #fff !important; -} - -.text-primary { - color: #007bff !important; -} - -a.text-primary:hover, a.text-primary:focus { - color: #0056b3 !important; -} - -.text-secondary { - color: #6c757d !important; -} - -a.text-secondary:hover, a.text-secondary:focus { - color: #494f54 !important; -} - -.text-success { - color: #28a745 !important; -} - -a.text-success:hover, a.text-success:focus { - color: #19692c !important; -} - -.text-info { - color: #17a2b8 !important; -} - -a.text-info:hover, a.text-info:focus { - color: #0f6674 !important; -} - -.text-warning { - color: #ffc107 !important; -} - -a.text-warning:hover, a.text-warning:focus { - color: #ba8b00 !important; -} - -.text-danger { - color: #dc3545 !important; -} - -a.text-danger:hover, a.text-danger:focus { - color: #a71d2a !important; -} - -.text-light { - color: #f8f9fa !important; -} - -a.text-light:hover, a.text-light:focus { - color: #cbd3da !important; -} - -.text-dark { - color: #343a40 !important; -} - -a.text-dark:hover, a.text-dark:focus { - color: #121416 !important; -} - -.text-body { - color: #212529 !important; -} - -.text-muted { - color: #6c757d !important; -} - -.text-black-50 { - color: rgba(0, 0, 0, 0.5) !important; -} - -.text-white-50 { - color: rgba(255, 255, 255, 0.5) !important; -} - -.text-hide { - font: 0/0 a; - color: transparent; - text-shadow: none; - background-color: transparent; - border: 0; -} - -.text-decoration-none { - text-decoration: none !important; -} - -.text-break { - word-break: break-word !important; - word-wrap: break-word !important; -} - -.text-reset { - color: inherit !important; -} - -.visible { - visibility: visible !important; -} - -.invisible { - visibility: hidden !important; -} - -@media print { - *, - *::before, - *::after { - text-shadow: none !important; - -webkit-box-shadow: none !important; - box-shadow: none !important; - } - - a:not(.btn) { - text-decoration: underline; - } - - abbr[title]::after { - content: " (" attr(title) ")"; - } - - pre { - white-space: pre-wrap !important; - } - - pre, - blockquote { - border: 1px solid #adb5bd; - page-break-inside: avoid; - } - - tr, - img { - page-break-inside: avoid; - } - - p, - h2, - h3 { - orphans: 3; - widows: 3; - } - - h2, - h3 { - page-break-after: avoid; - } - - @page { - size: a3; - } - body { - min-width: 992px !important; - } - - .container { - min-width: 992px !important; - } - - .navbar { - display: none; - } - - .badge { - border: 1px solid #000; - } - - .table { - border-collapse: collapse !important; - } - .table td, - .table th { - background-color: #fff !important; - } - - .table-bordered th, - .table-bordered td { - border: 1px solid #dee2e6 !important; - } - - .table-dark { - color: inherit; - } - .table-dark th, - .table-dark td, - .table-dark thead th, - .table-dark tbody + tbody { - border-color: #dee2e6; - } - - .table .thead-dark th { - color: inherit; - border-color: #dee2e6; - } -} -/*Github syntax highlighting theme via Rouge*/ -.highlight table td { - padding: 5px; -} - -.highlight table pre { - margin: 0; -} - -.highlight .cm { - color: #999988; - font-style: italic; -} - -.highlight .cp { - color: #999999; - font-weight: bold; -} - -.highlight .c1 { - color: #999988; - font-style: italic; -} - -.highlight .cs { - color: #999999; - font-weight: bold; - font-style: italic; -} - -.highlight .c, .highlight .cd { - color: #999988; - font-style: italic; -} - -.highlight .err { - color: #a61717; - background-color: #e3d2d2; -} - -.highlight .gd { - color: #000000; - background-color: #ffdddd; -} - -.highlight .ge { - color: #000000; - font-style: italic; -} - -.highlight .gr { - color: #aa0000; -} - -.highlight .gh { - color: #999999; -} - -.highlight .gi { - color: #000000; - background-color: #ddffdd; -} - -.highlight .go { - color: #888888; -} - -.highlight .gp { - color: #555555; -} - -.highlight .gs { - font-weight: bold; -} - -.highlight .gu { - color: #aaaaaa; -} - -.highlight .gt { - color: #aa0000; -} - -.highlight .kc { - color: #000000; - font-weight: bold; -} - -.highlight .kd { - color: #000000; - font-weight: bold; -} - -.highlight .kn { - color: #000000; - font-weight: bold; -} - -.highlight .kp { - color: #000000; - font-weight: bold; -} - -.highlight .kr { - color: #000000; - font-weight: bold; -} - -.highlight .kt { - color: #445588; - font-weight: bold; -} - -.highlight .k, .highlight .kv { - color: #000000; - font-weight: bold; -} - -.highlight .mf { - color: #009999; -} - -.highlight .mh { - color: #009999; -} - -.highlight .il { - color: #009999; -} - -.highlight .mi { - color: #009999; -} - -.highlight .mo { - color: #009999; -} - -.highlight .m, .highlight .mb, .highlight .mx { - color: #009999; -} - -.highlight .sb { - color: #d14; -} - -.highlight .sc { - color: #d14; -} - -.highlight .sd { - color: #d14; -} - -.highlight .s2 { - color: #d14; -} - -.highlight .se { - color: #d14; -} - -.highlight .sh { - color: #d14; -} - -.highlight .si { - color: #d14; -} - -.highlight .sx { - color: #d14; -} - -.highlight .sr { - color: #009926; -} - -.highlight .s1 { - color: #d14; -} - -.highlight .ss { - color: #990073; -} - -.highlight .s { - color: #d14; -} - -.highlight .na { - color: #008080; -} - -.highlight .bp { - color: #525252; -} - -.highlight .nb { - color: #0086B3; -} - -.highlight .nc { - color: #445588; - font-weight: bold; -} - -.highlight .no { - color: #008080; -} - -.highlight .nd { - color: #3c5d5d; - font-weight: bold; -} - -.highlight .ni { - color: #800080; -} - -.highlight .ne { - color: #990000; - font-weight: bold; -} - -.highlight .nf { - color: #990000; - font-weight: bold; -} - -.highlight .nl { - color: #990000; - font-weight: bold; -} - -.highlight .nn { - color: #555555; -} - -.highlight .nt { - color: #000080; -} - -.highlight .vc { - color: #008080; -} - -.highlight .vg { - color: #008080; -} - -.highlight .vi { - color: #008080; -} - -.highlight .nv { - color: #008080; -} - -.highlight .ow { - color: #000000; - font-weight: bold; -} - -.highlight .o { - color: #000000; - font-weight: bold; -} - -.highlight .n { - color: #000000; - font-weight: bold; -} - -.highlight .p { - color: #000000; - font-weight: bold; -} - -.highlight .w { - color: #bbbbbb; -} - -.highlight { - background-color: #f8f8f8; -} - -@font-face { - font-family: FreightSans; - font-weight: 700; - font-style: normal; - src: url("../fonts/FreightSans/freight-sans-bold.woff2") format("woff2"), url("../fonts/FreightSans/freight-sans-bold.woff") format("woff"); -} -@font-face { - font-family: FreightSans; - font-weight: 700; - font-style: italic; - src: url("../fonts/FreightSans/freight-sans-bold-italic.woff2") format("woff2"), url("../fonts/FreightSans/freight-sans-bold-italic.woff") format("woff"); -} -@font-face { - font-family: FreightSans; - font-weight: 500; - font-style: normal; - src: url("../fonts/FreightSans/freight-sans-medium.woff2") format("woff2"), url("../fonts/FreightSans/freight-sans-medium.woff") format("woff"); -} -@font-face { - font-family: FreightSans; - font-weight: 500; - font-style: italic; - src: url("../fonts/FreightSans/freight-sans-medium-italic.woff2") format("woff2"), url("../fonts/FreightSans/freight-sans-medium-italic.woff") format("woff"); -} -@font-face { - font-family: FreightSans; - font-weight: 100; - font-style: normal; - src: url("../fonts/FreightSans/freight-sans-light.woff2") format("woff2"), url("../fonts/FreightSans/freight-sans-light.woff") format("woff"); -} -@font-face { - font-family: FreightSans; - font-weight: 100; - font-style: italic; - src: url("../fonts/FreightSans/freight-sans-light-italic.woff2") format("woff2"), url("../fonts/FreightSans/freight-sans-light-italic.woff") format("woff"); -} -@font-face { - font-family: FreightSans; - font-weight: 400; - font-style: italic; - src: url("../fonts/FreightSans/freight-sans-book-italic.woff2") format("woff2"), url("../fonts/FreightSans/freight-sans-book-italic.woff") format("woff"); -} -@font-face { - font-family: FreightSans; - font-weight: 400; - font-style: normal; - src: url("../fonts/FreightSans/freight-sans-book.woff2") format("woff2"), url("../fonts/FreightSans/freight-sans-book.woff") format("woff"); -} -@font-face { - font-family: IBMPlexMono; - font-weight: 600; - font-style: normal; - unicode-range: u+0020-007f; - src: local("IBMPlexMono-SemiBold"), url("../fonts/IBMPlexMono/IBMPlexMono-SemiBold.woff2") format("woff2"), url("../fonts/IBMPlexMono/IBMPlexMono-SemiBold.woff") format("woff"); -} -@font-face { - font-family: IBMPlexMono; - font-weight: 500; - font-style: normal; - unicode-range: u+0020-007f; - src: local("IBMPlexMono-Medium"), url("../fonts/IBMPlexMono/IBMPlexMono-Medium.woff2") format("woff2"), url("../fonts/IBMPlexMono/IBMPlexMono-Medium.woff") format("woff"); -} -@font-face { - font-family: IBMPlexMono; - font-weight: 400; - font-style: normal; - unicode-range: u+0020-007f; - src: local("IBMPlexMono-Regular"), url("../fonts/IBMPlexMono/IBMPlexMono-Regular.woff2") format("woff2"), url("../fonts/IBMPlexMono/IBMPlexMono-Regular.woff") format("woff"); -} -@font-face { - font-family: IBMPlexMono; - font-weight: 300; - font-style: normal; - unicode-range: u+0020-007f; - src: local("IBMPlexMono-Light"), url("../fonts/IBMPlexMono/IBMPlexMono-Light.woff2") format("woff2"), url("../fonts/IBMPlexMono/IBMPlexMono-Light.woff") format("woff"); -} -@font-face { - font-family: UCity; - font-weight: 600; - font-style: normal; - src: local("UCity-Semibold"), url("../fonts/UCity/UCity-Semibold.woff2") format("woff2"); -} -@font-face { - font-family: UCity; - font-weight: 400; - font-style: normal; - src: local("UCity-Regular"), url("../fonts/UCity/UCity-Regular.woff2") format("woff2"); -} -@font-face { - font-family: UCity; - font-weight: 300; - font-style: normal; - src: local("UCity-Light"), url("../fonts/UCity/UCity-Light.woff2") format("woff2"); -} -html { - position: relative; - min-height: 100%; - font-size: 12px; -} -@media screen and (min-width: 768px) { - html { - font-size: 16px; - } -} - -* { - -webkit-box-sizing: border-box; - box-sizing: border-box; -} - -body { - font-family: FreightSans, Helvetica Neue, Helvetica, Arial, sans-serif; -} - -a:link, -a:visited, -a:hover { - text-decoration: none; - color: #792ee5; -} - -a.with-right-arrow, .btn.with-right-arrow { - padding-right: 1.375rem; - position: relative; - background-image: url("../images/chevron-right-orange.svg"); - background-size: 6px 13px; - background-position: center right 5px; - background-repeat: no-repeat; -} -@media screen and (min-width: 768px) { - a.with-right-arrow, .btn.with-right-arrow { - background-size: 8px 14px; - background-position: center right 12px; - padding-right: 2rem; - } -} - -::-webkit-input-placeholder { - color: #792ee5; -} - -::-moz-placeholder { - color: #792ee5; -} - -:-ms-input-placeholder { - color: #792ee5; -} - -:-moz-placeholder { - color: #792ee5; -} - -.email-subscribe-form input.email { - color: #792ee5; - border: none; - border-bottom: 1px solid #939393; - width: 100%; - background-color: transparent; - outline: none; - font-size: 1.125rem; - letter-spacing: 0.25px; - line-height: 2.25rem; -} -.email-subscribe-form input[type="submit"] { - position: absolute; - right: 0; - top: 10px; - height: 15px; - width: 15px; - background-image: url("../images/arrow-right-with-tail.svg"); - background-color: transparent; - background-repeat: no-repeat; - background-size: 15px 15px; - background-position: center center; - -webkit-appearance: none; - -moz-appearance: none; - appearance: none; - border: 0; -} - -.email-subscribe-form-fields-wrapper { - position: relative; -} - -.anchorjs-link { - color: #6c6c6d !important; -} -@media screen and (min-width: 768px) { - .anchorjs-link:hover { - color: inherit; - text-decoration: none !important; - } -} - -.pytorch-article #table-of-contents { - display: none; -} - -.badge { - font-weight: inherit; - border-radius: 3px; -} - -.badge-primary { - background-color: #792ee5; -} - -.badge-secondary { - background-color: #979797; -} - -code, kbd, pre, samp { - font-family: "Inconsolata", "IBMPlexMono", "SFMono-Regular", "Menlo", "Monaco", "Consolas", "Liberation Mono", "Courier New", "monospace"; -} - -code span, kbd span, pre span, samp span { - font-family: "Inconsolata", "IBMPlexMono", "SFMono-Regular", "Menlo", "Monaco", "Consolas", "Liberation Mono", "Courier New", "monospace"; -} - -pre { - padding: 1.125rem; - background-color: #f3f4f7; -} -pre code { - font-size: 0.875rem; -} -pre.highlight { - background-color: #f3f4f7; - line-height: 1.3125rem; -} - -code.highlighter-rouge { - color: #6c6c6d; - background-color: #f3f4f7; - padding: 2px 6px; -} - -a:link code.highlighter-rouge, -a:visited code.highlighter-rouge, -a:hover code.highlighter-rouge { - color: #fe6162; -} -a:link.has-code, -a:visited.has-code, -a:hover.has-code { - color: #fe6162; -} - -p code, -h1 code, -h2 code, -h3 code, -h4 code, -h5 code, -h6 code { - font-size: 78.5%; -} - -pre { - white-space: pre-wrap; - white-space: -moz-pre-wrap; - white-space: -pre-wrap; - white-space: -o-pre-wrap; - word-wrap: break-word; -} - -.header-holder { - height: 68px; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; - display: -webkit-box; - display: -ms-flexbox; - display: flex; - left: 0; - margin-left: auto; - margin-right: auto; - position: fixed; - right: 0; - top: 0; - width: 100%; - z-index: 9999; - background-color: #ffffff; - border-bottom: 1px solid #e2e2e2; -} -@media screen and (min-width: 1100px) { - .header-holder { - height: 90px; - } -} - -.header-container { - position: relative; - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; -} -.header-container:before, .header-container:after { - content: ""; - display: table; -} -.header-container:after { - clear: both; -} -.header-container { - *zoom: 1; -} -@media screen and (min-width: 1100px) { - .header-container { - display: block; - } -} - -.header-logo { - height: 32px; - width: calc(100% - 25px); - background-image: url("../images/logo_light.svg"), url("../images/logo.svg"); - background-repeat: no-repeat; - background-size: contain; - display: block; - float: left; - z-index: 10; -} -@media screen and (min-width: 1100px) { - .header-logo { - background-size: contain; - position: absolute; - height: 43px; - width: 25%; - top: 4px; - float: none; - } -} -@media screen and (min-width: 1600px) { - .header-logo { - width: 350px; - } -} - -.main-menu-open-button { - background-image: url("../images/icon-menu-dots.svg"); - background-position: center center; - background-size: 25px 7px; - background-repeat: no-repeat; - width: 25px; - height: 17px; - position: absolute; - right: 0; - top: 8px; -} -@media screen and (min-width: 1100px) { - .main-menu-open-button { - display: none; - } -} - -.header-holder .main-menu { - display: none; -} -@media screen and (min-width: 1100px) { - .header-holder .main-menu { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; - -webkit-box-pack: end; - -ms-flex-pack: end; - justify-content: flex-end; - } -} -.header-holder .main-menu ul { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; - margin: 0; -} -.header-holder .main-menu ul li { - display: inline-block; - margin-right: 40px; - position: relative; -} -.header-holder .main-menu ul li.active:after { - content: "•"; - bottom: -24px; - color: #792ee5; - font-size: 1.375rem; - left: 0; - position: absolute; - right: 0; - text-align: center; -} -.header-holder .main-menu ul li.active a { - color: #792ee5; -} -.header-holder .main-menu ul li.docs-active:after { - content: "•"; - bottom: -24px; - color: #792ee5; - font-size: 1.375rem; - left: -24px; - position: absolute; - right: 0; - text-align: center; -} -.header-holder .main-menu ul li:last-of-type { - margin-right: 0; -} -.header-holder .main-menu ul li a { - color: #1C1C1C; - font-family: UCity; - font-size: 14px; - font-weight: 600; - line-height: 1.25rem; - letter-spacing: 0px; - text-align: left; - text-decoration: none; -} -@media screen and (min-width: 1100px) { - .header-holder .main-menu ul li a:hover { - color: #792ee5; - } -} - -.mobile-main-menu { - display: none; -} -.mobile-main-menu.open { - background-color: #262626; - display: block; - height: 100%; - left: 0; - margin-left: auto; - margin-right: auto; - min-height: 100%; - position: fixed; - right: 0; - top: 0; - width: 100%; - z-index: 99999; -} - -.mobile-main-menu .container-fluid, .mobile-main-menu .container-sm, .mobile-main-menu .container-md, .mobile-main-menu .container-lg, .mobile-main-menu .container-xl { - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; - display: -webkit-box; - display: -ms-flexbox; - display: flex; - height: 68px; - position: relative; -} -.mobile-main-menu .container-fluid:before, .mobile-main-menu .container-sm:before, .mobile-main-menu .container-md:before, .mobile-main-menu .container-lg:before, .mobile-main-menu .container-xl:before, .mobile-main-menu .container-fluid:after, .mobile-main-menu .container-sm:after, .mobile-main-menu .container-md:after, .mobile-main-menu .container-lg:after, .mobile-main-menu .container-xl:after { - content: ""; - display: table; -} -.mobile-main-menu .container-fluid:after, .mobile-main-menu .container-sm:after, .mobile-main-menu .container-md:after, .mobile-main-menu .container-lg:after, .mobile-main-menu .container-xl:after { - clear: both; -} -.mobile-main-menu .container-fluid, .mobile-main-menu .container-sm, .mobile-main-menu .container-md, .mobile-main-menu .container-lg, .mobile-main-menu .container-xl { - *zoom: 1; -} - -.mobile-main-menu.open ul { - list-style-type: none; - padding: 0; -} -.mobile-main-menu.open ul li a, .mobile-main-menu.open .resources-mobile-menu-title { - font-size: 2rem; - color: #ffffff; - letter-spacing: 0; - line-height: 4rem; - text-decoration: none; -} -.mobile-main-menu.open ul li.active a { - color: #792ee5; -} - -.main-menu-close-button { - background-image: url("../images/icon-close.svg"); - background-position: center center; - background-repeat: no-repeat; - background-size: 24px 24px; - height: 24px; - position: absolute; - right: 0; - width: 24px; - top: 1px; -} - -.mobile-main-menu-header-container { - position: relative; -} - -.mobile-main-menu-links-container { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; - padding-left: 2.8125rem; - height: calc(100% - 68px); - overflow-y: scroll; -} -.mobile-main-menu-links-container .main-menu { - height: 100%; -} - -.mobile-main-menu-links-container ul.resources-mobile-menu-items li { - padding-left: 15px; -} - -.site-footer { - padding: 2.5rem 0; - width: 100%; - background: #000000; - background-size: 100%; - margin-left: 0; - margin-right: 0; - position: relative; - z-index: 201; -} -@media screen and (min-width: 768px) { - .site-footer { - padding: 5rem 0; - } -} -.site-footer p { - color: #ffffff; -} -.site-footer ul { - list-style-type: none; - padding-left: 0; - margin-bottom: 0; -} -.site-footer ul li { - font-size: 1.125rem; - line-height: 2rem; - color: #A0A0A1; - padding-bottom: 0.375rem; -} -.site-footer ul li.list-title { - padding-bottom: 0.75rem; - color: #ffffff; -} -.site-footer a:link, -.site-footer a:visited { - color: inherit; -} -@media screen and (min-width: 768px) { - .site-footer a:hover { - color: #792ee5; - } -} - -.docs-tutorials-resources { - background-color: #262626; - color: #ffffff; - padding-top: 2.5rem; - padding-bottom: 2.5rem; - position: relative; - z-index: 201; -} -@media screen and (min-width: 768px) { - .docs-tutorials-resources { - padding-top: 5rem; - padding-bottom: 5rem; - } -} -.docs-tutorials-resources p { - color: #929292; - font-size: 1.125rem; -} -.docs-tutorials-resources h2 { - font-size: 1.5rem; - letter-spacing: -0.25px; - text-transform: none; - margin-bottom: 0.25rem; -} -@media screen and (min-width: 768px) { - .docs-tutorials-resources h2 { - margin-bottom: 1.25rem; - } -} -.docs-tutorials-resources .col-md-4 { - margin-bottom: 2rem; - text-align: center; -} -@media screen and (min-width: 768px) { - .docs-tutorials-resources .col-md-4 { - margin-bottom: 0; - } -} -.docs-tutorials-resources .with-right-arrow { - margin-left: 12px; -} -.docs-tutorials-resources .with-right-arrow:hover { - background-image: url("../images/chevron-right-white.svg"); -} -.docs-tutorials-resources p { - font-size: 1rem; - line-height: 1.5rem; - letter-spacing: 0.22px; - color: #939393; - margin-bottom: 0; -} -@media screen and (min-width: 768px) { - .docs-tutorials-resources p { - margin-bottom: 1.25rem; - } -} -.docs-tutorials-resources a { - font-size: 1.125rem; - color: #792ee5; -} -.docs-tutorials-resources a:hover { - color: #ffffff; -} - -.footer-container { - position: relative; -} - -@media screen and (min-width: 768px) { - .footer-logo-wrapper { - position: absolute; - top: 0; - left: 30px; - } -} - -.footer-logo { - background-image: url("../images/logo-icon.svg"); - background-position: center; - background-repeat: no-repeat; - background-size: 20px 24px; - display: block; - height: 24px; - margin-bottom: 2.8125rem; - width: 20px; -} -@media screen and (min-width: 768px) { - .footer-logo { - background-size: 29px 36px; - height: 36px; - margin-bottom: 0; - margin-bottom: 0; - width: 29px; - } -} - -.footer-links-wrapper { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -ms-flex-wrap: wrap; - flex-wrap: wrap; -} -@media screen and (min-width: 768px) { - .footer-links-wrapper { - -ms-flex-wrap: initial; - flex-wrap: initial; - -webkit-box-pack: end; - -ms-flex-pack: end; - justify-content: flex-end; - } -} - -.footer-links-col { - margin-bottom: 3.75rem; - width: 50%; -} -@media screen and (min-width: 768px) { - .footer-links-col { - margin-bottom: 0; - width: 14%; - margin-right: 23px; - } - .footer-links-col.follow-us-col { - width: 18%; - margin-right: 0; - } -} -@media (min-width: 768px) and (max-width: 1239px) { - .footer-links-col { - width: 18%; - margin-right: 30px; - } -} - -.footer-social-icons { - margin: 8.5625rem 0 2.5rem 0; -} -.footer-social-icons a { - height: 32px; - width: 32px; - display: inline-block; - background-color: #CCCDD1; - border-radius: 50%; - margin-right: 5px; -} -.footer-social-icons a.facebook { - background-image: url("../images/logo-facebook-dark.svg"); - background-position: center center; - background-size: 9px 18px; - background-repeat: no-repeat; -} -.footer-social-icons a.twitter { - background-image: url("../images/logo-twitter-dark.svg"); - background-position: center center; - background-size: 17px 17px; - background-repeat: no-repeat; -} -.footer-social-icons a.youtube { - background-image: url("../images/logo-youtube-dark.svg"); - background-position: center center; - background-repeat: no-repeat; -} - -.site-footer .mc-field-group { - margin-top: -2px; -} - -article.pytorch-article { - max-width: 920px; - margin: 0 auto; -} -article.pytorch-article h2, -article.pytorch-article h3, -article.pytorch-article h4, -article.pytorch-article h5, -article.pytorch-article h6 { - margin: 1.375rem 0; - color: #262626; -} -article.pytorch-article h2 { - font-size: 1.625rem; - letter-spacing: 1.33px; - line-height: 2rem; - text-transform: none; -} -article.pytorch-article h3 { - font-weight: 600; - font-size: 1.25rem; - line-height: 1.5rem; - text-transform: none; -} -article.pytorch-article h4, -article.pytorch-article h5, -article.pytorch-article h6 { - font-size: 1.125rem; - letter-spacing: -0.19px; - line-height: 1.875rem; -} -article.pytorch-article p { - margin-bottom: 1.125rem; -} -article.pytorch-article p, -article.pytorch-article ul li, -article.pytorch-article ol li, -article.pytorch-article dl dt, -article.pytorch-article dl dd, -article.pytorch-article blockquote { - font-size: 1rem; - line-height: 1.375rem; - color: #262626; - letter-spacing: 0.01px; - font-weight: 500; -} -article.pytorch-article table { - margin-bottom: 2.5rem; - width: 100%; -} -article.pytorch-article table thead { - border-bottom: 1px solid #cacaca; -} -article.pytorch-article table th { - padding: 0.625rem; - color: #262626; -} -article.pytorch-article table td { - padding: 0.3125rem; -} -article.pytorch-article table tr th:first-of-type, -article.pytorch-article table tr td:first-of-type { - padding-left: 0; -} -article.pytorch-article table.docutils.field-list th.field-name { - padding: 0.3125rem; - padding-left: 0; -} -article.pytorch-article table.docutils.field-list td.field-body { - padding: 0.3125rem; -} -article.pytorch-article table.docutils.field-list td.field-body p:last-of-type { - margin-bottom: 0; -} -article.pytorch-article ul, -article.pytorch-article ol { - margin: 1.5rem 0 3.125rem 0; -} -@media screen and (min-width: 768px) { - article.pytorch-article ul, - article.pytorch-article ol { - padding-left: 6.25rem; - } -} -article.pytorch-article ul li, -article.pytorch-article ol li { - margin-bottom: 0.625rem; -} -article.pytorch-article dl { - margin-bottom: 1.5rem; -} -article.pytorch-article dl dt { - margin-bottom: 0.75rem; -} -article.pytorch-article pre { - margin-bottom: 2.5rem; -} -article.pytorch-article hr { - margin-top: 4.6875rem; - margin-bottom: 4.6875rem; -} -article.pytorch-article blockquote { - margin: 0 auto; - margin-bottom: 2.5rem; - width: 65%; -} -article.pytorch-article .hidden { - display: none; -} -article.pytorch-article img { - width: 100%; -} - -html { - height: 100%; -} -@media screen and (min-width: 768px) { - html { - font-size: 16px; - } -} - -body { - background: #ffffff; - height: 100%; - margin: 0; -} -body.no-scroll { - height: 100%; - overflow: hidden; -} - -p { - margin-top: 0; - margin-bottom: 1.125rem; -} -p a:link, -p a:visited, -p a:hover { - color: #792ee5; - text-decoration: none; -} -@media screen and (min-width: 768px) { - p a:hover { - text-decoration: underline; - } -} -p a:link, -p a:visited, -p a:hover { - color: #792ee5; -} - -.wy-breadcrumbs li a { - color: #792ee5; -} - -ul.pytorch-breadcrumbs { - padding-left: 0; - list-style-type: none; -} -ul.pytorch-breadcrumbs li { - display: inline-block; - font-size: 0.875rem; -} -ul.pytorch-breadcrumbs a { - color: #792ee5; - text-decoration: none; -} - -.table-of-contents-link-wrapper { - display: block; - margin-top: 0; - padding: 1.25rem 1.875rem; - background-color: #f3f4f7; - position: relative; - color: #262626; - font-size: 1.25rem; -} -.table-of-contents-link-wrapper.is-open .toggle-table-of-contents { - -webkit-transform: rotate(180deg); - transform: rotate(180deg); -} -@media screen and (min-width: 1100px) { - .table-of-contents-link-wrapper { - display: none; - } -} - -.toggle-table-of-contents { - background-image: url("../images/chevron-down-grey.svg"); - background-position: center center; - background-repeat: no-repeat; - background-size: 18px 18px; - height: 100%; - position: absolute; - right: 21px; - width: 30px; - top: 0; -} - -.tutorials-header .header-logo { - background-image: url("../images/logo.svg"); - height: 38px; - top: -10px; -} -.tutorials-header .main-menu ul li a { - color: #262626; -} -.tutorials-header .main-menu-open-button { - background-image: url("../images/icon-menu-dots-dark.svg"); -} - -.rst-content footer .rating-hr.hr-top { - margin-bottom: -0.0625rem; -} -.rst-content footer .rating-hr.hr-bottom { - margin-top: -0.0625rem; -} -.rst-content footer .rating-container { - display: -webkit-inline-box; - display: -ms-inline-flexbox; - display: inline-flex; - font-size: 1.125rem; -} -.rst-content footer .rating-container .rating-prompt, .rst-content footer .rating-container .was-helpful-thank-you { - padding: 0.625rem 1.25rem 0.625rem 1.25rem; -} -.rst-content footer .rating-container .was-helpful-thank-you { - display: none; -} -.rst-content footer .rating-container .rating-prompt.yes-link, .rst-content footer .rating-container .rating-prompt.no-link { - color: #792ee5; - cursor: pointer; -} -.rst-content footer .rating-container .rating-prompt.yes-link:hover, .rst-content footer .rating-container .rating-prompt.no-link:hover { - background-color: #792ee5; - color: #ffffff; -} -.rst-content footer .rating-container .stars-outer { - display: inline-block; - position: relative; - font-family: FontAwesome; - padding: 0.625rem 1.25rem 0.625rem 1.25rem; -} -.rst-content footer .rating-container .stars-outer i { - cursor: pointer; -} -.rst-content footer .rating-container .stars-outer .star-fill { - color: #792ee5; -} -.rst-content footer div[role="contentinfo"] { - padding-top: 2.5rem; -} -.rst-content footer div[role="contentinfo"] p { - margin-bottom: 0; -} - -h1 { - font-size: 2rem; - letter-spacing: 1.78px; - line-height: 2.5rem; - text-transform: uppercase; - margin: 1.375rem 0; -} - -span.pre { - color: #6c6c6d; - background-color: #f3f4f7; - padding: 2px 6px; -} - -pre { - background-color: #f3f4f7; - padding: 1.375rem; -} - -.highlight .c1 { - color: #6c6c6d; -} - -.headerlink { - display: none !important; -} - -a:link.has-code, -a:hover.has-code, -a:visited.has-code { - color: #fe6162; -} -a:link.has-code span, -a:hover.has-code span, -a:visited.has-code span { - color: #fe6162; -} - -article.pytorch-article ul, -article.pytorch-article ol { - padding-left: 1.875rem; - margin: 0; -} -article.pytorch-article ul li, -article.pytorch-article ol li { - margin: 0; - line-height: 1.75rem; -} -article.pytorch-article ul p, -article.pytorch-article ol p { - line-height: 1.75rem; - margin-bottom: 0; -} -article.pytorch-article ul ul, -article.pytorch-article ul ol, -article.pytorch-article ol ul, -article.pytorch-article ol ol { - margin: 0; -} -article.pytorch-article h1, -article.pytorch-article h2, -article.pytorch-article h3, -article.pytorch-article h4, -article.pytorch-article h5, -article.pytorch-article h6 { - font-weight: normal; -} -article.pytorch-article h1 a, -article.pytorch-article h2 a, -article.pytorch-article h3 a, -article.pytorch-article h4 a, -article.pytorch-article h5 a, -article.pytorch-article h6 a { - color: #262626; -} -article.pytorch-article p.caption { - margin-top: 1.25rem; -} - -article.pytorch-article .section:first-of-type h1:first-of-type { - margin-top: 0; -} - -.left-menu-link { - background-color: green; -} -.left-menu-link:hover { - background-color: #792ee5; -} - -article.pytorch-article .sphx-glr-thumbcontainer { - margin: 0; - border: 1px solid #d6d7d8; - border-radius: 0; - width: 45%; - text-align: center; - margin-bottom: 5%; -} -@media screen and (max-width: 1100px) { - article.pytorch-article .sphx-glr-thumbcontainer:nth-child(odd) { - margin-left: 0; - margin-right: 2.5%; - } - article.pytorch-article .sphx-glr-thumbcontainer:nth-child(even) { - margin-right: 0; - margin-left: 2.5%; - } - article.pytorch-article .sphx-glr-thumbcontainer .figure { - width: 40%; - } -} -@media screen and (min-width: 1101px) { - article.pytorch-article .sphx-glr-thumbcontainer { - margin-right: 3%; - margin-bottom: 3%; - width: 30%; - } -} -article.pytorch-article .sphx-glr-thumbcontainer .caption-text a { - color: #1C1C1C; - text-decoration: none; - font-family: UCity; - font-size: 0.875rem; - font-style: normal; - font-weight: 600; - line-height: 1.25rem; - letter-spacing: 0px; - text-align: left; -} -article.pytorch-article .sphx-glr-thumbcontainer:hover { - -webkit-box-shadow: none; - box-shadow: none; - border-bottom-color: #ffffff; -} -article.pytorch-article .sphx-glr-thumbcontainer:hover .figure:before { - bottom: 100%; -} -article.pytorch-article .sphx-glr-thumbcontainer .figure { - width: 80%; -} -article.pytorch-article .sphx-glr-thumbcontainer .figure:before { - content: ""; - display: block; - position: absolute; - top: 0; - bottom: 35%; - left: 0; - right: 0; - background: #8A94B3; - opacity: 0.10; -} -article.pytorch-article .sphx-glr-thumbcontainer .figure a.reference.internal { - text-align: left; -} -@media screen and (min-width: 768px) { - article.pytorch-article .sphx-glr-thumbcontainer:after { - content: ""; - display: block; - width: 0; - height: 1px; - position: absolute; - bottom: -1px; - left: 5px; - background-color: #792ee5; - -webkit-transition: width .250s ease-in-out; - transition: width .250s ease-in-out; - } - article.pytorch-article .sphx-glr-thumbcontainer:hover:after { - width: calc(100% - 5px); - } -} -@media screen and (min-width: 768px) { - article.pytorch-article .sphx-glr-thumbcontainer:after { - background-color: #792ee5; - } -} - -article.pytorch-article .section :not(dt) > code { - color: #262626; - border-top: solid 2px #ffffff; - background-color: #ffffff; - border-bottom: solid 2px #ffffff; - padding: 0px 3px; - -webkit-box-decoration-break: clone; - box-decoration-break: clone; -} -article.pytorch-article .section :not(dt) > code .pre { - outline: 0px; - padding: 0px; -} -article.pytorch-article .function dt, article.pytorch-article .method dt, article.pytorch-article .attribute dt, article.pytorch-article .class .attribute dt, article.pytorch-article .class dt { - position: relative; - background: #f3f4f7; - padding: 0.5rem; - border-left: 3px solid #792ee5; - word-wrap: break-word; - padding-right: 100px; -} -article.pytorch-article .function dt em.property, article.pytorch-article .method dt em.property, article.pytorch-article .attribute dt em.property, article.pytorch-article .class dt em.property { - font-family: inherit; -} -article.pytorch-article .function dt em, article.pytorch-article .class dt em, article.pytorch-article .attribute dt em, article.pytorch-article .class .attribute dt em, article.pytorch-article .method dt em, article.pytorch-article .function dt .sig-paren, article.pytorch-article .class dt .sig-paren, article.pytorch-article .attribute dt .sig-paren, article.pytorch-article .method dt .sig-paren { - font-family: "Inconsolata", "IBMPlexMono", "SFMono-Regular", "Menlo", "Monaco", "Consolas", "Liberation Mono", "Courier New", "monospace"; - font-size: 87.5%; -} -article.pytorch-article .function dt a, article.pytorch-article .method dt a, article.pytorch-article .attribute dt a, article.pytorch-article .class .attribute dt a, article.pytorch-article .class dt a { - position: absolute; - right: 30px; - padding-right: 0; - top: 50%; - -webkit-transform: perspective(1px) translateY(-50%); - transform: perspective(1px) translateY(-50%); -} -article.pytorch-article .function dt:hover .viewcode-link, article.pytorch-article .method dt:hover .viewcode-link, article.pytorch-article .attribute dt:hover .viewcode-link, article.pytorch-article .class dt:hover .viewcode-link { - color: #792ee5; -} -article.pytorch-article .function .anchorjs-link, article.pytorch-article .method .anchorjs-link, article.pytorch-article .attribute .anchorjs-link, article.pytorch-article .class .anchorjs-link { - display: inline; - position: absolute; - right: 8px; - font-size: 1.5625rem !important; - padding-left: 0; -} -article.pytorch-article .function dt > code, article.pytorch-article .method dt > code, article.pytorch-article .attribute dt > code, article.pytorch-article .class .attribute dt > code, article.pytorch-article .class dt > code { - color: #262626; - border-top: solid 2px #f3f4f7; - background-color: #f3f4f7; - border-bottom: solid 2px #f3f4f7; - -webkit-box-decoration-break: clone; - box-decoration-break: clone; -} -article.pytorch-article .function .viewcode-link, article.pytorch-article .method .viewcode-link, article.pytorch-article .attribute .viewcode-link, article.pytorch-article .class .viewcode-link { - font-size: 0.875rem; - color: #979797; - letter-spacing: 0; - line-height: 1.5rem; - text-transform: uppercase; -} -article.pytorch-article .function dd, article.pytorch-article .method dd, article.pytorch-article .attribute dd, article.pytorch-article .class .attribute dd, article.pytorch-article .class dd { - padding-left: 3.75rem; -} -article.pytorch-article .function dd p, article.pytorch-article .method dd p, article.pytorch-article .attribute dd p, article.pytorch-article .class .attribute dd p, article.pytorch-article .class dd p { - color: #262626; -} -article.pytorch-article .function table tbody tr th.field-name, article.pytorch-article .method table tbody tr th.field-name, article.pytorch-article .attribute table tbody tr th.field-name, article.pytorch-article .class table tbody tr th.field-name { - white-space: nowrap; - color: #262626; - width: 20%; -} -@media screen and (min-width: 768px) { - article.pytorch-article .function table tbody tr th.field-name, article.pytorch-article .method table tbody tr th.field-name, article.pytorch-article .attribute table tbody tr th.field-name, article.pytorch-article .class table tbody tr th.field-name { - width: 15%; - } -} -article.pytorch-article .function table tbody tr td.field-body, article.pytorch-article .method table tbody tr td.field-body, article.pytorch-article .attribute table tbody tr td.field-body, article.pytorch-article .class table tbody tr td.field-body { - padding: 0.625rem; - width: 80%; - color: #262626; -} -@media screen and (min-width: 768px) { - article.pytorch-article .function table tbody tr td.field-body, article.pytorch-article .method table tbody tr td.field-body, article.pytorch-article .attribute table tbody tr td.field-body, article.pytorch-article .class table tbody tr td.field-body { - width: 85%; - } -} -@media screen and (min-width: 1600px) { - article.pytorch-article .function table tbody tr td.field-body, article.pytorch-article .method table tbody tr td.field-body, article.pytorch-article .attribute table tbody tr td.field-body, article.pytorch-article .class table tbody tr td.field-body { - padding-left: 1.25rem; - } -} -article.pytorch-article .function table tbody tr td.field-body p, article.pytorch-article .method table tbody tr td.field-body p, article.pytorch-article .attribute table tbody tr td.field-body p, article.pytorch-article .class table tbody tr td.field-body p { - padding-left: 0px; -} -article.pytorch-article .function table tbody tr td.field-body p:last-of-type, article.pytorch-article .method table tbody tr td.field-body p:last-of-type, article.pytorch-article .attribute table tbody tr td.field-body p:last-of-type, article.pytorch-article .class table tbody tr td.field-body p:last-of-type { - margin-bottom: 0; -} -article.pytorch-article .function table tbody tr td.field-body ol, article.pytorch-article .method table tbody tr td.field-body ol, article.pytorch-article .attribute table tbody tr td.field-body ol, article.pytorch-article .class table tbody tr td.field-body ol, article.pytorch-article .function table tbody tr td.field-body ul, article.pytorch-article .method table tbody tr td.field-body ul, article.pytorch-article .attribute table tbody tr td.field-body ul, article.pytorch-article .class table tbody tr td.field-body ul { - padding-left: 1rem; - padding-bottom: 0; -} -article.pytorch-article .function table.docutils.field-list, article.pytorch-article .method table.docutils.field-list, article.pytorch-article .attribute table.docutils.field-list, article.pytorch-article .class table.docutils.field-list { - margin-bottom: 0.75rem; -} -article.pytorch-article .attribute .has-code { - float: none; -} -article.pytorch-article .class dt { - border-left: none; - border-top: 3px solid #792ee5; - padding-left: 4em; -} -article.pytorch-article .class dt em.property { - position: absolute; - left: 0.5rem; -} -article.pytorch-article .class dd .docutils dt { - padding-left: 0.5rem; -} -article.pytorch-article .class em.property { - text-transform: uppercase; - font-style: normal; - color: #792ee5; - font-size: 1rem; - letter-spacing: 0; - padding-right: 0.75rem; -} -article.pytorch-article .class dl dt em.property { - position: static; - left: 0; - padding-right: 0; -} -article.pytorch-article .class .method dt, -article.pytorch-article .class .staticmethod dt { - border-left: 3px solid #792ee5; - border-top: none; -} -article.pytorch-article .class .method dt, -article.pytorch-article .class .staticmethod dt { - padding-left: 0.5rem; -} -article.pytorch-article .class .attribute dt { - border-top: none; -} -article.pytorch-article .class .attribute dt em.property { - position: relative; - left: 0; -} -article.pytorch-article table { - table-layout: fixed; -} - -article.pytorch-article .note, -article.pytorch-article .warning, -article.pytorch-article .tip, -article.pytorch-article .seealso, -article.pytorch-article .hint, -article.pytorch-article .important, -article.pytorch-article .caution, -article.pytorch-article .danger, -article.pytorch-article .attention, -article.pytorch-article .error { - background: #f3f4f7; - margin-top: 1.875rem; - margin-bottom: 1.125rem; -} -article.pytorch-article .note .admonition-title, -article.pytorch-article .warning .admonition-title, -article.pytorch-article .tip .admonition-title, -article.pytorch-article .seealso .admonition-title, -article.pytorch-article .hint .admonition-title, -article.pytorch-article .important .admonition-title, -article.pytorch-article .caution .admonition-title, -article.pytorch-article .danger .admonition-title, -article.pytorch-article .attention .admonition-title, -article.pytorch-article .error .admonition-title { - color: #ffffff; - letter-spacing: 1px; - text-transform: uppercase; - margin-bottom: 1.125rem; - padding: 3px 0 3px 1.375rem; - position: relative; - font-size: 0.875rem; -} -article.pytorch-article .note .admonition-title:before, -article.pytorch-article .warning .admonition-title:before, -article.pytorch-article .tip .admonition-title:before, -article.pytorch-article .seealso .admonition-title:before, -article.pytorch-article .hint .admonition-title:before, -article.pytorch-article .important .admonition-title:before, -article.pytorch-article .caution .admonition-title:before, -article.pytorch-article .danger .admonition-title:before, -article.pytorch-article .attention .admonition-title:before, -article.pytorch-article .error .admonition-title:before { - content: "\2022"; - position: absolute; - left: 9px; - color: #ffffff; - top: 2px; -} -article.pytorch-article .note p:nth-child(n + 2), -article.pytorch-article .warning p:nth-child(n + 2), -article.pytorch-article .tip p:nth-child(n + 2), -article.pytorch-article .seealso p:nth-child(n + 2), -article.pytorch-article .hint p:nth-child(n + 2), -article.pytorch-article .important p:nth-child(n + 2), -article.pytorch-article .caution p:nth-child(n + 2), -article.pytorch-article .danger p:nth-child(n + 2), -article.pytorch-article .attention p:nth-child(n + 2), -article.pytorch-article .error p:nth-child(n + 2) { - padding: 0 1.375rem; -} -article.pytorch-article .note table, -article.pytorch-article .warning table, -article.pytorch-article .tip table, -article.pytorch-article .seealso table, -article.pytorch-article .hint table, -article.pytorch-article .important table, -article.pytorch-article .caution table, -article.pytorch-article .danger table, -article.pytorch-article .attention table, -article.pytorch-article .error table { - margin: 0 2rem; - width: auto; -} -article.pytorch-article .note .pre, -article.pytorch-article .note pre, -article.pytorch-article .warning .pre, -article.pytorch-article .warning pre, -article.pytorch-article .tip .pre, -article.pytorch-article .tip pre, -article.pytorch-article .seealso .pre, -article.pytorch-article .seealso pre, -article.pytorch-article .hint .pre, -article.pytorch-article .hint pre, -article.pytorch-article .important .pre, -article.pytorch-article .important pre, -article.pytorch-article .caution .pre, -article.pytorch-article .caution pre, -article.pytorch-article .danger .pre, -article.pytorch-article .danger pre, -article.pytorch-article .attention .pre, -article.pytorch-article .attention pre, -article.pytorch-article .error .pre, -article.pytorch-article .error pre { - background: #ffffff; - outline: 1px solid #e9e9e9; -} -article.pytorch-article .note :not(dt) > code, -article.pytorch-article .warning :not(dt) > code, -article.pytorch-article .tip :not(dt) > code, -article.pytorch-article .seealso :not(dt) > code, -article.pytorch-article .hint :not(dt) > code, -article.pytorch-article .important :not(dt) > code, -article.pytorch-article .caution :not(dt) > code, -article.pytorch-article .danger :not(dt) > code, -article.pytorch-article .attention :not(dt) > code, -article.pytorch-article .error :not(dt) > code { - border-top: solid 2px #ffffff; - background-color: #ffffff; - border-bottom: solid 2px #ffffff; - padding: 0px 3px; - -webkit-box-decoration-break: clone; - box-decoration-break: clone; - outline: 1px solid #e9e9e9; -} -article.pytorch-article .note :not(dt) > code .pre, -article.pytorch-article .warning :not(dt) > code .pre, -article.pytorch-article .tip :not(dt) > code .pre, -article.pytorch-article .seealso :not(dt) > code .pre, -article.pytorch-article .hint :not(dt) > code .pre, -article.pytorch-article .important :not(dt) > code .pre, -article.pytorch-article .caution :not(dt) > code .pre, -article.pytorch-article .danger :not(dt) > code .pre, -article.pytorch-article .attention :not(dt) > code .pre, -article.pytorch-article .error :not(dt) > code .pre { - outline: 0px; - padding: 0px; -} -article.pytorch-article .note pre, -article.pytorch-article .warning pre, -article.pytorch-article .tip pre, -article.pytorch-article .seealso pre, -article.pytorch-article .hint pre, -article.pytorch-article .important pre, -article.pytorch-article .caution pre, -article.pytorch-article .danger pre, -article.pytorch-article .attention pre, -article.pytorch-article .error pre { - margin-bottom: 0; -} -article.pytorch-article .note .highlight, -article.pytorch-article .warning .highlight, -article.pytorch-article .tip .highlight, -article.pytorch-article .seealso .highlight, -article.pytorch-article .hint .highlight, -article.pytorch-article .important .highlight, -article.pytorch-article .caution .highlight, -article.pytorch-article .danger .highlight, -article.pytorch-article .attention .highlight, -article.pytorch-article .error .highlight { - margin: 0 2rem 1.125rem 2rem; -} -article.pytorch-article .note ul, -article.pytorch-article .note ol, -article.pytorch-article .warning ul, -article.pytorch-article .warning ol, -article.pytorch-article .tip ul, -article.pytorch-article .tip ol, -article.pytorch-article .seealso ul, -article.pytorch-article .seealso ol, -article.pytorch-article .hint ul, -article.pytorch-article .hint ol, -article.pytorch-article .important ul, -article.pytorch-article .important ol, -article.pytorch-article .caution ul, -article.pytorch-article .caution ol, -article.pytorch-article .danger ul, -article.pytorch-article .danger ol, -article.pytorch-article .attention ul, -article.pytorch-article .attention ol, -article.pytorch-article .error ul, -article.pytorch-article .error ol { - padding-left: 3.25rem; -} -article.pytorch-article .note ul li, -article.pytorch-article .note ol li, -article.pytorch-article .warning ul li, -article.pytorch-article .warning ol li, -article.pytorch-article .tip ul li, -article.pytorch-article .tip ol li, -article.pytorch-article .seealso ul li, -article.pytorch-article .seealso ol li, -article.pytorch-article .hint ul li, -article.pytorch-article .hint ol li, -article.pytorch-article .important ul li, -article.pytorch-article .important ol li, -article.pytorch-article .caution ul li, -article.pytorch-article .caution ol li, -article.pytorch-article .danger ul li, -article.pytorch-article .danger ol li, -article.pytorch-article .attention ul li, -article.pytorch-article .attention ol li, -article.pytorch-article .error ul li, -article.pytorch-article .error ol li { - color: #262626; -} -article.pytorch-article .note p, -article.pytorch-article .warning p, -article.pytorch-article .tip p, -article.pytorch-article .seealso p, -article.pytorch-article .hint p, -article.pytorch-article .important p, -article.pytorch-article .caution p, -article.pytorch-article .danger p, -article.pytorch-article .attention p, -article.pytorch-article .error p { - margin-top: 1.125rem; -} -article.pytorch-article .note .admonition-title { - background: #54c7ec; -} -article.pytorch-article .warning .admonition-title { - background: #e94f3b; -} -article.pytorch-article .tip .admonition-title { - background: #6bcebb; -} -article.pytorch-article .seealso .admonition-title { - background: #6bcebb; -} -article.pytorch-article .hint .admonition-title { - background: #a2cdde; -} -article.pytorch-article .important .admonition-title { - background: #5890ff; -} -article.pytorch-article .caution .admonition-title { - background: #f7923a; -} -article.pytorch-article .danger .admonition-title { - background: #db2c49; -} -article.pytorch-article .attention .admonition-title { - background: #f5a623; -} -article.pytorch-article .error .admonition-title { - background: #cc2f90; -} -article.pytorch-article .sphx-glr-download-link-note.admonition.note, -article.pytorch-article .reference.download.internal, article.pytorch-article .sphx-glr-signature { - display: none; -} -article.pytorch-article .admonition > p:last-of-type { - margin-bottom: 0; - padding-bottom: 1.125rem !important; -} - -.pytorch-article div.sphx-glr-download a { - background-color: #f3f4f7; - background-image: url("../images/arrow-down-orange.svg"); - background-repeat: no-repeat; - background-position: left 10px center; - background-size: 15px 15px; - border-radius: 0; - border: none; - display: block; - text-align: left; - padding: 0.9375rem 3.125rem; - position: relative; - margin: 1.25rem auto; -} -@media screen and (min-width: 768px) { - .pytorch-article div.sphx-glr-download a:after { - content: ""; - display: block; - width: 0; - height: 1px; - position: absolute; - bottom: -1px; - left: 5px; - background-color: #792ee5; - -webkit-transition: width .250s ease-in-out; - transition: width .250s ease-in-out; - } - .pytorch-article div.sphx-glr-download a:hover:after { - width: calc(100% - 5px); - } -} -@media screen and (min-width: 768px) { - .pytorch-article div.sphx-glr-download a:after { - background-color: #792ee5; - } -} -@media screen and (min-width: 768px) { - .pytorch-article div.sphx-glr-download a { - background-position: left 20px center; - } -} -.pytorch-article div.sphx-glr-download a:hover { - -webkit-box-shadow: none; - box-shadow: none; - text-decoration: none; - background-image: url("../images/arrow-down-orange.svg"); - background-color: #f3f4f7; -} -.pytorch-article div.sphx-glr-download a span.pre { - background-color: transparent; - font-size: 1.125rem; - padding: 0; - color: #262626; -} -.pytorch-article div.sphx-glr-download a code, .pytorch-article div.sphx-glr-download a kbd, .pytorch-article div.sphx-glr-download a pre, .pytorch-article div.sphx-glr-download a samp, .pytorch-article div.sphx-glr-download a span.pre { - font-family: FreightSans, Helvetica Neue, Helvetica, Arial, sans-serif; -} - -.pytorch-article p.sphx-glr-script-out { - margin-bottom: 1.125rem; -} - -.pytorch-article div.sphx-glr-script-out { - margin-bottom: 2.5rem; -} -.pytorch-article div.sphx-glr-script-out .highlight { - margin-left: 0; - margin-top: 0; -} -.pytorch-article div.sphx-glr-script-out .highlight pre { - background-color: #fdede9; - padding: 1.5625rem; - color: #837b79; -} -.pytorch-article div.sphx-glr-script-out + p { - margin-top: unset; -} - -article.pytorch-article .wy-table-responsive table { - border: none; - border-color: #ffffff !important; - table-layout: fixed; -} -article.pytorch-article .wy-table-responsive table thead tr { - border-bottom: 2px solid #6c6c6d; -} -article.pytorch-article .wy-table-responsive table thead th { - line-height: 1.75rem; - padding-left: 0.9375rem; - padding-right: 0.9375rem; -} -article.pytorch-article .wy-table-responsive table tbody .row-odd { - background-color: #f3f4f7; -} -article.pytorch-article .wy-table-responsive table tbody td { - color: #6c6c6d; - white-space: normal; - padding: 0.9375rem; - font-size: 1rem; - line-height: 1.375rem; -} -article.pytorch-article .wy-table-responsive table tbody td .pre { - background: #ffffff; - color: #792ee5; - font-size: 87.5%; -} -article.pytorch-article .wy-table-responsive table tbody td code { - font-size: 87.5%; -} - -a[rel~="prev"], a[rel~="next"] { - padding: 0.375rem 0 0 0; -} - -img.next-page, -img.previous-page { - width: 8px; - height: 10px; - position: relative; - top: -1px; -} - -img.previous-page { - -webkit-transform: scaleX(-1); - transform: scaleX(-1); -} - -.rst-footer-buttons { - margin-top: 1.875rem; - margin-bottom: 1.875rem; -} -.rst-footer-buttons .btn:focus, -.rst-footer-buttons .btn.focus { - -webkit-box-shadow: none; - box-shadow: none; -} - -article.pytorch-article blockquote { - margin-left: 3.75rem; - color: #6c6c6d; -} - -article.pytorch-article .caption { - color: #6c6c6d; - letter-spacing: 0.25px; - line-height: 2.125rem; -} - -article.pytorch-article .math { - color: #262626; - width: auto; - text-align: center; -} -article.pytorch-article .math img { - width: auto; -} - -.pytorch-breadcrumbs-wrapper { - width: 100%; -} -@media screen and (min-width: 1101px) { - .pytorch-breadcrumbs-wrapper { - float: left; - margin-left: 3%; - width: 73%; - } -} -@media screen and (min-width: 1600px) { - .pytorch-breadcrumbs-wrapper { - width: 850px; - margin-left: 1.875rem; - } -} -.pytorch-breadcrumbs-wrapper .pytorch-breadcrumbs-aside { - float: right; -} -.pytorch-breadcrumbs-wrapper .pytorch-breadcrumbs-aside .fa.fa-github { - margin-top: 5px; - display: block; -} - -.pytorch-article .container { - padding-left: 0; - padding-right: 0; - max-width: none; -} - -a:link, -a:visited, -a:hover { - color: #792ee5; -} - -::-webkit-input-placeholder { - color: #792ee5; -} - -::-moz-placeholder { - color: #792ee5; -} - -:-ms-input-placeholder { - color: #792ee5; -} - -:-moz-placeholder { - color: #792ee5; -} - -@media screen and (min-width: 768px) { - .site-footer a:hover { - color: #792ee5; - } -} - -.docs-tutorials-resources a { - color: #792ee5; -} - -.header-holder { - position: relative; - z-index: 201; -} - -.header-holder .main-menu ul li.active:after { - color: #792ee5; -} -.header-holder .main-menu ul li.active a { - color: #792ee5; -} -@media screen and (min-width: 1100px) { - .header-holder .main-menu ul li a:hover { - color: #792ee5; - } -} - -.mobile-main-menu.open ul li.active a { - color: #792ee5; -} - -.version { - padding-bottom: 1rem; -} - -.pytorch-call-to-action-links { - padding-top: 0; - display: -webkit-box; - display: -ms-flexbox; - display: flex; -} -@media screen and (min-width: 768px) { - .pytorch-call-to-action-links { - padding-top: 2.5rem; - } -} -@media (min-width: 768px) and (max-width: 1239px) { - .pytorch-call-to-action-links { - padding-top: 0; - } -} -@media (min-width: 1100px) and (max-width: 1239px) { - .pytorch-call-to-action-links { - padding-top: 2.5rem; - } -} -.pytorch-call-to-action-links #tutorial-type { - display: none; -} -.pytorch-call-to-action-links .call-to-action-img, .pytorch-call-to-action-links .call-to-action-notebook-img { - height: 1.375rem; - width: 1.375rem; - margin-right: 10px; -} -.pytorch-call-to-action-links .call-to-action-notebook-img { - height: 1rem; -} -.pytorch-call-to-action-links a { - padding-right: 1.25rem; - color: #000000; - cursor: pointer; -} -.pytorch-call-to-action-links a:hover { - color: #792ee5; -} -.pytorch-call-to-action-links a .call-to-action-desktop-view { - display: none; -} -@media screen and (min-width: 768px) { - .pytorch-call-to-action-links a .call-to-action-desktop-view { - display: block; - } -} -.pytorch-call-to-action-links a .call-to-action-mobile-view { - display: block; -} -@media screen and (min-width: 768px) { - .pytorch-call-to-action-links a .call-to-action-mobile-view { - display: none; - } -} -.pytorch-call-to-action-links a #google-colab-link, .pytorch-call-to-action-links a #download-notebook-link, -.pytorch-call-to-action-links a #github-view-link { - padding-bottom: 0.625rem; - border-bottom: 1px solid #f3f4f7; - padding-right: 2.5rem; - display: -webkit-box; - display: -ms-flexbox; - display: flex; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; -} -.pytorch-call-to-action-links a #google-colab-link:hover, .pytorch-call-to-action-links a #download-notebook-link:hover, -.pytorch-call-to-action-links a #github-view-link:hover { - border-bottom-color: #792ee5; - color: #792ee5; -} - -.slack-container { - display: -webkit-box; - display: -ms-flexbox; - display: flex; -} -.slack-container .slack-button { - border: 1px solid transparent; - background: linear-gradient(206.91deg, #792EE5 16.83%, #3EABB3 144.59%); - border-radius: 6px; - height: 30px; - width: 210px; - -webkit-box-pack: center; - -ms-flex-pack: center; - justify-content: center; - font-size: 14px; -} -.slack-container a { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - height: 100%; - text-decoration: none; -} -.slack-container .icon { - height: 100%; - color: white; - margin-left: 10px; - padding-top: 2px; -} -.slack-container .button-title { - margin: auto; - margin-left: 5px; - margin-right: 5px; - color: white; -} - -.slack-align-left { - -webkit-box-pack: start; - -ms-flex-pack: start; - justify-content: flex-start; -} - -.slack-align-center { - -webkit-box-pack: center; - -ms-flex-pack: center; - justify-content: center; -} - -.slack-align-right { - -webkit-box-pack: end; - -ms-flex-pack: end; - justify-content: flex-end; -} - -#tutorial-cards-container #tutorial-cards { - width: 100%; -} -#tutorial-cards-container .tutorials-nav { - padding-left: 0; - padding-right: 0; - padding-bottom: 0; -} -#tutorial-cards-container .tutorials-hr { - margin-top: 1rem; - margin-bottom: 1rem; -} -#tutorial-cards-container .card.tutorials-card { - border: 1px solid #cfcfcf; - border-radius: 5px; - height: 98px; - margin-bottom: 1.25rem; - margin-bottom: 1.875rem; - cursor: pointer; -} -@media screen and (min-width: 1240px) { - #tutorial-cards-container .card.tutorials-card { - height: 200px; - } -} -@media (min-width: 768px) and (max-width: 1239px) { - #tutorial-cards-container .card.tutorials-card { - height: 200px; - } -} -#tutorial-cards-container .card.tutorials-card .tutorials-image { - position: absolute; - top: 0px; - right: 0px; - height: 96px; - width: 96px; - opacity: 0.7; -} -#tutorial-cards-container .card.tutorials-card .tutorials-image img { - height: 100%; - width: 100%; -} -@media screen and (min-width: 768px) { - #tutorial-cards-container .card.tutorials-card .tutorials-image { - height: 198px; - width: 198px; - } -} -@media (min-width: 768px) and (max-width: 1239px) { - #tutorial-cards-container .card.tutorials-card .tutorials-image { - height: 198px; - width: 198px; - } -} -#tutorial-cards-container .card.tutorials-card .tutorials-image:before { - content: ''; - position: absolute; - top: 0; - left: 0; - bottom: 0; - right: 0; - z-index: 1; - opacity: .075; -} -#tutorial-cards-container .card.tutorials-card .card-title-container { - display: -webkit-inline-box; - display: -ms-inline-flexbox; - display: inline-flex; -} -#tutorial-cards-container .card.tutorials-card .card-title-container h4 { - margin-bottom: 1.125rem; - margin-top: 0; - font-size: 1.5rem; -} -#tutorial-cards-container .card.tutorials-card p.card-summary, #tutorial-cards-container .card.tutorials-card .card-title-container, #tutorial-cards-container .card.tutorials-card p.tags { - white-space: nowrap; - overflow-y: hidden; - overflow-x: scroll; -} -@media screen and (min-width: 768px) { - #tutorial-cards-container .card.tutorials-card p.card-summary, #tutorial-cards-container .card.tutorials-card .card-title-container, #tutorial-cards-container .card.tutorials-card p.tags { - overflow: hidden; - } -} -@media (min-width: 768px) and (max-width: 1239px) { - #tutorial-cards-container .card.tutorials-card p.card-summary, #tutorial-cards-container .card.tutorials-card .card-title-container, #tutorial-cards-container .card.tutorials-card p.tags { - overflow: hidden; - } -} -#tutorial-cards-container .card.tutorials-card p.card-summary, #tutorial-cards-container .card.tutorials-card p.tags { - color: #6c6c6d; - font-weight: 400; - margin-bottom: 0; - line-height: 1.5rem; - font-size: 0.9375rem; -} -#tutorial-cards-container .card.tutorials-card p.card-summary { - height: 1.5rem; -} -@media screen and (min-width: 768px) { - #tutorial-cards-container .card.tutorials-card p.card-summary { - white-space: normal; - height: 4.5rem; - } -} -@media (min-width: 768px) and (max-width: 1239px) { - #tutorial-cards-container .card.tutorials-card p.card-summary { - white-space: normal; - height: 4.5rem; - } -} -#tutorial-cards-container .card.tutorials-card p.card-summary, #tutorial-cards-container .card.tutorials-card .card-title-container { - width: calc(100% - 96px); -} -@media screen and (min-width: 768px) { - #tutorial-cards-container .card.tutorials-card p.card-summary, #tutorial-cards-container .card.tutorials-card .card-title-container { - width: calc(100% - 200px); - } -} -@media (min-width: 768px) and (max-width: 1239px) { - #tutorial-cards-container .card.tutorials-card p.card-summary, #tutorial-cards-container .card.tutorials-card .card-title-container { - width: calc(100% - 200px); - } -} -#tutorial-cards-container .card.tutorials-card p.tags { - position: absolute; - bottom: 0.75rem; - width: calc(100% - 96px - 1.25rem - 1.25rem); -} -@media screen and (min-width: 768px) { - #tutorial-cards-container .card.tutorials-card p.tags { - width: calc(100% - 200px - 1.25rem - 1.25rem); - } -} -@media (min-width: 768px) and (max-width: 1239px) { - #tutorial-cards-container .card.tutorials-card p.tags { - width: calc(100% - 200px - 1.25rem - 1.25rem); - } -} -#tutorial-cards-container .card.tutorials-card h4 { - color: #262626; - margin-bottom: 1.125rem; -} -#tutorial-cards-container .card.tutorials-card a { - height: 100%; -} -@media screen and (min-width: 768px) { - #tutorial-cards-container .card.tutorials-card a { - min-height: 190px; - } -} -@media (min-width: 768px) and (max-width: 1239px) { - #tutorial-cards-container .card.tutorials-card a { - min-height: 234px; - } -} -@media screen and (min-width: 768px) { - #tutorial-cards-container .card.tutorials-card:after { - content: ""; - display: block; - width: 0; - height: 1px; - position: absolute; - bottom: -1px; - left: 5px; - background-color: #792ee5; - -webkit-transition: width .250s ease-in-out; - transition: width .250s ease-in-out; - } - #tutorial-cards-container .card.tutorials-card:hover:after { - width: calc(100% - 5px); - } -} -#tutorial-cards-container .card.tutorials-card:hover { - background-color: #ffffff; - border: 1px solid #e2e2e2; -} -#tutorial-cards-container .card.tutorials-card:hover p.card-summary { - color: #262626; -} -#tutorial-cards-container .card.tutorials-card:hover .tutorials-image { - opacity: unset; -} -#tutorial-cards-container .tutorial-tags-container { - width: 100%; -} -#tutorial-cards-container .tutorial-tags-container.active { - width: 0; -} -#tutorial-cards-container .tutorial-filter-menu ul { - list-style-type: none; - padding-left: 1.25rem; -} -#tutorial-cards-container .tutorial-filter-menu ul li { - padding-right: 1.25rem; - word-break: break-all; -} -#tutorial-cards-container .tutorial-filter-menu ul li a { - color: #979797; -} -#tutorial-cards-container .tutorial-filter-menu ul li a:hover { - color: #792ee5; -} -#tutorial-cards-container .tutorial-filter { - cursor: pointer; -} -#tutorial-cards-container .filter-btn { - color: #979797; - border: 1px solid #979797; - border-radius: 3px; - display: inline-block; - text-align: center; - white-space: nowrap; - vertical-align: middle; - padding: 0.375rem 0.75rem; - font-size: 1rem; - line-height: 1.5; - margin-bottom: 5px; -} -#tutorial-cards-container .filter-btn:hover { - border: 1px solid #792ee5; - color: #792ee5; -} -#tutorial-cards-container .filter-btn.selected { - background-color: #792ee5; - border: 1px solid #792ee5; - color: #ffffff; -} -#tutorial-cards-container .all-tag-selected { - background-color: #979797; - color: #ffffff; -} -#tutorial-cards-container .all-tag-selected:hover { - border-color: #979797; - color: #ffffff; -} -#tutorial-cards-container .pagination .page { - border: 1px solid #dee2e6; - padding: 0.5rem 0.75rem; -} -#tutorial-cards-container .pagination .active .page { - background-color: #dee2e6; -} - -article.pytorch-article .display-card-container .col-md-2 { - padding: 5px; -} -article.pytorch-article .display-card-container .col-md-3 { - padding: 5px; -} -article.pytorch-article .display-card-container .col-md-4 { - padding: 5px; -} -article.pytorch-article .display-card-container .col-md-6 { - padding: 5px; -} -article.pytorch-article .display-card-container .col-md-12 { - padding: 5px; -} -article.pytorch-article .display-card-container h3 { - margin: 5px 0 10px 0; -} -@media screen and (min-width: 768px) { - article.pytorch-article .display-card-container .display-card-hover:after { - content: ""; - display: block; - width: 0; - height: 2px; - position: absolute; - top: calc(100% - 12px); - left: 15px; - background-color: #792ee5; - -webkit-transition: width 0.25s ease-in-out; - transition: width 0.25s ease-in-out; - } - article.pytorch-article .display-card-container .display-card-hover:hover:after { - width: calc(100% - 30px); - } -} -article.pytorch-article .display-card-container .card-tag { - position: absolute; - bottom: 17px; - left: 15px; - padding: 2px 3px 2px 3px; - border: 1px solid #792ee5; - color: #792ee5; - border-radius: 4px; - font-size: 10px; - font-weight: 500; - text-transform: uppercase; -} -article.pytorch-article .display-card-container .display-card { - padding-bottom: 10px; - border: 1px solid #cfcfcf; - border-radius: 5px; - padding: 10px; -} -article.pytorch-article .display-card-container .display-card .body-paragraph { - color: #666666; - font-weight: 400; - font-size: 0.875rem; - line-height: 1.25rem; -} -article.pytorch-article .display-card-container .display-card .image-center { - display: -webkit-box; - display: -ms-flexbox; - display: flex; - margin: auto; -} -article.pytorch-article .display-card-container .display-card .image-center img { - height: 125px; - margin: auto; - width: 100%; - -o-object-fit: contain; - object-fit: contain; -} -article.pytorch-article .display-card-container .display-card .image-right { - float: right; - height: 100%; -} -article.pytorch-article .display-card-container .display-card .image-right img { - height: 100%; - width: auto; - -o-object-fit: contain; - object-fit: contain; -} -article.pytorch-article .tutorials-callout-container { - padding-bottom: 50px; -} -article.pytorch-article .tutorials-callout-container .col-md-6 { - padding: 5px; -} -article.pytorch-article .tutorials-callout-container .text-container { - padding-bottom: 10px; - border: 1px solid #cfcfcf; - border-radius: 5px; - padding: 10px; -} -@media screen and (min-width: 768px) { - article.pytorch-article .tutorials-callout-container .text-container:after { - content: ""; - display: block; - width: 0; - height: 2px; - position: absolute; - top: calc(100% - 12px); - left: 15px; - background-color: #792ee5; - -webkit-transition: width .25s ease-in-out; - transition: width .25s ease-in-out; - } - article.pytorch-article .tutorials-callout-container .text-container:hover:after { - width: calc(100% - 30px); - } -} -@media screen and (min-width: 768px) { - article.pytorch-article .tutorials-callout-container .text-container { - height: 160px; - } -} -article.pytorch-article .tutorials-callout-container .text-container .body-paragraph { - color: #666666; - font-weight: 400; - font-size: 0.875rem; - line-height: 1.25rem; -} -article.pytorch-article .tutorials-callout-container .text-container-small { - padding-bottom: 10px; - border: 1px solid #cfcfcf; - border-radius: 5px; - padding: 10px; - margin-bottom: 10px; -} -@media screen and (min-width: 768px) { - article.pytorch-article .tutorials-callout-container .text-container-small:after { - content: ""; - display: block; - width: 0; - height: 2px; - position: absolute; - top: calc(100% - 22px); - left: 15px; - background-color: #792ee5; - -webkit-transition: width .25s ease-in-out; - transition: width .25s ease-in-out; - } - article.pytorch-article .tutorials-callout-container .text-container-small:hover:after { - width: calc(100% - 30px); - } -} -@media screen and (min-width: 768px) { - article.pytorch-article .tutorials-callout-container .text-container-small { - height: 130px; - } -} -article.pytorch-article .tutorials-callout-container .text-container-small .body-paragraph { - color: #666666; - font-weight: 400; - font-size: 0.875rem; - line-height: 1.25rem; -} -article.pytorch-article .tutorials-callout-container .btn.callout-button { - font-size: 1.125rem; - border-radius: 0; - border: none; - background-color: #f3f4f7; - color: #6c6c6d; - font-weight: 400; - position: relative; - letter-spacing: 0.25px; -} -@media screen and (min-width: 768px) { - article.pytorch-article .tutorials-callout-container .btn.callout-button:after { - content: ""; - display: block; - width: 0; - height: 1px; - position: absolute; - bottom: -1px; - left: 5px; - background-color: #792ee5; - -webkit-transition: width .250s ease-in-out; - transition: width .250s ease-in-out; - } - article.pytorch-article .tutorials-callout-container .btn.callout-button:hover:after { - width: calc(100% - 5px); - } -} -article.pytorch-article .tutorials-callout-container .btn.callout-button a { - color: inherit; -} - -.center-wrapper { - max-width: 560px; - height: auto; - margin: 1.5rem auto; -} - -.video-wrapper { - position: relative; - padding-bottom: 56.25%; - /* 16:9 */ -} - -.video-wrapper iframe { - position: absolute; - top: 0; - left: 0; - width: 100%; - height: 100%; -} - -.pytorch-container { - margin: 0 auto; - padding: 0 1.875rem; - width: auto; - position: relative; -} -@media screen and (min-width: 1100px) { - .pytorch-container { - padding: 0; - } -} -@media screen and (min-width: 1101px) { - .pytorch-container { - margin-left: 25%; - } -} -@media screen and (min-width: 1600px) { - .pytorch-container { - margin-left: 350px; - } -} -.pytorch-container:before, .pytorch-container:after { - content: ""; - display: table; -} -.pytorch-container:after { - clear: both; -} -.pytorch-container { - *zoom: 1; -} - -.pytorch-content-wrap { - background-color: #ffffff; - display: -webkit-box; - display: -ms-flexbox; - display: flex; - position: relative; - padding-top: 0; -} -.pytorch-content-wrap:before, .pytorch-content-wrap:after { - content: ""; - display: table; -} -.pytorch-content-wrap:after { - clear: both; -} -.pytorch-content-wrap { - *zoom: 1; -} -@media screen and (min-width: 1101px) { - .pytorch-content-wrap { - padding-top: 45px; - float: left; - width: 100%; - display: block; - } -} -@media screen and (min-width: 1600px) { - .pytorch-content-wrap { - width: 100%; - } -} - -.pytorch-content { - background: #ffffff; - width: 100%; - max-width: 700px; - position: relative; -} - -.pytorch-content-left { - min-height: 100vh; - margin-top: 2.5rem; - width: 100%; -} -@media screen and (min-width: 1101px) { - .pytorch-content-left { - margin-top: 0; - margin-left: 20px; - width: 73%; - float: left; - } -} -@media screen and (min-width: 1600px) { - .pytorch-content-left { - width: 73%; - margin-left: 30px; - } -} -.pytorch-content-left .main-content { - padding-top: 0.9375rem; -} -.pytorch-content-left .main-content ul.simple { - padding-bottom: 1.25rem; -} -.pytorch-content-left .main-content .note:nth-child(1), .pytorch-content-left .main-content .warning:nth-child(1) { - margin-top: 0; -} - -.pytorch-content-right { - display: none; - position: relative; - overflow-x: hidden; - overflow-y: hidden; -} -@media screen and (min-width: 1101px) { - .pytorch-content-right { - display: block; - margin-left: 0; - width: 25%; - float: left; - height: 100%; - padding-right: 5px; - } -} -@media screen and (min-width: 1600px) { - .pytorch-content-right { - width: 24%; - padding-right: 5px; - } -} - -@media screen and (min-width: 1101px) { - .pytorch-side-scroll { - position: relative; - overflow-x: hidden; - overflow-y: scroll; - height: 100%; - } -} - -.pytorch-menu-vertical { - padding: 1.25rem 1.875rem 2.5rem 1.875rem; -} -@media screen and (min-width: 1101px) { - .pytorch-menu-vertical { - display: block; - padding-top: 0; - padding-right: 13.5%; - padding-bottom: 5.625rem; - } -} -@media screen and (min-width: 1600px) { - .pytorch-menu-vertical { - padding-left: 0; - padding-right: 1.5625rem; - } -} - -.pytorch-left-menu { - display: none; - background-color: white; - color: #262626; - overflow: scroll; - border-right: 1px solid #e2e2e2; -} -@media screen and (min-width: 1101px) { - .pytorch-left-menu { - display: block; - overflow-x: hidden; - overflow-y: hidden; - padding-bottom: 110px; - padding: 0 1.875rem 0 0; - width: 22%; - z-index: 200; - float: left; - } - .pytorch-left-menu.make-fixed { - position: fixed; - top: 0; - bottom: 0; - left: 0; - float: none; - } -} -@media screen and (min-width: 1600px) { - .pytorch-left-menu { - padding: 0 0 0 1.875rem; - width: 350px; - } -} - -.expand-menu, .hide-menu { - color: #6c6c6d; - padding-left: 10px; - cursor: none; - float: right; - pointer-events: none; -} - -.menu-item-decorator { - color: #848484; -} - -.collapse { - display: none; -} - -.left-nav-top-caption { - padding-top: 1rem; -} - -.pytorch-left-menu p.caption { - display: block; - margin-bottom: 0px; - text-transform: none; - white-space: normal; - border-radius: 6px; - padding: 0.5rem; - color: #1C1C1C; - font-family: UCity; - font-size: 0.875rem; - font-style: normal; - font-weight: 600; - line-height: 1.25rem; - letter-spacing: 0px; - text-align: left; -} -.pytorch-left-menu p.caption:hover { - background-color: #EFEEFF; - color: #4F00BA; -} - -.pytorch-left-menu-search { - margin-bottom: 2.5rem; -} -@media screen and (min-width: 1101px) { - .pytorch-left-menu-search { - margin: 1.25rem 0.625rem 1.875rem 0; - } -} - -.pytorch-left-menu-search ::-webkit-input-placeholder { - color: #262626; -} -.pytorch-left-menu-search ::-moz-placeholder { - color: #262626; -} -.pytorch-left-menu-search :-ms-input-placeholder { - color: #262626; -} -.pytorch-left-menu-search ::-ms-input-placeholder { - color: #262626; -} -.pytorch-left-menu-search ::placeholder { - color: #262626; -} - -.pytorch-left-menu-search input[type=text] { - border-radius: 0; - padding: 0.5rem 0.75rem; - border-color: #ffffff; - color: #262626; - border-style: solid; - font-size: 1rem; - width: 100%; - background-color: #f3f4f7; - background-image: url("../images/search-icon.svg"); - background-repeat: no-repeat; - background-size: 18px 18px; - background-position: 12px 10px; - padding-left: 40px; - background-color: #F6F8FB; -} -.pytorch-left-menu-search input[type=text]:focus { - outline: 0; -} - -@media screen and (min-width: 1101px) { - .pytorch-left-menu .pytorch-side-scroll { - width: 120%; - } -} -@media screen and (min-width: 1600px) { - .pytorch-left-menu .pytorch-side-scroll { - width: 340px; - } -} - -.pytorch-right-menu { - min-height: 100px; - overflow-x: hidden; - overflow-y: hidden; - left: 0; - z-index: 200; - padding-top: 0; - position: relative; -} -@media screen and (min-width: 1101px) { - .pytorch-right-menu { - width: 100%; - } - .pytorch-right-menu.scrolling-fixed { - position: fixed; - top: 45px; - left: 81.1%; - width: 19%; - padding-right: 10px; - } - .pytorch-right-menu.scrolling-absolute { - position: absolute; - left: 0; - } -} -@media screen and (min-width: 1600px) { - .pytorch-right-menu { - left: 0; - width: 100%; - } - .pytorch-right-menu.scrolling-fixed { - position: fixed; - top: 45px; - left: 80%; - } - .pytorch-right-menu.scrolling-absolute { - position: absolute; - left: 0; - } -} - -.pytorch-left-menu ul, -.pytorch-right-menu ul { - list-style-type: none; - padding-left: 0; - margin-bottom: 2.5rem; -} -.pytorch-left-menu > ul, -.pytorch-right-menu > ul { - margin-bottom: 2.5rem; -} -.pytorch-left-menu a:link, -.pytorch-left-menu a:visited, -.pytorch-left-menu a:hover, -.pytorch-right-menu a:link, -.pytorch-right-menu a:visited, -.pytorch-right-menu a:hover { - color: #6c6c6d; - font-size: 0.875rem; - line-height: 1rem; - padding: 0; - text-decoration: none; -} -.pytorch-left-menu a:link.reference.internal, -.pytorch-left-menu a:visited.reference.internal, -.pytorch-left-menu a:hover.reference.internal, -.pytorch-right-menu a:link.reference.internal, -.pytorch-right-menu a:visited.reference.internal, -.pytorch-right-menu a:hover.reference.internal { - min-height: 25px; - height: auto; - padding: 5px; - border-radius: 6px; - position: relative; - width: 100%; -} -.pytorch-left-menu a:link.reference.internal:hover, -.pytorch-left-menu a:visited.reference.internal:hover, -.pytorch-left-menu a:hover.reference.internal:hover, -.pytorch-right-menu a:link.reference.internal:hover, -.pytorch-right-menu a:visited.reference.internal:hover, -.pytorch-right-menu a:hover.reference.internal:hover { - background-color: #EFEEFF; - color: #4F00BA; -} -.pytorch-left-menu a:link.reference.external, -.pytorch-left-menu a:visited.reference.external, -.pytorch-left-menu a:hover.reference.external, -.pytorch-right-menu a:link.reference.external, -.pytorch-right-menu a:visited.reference.external, -.pytorch-right-menu a:hover.reference.external { - min-height: 25px; - height: auto; - padding: 5px; - border-radius: 6px; - position: relative; - width: 100%; -} -.pytorch-left-menu a:link.reference.external:hover, -.pytorch-left-menu a:visited.reference.external:hover, -.pytorch-left-menu a:hover.reference.external:hover, -.pytorch-right-menu a:link.reference.external:hover, -.pytorch-right-menu a:visited.reference.external:hover, -.pytorch-right-menu a:hover.reference.external:hover { - background-color: #EFEEFF; - color: #4F00BA; -} -.pytorch-left-menu li code, -.pytorch-right-menu li code { - border: none; - background: inherit; - color: inherit; - padding-left: 0; - padding-right: 0; -} -.pytorch-left-menu li span.toctree-expand, -.pytorch-right-menu li span.toctree-expand { - display: block; - float: left; - margin-left: -1.2em; - font-size: 0.8em; - line-height: 1.6em; -} -.pytorch-left-menu li.on a, .pytorch-left-menu li.current > a, -.pytorch-right-menu li.on a, -.pytorch-right-menu li.current > a { - position: relative; - border: none; -} -.pytorch-left-menu li.on a span.toctree-expand, .pytorch-left-menu li.current > a span.toctree-expand, -.pytorch-right-menu li.on a span.toctree-expand, -.pytorch-right-menu li.current > a span.toctree-expand { - display: block; - font-size: 0.8em; - line-height: 1.6em; -} -.pytorch-left-menu li.toctree-l1.current > a, -.pytorch-right-menu li.toctree-l1.current > a { - color: #792ee5; -} -.pytorch-left-menu li.toctree-l1.current > a:before, -.pytorch-right-menu li.toctree-l1.current > a:before { - content: ""; - display: block; - width: 2px; - height: 100%; - background: #792ee5; - left: -5px; - top: 0; - position: absolute; -} -.pytorch-left-menu li.toctree-l1.current li.toctree-l2 > ul, .pytorch-left-menu li.toctree-l2.current li.toctree-l3 > ul, -.pytorch-right-menu li.toctree-l1.current li.toctree-l2 > ul, -.pytorch-right-menu li.toctree-l2.current li.toctree-l3 > ul { - display: none; -} -.pytorch-left-menu li.toctree-l1.current li.toctree-l2.current > ul, .pytorch-left-menu li.toctree-l2.current li.toctree-l3.current > ul, -.pytorch-right-menu li.toctree-l1.current li.toctree-l2.current > ul, -.pytorch-right-menu li.toctree-l2.current li.toctree-l3.current > ul { - display: block; -} -.pytorch-left-menu li.toctree-l2.current li.toctree-l3 > a, -.pytorch-right-menu li.toctree-l2.current li.toctree-l3 > a { - display: block; -} -.pytorch-left-menu li.toctree-l3, -.pytorch-right-menu li.toctree-l3 { - font-size: 0.9em; -} -.pytorch-left-menu li.toctree-l3.current li.toctree-l4 > a, -.pytorch-right-menu li.toctree-l3.current li.toctree-l4 > a { - display: block; -} -.pytorch-left-menu li.toctree-l4, -.pytorch-right-menu li.toctree-l4 { - font-size: 0.9em; -} -.pytorch-left-menu li.current ul, -.pytorch-right-menu li.current ul { - display: block; -} -.pytorch-left-menu li ul, -.pytorch-right-menu li ul { - margin-bottom: 0; - display: none; -} -.pytorch-left-menu li ul li a, -.pytorch-right-menu li ul li a { - margin-bottom: 0; -} -.pytorch-left-menu a, -.pytorch-right-menu a { - display: inline-block; - position: relative; -} -.pytorch-left-menu a:hover, -.pytorch-right-menu a:hover { - cursor: pointer; -} -.pytorch-left-menu a:active, -.pytorch-right-menu a:active { - cursor: pointer; -} - -.pytorch-left-menu ul { - padding-left: 0; - margin-left: 5px; -} -.pytorch-right-menu a:link, -.pytorch-right-menu a:visited, -.pytorch-right-menu a:hover { - color: #6c6c6d; -} -.pytorch-right-menu a:link span.pre, -.pytorch-right-menu a:visited span.pre, -.pytorch-right-menu a:hover span.pre { - color: #6c6c6d; -} -.pytorch-right-menu a.reference.internal.expanded:before { - content: "-"; - font-family: monospace; - position: absolute; - left: -12px; -} -.pytorch-right-menu a.reference.internal.not-expanded:before { - content: "+"; - font-family: monospace; - position: absolute; - left: -12px; -} -.pytorch-right-menu li.active > a { - color: #792ee5; -} -.pytorch-right-menu li.active > a span.pre, .pytorch-right-menu li.active > a:before { - color: #792ee5; -} -.pytorch-right-menu li.active > a:after { - content: "\2022"; - color: #792ee5; - display: inline-block; - font-size: 1.375rem; - left: -17px; - position: absolute; - top: 1px; -} -.pytorch-right-menu .pytorch-side-scroll > ul > li > ul > li { - margin-bottom: 0; -} -.pytorch-right-menu ul ul { - padding-left: 0; -} -.pytorch-right-menu ul ul li { - padding-left: 0px; -} -.pytorch-right-menu ul ul li a.reference.internal { - padding-left: 0; -} -.pytorch-right-menu ul ul li ul { - display: none; - padding-left: 10px; -} -.pytorch-right-menu ul ul li li a.reference.internal { - padding-left: 0; -} -.pytorch-right-menu li ul { - display: block; -} - -.pytorch-right-menu .pytorch-side-scroll { - padding-top: 20px; -} -@media screen and (min-width: 1101px) { - .pytorch-right-menu .pytorch-side-scroll { - width: 100%; - } -} -@media screen and (min-width: 1600px) { - .pytorch-right-menu .pytorch-side-scroll { - width: 100%; - } -} -.pytorch-right-menu .pytorch-side-scroll > ul { - padding-left: 20px; - padding-right: 0; - margin-bottom: 0; -} -@media screen and (min-width: 1600px) { - .pytorch-right-menu .pytorch-side-scroll > ul { - padding-left: 25px; - } -} -.pytorch-right-menu .pytorch-side-scroll > ul > li > a.reference.internal { - color: #262626; - font-weight: 500; -} -.pytorch-right-menu .pytorch-side-scroll ul li { - position: relative; -} - -#pytorch-right-menu .side-scroll-highlight { - color: #792ee5; -} - -.header-container { - max-width: none; - margin-top: 4px; -} -@media screen and (min-width: 1101px) { - .header-container { - margin-top: 0; - } -} -@media screen and (min-width: 1600px) { - .header-container { - margin-top: 0; - } -} - -.container-fluid.header-holder, .header-holder.container-sm, .header-holder.container-md, .header-holder.container-lg, .header-holder.container-xl { - padding-right: 0; - padding-left: 0; -} - -.header-holder .container { - max-width: none; - padding-right: 1.875rem; - padding-left: 1.875rem; -} -@media screen and (min-width: 1101px) { - .header-holder .container { - padding-right: 1.875rem; - padding-left: 1.875rem; - } -} - -.header-holder .main-menu { - -webkit-box-pack: unset; - -ms-flex-pack: unset; - justify-content: unset; - position: relative; -} -@media screen and (min-width: 1101px) { - .header-holder .main-menu ul { - padding-left: 0; - margin-left: 26%; - } -} -@media screen and (min-width: 1600px) { - .header-holder .main-menu ul { - padding-left: 38px; - margin-left: 310px; - } -} - -.pytorch-page-level-bar { - display: none; - -webkit-box-align: center; - -ms-flex-align: center; - align-items: center; - background-color: #ffffff; - border-bottom: 1px solid #e2e2e2; - width: 100%; - z-index: 201; -} -@media screen and (min-width: 1101px) { - .pytorch-page-level-bar { - left: 0; - display: -webkit-box; - display: -ms-flexbox; - display: flex; - height: 45px; - padding-left: 0; - width: 100%; - position: absolute; - z-index: 1; - } - .pytorch-page-level-bar.left-menu-is-fixed { - position: fixed; - top: 0; - left: 25%; - padding-left: 0; - right: 0; - width: 75%; - } -} -@media screen and (min-width: 1600px) { - .pytorch-page-level-bar { - left: 0; - right: 0; - width: auto; - z-index: 1; - } - .pytorch-page-level-bar.left-menu-is-fixed { - left: 350px; - right: 0; - width: auto; - } -} -.pytorch-page-level-bar ul, .pytorch-page-level-bar li { - margin: 0; -} - -.pytorch-shortcuts-wrapper { - display: none; -} -@media screen and (min-width: 1101px) { - .pytorch-shortcuts-wrapper { - font-size: 0.875rem; - float: left; - margin-left: 2%; - } -} -@media screen and (min-width: 1600px) { - .pytorch-shortcuts-wrapper { - margin-left: 1.875rem; - } -} - -.cookie-banner-wrapper { - display: none; -} -.cookie-banner-wrapper .container { - padding-left: 1.875rem; - padding-right: 1.875rem; - max-width: 1240px; -} -.cookie-banner-wrapper.is-visible { - display: block; - position: fixed; - bottom: 0; - background-color: #f3f4f7; - min-height: 100px; - width: 100%; - z-index: 401; - border-top: 3px solid #ededee; -} -.cookie-banner-wrapper .gdpr-notice { - color: #6c6c6d; - margin-top: 1.5625rem; - text-align: left; - max-width: 1440px; -} -@media screen and (min-width: 768px) { - .cookie-banner-wrapper .gdpr-notice { - width: 77%; - } -} -@media (min-width: 768px) and (max-width: 1239px) { - .cookie-banner-wrapper .gdpr-notice { - width: inherit; - } -} -.cookie-banner-wrapper .gdpr-notice .cookie-policy-link { - color: #343434; -} -.cookie-banner-wrapper .close-button { - -webkit-appearance: none; - -moz-appearance: none; - appearance: none; - background: transparent; - border: 1px solid #f3f4f7; - height: 1.3125rem; - position: absolute; - bottom: 42px; - right: 0; - top: 0; - cursor: pointer; - outline: none; -} -@media screen and (min-width: 768px) { - .cookie-banner-wrapper .close-button { - right: 20%; - top: inherit; - } -} -@media (min-width: 768px) and (max-width: 1239px) { - .cookie-banner-wrapper .close-button { - right: 0; - top: 0; - } -} - -.main-menu ul li .resources-dropdown a { - cursor: pointer; -} -.main-menu ul li .dropdown-menu { - border-radius: 0; - padding: 0; -} -.main-menu ul li .dropdown-menu .dropdown-item { - color: #6c6c6d; - border-bottom: 1px solid #e2e2e2; -} -.main-menu ul li .dropdown-menu .dropdown-item:last-of-type { - border-bottom-color: transparent; -} -.main-menu ul li .dropdown-menu .dropdown-item:hover { - background-color: #792ee5; -} -.main-menu ul li .dropdown-menu .dropdown-item p { - font-size: 1rem; - color: #979797; -} -.main-menu ul li .dropdown-menu a.dropdown-item:hover { - color: #ffffff; -} -.main-menu ul li .dropdown-menu a.dropdown-item:hover p { - color: #ffffff; -} - -.resources-dropdown-menu { - display: none; - position: absolute; - z-index: 1000; - display: none; - float: left; - min-width: 10rem; - padding: 0.5rem 0; - font-size: 1rem; - color: #212529; - text-align: left; - list-style: none; - background-color: #ffffff; - background-clip: padding-box; - border: 1px solid rgba(0, 0, 0, 0.15); - border-radius: 0.25rem; -} - -.resources-dropdown:hover .resources-dropdown-menu { - display: block; -} - -.main-menu ul li .resources-dropdown-menu { - border-radius: 0; - padding: 0; -} -.main-menu ul li.active:hover .resources-dropdown-menu { - display: block; -} - -.main-menu ul li .resources-dropdown-menu .dropdown-item { - color: #6c6c6d; - border-bottom: 1px solid #e2e2e2; -} - -.resources-dropdown .with-down-orange-arrow { - padding-right: 2rem; - position: relative; - background: url("../images/chevron-down-orange.svg"); - background-size: 10px 15px; - background-position: top 0px right 12px; - background-repeat: no-repeat; -} - -.with-down-arrow { - padding-right: 2rem; - position: relative; - background-image: url("../images/chevron-down-black.svg"); - background-size: 14px 18px; - background-position: top 7px right 10px; - background-repeat: no-repeat; -} -.with-down-arrow:hover { - background-image: url("../images/chevron-down-orange.svg"); - background-repeat: no-repeat; -} - -.header-holder .main-menu ul li a.nav-dropdown-item { - display: block; - width: 100%; - clear: both; - font-weight: 400; - color: #979797; - text-align: left; - padding: 5px; - background-color: transparent; - border-bottom: 1px solid #e2e2e2; -} -.header-holder .main-menu ul li a.nav-dropdown-item:last-of-type { - border-bottom-color: transparent; -} -.header-holder .main-menu ul li a.nav-dropdown-item:hover { - background-color: #EFEEFF; - color: #792ee5; -} -.header-holder .main-menu ul li a.nav-dropdown-item .dropdown-title { - font-family: UCity; - font-size: 0.75rem; - font-weight: 400; - line-height: 1.375rem; - color: #6c6c6d; -} - -.header-holder .main-menu ul li a.nav-dropdown-item:hover .dropdown-title { - background-color: hover_background; - color: #792ee5; -} - -/*# sourceMappingURL=theme.css.map */ \ No newline at end of file diff --git a/docs/_static/doctools.js b/docs/_static/doctools.js deleted file mode 100644 index e1bfd70..0000000 --- a/docs/_static/doctools.js +++ /dev/null @@ -1,358 +0,0 @@ -/* - * doctools.js - * ~~~~~~~~~~~ - * - * Sphinx JavaScript utilities for all documentation. - * - * :copyright: Copyright 2007-2022 by the Sphinx team, see AUTHORS. - * :license: BSD, see LICENSE for details. - * - */ - -/** - * select a different prefix for underscore - */ -$u = _.noConflict(); - -/** - * make the code below compatible with browsers without - * an installed firebug like debugger -if (!window.console || !console.firebug) { - var names = ["log", "debug", "info", "warn", "error", "assert", "dir", - "dirxml", "group", "groupEnd", "time", "timeEnd", "count", "trace", - "profile", "profileEnd"]; - window.console = {}; - for (var i = 0; i < names.length; ++i) - window.console[names[i]] = function() {}; -} - */ - -/** - * small helper function to urldecode strings - * - * See https://developer.mozilla.org/en-US/docs/Web/JavaScript/Reference/Global_Objects/decodeURIComponent#Decoding_query_parameters_from_a_URL - */ -jQuery.urldecode = function(x) { - if (!x) { - return x - } - return decodeURIComponent(x.replace(/\+/g, ' ')); -}; - -/** - * small helper function to urlencode strings - */ -jQuery.urlencode = encodeURIComponent; - -/** - * This function returns the parsed url parameters of the - * current request. Multiple values per key are supported, - * it will always return arrays of strings for the value parts. - */ -jQuery.getQueryParameters = function(s) { - if (typeof s === 'undefined') - s = document.location.search; - var parts = s.substr(s.indexOf('?') + 1).split('&'); - var result = {}; - for (var i = 0; i < parts.length; i++) { - var tmp = parts[i].split('=', 2); - var key = jQuery.urldecode(tmp[0]); - var value = jQuery.urldecode(tmp[1]); - if (key in result) - result[key].push(value); - else - result[key] = [value]; - } - return result; -}; - -/** - * highlight a given string on a jquery object by wrapping it in - * span elements with the given class name. - */ -jQuery.fn.highlightText = function(text, className) { - function highlight(node, addItems) { - if (node.nodeType === 3) { - var val = node.nodeValue; - var pos = val.toLowerCase().indexOf(text); - if (pos >= 0 && - !jQuery(node.parentNode).hasClass(className) && - !jQuery(node.parentNode).hasClass("nohighlight")) { - var span; - var isInSVG = jQuery(node).closest("body, svg, foreignObject").is("svg"); - if (isInSVG) { - span = document.createElementNS("http://www.w3.org/2000/svg", "tspan"); - } else { - span = document.createElement("span"); - span.className = className; - } - span.appendChild(document.createTextNode(val.substr(pos, text.length))); - node.parentNode.insertBefore(span, node.parentNode.insertBefore( - document.createTextNode(val.substr(pos + text.length)), - node.nextSibling)); - node.nodeValue = val.substr(0, pos); - if (isInSVG) { - var rect = document.createElementNS("http://www.w3.org/2000/svg", "rect"); - var bbox = node.parentElement.getBBox(); - rect.x.baseVal.value = bbox.x; - rect.y.baseVal.value = bbox.y; - rect.width.baseVal.value = bbox.width; - rect.height.baseVal.value = bbox.height; - rect.setAttribute('class', className); - addItems.push({ - "parent": node.parentNode, - "target": rect}); - } - } - } - else if (!jQuery(node).is("button, select, textarea")) { - jQuery.each(node.childNodes, function() { - highlight(this, addItems); - }); - } - } - var addItems = []; - var result = this.each(function() { - highlight(this, addItems); - }); - for (var i = 0; i < addItems.length; ++i) { - jQuery(addItems[i].parent).before(addItems[i].target); - } - return result; -}; - -/* - * backward compatibility for jQuery.browser - * This will be supported until firefox bug is fixed. - */ -if (!jQuery.browser) { - jQuery.uaMatch = function(ua) { - ua = ua.toLowerCase(); - - var match = /(chrome)[ \/]([\w.]+)/.exec(ua) || - /(webkit)[ \/]([\w.]+)/.exec(ua) || - /(opera)(?:.*version|)[ \/]([\w.]+)/.exec(ua) || - /(msie) ([\w.]+)/.exec(ua) || - ua.indexOf("compatible") < 0 && /(mozilla)(?:.*? rv:([\w.]+)|)/.exec(ua) || - []; - - return { - browser: match[ 1 ] || "", - version: match[ 2 ] || "0" - }; - }; - jQuery.browser = {}; - jQuery.browser[jQuery.uaMatch(navigator.userAgent).browser] = true; -} - -/** - * Small JavaScript module for the documentation. - */ -var Documentation = { - - init : function() { - this.fixFirefoxAnchorBug(); - this.highlightSearchWords(); - this.initIndexTable(); - this.initOnKeyListeners(); - }, - - /** - * i18n support - */ - TRANSLATIONS : {}, - PLURAL_EXPR : function(n) { return n === 1 ? 0 : 1; }, - LOCALE : 'unknown', - - // gettext and ngettext don't access this so that the functions - // can safely bound to a different name (_ = Documentation.gettext) - gettext : function(string) { - var translated = Documentation.TRANSLATIONS[string]; - if (typeof translated === 'undefined') - return string; - return (typeof translated === 'string') ? translated : translated[0]; - }, - - ngettext : function(singular, plural, n) { - var translated = Documentation.TRANSLATIONS[singular]; - if (typeof translated === 'undefined') - return (n == 1) ? singular : plural; - return translated[Documentation.PLURALEXPR(n)]; - }, - - addTranslations : function(catalog) { - for (var key in catalog.messages) - this.TRANSLATIONS[key] = catalog.messages[key]; - this.PLURAL_EXPR = new Function('n', 'return +(' + catalog.plural_expr + ')'); - this.LOCALE = catalog.locale; - }, - - /** - * add context elements like header anchor links - */ - addContextElements : function() { - $('div[id] > :header:first').each(function() { - $('\u00B6'). - attr('href', '#' + this.id). - attr('title', _('Permalink to this headline')). - appendTo(this); - }); - $('dt[id]').each(function() { - $('\u00B6'). - attr('href', '#' + this.id). - attr('title', _('Permalink to this definition')). - appendTo(this); - }); - }, - - /** - * workaround a firefox stupidity - * see: https://bugzilla.mozilla.org/show_bug.cgi?id=645075 - */ - fixFirefoxAnchorBug : function() { - if (document.location.hash && $.browser.mozilla) - window.setTimeout(function() { - document.location.href += ''; - }, 10); - }, - - /** - * highlight the search words provided in the url in the text - */ - highlightSearchWords : function() { - var params = $.getQueryParameters(); - var terms = (params.highlight) ? params.highlight[0].split(/\s+/) : []; - if (terms.length) { - var body = $('div.body'); - if (!body.length) { - body = $('body'); - } - window.setTimeout(function() { - $.each(terms, function() { - body.highlightText(this.toLowerCase(), 'highlighted'); - }); - }, 10); - $('') - .appendTo($('#searchbox')); - } - }, - - /** - * init the domain index toggle buttons - */ - initIndexTable : function() { - var togglers = $('img.toggler').click(function() { - var src = $(this).attr('src'); - var idnum = $(this).attr('id').substr(7); - $('tr.cg-' + idnum).toggle(); - if (src.substr(-9) === 'minus.png') - $(this).attr('src', src.substr(0, src.length-9) + 'plus.png'); - else - $(this).attr('src', src.substr(0, src.length-8) + 'minus.png'); - }).css('display', ''); - if (DOCUMENTATION_OPTIONS.COLLAPSE_INDEX) { - togglers.click(); - } - }, - - /** - * helper function to hide the search marks again - */ - hideSearchWords : function() { - $('#searchbox .highlight-link').fadeOut(300); - $('span.highlighted').removeClass('highlighted'); - var url = new URL(window.location); - url.searchParams.delete('highlight'); - window.history.replaceState({}, '', url); - }, - - /** - * helper function to focus on search bar - */ - focusSearchBar : function() { - $('input[name=q]').first().focus(); - }, - - /** - * make the url absolute - */ - makeURL : function(relativeURL) { - return DOCUMENTATION_OPTIONS.URL_ROOT + '/' + relativeURL; - }, - - /** - * get the current relative url - */ - getCurrentURL : function() { - var path = document.location.pathname; - var parts = path.split(/\//); - $.each(DOCUMENTATION_OPTIONS.URL_ROOT.split(/\//), function() { - if (this === '..') - parts.pop(); - }); - var url = parts.join('/'); - return path.substring(url.lastIndexOf('/') + 1, path.length - 1); - }, - - initOnKeyListeners: function() { - // only install a listener if it is really needed - if (!DOCUMENTATION_OPTIONS.NAVIGATION_WITH_KEYS && - !DOCUMENTATION_OPTIONS.ENABLE_SEARCH_SHORTCUTS) - return; - - $(document).keydown(function(event) { - var activeElementType = document.activeElement.tagName; - // don't navigate when in search box, textarea, dropdown or button - if (activeElementType !== 'TEXTAREA' && activeElementType !== 'INPUT' && activeElementType !== 'SELECT' - && activeElementType !== 'BUTTON') { - if (event.altKey || event.ctrlKey || event.metaKey) - return; - - if (!event.shiftKey) { - switch (event.key) { - case 'ArrowLeft': - if (!DOCUMENTATION_OPTIONS.NAVIGATION_WITH_KEYS) - break; - var prevHref = $('link[rel="prev"]').prop('href'); - if (prevHref) { - window.location.href = prevHref; - return false; - } - break; - case 'ArrowRight': - if (!DOCUMENTATION_OPTIONS.NAVIGATION_WITH_KEYS) - break; - var nextHref = $('link[rel="next"]').prop('href'); - if (nextHref) { - window.location.href = nextHref; - return false; - } - break; - case 'Escape': - if (!DOCUMENTATION_OPTIONS.ENABLE_SEARCH_SHORTCUTS) - break; - Documentation.hideSearchWords(); - return false; - } - } - - // some keyboard layouts may need Shift to get / - switch (event.key) { - case '/': - if (!DOCUMENTATION_OPTIONS.ENABLE_SEARCH_SHORTCUTS) - break; - Documentation.focusSearchBar(); - return false; - } - } - }); - } -}; - -// quick alias for translations -_ = Documentation.gettext; - -$(document).ready(function() { - Documentation.init(); -}); diff --git a/docs/_static/documentation_options.js b/docs/_static/documentation_options.js deleted file mode 100644 index 6f4c5ec..0000000 --- a/docs/_static/documentation_options.js +++ /dev/null @@ -1,14 +0,0 @@ -var DOCUMENTATION_OPTIONS = { - URL_ROOT: document.getElementById("documentation_options").getAttribute('data-url_root'), - VERSION: '1.7.0dev', - LANGUAGE: 'None', - COLLAPSE_INDEX: false, - BUILDER: 'html', - FILE_SUFFIX: '.html', - LINK_SUFFIX: '.html', - HAS_SOURCE: true, - SOURCELINK_SUFFIX: '.txt', - NAVIGATION_WITH_KEYS: false, - SHOW_SEARCH_SUMMARY: true, - ENABLE_SEARCH_SHORTCUTS: true, -}; \ No newline at end of file diff --git a/docs/_static/file.png b/docs/_static/file.png deleted file mode 100644 index a858a41..0000000 Binary files a/docs/_static/file.png and /dev/null differ diff --git a/docs/_static/fonts/FreightSans/freight-sans-bold-italic.woff b/docs/_static/fonts/FreightSans/freight-sans-bold-italic.woff deleted file mode 100644 index e317248..0000000 Binary files a/docs/_static/fonts/FreightSans/freight-sans-bold-italic.woff and /dev/null differ diff --git a/docs/_static/fonts/FreightSans/freight-sans-bold-italic.woff2 b/docs/_static/fonts/FreightSans/freight-sans-bold-italic.woff2 deleted file mode 100644 index cec2dc9..0000000 Binary files a/docs/_static/fonts/FreightSans/freight-sans-bold-italic.woff2 and /dev/null differ diff --git a/docs/_static/fonts/FreightSans/freight-sans-bold.woff b/docs/_static/fonts/FreightSans/freight-sans-bold.woff deleted file mode 100644 index de46625..0000000 Binary files a/docs/_static/fonts/FreightSans/freight-sans-bold.woff and /dev/null differ diff --git a/docs/_static/fonts/FreightSans/freight-sans-bold.woff2 b/docs/_static/fonts/FreightSans/freight-sans-bold.woff2 deleted file mode 100644 index dc05cd8..0000000 Binary files a/docs/_static/fonts/FreightSans/freight-sans-bold.woff2 and /dev/null differ diff --git a/docs/_static/fonts/FreightSans/freight-sans-book-italic.woff b/docs/_static/fonts/FreightSans/freight-sans-book-italic.woff deleted file mode 100644 index a50e503..0000000 Binary files a/docs/_static/fonts/FreightSans/freight-sans-book-italic.woff and /dev/null differ diff --git a/docs/_static/fonts/FreightSans/freight-sans-book-italic.woff2 b/docs/_static/fonts/FreightSans/freight-sans-book-italic.woff2 deleted file mode 100644 index fe284db..0000000 Binary files a/docs/_static/fonts/FreightSans/freight-sans-book-italic.woff2 and /dev/null differ diff --git a/docs/_static/fonts/FreightSans/freight-sans-book.woff b/docs/_static/fonts/FreightSans/freight-sans-book.woff deleted file mode 100644 index 6ab8775..0000000 Binary files a/docs/_static/fonts/FreightSans/freight-sans-book.woff and /dev/null differ diff --git a/docs/_static/fonts/FreightSans/freight-sans-book.woff2 b/docs/_static/fonts/FreightSans/freight-sans-book.woff2 deleted file mode 100644 index 2688739..0000000 Binary files a/docs/_static/fonts/FreightSans/freight-sans-book.woff2 and /dev/null differ diff --git a/docs/_static/fonts/FreightSans/freight-sans-light-italic.woff b/docs/_static/fonts/FreightSans/freight-sans-light-italic.woff deleted file mode 100644 index beda58d..0000000 Binary files a/docs/_static/fonts/FreightSans/freight-sans-light-italic.woff and /dev/null differ diff --git a/docs/_static/fonts/FreightSans/freight-sans-light-italic.woff2 b/docs/_static/fonts/FreightSans/freight-sans-light-italic.woff2 deleted file mode 100644 index e2fa013..0000000 Binary files a/docs/_static/fonts/FreightSans/freight-sans-light-italic.woff2 and /dev/null differ diff --git a/docs/_static/fonts/FreightSans/freight-sans-light.woff b/docs/_static/fonts/FreightSans/freight-sans-light.woff deleted file mode 100644 index 226a0bf..0000000 Binary files a/docs/_static/fonts/FreightSans/freight-sans-light.woff and /dev/null differ diff --git a/docs/_static/fonts/FreightSans/freight-sans-light.woff2 b/docs/_static/fonts/FreightSans/freight-sans-light.woff2 deleted file mode 100644 index 6d8ff2c..0000000 Binary files a/docs/_static/fonts/FreightSans/freight-sans-light.woff2 and /dev/null differ diff --git a/docs/_static/fonts/FreightSans/freight-sans-medium-italic.woff b/docs/_static/fonts/FreightSans/freight-sans-medium-italic.woff deleted file mode 100644 index a42115d..0000000 Binary files a/docs/_static/fonts/FreightSans/freight-sans-medium-italic.woff and /dev/null differ diff --git a/docs/_static/fonts/FreightSans/freight-sans-medium-italic.woff2 b/docs/_static/fonts/FreightSans/freight-sans-medium-italic.woff2 deleted file mode 100644 index 16a7713..0000000 Binary files a/docs/_static/fonts/FreightSans/freight-sans-medium-italic.woff2 and /dev/null differ diff --git a/docs/_static/fonts/FreightSans/freight-sans-medium.woff b/docs/_static/fonts/FreightSans/freight-sans-medium.woff deleted file mode 100644 index 5ea3453..0000000 Binary files a/docs/_static/fonts/FreightSans/freight-sans-medium.woff and /dev/null differ diff --git a/docs/_static/fonts/FreightSans/freight-sans-medium.woff2 b/docs/_static/fonts/FreightSans/freight-sans-medium.woff2 deleted file mode 100644 index c58b6a5..0000000 Binary files a/docs/_static/fonts/FreightSans/freight-sans-medium.woff2 and /dev/null differ diff --git a/docs/_static/fonts/IBMPlexMono/IBMPlexMono-Light.woff b/docs/_static/fonts/IBMPlexMono/IBMPlexMono-Light.woff deleted file mode 100644 index cf37a5c..0000000 Binary files a/docs/_static/fonts/IBMPlexMono/IBMPlexMono-Light.woff and /dev/null differ diff --git a/docs/_static/fonts/IBMPlexMono/IBMPlexMono-Light.woff2 b/docs/_static/fonts/IBMPlexMono/IBMPlexMono-Light.woff2 deleted file mode 100644 index 955a6ea..0000000 Binary files a/docs/_static/fonts/IBMPlexMono/IBMPlexMono-Light.woff2 and /dev/null differ diff --git a/docs/_static/fonts/IBMPlexMono/IBMPlexMono-Medium.woff b/docs/_static/fonts/IBMPlexMono/IBMPlexMono-Medium.woff deleted file mode 100644 index fc65a67..0000000 Binary files a/docs/_static/fonts/IBMPlexMono/IBMPlexMono-Medium.woff and /dev/null differ diff --git a/docs/_static/fonts/IBMPlexMono/IBMPlexMono-Medium.woff2 b/docs/_static/fonts/IBMPlexMono/IBMPlexMono-Medium.woff2 deleted file mode 100644 index c352e40..0000000 Binary files a/docs/_static/fonts/IBMPlexMono/IBMPlexMono-Medium.woff2 and /dev/null differ diff --git a/docs/_static/fonts/IBMPlexMono/IBMPlexMono-Regular.woff b/docs/_static/fonts/IBMPlexMono/IBMPlexMono-Regular.woff deleted file mode 100644 index 7d63d89..0000000 Binary files a/docs/_static/fonts/IBMPlexMono/IBMPlexMono-Regular.woff and /dev/null differ diff --git a/docs/_static/fonts/IBMPlexMono/IBMPlexMono-Regular.woff2 b/docs/_static/fonts/IBMPlexMono/IBMPlexMono-Regular.woff2 deleted file mode 100644 index d0d7ded..0000000 Binary files a/docs/_static/fonts/IBMPlexMono/IBMPlexMono-Regular.woff2 and /dev/null differ diff --git a/docs/_static/fonts/IBMPlexMono/IBMPlexMono-SemiBold.woff b/docs/_static/fonts/IBMPlexMono/IBMPlexMono-SemiBold.woff deleted file mode 100644 index 1da7753..0000000 Binary files a/docs/_static/fonts/IBMPlexMono/IBMPlexMono-SemiBold.woff and /dev/null differ diff --git a/docs/_static/fonts/IBMPlexMono/IBMPlexMono-SemiBold.woff2 b/docs/_static/fonts/IBMPlexMono/IBMPlexMono-SemiBold.woff2 deleted file mode 100644 index 79dffdb..0000000 Binary files a/docs/_static/fonts/IBMPlexMono/IBMPlexMono-SemiBold.woff2 and /dev/null differ diff --git a/docs/_static/fonts/Inconsolata/Inconsolata.woff2 b/docs/_static/fonts/Inconsolata/Inconsolata.woff2 deleted file mode 100644 index 5d7a78e..0000000 Binary files a/docs/_static/fonts/Inconsolata/Inconsolata.woff2 and /dev/null differ diff --git a/docs/_static/fonts/UCity/UCity-Light.woff2 b/docs/_static/fonts/UCity/UCity-Light.woff2 deleted file mode 100644 index 27ba105..0000000 Binary files a/docs/_static/fonts/UCity/UCity-Light.woff2 and /dev/null differ diff --git a/docs/_static/fonts/UCity/UCity-Regular.woff2 b/docs/_static/fonts/UCity/UCity-Regular.woff2 deleted file mode 100644 index 86aafa8..0000000 Binary files a/docs/_static/fonts/UCity/UCity-Regular.woff2 and /dev/null differ diff --git a/docs/_static/fonts/UCity/UCity-Semibold.woff2 b/docs/_static/fonts/UCity/UCity-Semibold.woff2 deleted file mode 100644 index 50be9a4..0000000 Binary files a/docs/_static/fonts/UCity/UCity-Semibold.woff2 and /dev/null differ diff --git a/docs/_static/images/accelerator/ipus/profiler.png b/docs/_static/images/accelerator/ipus/profiler.png deleted file mode 100644 index cbed276..0000000 Binary files a/docs/_static/images/accelerator/ipus/profiler.png and /dev/null differ diff --git a/docs/_static/images/arrow-down-orange.svg b/docs/_static/images/arrow-down-orange.svg deleted file mode 100644 index 99b0e57..0000000 --- a/docs/_static/images/arrow-down-orange.svg +++ /dev/null @@ -1,19 +0,0 @@ - - - - Group 5 - Created with Sketch. - - - - - - - - - - - - - - \ No newline at end of file diff --git a/docs/_static/images/arrow-right-with-tail.svg b/docs/_static/images/arrow-right-with-tail.svg deleted file mode 100644 index f6e85bb..0000000 --- a/docs/_static/images/arrow-right-with-tail.svg +++ /dev/null @@ -1,19 +0,0 @@ - - - - Page 1 - Created with Sketch. - - - - - - - - - - - - - - \ No newline at end of file diff --git a/docs/_static/images/benchmarks/figure-parity-times.png b/docs/_static/images/benchmarks/figure-parity-times.png deleted file mode 100644 index 2e8c589..0000000 Binary files a/docs/_static/images/benchmarks/figure-parity-times.png and /dev/null differ diff --git a/docs/_static/images/chevron-down-black.svg b/docs/_static/images/chevron-down-black.svg deleted file mode 100644 index 097bc07..0000000 --- a/docs/_static/images/chevron-down-black.svg +++ /dev/null @@ -1,16 +0,0 @@ - - - Created with Sketch. - - - - - - - - - - - - - diff --git a/docs/_static/images/chevron-down-grey.svg b/docs/_static/images/chevron-down-grey.svg deleted file mode 100644 index 82d6514..0000000 --- a/docs/_static/images/chevron-down-grey.svg +++ /dev/null @@ -1,18 +0,0 @@ - - - - -Created with Sketch. - - - - - - - - - - - - diff --git a/docs/_static/images/chevron-down-orange.svg b/docs/_static/images/chevron-down-orange.svg deleted file mode 100644 index d993c72..0000000 --- a/docs/_static/images/chevron-down-orange.svg +++ /dev/null @@ -1,16 +0,0 @@ - - - Created with Sketch. - - - - - - - - - - - - - diff --git a/docs/_static/images/chevron-down-white.svg b/docs/_static/images/chevron-down-white.svg deleted file mode 100644 index e6c94e2..0000000 --- a/docs/_static/images/chevron-down-white.svg +++ /dev/null @@ -1,16 +0,0 @@ - - - Created with Sketch. - - - - - - - - - - - - - diff --git a/docs/_static/images/chevron-right-orange.svg b/docs/_static/images/chevron-right-orange.svg deleted file mode 100644 index b43c4f7..0000000 --- a/docs/_static/images/chevron-right-orange.svg +++ /dev/null @@ -1,17 +0,0 @@ - - - - -Page 1 -Created with Sketch. - - - - - - - - - - diff --git a/docs/_static/images/chevron-right-white.svg b/docs/_static/images/chevron-right-white.svg deleted file mode 100644 index dd9e77f..0000000 --- a/docs/_static/images/chevron-right-white.svg +++ /dev/null @@ -1,17 +0,0 @@ - - - - -Page 1 -Created with Sketch. - - - - - - - - - - \ No newline at end of file diff --git a/docs/_static/images/home-footer-background.jpg b/docs/_static/images/home-footer-background.jpg deleted file mode 100644 index b307bb5..0000000 Binary files a/docs/_static/images/home-footer-background.jpg and /dev/null differ diff --git a/docs/_static/images/icon-close.svg b/docs/_static/images/icon-close.svg deleted file mode 100644 index 348964e..0000000 --- a/docs/_static/images/icon-close.svg +++ /dev/null @@ -1,21 +0,0 @@ - - - - Page 1 - Created with Sketch. - - - - - - - - - - - - - - - - \ No newline at end of file diff --git a/docs/_static/images/icon-menu-dots-dark.svg b/docs/_static/images/icon-menu-dots-dark.svg deleted file mode 100644 index fa2ad04..0000000 --- a/docs/_static/images/icon-menu-dots-dark.svg +++ /dev/null @@ -1,42 +0,0 @@ - - - - Page 1 - Created with Sketch. - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - \ No newline at end of file diff --git a/docs/_static/images/lightning_examples/augmentation_kornia.svg b/docs/_static/images/lightning_examples/augmentation_kornia.svg deleted file mode 100644 index 481762a..0000000 --- a/docs/_static/images/lightning_examples/augmentation_kornia.svg +++ /dev/null @@ -1,3 +0,0 @@ - - - diff --git a/docs/_static/images/logo-facebook-dark.svg b/docs/_static/images/logo-facebook-dark.svg deleted file mode 100644 index cff1791..0000000 --- a/docs/_static/images/logo-facebook-dark.svg +++ /dev/null @@ -1,8 +0,0 @@ - - - - - - diff --git a/docs/_static/images/logo-icon.svg b/docs/_static/images/logo-icon.svg deleted file mode 100644 index a3ff2ee..0000000 --- a/docs/_static/images/logo-icon.svg +++ /dev/null @@ -1,62 +0,0 @@ - - - - - - image/svg+xml - - - - - - - - - - diff --git a/docs/_static/images/logo-large.svg b/docs/_static/images/logo-large.svg deleted file mode 100644 index 4a6cd73..0000000 --- a/docs/_static/images/logo-large.svg +++ /dev/null @@ -1,61 +0,0 @@ - - - - - - image/svg+xml - - - - - - - - - diff --git a/docs/_static/images/logo-lightning-large.svg b/docs/_static/images/logo-lightning-large.svg deleted file mode 100644 index 4a6cd73..0000000 --- a/docs/_static/images/logo-lightning-large.svg +++ /dev/null @@ -1,61 +0,0 @@ - - - - - - image/svg+xml - - - - - - - - - diff --git a/docs/_static/images/logo-pytorch-dark.svg b/docs/_static/images/logo-pytorch-dark.svg deleted file mode 100644 index 9b4c1a5..0000000 --- a/docs/_static/images/logo-pytorch-dark.svg +++ /dev/null @@ -1,30 +0,0 @@ - - - - - - - - - - - - - - - - - - - - diff --git a/docs/_static/images/logo-pytorch-icon.svg b/docs/_static/images/logo-pytorch-icon.svg deleted file mode 100644 index 575f682..0000000 --- a/docs/_static/images/logo-pytorch-icon.svg +++ /dev/null @@ -1,12 +0,0 @@ - - - - - - - - - diff --git a/docs/_static/images/logo-pytorch.svg b/docs/_static/images/logo-pytorch.svg deleted file mode 100644 index f8d44b9..0000000 --- a/docs/_static/images/logo-pytorch.svg +++ /dev/null @@ -1,31 +0,0 @@ - - - - - - - - - - - - - - - - - - - - diff --git a/docs/_static/images/logo-twitter-dark.svg b/docs/_static/images/logo-twitter-dark.svg deleted file mode 100644 index 1572570..0000000 --- a/docs/_static/images/logo-twitter-dark.svg +++ /dev/null @@ -1,16 +0,0 @@ - - - - - - - - diff --git a/docs/_static/images/logo-youtube-dark.svg b/docs/_static/images/logo-youtube-dark.svg deleted file mode 100644 index e3cfedd..0000000 --- a/docs/_static/images/logo-youtube-dark.svg +++ /dev/null @@ -1,21 +0,0 @@ - - - - - - - - - - - - - - - - - - - - - diff --git a/docs/_static/images/pytorch-colab.svg b/docs/_static/images/pytorch-colab.svg deleted file mode 100644 index 2ab15e2..0000000 --- a/docs/_static/images/pytorch-colab.svg +++ /dev/null @@ -1,24 +0,0 @@ - - - - - - - - - - - - diff --git a/docs/_static/images/pytorch-download.svg b/docs/_static/images/pytorch-download.svg deleted file mode 100644 index cc37d63..0000000 --- a/docs/_static/images/pytorch-download.svg +++ /dev/null @@ -1,10 +0,0 @@ - - - - - - diff --git a/docs/_static/images/pytorch-github.svg b/docs/_static/images/pytorch-github.svg deleted file mode 100644 index 2c2570d..0000000 --- a/docs/_static/images/pytorch-github.svg +++ /dev/null @@ -1,15 +0,0 @@ - - - - - - diff --git a/docs/_static/images/pytorch-x.svg b/docs/_static/images/pytorch-x.svg deleted file mode 100644 index 8207af4..0000000 --- a/docs/_static/images/pytorch-x.svg +++ /dev/null @@ -1,10 +0,0 @@ - - - - - - - diff --git a/docs/_static/images/search-icon.svg b/docs/_static/images/search-icon.svg deleted file mode 100644 index 32b597e..0000000 --- a/docs/_static/images/search-icon.svg +++ /dev/null @@ -1,19 +0,0 @@ - - - - Created with Sketch. - - - - - - - - - - - - - - - diff --git a/docs/_static/images/trainer/lr_finder.png b/docs/_static/images/trainer/lr_finder.png deleted file mode 100644 index bd1667b..0000000 Binary files a/docs/_static/images/trainer/lr_finder.png and /dev/null differ diff --git a/docs/_static/images/view-page-source-icon.svg b/docs/_static/images/view-page-source-icon.svg deleted file mode 100644 index 8477adf..0000000 --- a/docs/_static/images/view-page-source-icon.svg +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - diff --git a/docs/_static/jquery-3.5.1.js b/docs/_static/jquery-3.5.1.js deleted file mode 100644 index 5093733..0000000 --- a/docs/_static/jquery-3.5.1.js +++ /dev/null @@ -1,10872 +0,0 @@ -/*! - * jQuery JavaScript Library v3.5.1 - * https://jquery.com/ - * - * Includes Sizzle.js - * https://sizzlejs.com/ - * - * Copyright JS Foundation and other contributors - * Released under the MIT license - * https://jquery.org/license - * - * Date: 2020-05-04T22:49Z - */ -( function( global, factory ) { - - "use strict"; - - if ( typeof module === "object" && typeof module.exports === "object" ) { - - // For CommonJS and CommonJS-like environments where a proper `window` - // is present, execute the factory and get jQuery. - // For environments that do not have a `window` with a `document` - // (such as Node.js), expose a factory as module.exports. - // This accentuates the need for the creation of a real `window`. - // e.g. var jQuery = require("jquery")(window); - // See ticket #14549 for more info. - module.exports = global.document ? - factory( global, true ) : - function( w ) { - if ( !w.document ) { - throw new Error( "jQuery requires a window with a document" ); - } - return factory( w ); - }; - } else { - factory( global ); - } - -// Pass this if window is not defined yet -} )( typeof window !== "undefined" ? window : this, function( window, noGlobal ) { - -// Edge <= 12 - 13+, Firefox <=18 - 45+, IE 10 - 11, Safari 5.1 - 9+, iOS 6 - 9.1 -// throw exceptions when non-strict code (e.g., ASP.NET 4.5) accesses strict mode -// arguments.callee.caller (trac-13335). But as of jQuery 3.0 (2016), strict mode should be common -// enough that all such attempts are guarded in a try block. -"use strict"; - -var arr = []; - -var getProto = Object.getPrototypeOf; - -var slice = arr.slice; - -var flat = arr.flat ? function( array ) { - return arr.flat.call( array ); -} : function( array ) { - return arr.concat.apply( [], array ); -}; - - -var push = arr.push; - -var indexOf = arr.indexOf; - -var class2type = {}; - -var toString = class2type.toString; - -var hasOwn = class2type.hasOwnProperty; - -var fnToString = hasOwn.toString; - -var ObjectFunctionString = fnToString.call( Object ); - -var support = {}; - -var isFunction = function isFunction( obj ) { - - // Support: Chrome <=57, Firefox <=52 - // In some browsers, typeof returns "function" for HTML elements - // (i.e., `typeof document.createElement( "object" ) === "function"`). - // We don't want to classify *any* DOM node as a function. - return typeof obj === "function" && typeof obj.nodeType !== "number"; - }; - - -var isWindow = function isWindow( obj ) { - return obj != null && obj === obj.window; - }; - - -var document = window.document; - - - - var preservedScriptAttributes = { - type: true, - src: true, - nonce: true, - noModule: true - }; - - function DOMEval( code, node, doc ) { - doc = doc || document; - - var i, val, - script = doc.createElement( "script" ); - - script.text = code; - if ( node ) { - for ( i in preservedScriptAttributes ) { - - // Support: Firefox 64+, Edge 18+ - // Some browsers don't support the "nonce" property on scripts. - // On the other hand, just using `getAttribute` is not enough as - // the `nonce` attribute is reset to an empty string whenever it - // becomes browsing-context connected. - // See https://github.com/whatwg/html/issues/2369 - // See https://html.spec.whatwg.org/#nonce-attributes - // The `node.getAttribute` check was added for the sake of - // `jQuery.globalEval` so that it can fake a nonce-containing node - // via an object. - val = node[ i ] || node.getAttribute && node.getAttribute( i ); - if ( val ) { - script.setAttribute( i, val ); - } - } - } - doc.head.appendChild( script ).parentNode.removeChild( script ); - } - - -function toType( obj ) { - if ( obj == null ) { - return obj + ""; - } - - // Support: Android <=2.3 only (functionish RegExp) - return typeof obj === "object" || typeof obj === "function" ? - class2type[ toString.call( obj ) ] || "object" : - typeof obj; -} -/* global Symbol */ -// Defining this global in .eslintrc.json would create a danger of using the global -// unguarded in another place, it seems safer to define global only for this module - - - -var - version = "3.5.1", - - // Define a local copy of jQuery - jQuery = function( selector, context ) { - - // The jQuery object is actually just the init constructor 'enhanced' - // Need init if jQuery is called (just allow error to be thrown if not included) - return new jQuery.fn.init( selector, context ); - }; - -jQuery.fn = jQuery.prototype = { - - // The current version of jQuery being used - jquery: version, - - constructor: jQuery, - - // The default length of a jQuery object is 0 - length: 0, - - toArray: function() { - return slice.call( this ); - }, - - // Get the Nth element in the matched element set OR - // Get the whole matched element set as a clean array - get: function( num ) { - - // Return all the elements in a clean array - if ( num == null ) { - return slice.call( this ); - } - - // Return just the one element from the set - return num < 0 ? this[ num + this.length ] : this[ num ]; - }, - - // Take an array of elements and push it onto the stack - // (returning the new matched element set) - pushStack: function( elems ) { - - // Build a new jQuery matched element set - var ret = jQuery.merge( this.constructor(), elems ); - - // Add the old object onto the stack (as a reference) - ret.prevObject = this; - - // Return the newly-formed element set - return ret; - }, - - // Execute a callback for every element in the matched set. - each: function( callback ) { - return jQuery.each( this, callback ); - }, - - map: function( callback ) { - return this.pushStack( jQuery.map( this, function( elem, i ) { - return callback.call( elem, i, elem ); - } ) ); - }, - - slice: function() { - return this.pushStack( slice.apply( this, arguments ) ); - }, - - first: function() { - return this.eq( 0 ); - }, - - last: function() { - return this.eq( -1 ); - }, - - even: function() { - return this.pushStack( jQuery.grep( this, function( _elem, i ) { - return ( i + 1 ) % 2; - } ) ); - }, - - odd: function() { - return this.pushStack( jQuery.grep( this, function( _elem, i ) { - return i % 2; - } ) ); - }, - - eq: function( i ) { - var len = this.length, - j = +i + ( i < 0 ? len : 0 ); - return this.pushStack( j >= 0 && j < len ? [ this[ j ] ] : [] ); - }, - - end: function() { - return this.prevObject || this.constructor(); - }, - - // For internal use only. - // Behaves like an Array's method, not like a jQuery method. - push: push, - sort: arr.sort, - splice: arr.splice -}; - -jQuery.extend = jQuery.fn.extend = function() { - var options, name, src, copy, copyIsArray, clone, - target = arguments[ 0 ] || {}, - i = 1, - length = arguments.length, - deep = false; - - // Handle a deep copy situation - if ( typeof target === "boolean" ) { - deep = target; - - // Skip the boolean and the target - target = arguments[ i ] || {}; - i++; - } - - // Handle case when target is a string or something (possible in deep copy) - if ( typeof target !== "object" && !isFunction( target ) ) { - target = {}; - } - - // Extend jQuery itself if only one argument is passed - if ( i === length ) { - target = this; - i--; - } - - for ( ; i < length; i++ ) { - - // Only deal with non-null/undefined values - if ( ( options = arguments[ i ] ) != null ) { - - // Extend the base object - for ( name in options ) { - copy = options[ name ]; - - // Prevent Object.prototype pollution - // Prevent never-ending loop - if ( name === "__proto__" || target === copy ) { - continue; - } - - // Recurse if we're merging plain objects or arrays - if ( deep && copy && ( jQuery.isPlainObject( copy ) || - ( copyIsArray = Array.isArray( copy ) ) ) ) { - src = target[ name ]; - - // Ensure proper type for the source value - if ( copyIsArray && !Array.isArray( src ) ) { - clone = []; - } else if ( !copyIsArray && !jQuery.isPlainObject( src ) ) { - clone = {}; - } else { - clone = src; - } - copyIsArray = false; - - // Never move original objects, clone them - target[ name ] = jQuery.extend( deep, clone, copy ); - - // Don't bring in undefined values - } else if ( copy !== undefined ) { - target[ name ] = copy; - } - } - } - } - - // Return the modified object - return target; -}; - -jQuery.extend( { - - // Unique for each copy of jQuery on the page - expando: "jQuery" + ( version + Math.random() ).replace( /\D/g, "" ), - - // Assume jQuery is ready without the ready module - isReady: true, - - error: function( msg ) { - throw new Error( msg ); - }, - - noop: function() {}, - - isPlainObject: function( obj ) { - var proto, Ctor; - - // Detect obvious negatives - // Use toString instead of jQuery.type to catch host objects - if ( !obj || toString.call( obj ) !== "[object Object]" ) { - return false; - } - - proto = getProto( obj ); - - // Objects with no prototype (e.g., `Object.create( null )`) are plain - if ( !proto ) { - return true; - } - - // Objects with prototype are plain iff they were constructed by a global Object function - Ctor = hasOwn.call( proto, "constructor" ) && proto.constructor; - return typeof Ctor === "function" && fnToString.call( Ctor ) === ObjectFunctionString; - }, - - isEmptyObject: function( obj ) { - var name; - - for ( name in obj ) { - return false; - } - return true; - }, - - // Evaluates a script in a provided context; falls back to the global one - // if not specified. - globalEval: function( code, options, doc ) { - DOMEval( code, { nonce: options && options.nonce }, doc ); - }, - - each: function( obj, callback ) { - var length, i = 0; - - if ( isArrayLike( obj ) ) { - length = obj.length; - for ( ; i < length; i++ ) { - if ( callback.call( obj[ i ], i, obj[ i ] ) === false ) { - break; - } - } - } else { - for ( i in obj ) { - if ( callback.call( obj[ i ], i, obj[ i ] ) === false ) { - break; - } - } - } - - return obj; - }, - - // results is for internal usage only - makeArray: function( arr, results ) { - var ret = results || []; - - if ( arr != null ) { - if ( isArrayLike( Object( arr ) ) ) { - jQuery.merge( ret, - typeof arr === "string" ? - [ arr ] : arr - ); - } else { - push.call( ret, arr ); - } - } - - return ret; - }, - - inArray: function( elem, arr, i ) { - return arr == null ? -1 : indexOf.call( arr, elem, i ); - }, - - // Support: Android <=4.0 only, PhantomJS 1 only - // push.apply(_, arraylike) throws on ancient WebKit - merge: function( first, second ) { - var len = +second.length, - j = 0, - i = first.length; - - for ( ; j < len; j++ ) { - first[ i++ ] = second[ j ]; - } - - first.length = i; - - return first; - }, - - grep: function( elems, callback, invert ) { - var callbackInverse, - matches = [], - i = 0, - length = elems.length, - callbackExpect = !invert; - - // Go through the array, only saving the items - // that pass the validator function - for ( ; i < length; i++ ) { - callbackInverse = !callback( elems[ i ], i ); - if ( callbackInverse !== callbackExpect ) { - matches.push( elems[ i ] ); - } - } - - return matches; - }, - - // arg is for internal usage only - map: function( elems, callback, arg ) { - var length, value, - i = 0, - ret = []; - - // Go through the array, translating each of the items to their new values - if ( isArrayLike( elems ) ) { - length = elems.length; - for ( ; i < length; i++ ) { - value = callback( elems[ i ], i, arg ); - - if ( value != null ) { - ret.push( value ); - } - } - - // Go through every key on the object, - } else { - for ( i in elems ) { - value = callback( elems[ i ], i, arg ); - - if ( value != null ) { - ret.push( value ); - } - } - } - - // Flatten any nested arrays - return flat( ret ); - }, - - // A global GUID counter for objects - guid: 1, - - // jQuery.support is not used in Core but other projects attach their - // properties to it so it needs to exist. - support: support -} ); - -if ( typeof Symbol === "function" ) { - jQuery.fn[ Symbol.iterator ] = arr[ Symbol.iterator ]; -} - -// Populate the class2type map -jQuery.each( "Boolean Number String Function Array Date RegExp Object Error Symbol".split( " " ), -function( _i, name ) { - class2type[ "[object " + name + "]" ] = name.toLowerCase(); -} ); - -function isArrayLike( obj ) { - - // Support: real iOS 8.2 only (not reproducible in simulator) - // `in` check used to prevent JIT error (gh-2145) - // hasOwn isn't used here due to false negatives - // regarding Nodelist length in IE - var length = !!obj && "length" in obj && obj.length, - type = toType( obj ); - - if ( isFunction( obj ) || isWindow( obj ) ) { - return false; - } - - return type === "array" || length === 0 || - typeof length === "number" && length > 0 && ( length - 1 ) in obj; -} -var Sizzle = -/*! - * Sizzle CSS Selector Engine v2.3.5 - * https://sizzlejs.com/ - * - * Copyright JS Foundation and other contributors - * Released under the MIT license - * https://js.foundation/ - * - * Date: 2020-03-14 - */ -( function( window ) { -var i, - support, - Expr, - getText, - isXML, - tokenize, - compile, - select, - outermostContext, - sortInput, - hasDuplicate, - - // Local document vars - setDocument, - document, - docElem, - documentIsHTML, - rbuggyQSA, - rbuggyMatches, - matches, - contains, - - // Instance-specific data - expando = "sizzle" + 1 * new Date(), - preferredDoc = window.document, - dirruns = 0, - done = 0, - classCache = createCache(), - tokenCache = createCache(), - compilerCache = createCache(), - nonnativeSelectorCache = createCache(), - sortOrder = function( a, b ) { - if ( a === b ) { - hasDuplicate = true; - } - return 0; - }, - - // Instance methods - hasOwn = ( {} ).hasOwnProperty, - arr = [], - pop = arr.pop, - pushNative = arr.push, - push = arr.push, - slice = arr.slice, - - // Use a stripped-down indexOf as it's faster than native - // https://jsperf.com/thor-indexof-vs-for/5 - indexOf = function( list, elem ) { - var i = 0, - len = list.length; - for ( ; i < len; i++ ) { - if ( list[ i ] === elem ) { - return i; - } - } - return -1; - }, - - booleans = "checked|selected|async|autofocus|autoplay|controls|defer|disabled|hidden|" + - "ismap|loop|multiple|open|readonly|required|scoped", - - // Regular expressions - - // http://www.w3.org/TR/css3-selectors/#whitespace - whitespace = "[\\x20\\t\\r\\n\\f]", - - // https://www.w3.org/TR/css-syntax-3/#ident-token-diagram - identifier = "(?:\\\\[\\da-fA-F]{1,6}" + whitespace + - "?|\\\\[^\\r\\n\\f]|[\\w-]|[^\0-\\x7f])+", - - // Attribute selectors: http://www.w3.org/TR/selectors/#attribute-selectors - attributes = "\\[" + whitespace + "*(" + identifier + ")(?:" + whitespace + - - // Operator (capture 2) - "*([*^$|!~]?=)" + whitespace + - - // "Attribute values must be CSS identifiers [capture 5] - // or strings [capture 3 or capture 4]" - "*(?:'((?:\\\\.|[^\\\\'])*)'|\"((?:\\\\.|[^\\\\\"])*)\"|(" + identifier + "))|)" + - whitespace + "*\\]", - - pseudos = ":(" + identifier + ")(?:\\((" + - - // To reduce the number of selectors needing tokenize in the preFilter, prefer arguments: - // 1. quoted (capture 3; capture 4 or capture 5) - "('((?:\\\\.|[^\\\\'])*)'|\"((?:\\\\.|[^\\\\\"])*)\")|" + - - // 2. simple (capture 6) - "((?:\\\\.|[^\\\\()[\\]]|" + attributes + ")*)|" + - - // 3. anything else (capture 2) - ".*" + - ")\\)|)", - - // Leading and non-escaped trailing whitespace, capturing some non-whitespace characters preceding the latter - rwhitespace = new RegExp( whitespace + "+", "g" ), - rtrim = new RegExp( "^" + whitespace + "+|((?:^|[^\\\\])(?:\\\\.)*)" + - whitespace + "+$", "g" ), - - rcomma = new RegExp( "^" + whitespace + "*," + whitespace + "*" ), - rcombinators = new RegExp( "^" + whitespace + "*([>+~]|" + whitespace + ")" + whitespace + - "*" ), - rdescend = new RegExp( whitespace + "|>" ), - - rpseudo = new RegExp( pseudos ), - ridentifier = new RegExp( "^" + identifier + "$" ), - - matchExpr = { - "ID": new RegExp( "^#(" + identifier + ")" ), - "CLASS": new RegExp( "^\\.(" + identifier + ")" ), - "TAG": new RegExp( "^(" + identifier + "|[*])" ), - "ATTR": new RegExp( "^" + attributes ), - "PSEUDO": new RegExp( "^" + pseudos ), - "CHILD": new RegExp( "^:(only|first|last|nth|nth-last)-(child|of-type)(?:\\(" + - whitespace + "*(even|odd|(([+-]|)(\\d*)n|)" + whitespace + "*(?:([+-]|)" + - whitespace + "*(\\d+)|))" + whitespace + "*\\)|)", "i" ), - "bool": new RegExp( "^(?:" + booleans + ")$", "i" ), - - // For use in libraries implementing .is() - // We use this for POS matching in `select` - "needsContext": new RegExp( "^" + whitespace + - "*[>+~]|:(even|odd|eq|gt|lt|nth|first|last)(?:\\(" + whitespace + - "*((?:-\\d)?\\d*)" + whitespace + "*\\)|)(?=[^-]|$)", "i" ) - }, - - rhtml = /HTML$/i, - rinputs = /^(?:input|select|textarea|button)$/i, - rheader = /^h\d$/i, - - rnative = /^[^{]+\{\s*\[native \w/, - - // Easily-parseable/retrievable ID or TAG or CLASS selectors - rquickExpr = /^(?:#([\w-]+)|(\w+)|\.([\w-]+))$/, - - rsibling = /[+~]/, - - // CSS escapes - // http://www.w3.org/TR/CSS21/syndata.html#escaped-characters - runescape = new RegExp( "\\\\[\\da-fA-F]{1,6}" + whitespace + "?|\\\\([^\\r\\n\\f])", "g" ), - funescape = function( escape, nonHex ) { - var high = "0x" + escape.slice( 1 ) - 0x10000; - - return nonHex ? - - // Strip the backslash prefix from a non-hex escape sequence - nonHex : - - // Replace a hexadecimal escape sequence with the encoded Unicode code point - // Support: IE <=11+ - // For values outside the Basic Multilingual Plane (BMP), manually construct a - // surrogate pair - high < 0 ? - String.fromCharCode( high + 0x10000 ) : - String.fromCharCode( high >> 10 | 0xD800, high & 0x3FF | 0xDC00 ); - }, - - // CSS string/identifier serialization - // https://drafts.csswg.org/cssom/#common-serializing-idioms - rcssescape = /([\0-\x1f\x7f]|^-?\d)|^-$|[^\0-\x1f\x7f-\uFFFF\w-]/g, - fcssescape = function( ch, asCodePoint ) { - if ( asCodePoint ) { - - // U+0000 NULL becomes U+FFFD REPLACEMENT CHARACTER - if ( ch === "\0" ) { - return "\uFFFD"; - } - - // Control characters and (dependent upon position) numbers get escaped as code points - return ch.slice( 0, -1 ) + "\\" + - ch.charCodeAt( ch.length - 1 ).toString( 16 ) + " "; - } - - // Other potentially-special ASCII characters get backslash-escaped - return "\\" + ch; - }, - - // Used for iframes - // See setDocument() - // Removing the function wrapper causes a "Permission Denied" - // error in IE - unloadHandler = function() { - setDocument(); - }, - - inDisabledFieldset = addCombinator( - function( elem ) { - return elem.disabled === true && elem.nodeName.toLowerCase() === "fieldset"; - }, - { dir: "parentNode", next: "legend" } - ); - -// Optimize for push.apply( _, NodeList ) -try { - push.apply( - ( arr = slice.call( preferredDoc.childNodes ) ), - preferredDoc.childNodes - ); - - // Support: Android<4.0 - // Detect silently failing push.apply - // eslint-disable-next-line no-unused-expressions - arr[ preferredDoc.childNodes.length ].nodeType; -} catch ( e ) { - push = { apply: arr.length ? - - // Leverage slice if possible - function( target, els ) { - pushNative.apply( target, slice.call( els ) ); - } : - - // Support: IE<9 - // Otherwise append directly - function( target, els ) { - var j = target.length, - i = 0; - - // Can't trust NodeList.length - while ( ( target[ j++ ] = els[ i++ ] ) ) {} - target.length = j - 1; - } - }; -} - -function Sizzle( selector, context, results, seed ) { - var m, i, elem, nid, match, groups, newSelector, - newContext = context && context.ownerDocument, - - // nodeType defaults to 9, since context defaults to document - nodeType = context ? context.nodeType : 9; - - results = results || []; - - // Return early from calls with invalid selector or context - if ( typeof selector !== "string" || !selector || - nodeType !== 1 && nodeType !== 9 && nodeType !== 11 ) { - - return results; - } - - // Try to shortcut find operations (as opposed to filters) in HTML documents - if ( !seed ) { - setDocument( context ); - context = context || document; - - if ( documentIsHTML ) { - - // If the selector is sufficiently simple, try using a "get*By*" DOM method - // (excepting DocumentFragment context, where the methods don't exist) - if ( nodeType !== 11 && ( match = rquickExpr.exec( selector ) ) ) { - - // ID selector - if ( ( m = match[ 1 ] ) ) { - - // Document context - if ( nodeType === 9 ) { - if ( ( elem = context.getElementById( m ) ) ) { - - // Support: IE, Opera, Webkit - // TODO: identify versions - // getElementById can match elements by name instead of ID - if ( elem.id === m ) { - results.push( elem ); - return results; - } - } else { - return results; - } - - // Element context - } else { - - // Support: IE, Opera, Webkit - // TODO: identify versions - // getElementById can match elements by name instead of ID - if ( newContext && ( elem = newContext.getElementById( m ) ) && - contains( context, elem ) && - elem.id === m ) { - - results.push( elem ); - return results; - } - } - - // Type selector - } else if ( match[ 2 ] ) { - push.apply( results, context.getElementsByTagName( selector ) ); - return results; - - // Class selector - } else if ( ( m = match[ 3 ] ) && support.getElementsByClassName && - context.getElementsByClassName ) { - - push.apply( results, context.getElementsByClassName( m ) ); - return results; - } - } - - // Take advantage of querySelectorAll - if ( support.qsa && - !nonnativeSelectorCache[ selector + " " ] && - ( !rbuggyQSA || !rbuggyQSA.test( selector ) ) && - - // Support: IE 8 only - // Exclude object elements - ( nodeType !== 1 || context.nodeName.toLowerCase() !== "object" ) ) { - - newSelector = selector; - newContext = context; - - // qSA considers elements outside a scoping root when evaluating child or - // descendant combinators, which is not what we want. - // In such cases, we work around the behavior by prefixing every selector in the - // list with an ID selector referencing the scope context. - // The technique has to be used as well when a leading combinator is used - // as such selectors are not recognized by querySelectorAll. - // Thanks to Andrew Dupont for this technique. - if ( nodeType === 1 && - ( rdescend.test( selector ) || rcombinators.test( selector ) ) ) { - - // Expand context for sibling selectors - newContext = rsibling.test( selector ) && testContext( context.parentNode ) || - context; - - // We can use :scope instead of the ID hack if the browser - // supports it & if we're not changing the context. - if ( newContext !== context || !support.scope ) { - - // Capture the context ID, setting it first if necessary - if ( ( nid = context.getAttribute( "id" ) ) ) { - nid = nid.replace( rcssescape, fcssescape ); - } else { - context.setAttribute( "id", ( nid = expando ) ); - } - } - - // Prefix every selector in the list - groups = tokenize( selector ); - i = groups.length; - while ( i-- ) { - groups[ i ] = ( nid ? "#" + nid : ":scope" ) + " " + - toSelector( groups[ i ] ); - } - newSelector = groups.join( "," ); - } - - try { - push.apply( results, - newContext.querySelectorAll( newSelector ) - ); - return results; - } catch ( qsaError ) { - nonnativeSelectorCache( selector, true ); - } finally { - if ( nid === expando ) { - context.removeAttribute( "id" ); - } - } - } - } - } - - // All others - return select( selector.replace( rtrim, "$1" ), context, results, seed ); -} - -/** - * Create key-value caches of limited size - * @returns {function(string, object)} Returns the Object data after storing it on itself with - * property name the (space-suffixed) string and (if the cache is larger than Expr.cacheLength) - * deleting the oldest entry - */ -function createCache() { - var keys = []; - - function cache( key, value ) { - - // Use (key + " ") to avoid collision with native prototype properties (see Issue #157) - if ( keys.push( key + " " ) > Expr.cacheLength ) { - - // Only keep the most recent entries - delete cache[ keys.shift() ]; - } - return ( cache[ key + " " ] = value ); - } - return cache; -} - -/** - * Mark a function for special use by Sizzle - * @param {Function} fn The function to mark - */ -function markFunction( fn ) { - fn[ expando ] = true; - return fn; -} - -/** - * Support testing using an element - * @param {Function} fn Passed the created element and returns a boolean result - */ -function assert( fn ) { - var el = document.createElement( "fieldset" ); - - try { - return !!fn( el ); - } catch ( e ) { - return false; - } finally { - - // Remove from its parent by default - if ( el.parentNode ) { - el.parentNode.removeChild( el ); - } - - // release memory in IE - el = null; - } -} - -/** - * Adds the same handler for all of the specified attrs - * @param {String} attrs Pipe-separated list of attributes - * @param {Function} handler The method that will be applied - */ -function addHandle( attrs, handler ) { - var arr = attrs.split( "|" ), - i = arr.length; - - while ( i-- ) { - Expr.attrHandle[ arr[ i ] ] = handler; - } -} - -/** - * Checks document order of two siblings - * @param {Element} a - * @param {Element} b - * @returns {Number} Returns less than 0 if a precedes b, greater than 0 if a follows b - */ -function siblingCheck( a, b ) { - var cur = b && a, - diff = cur && a.nodeType === 1 && b.nodeType === 1 && - a.sourceIndex - b.sourceIndex; - - // Use IE sourceIndex if available on both nodes - if ( diff ) { - return diff; - } - - // Check if b follows a - if ( cur ) { - while ( ( cur = cur.nextSibling ) ) { - if ( cur === b ) { - return -1; - } - } - } - - return a ? 1 : -1; -} - -/** - * Returns a function to use in pseudos for input types - * @param {String} type - */ -function createInputPseudo( type ) { - return function( elem ) { - var name = elem.nodeName.toLowerCase(); - return name === "input" && elem.type === type; - }; -} - -/** - * Returns a function to use in pseudos for buttons - * @param {String} type - */ -function createButtonPseudo( type ) { - return function( elem ) { - var name = elem.nodeName.toLowerCase(); - return ( name === "input" || name === "button" ) && elem.type === type; - }; -} - -/** - * Returns a function to use in pseudos for :enabled/:disabled - * @param {Boolean} disabled true for :disabled; false for :enabled - */ -function createDisabledPseudo( disabled ) { - - // Known :disabled false positives: fieldset[disabled] > legend:nth-of-type(n+2) :can-disable - return function( elem ) { - - // Only certain elements can match :enabled or :disabled - // https://html.spec.whatwg.org/multipage/scripting.html#selector-enabled - // https://html.spec.whatwg.org/multipage/scripting.html#selector-disabled - if ( "form" in elem ) { - - // Check for inherited disabledness on relevant non-disabled elements: - // * listed form-associated elements in a disabled fieldset - // https://html.spec.whatwg.org/multipage/forms.html#category-listed - // https://html.spec.whatwg.org/multipage/forms.html#concept-fe-disabled - // * option elements in a disabled optgroup - // https://html.spec.whatwg.org/multipage/forms.html#concept-option-disabled - // All such elements have a "form" property. - if ( elem.parentNode && elem.disabled === false ) { - - // Option elements defer to a parent optgroup if present - if ( "label" in elem ) { - if ( "label" in elem.parentNode ) { - return elem.parentNode.disabled === disabled; - } else { - return elem.disabled === disabled; - } - } - - // Support: IE 6 - 11 - // Use the isDisabled shortcut property to check for disabled fieldset ancestors - return elem.isDisabled === disabled || - - // Where there is no isDisabled, check manually - /* jshint -W018 */ - elem.isDisabled !== !disabled && - inDisabledFieldset( elem ) === disabled; - } - - return elem.disabled === disabled; - - // Try to winnow out elements that can't be disabled before trusting the disabled property. - // Some victims get caught in our net (label, legend, menu, track), but it shouldn't - // even exist on them, let alone have a boolean value. - } else if ( "label" in elem ) { - return elem.disabled === disabled; - } - - // Remaining elements are neither :enabled nor :disabled - return false; - }; -} - -/** - * Returns a function to use in pseudos for positionals - * @param {Function} fn - */ -function createPositionalPseudo( fn ) { - return markFunction( function( argument ) { - argument = +argument; - return markFunction( function( seed, matches ) { - var j, - matchIndexes = fn( [], seed.length, argument ), - i = matchIndexes.length; - - // Match elements found at the specified indexes - while ( i-- ) { - if ( seed[ ( j = matchIndexes[ i ] ) ] ) { - seed[ j ] = !( matches[ j ] = seed[ j ] ); - } - } - } ); - } ); -} - -/** - * Checks a node for validity as a Sizzle context - * @param {Element|Object=} context - * @returns {Element|Object|Boolean} The input node if acceptable, otherwise a falsy value - */ -function testContext( context ) { - return context && typeof context.getElementsByTagName !== "undefined" && context; -} - -// Expose support vars for convenience -support = Sizzle.support = {}; - -/** - * Detects XML nodes - * @param {Element|Object} elem An element or a document - * @returns {Boolean} True iff elem is a non-HTML XML node - */ -isXML = Sizzle.isXML = function( elem ) { - var namespace = elem.namespaceURI, - docElem = ( elem.ownerDocument || elem ).documentElement; - - // Support: IE <=8 - // Assume HTML when documentElement doesn't yet exist, such as inside loading iframes - // https://bugs.jquery.com/ticket/4833 - return !rhtml.test( namespace || docElem && docElem.nodeName || "HTML" ); -}; - -/** - * Sets document-related variables once based on the current document - * @param {Element|Object} [doc] An element or document object to use to set the document - * @returns {Object} Returns the current document - */ -setDocument = Sizzle.setDocument = function( node ) { - var hasCompare, subWindow, - doc = node ? node.ownerDocument || node : preferredDoc; - - // Return early if doc is invalid or already selected - // Support: IE 11+, Edge 17 - 18+ - // IE/Edge sometimes throw a "Permission denied" error when strict-comparing - // two documents; shallow comparisons work. - // eslint-disable-next-line eqeqeq - if ( doc == document || doc.nodeType !== 9 || !doc.documentElement ) { - return document; - } - - // Update global variables - document = doc; - docElem = document.documentElement; - documentIsHTML = !isXML( document ); - - // Support: IE 9 - 11+, Edge 12 - 18+ - // Accessing iframe documents after unload throws "permission denied" errors (jQuery #13936) - // Support: IE 11+, Edge 17 - 18+ - // IE/Edge sometimes throw a "Permission denied" error when strict-comparing - // two documents; shallow comparisons work. - // eslint-disable-next-line eqeqeq - if ( preferredDoc != document && - ( subWindow = document.defaultView ) && subWindow.top !== subWindow ) { - - // Support: IE 11, Edge - if ( subWindow.addEventListener ) { - subWindow.addEventListener( "unload", unloadHandler, false ); - - // Support: IE 9 - 10 only - } else if ( subWindow.attachEvent ) { - subWindow.attachEvent( "onunload", unloadHandler ); - } - } - - // Support: IE 8 - 11+, Edge 12 - 18+, Chrome <=16 - 25 only, Firefox <=3.6 - 31 only, - // Safari 4 - 5 only, Opera <=11.6 - 12.x only - // IE/Edge & older browsers don't support the :scope pseudo-class. - // Support: Safari 6.0 only - // Safari 6.0 supports :scope but it's an alias of :root there. - support.scope = assert( function( el ) { - docElem.appendChild( el ).appendChild( document.createElement( "div" ) ); - return typeof el.querySelectorAll !== "undefined" && - !el.querySelectorAll( ":scope fieldset div" ).length; - } ); - - /* Attributes - ---------------------------------------------------------------------- */ - - // Support: IE<8 - // Verify that getAttribute really returns attributes and not properties - // (excepting IE8 booleans) - support.attributes = assert( function( el ) { - el.className = "i"; - return !el.getAttribute( "className" ); - } ); - - /* getElement(s)By* - ---------------------------------------------------------------------- */ - - // Check if getElementsByTagName("*") returns only elements - support.getElementsByTagName = assert( function( el ) { - el.appendChild( document.createComment( "" ) ); - return !el.getElementsByTagName( "*" ).length; - } ); - - // Support: IE<9 - support.getElementsByClassName = rnative.test( document.getElementsByClassName ); - - // Support: IE<10 - // Check if getElementById returns elements by name - // The broken getElementById methods don't pick up programmatically-set names, - // so use a roundabout getElementsByName test - support.getById = assert( function( el ) { - docElem.appendChild( el ).id = expando; - return !document.getElementsByName || !document.getElementsByName( expando ).length; - } ); - - // ID filter and find - if ( support.getById ) { - Expr.filter[ "ID" ] = function( id ) { - var attrId = id.replace( runescape, funescape ); - return function( elem ) { - return elem.getAttribute( "id" ) === attrId; - }; - }; - Expr.find[ "ID" ] = function( id, context ) { - if ( typeof context.getElementById !== "undefined" && documentIsHTML ) { - var elem = context.getElementById( id ); - return elem ? [ elem ] : []; - } - }; - } else { - Expr.filter[ "ID" ] = function( id ) { - var attrId = id.replace( runescape, funescape ); - return function( elem ) { - var node = typeof elem.getAttributeNode !== "undefined" && - elem.getAttributeNode( "id" ); - return node && node.value === attrId; - }; - }; - - // Support: IE 6 - 7 only - // getElementById is not reliable as a find shortcut - Expr.find[ "ID" ] = function( id, context ) { - if ( typeof context.getElementById !== "undefined" && documentIsHTML ) { - var node, i, elems, - elem = context.getElementById( id ); - - if ( elem ) { - - // Verify the id attribute - node = elem.getAttributeNode( "id" ); - if ( node && node.value === id ) { - return [ elem ]; - } - - // Fall back on getElementsByName - elems = context.getElementsByName( id ); - i = 0; - while ( ( elem = elems[ i++ ] ) ) { - node = elem.getAttributeNode( "id" ); - if ( node && node.value === id ) { - return [ elem ]; - } - } - } - - return []; - } - }; - } - - // Tag - Expr.find[ "TAG" ] = support.getElementsByTagName ? - function( tag, context ) { - if ( typeof context.getElementsByTagName !== "undefined" ) { - return context.getElementsByTagName( tag ); - - // DocumentFragment nodes don't have gEBTN - } else if ( support.qsa ) { - return context.querySelectorAll( tag ); - } - } : - - function( tag, context ) { - var elem, - tmp = [], - i = 0, - - // By happy coincidence, a (broken) gEBTN appears on DocumentFragment nodes too - results = context.getElementsByTagName( tag ); - - // Filter out possible comments - if ( tag === "*" ) { - while ( ( elem = results[ i++ ] ) ) { - if ( elem.nodeType === 1 ) { - tmp.push( elem ); - } - } - - return tmp; - } - return results; - }; - - // Class - Expr.find[ "CLASS" ] = support.getElementsByClassName && function( className, context ) { - if ( typeof context.getElementsByClassName !== "undefined" && documentIsHTML ) { - return context.getElementsByClassName( className ); - } - }; - - /* QSA/matchesSelector - ---------------------------------------------------------------------- */ - - // QSA and matchesSelector support - - // matchesSelector(:active) reports false when true (IE9/Opera 11.5) - rbuggyMatches = []; - - // qSa(:focus) reports false when true (Chrome 21) - // We allow this because of a bug in IE8/9 that throws an error - // whenever `document.activeElement` is accessed on an iframe - // So, we allow :focus to pass through QSA all the time to avoid the IE error - // See https://bugs.jquery.com/ticket/13378 - rbuggyQSA = []; - - if ( ( support.qsa = rnative.test( document.querySelectorAll ) ) ) { - - // Build QSA regex - // Regex strategy adopted from Diego Perini - assert( function( el ) { - - var input; - - // Select is set to empty string on purpose - // This is to test IE's treatment of not explicitly - // setting a boolean content attribute, - // since its presence should be enough - // https://bugs.jquery.com/ticket/12359 - docElem.appendChild( el ).innerHTML = "" + - ""; - - // Support: IE8, Opera 11-12.16 - // Nothing should be selected when empty strings follow ^= or $= or *= - // The test attribute must be unknown in Opera but "safe" for WinRT - // https://msdn.microsoft.com/en-us/library/ie/hh465388.aspx#attribute_section - if ( el.querySelectorAll( "[msallowcapture^='']" ).length ) { - rbuggyQSA.push( "[*^$]=" + whitespace + "*(?:''|\"\")" ); - } - - // Support: IE8 - // Boolean attributes and "value" are not treated correctly - if ( !el.querySelectorAll( "[selected]" ).length ) { - rbuggyQSA.push( "\\[" + whitespace + "*(?:value|" + booleans + ")" ); - } - - // Support: Chrome<29, Android<4.4, Safari<7.0+, iOS<7.0+, PhantomJS<1.9.8+ - if ( !el.querySelectorAll( "[id~=" + expando + "-]" ).length ) { - rbuggyQSA.push( "~=" ); - } - - // Support: IE 11+, Edge 15 - 18+ - // IE 11/Edge don't find elements on a `[name='']` query in some cases. - // Adding a temporary attribute to the document before the selection works - // around the issue. - // Interestingly, IE 10 & older don't seem to have the issue. - input = document.createElement( "input" ); - input.setAttribute( "name", "" ); - el.appendChild( input ); - if ( !el.querySelectorAll( "[name='']" ).length ) { - rbuggyQSA.push( "\\[" + whitespace + "*name" + whitespace + "*=" + - whitespace + "*(?:''|\"\")" ); - } - - // Webkit/Opera - :checked should return selected option elements - // http://www.w3.org/TR/2011/REC-css3-selectors-20110929/#checked - // IE8 throws error here and will not see later tests - if ( !el.querySelectorAll( ":checked" ).length ) { - rbuggyQSA.push( ":checked" ); - } - - // Support: Safari 8+, iOS 8+ - // https://bugs.webkit.org/show_bug.cgi?id=136851 - // In-page `selector#id sibling-combinator selector` fails - if ( !el.querySelectorAll( "a#" + expando + "+*" ).length ) { - rbuggyQSA.push( ".#.+[+~]" ); - } - - // Support: Firefox <=3.6 - 5 only - // Old Firefox doesn't throw on a badly-escaped identifier. - el.querySelectorAll( "\\\f" ); - rbuggyQSA.push( "[\\r\\n\\f]" ); - } ); - - assert( function( el ) { - el.innerHTML = "" + - ""; - - // Support: Windows 8 Native Apps - // The type and name attributes are restricted during .innerHTML assignment - var input = document.createElement( "input" ); - input.setAttribute( "type", "hidden" ); - el.appendChild( input ).setAttribute( "name", "D" ); - - // Support: IE8 - // Enforce case-sensitivity of name attribute - if ( el.querySelectorAll( "[name=d]" ).length ) { - rbuggyQSA.push( "name" + whitespace + "*[*^$|!~]?=" ); - } - - // FF 3.5 - :enabled/:disabled and hidden elements (hidden elements are still enabled) - // IE8 throws error here and will not see later tests - if ( el.querySelectorAll( ":enabled" ).length !== 2 ) { - rbuggyQSA.push( ":enabled", ":disabled" ); - } - - // Support: IE9-11+ - // IE's :disabled selector does not pick up the children of disabled fieldsets - docElem.appendChild( el ).disabled = true; - if ( el.querySelectorAll( ":disabled" ).length !== 2 ) { - rbuggyQSA.push( ":enabled", ":disabled" ); - } - - // Support: Opera 10 - 11 only - // Opera 10-11 does not throw on post-comma invalid pseudos - el.querySelectorAll( "*,:x" ); - rbuggyQSA.push( ",.*:" ); - } ); - } - - if ( ( support.matchesSelector = rnative.test( ( matches = docElem.matches || - docElem.webkitMatchesSelector || - docElem.mozMatchesSelector || - docElem.oMatchesSelector || - docElem.msMatchesSelector ) ) ) ) { - - assert( function( el ) { - - // Check to see if it's possible to do matchesSelector - // on a disconnected node (IE 9) - support.disconnectedMatch = matches.call( el, "*" ); - - // This should fail with an exception - // Gecko does not error, returns false instead - matches.call( el, "[s!='']:x" ); - rbuggyMatches.push( "!=", pseudos ); - } ); - } - - rbuggyQSA = rbuggyQSA.length && new RegExp( rbuggyQSA.join( "|" ) ); - rbuggyMatches = rbuggyMatches.length && new RegExp( rbuggyMatches.join( "|" ) ); - - /* Contains - ---------------------------------------------------------------------- */ - hasCompare = rnative.test( docElem.compareDocumentPosition ); - - // Element contains another - // Purposefully self-exclusive - // As in, an element does not contain itself - contains = hasCompare || rnative.test( docElem.contains ) ? - function( a, b ) { - var adown = a.nodeType === 9 ? a.documentElement : a, - bup = b && b.parentNode; - return a === bup || !!( bup && bup.nodeType === 1 && ( - adown.contains ? - adown.contains( bup ) : - a.compareDocumentPosition && a.compareDocumentPosition( bup ) & 16 - ) ); - } : - function( a, b ) { - if ( b ) { - while ( ( b = b.parentNode ) ) { - if ( b === a ) { - return true; - } - } - } - return false; - }; - - /* Sorting - ---------------------------------------------------------------------- */ - - // Document order sorting - sortOrder = hasCompare ? - function( a, b ) { - - // Flag for duplicate removal - if ( a === b ) { - hasDuplicate = true; - return 0; - } - - // Sort on method existence if only one input has compareDocumentPosition - var compare = !a.compareDocumentPosition - !b.compareDocumentPosition; - if ( compare ) { - return compare; - } - - // Calculate position if both inputs belong to the same document - // Support: IE 11+, Edge 17 - 18+ - // IE/Edge sometimes throw a "Permission denied" error when strict-comparing - // two documents; shallow comparisons work. - // eslint-disable-next-line eqeqeq - compare = ( a.ownerDocument || a ) == ( b.ownerDocument || b ) ? - a.compareDocumentPosition( b ) : - - // Otherwise we know they are disconnected - 1; - - // Disconnected nodes - if ( compare & 1 || - ( !support.sortDetached && b.compareDocumentPosition( a ) === compare ) ) { - - // Choose the first element that is related to our preferred document - // Support: IE 11+, Edge 17 - 18+ - // IE/Edge sometimes throw a "Permission denied" error when strict-comparing - // two documents; shallow comparisons work. - // eslint-disable-next-line eqeqeq - if ( a == document || a.ownerDocument == preferredDoc && - contains( preferredDoc, a ) ) { - return -1; - } - - // Support: IE 11+, Edge 17 - 18+ - // IE/Edge sometimes throw a "Permission denied" error when strict-comparing - // two documents; shallow comparisons work. - // eslint-disable-next-line eqeqeq - if ( b == document || b.ownerDocument == preferredDoc && - contains( preferredDoc, b ) ) { - return 1; - } - - // Maintain original order - return sortInput ? - ( indexOf( sortInput, a ) - indexOf( sortInput, b ) ) : - 0; - } - - return compare & 4 ? -1 : 1; - } : - function( a, b ) { - - // Exit early if the nodes are identical - if ( a === b ) { - hasDuplicate = true; - return 0; - } - - var cur, - i = 0, - aup = a.parentNode, - bup = b.parentNode, - ap = [ a ], - bp = [ b ]; - - // Parentless nodes are either documents or disconnected - if ( !aup || !bup ) { - - // Support: IE 11+, Edge 17 - 18+ - // IE/Edge sometimes throw a "Permission denied" error when strict-comparing - // two documents; shallow comparisons work. - /* eslint-disable eqeqeq */ - return a == document ? -1 : - b == document ? 1 : - /* eslint-enable eqeqeq */ - aup ? -1 : - bup ? 1 : - sortInput ? - ( indexOf( sortInput, a ) - indexOf( sortInput, b ) ) : - 0; - - // If the nodes are siblings, we can do a quick check - } else if ( aup === bup ) { - return siblingCheck( a, b ); - } - - // Otherwise we need full lists of their ancestors for comparison - cur = a; - while ( ( cur = cur.parentNode ) ) { - ap.unshift( cur ); - } - cur = b; - while ( ( cur = cur.parentNode ) ) { - bp.unshift( cur ); - } - - // Walk down the tree looking for a discrepancy - while ( ap[ i ] === bp[ i ] ) { - i++; - } - - return i ? - - // Do a sibling check if the nodes have a common ancestor - siblingCheck( ap[ i ], bp[ i ] ) : - - // Otherwise nodes in our document sort first - // Support: IE 11+, Edge 17 - 18+ - // IE/Edge sometimes throw a "Permission denied" error when strict-comparing - // two documents; shallow comparisons work. - /* eslint-disable eqeqeq */ - ap[ i ] == preferredDoc ? -1 : - bp[ i ] == preferredDoc ? 1 : - /* eslint-enable eqeqeq */ - 0; - }; - - return document; -}; - -Sizzle.matches = function( expr, elements ) { - return Sizzle( expr, null, null, elements ); -}; - -Sizzle.matchesSelector = function( elem, expr ) { - setDocument( elem ); - - if ( support.matchesSelector && documentIsHTML && - !nonnativeSelectorCache[ expr + " " ] && - ( !rbuggyMatches || !rbuggyMatches.test( expr ) ) && - ( !rbuggyQSA || !rbuggyQSA.test( expr ) ) ) { - - try { - var ret = matches.call( elem, expr ); - - // IE 9's matchesSelector returns false on disconnected nodes - if ( ret || support.disconnectedMatch || - - // As well, disconnected nodes are said to be in a document - // fragment in IE 9 - elem.document && elem.document.nodeType !== 11 ) { - return ret; - } - } catch ( e ) { - nonnativeSelectorCache( expr, true ); - } - } - - return Sizzle( expr, document, null, [ elem ] ).length > 0; -}; - -Sizzle.contains = function( context, elem ) { - - // Set document vars if needed - // Support: IE 11+, Edge 17 - 18+ - // IE/Edge sometimes throw a "Permission denied" error when strict-comparing - // two documents; shallow comparisons work. - // eslint-disable-next-line eqeqeq - if ( ( context.ownerDocument || context ) != document ) { - setDocument( context ); - } - return contains( context, elem ); -}; - -Sizzle.attr = function( elem, name ) { - - // Set document vars if needed - // Support: IE 11+, Edge 17 - 18+ - // IE/Edge sometimes throw a "Permission denied" error when strict-comparing - // two documents; shallow comparisons work. - // eslint-disable-next-line eqeqeq - if ( ( elem.ownerDocument || elem ) != document ) { - setDocument( elem ); - } - - var fn = Expr.attrHandle[ name.toLowerCase() ], - - // Don't get fooled by Object.prototype properties (jQuery #13807) - val = fn && hasOwn.call( Expr.attrHandle, name.toLowerCase() ) ? - fn( elem, name, !documentIsHTML ) : - undefined; - - return val !== undefined ? - val : - support.attributes || !documentIsHTML ? - elem.getAttribute( name ) : - ( val = elem.getAttributeNode( name ) ) && val.specified ? - val.value : - null; -}; - -Sizzle.escape = function( sel ) { - return ( sel + "" ).replace( rcssescape, fcssescape ); -}; - -Sizzle.error = function( msg ) { - throw new Error( "Syntax error, unrecognized expression: " + msg ); -}; - -/** - * Document sorting and removing duplicates - * @param {ArrayLike} results - */ -Sizzle.uniqueSort = function( results ) { - var elem, - duplicates = [], - j = 0, - i = 0; - - // Unless we *know* we can detect duplicates, assume their presence - hasDuplicate = !support.detectDuplicates; - sortInput = !support.sortStable && results.slice( 0 ); - results.sort( sortOrder ); - - if ( hasDuplicate ) { - while ( ( elem = results[ i++ ] ) ) { - if ( elem === results[ i ] ) { - j = duplicates.push( i ); - } - } - while ( j-- ) { - results.splice( duplicates[ j ], 1 ); - } - } - - // Clear input after sorting to release objects - // See https://github.com/jquery/sizzle/pull/225 - sortInput = null; - - return results; -}; - -/** - * Utility function for retrieving the text value of an array of DOM nodes - * @param {Array|Element} elem - */ -getText = Sizzle.getText = function( elem ) { - var node, - ret = "", - i = 0, - nodeType = elem.nodeType; - - if ( !nodeType ) { - - // If no nodeType, this is expected to be an array - while ( ( node = elem[ i++ ] ) ) { - - // Do not traverse comment nodes - ret += getText( node ); - } - } else if ( nodeType === 1 || nodeType === 9 || nodeType === 11 ) { - - // Use textContent for elements - // innerText usage removed for consistency of new lines (jQuery #11153) - if ( typeof elem.textContent === "string" ) { - return elem.textContent; - } else { - - // Traverse its children - for ( elem = elem.firstChild; elem; elem = elem.nextSibling ) { - ret += getText( elem ); - } - } - } else if ( nodeType === 3 || nodeType === 4 ) { - return elem.nodeValue; - } - - // Do not include comment or processing instruction nodes - - return ret; -}; - -Expr = Sizzle.selectors = { - - // Can be adjusted by the user - cacheLength: 50, - - createPseudo: markFunction, - - match: matchExpr, - - attrHandle: {}, - - find: {}, - - relative: { - ">": { dir: "parentNode", first: true }, - " ": { dir: "parentNode" }, - "+": { dir: "previousSibling", first: true }, - "~": { dir: "previousSibling" } - }, - - preFilter: { - "ATTR": function( match ) { - match[ 1 ] = match[ 1 ].replace( runescape, funescape ); - - // Move the given value to match[3] whether quoted or unquoted - match[ 3 ] = ( match[ 3 ] || match[ 4 ] || - match[ 5 ] || "" ).replace( runescape, funescape ); - - if ( match[ 2 ] === "~=" ) { - match[ 3 ] = " " + match[ 3 ] + " "; - } - - return match.slice( 0, 4 ); - }, - - "CHILD": function( match ) { - - /* matches from matchExpr["CHILD"] - 1 type (only|nth|...) - 2 what (child|of-type) - 3 argument (even|odd|\d*|\d*n([+-]\d+)?|...) - 4 xn-component of xn+y argument ([+-]?\d*n|) - 5 sign of xn-component - 6 x of xn-component - 7 sign of y-component - 8 y of y-component - */ - match[ 1 ] = match[ 1 ].toLowerCase(); - - if ( match[ 1 ].slice( 0, 3 ) === "nth" ) { - - // nth-* requires argument - if ( !match[ 3 ] ) { - Sizzle.error( match[ 0 ] ); - } - - // numeric x and y parameters for Expr.filter.CHILD - // remember that false/true cast respectively to 0/1 - match[ 4 ] = +( match[ 4 ] ? - match[ 5 ] + ( match[ 6 ] || 1 ) : - 2 * ( match[ 3 ] === "even" || match[ 3 ] === "odd" ) ); - match[ 5 ] = +( ( match[ 7 ] + match[ 8 ] ) || match[ 3 ] === "odd" ); - - // other types prohibit arguments - } else if ( match[ 3 ] ) { - Sizzle.error( match[ 0 ] ); - } - - return match; - }, - - "PSEUDO": function( match ) { - var excess, - unquoted = !match[ 6 ] && match[ 2 ]; - - if ( matchExpr[ "CHILD" ].test( match[ 0 ] ) ) { - return null; - } - - // Accept quoted arguments as-is - if ( match[ 3 ] ) { - match[ 2 ] = match[ 4 ] || match[ 5 ] || ""; - - // Strip excess characters from unquoted arguments - } else if ( unquoted && rpseudo.test( unquoted ) && - - // Get excess from tokenize (recursively) - ( excess = tokenize( unquoted, true ) ) && - - // advance to the next closing parenthesis - ( excess = unquoted.indexOf( ")", unquoted.length - excess ) - unquoted.length ) ) { - - // excess is a negative index - match[ 0 ] = match[ 0 ].slice( 0, excess ); - match[ 2 ] = unquoted.slice( 0, excess ); - } - - // Return only captures needed by the pseudo filter method (type and argument) - return match.slice( 0, 3 ); - } - }, - - filter: { - - "TAG": function( nodeNameSelector ) { - var nodeName = nodeNameSelector.replace( runescape, funescape ).toLowerCase(); - return nodeNameSelector === "*" ? - function() { - return true; - } : - function( elem ) { - return elem.nodeName && elem.nodeName.toLowerCase() === nodeName; - }; - }, - - "CLASS": function( className ) { - var pattern = classCache[ className + " " ]; - - return pattern || - ( pattern = new RegExp( "(^|" + whitespace + - ")" + className + "(" + whitespace + "|$)" ) ) && classCache( - className, function( elem ) { - return pattern.test( - typeof elem.className === "string" && elem.className || - typeof elem.getAttribute !== "undefined" && - elem.getAttribute( "class" ) || - "" - ); - } ); - }, - - "ATTR": function( name, operator, check ) { - return function( elem ) { - var result = Sizzle.attr( elem, name ); - - if ( result == null ) { - return operator === "!="; - } - if ( !operator ) { - return true; - } - - result += ""; - - /* eslint-disable max-len */ - - return operator === "=" ? result === check : - operator === "!=" ? result !== check : - operator === "^=" ? check && result.indexOf( check ) === 0 : - operator === "*=" ? check && result.indexOf( check ) > -1 : - operator === "$=" ? check && result.slice( -check.length ) === check : - operator === "~=" ? ( " " + result.replace( rwhitespace, " " ) + " " ).indexOf( check ) > -1 : - operator === "|=" ? result === check || result.slice( 0, check.length + 1 ) === check + "-" : - false; - /* eslint-enable max-len */ - - }; - }, - - "CHILD": function( type, what, _argument, first, last ) { - var simple = type.slice( 0, 3 ) !== "nth", - forward = type.slice( -4 ) !== "last", - ofType = what === "of-type"; - - return first === 1 && last === 0 ? - - // Shortcut for :nth-*(n) - function( elem ) { - return !!elem.parentNode; - } : - - function( elem, _context, xml ) { - var cache, uniqueCache, outerCache, node, nodeIndex, start, - dir = simple !== forward ? "nextSibling" : "previousSibling", - parent = elem.parentNode, - name = ofType && elem.nodeName.toLowerCase(), - useCache = !xml && !ofType, - diff = false; - - if ( parent ) { - - // :(first|last|only)-(child|of-type) - if ( simple ) { - while ( dir ) { - node = elem; - while ( ( node = node[ dir ] ) ) { - if ( ofType ? - node.nodeName.toLowerCase() === name : - node.nodeType === 1 ) { - - return false; - } - } - - // Reverse direction for :only-* (if we haven't yet done so) - start = dir = type === "only" && !start && "nextSibling"; - } - return true; - } - - start = [ forward ? parent.firstChild : parent.lastChild ]; - - // non-xml :nth-child(...) stores cache data on `parent` - if ( forward && useCache ) { - - // Seek `elem` from a previously-cached index - - // ...in a gzip-friendly way - node = parent; - outerCache = node[ expando ] || ( node[ expando ] = {} ); - - // Support: IE <9 only - // Defend against cloned attroperties (jQuery gh-1709) - uniqueCache = outerCache[ node.uniqueID ] || - ( outerCache[ node.uniqueID ] = {} ); - - cache = uniqueCache[ type ] || []; - nodeIndex = cache[ 0 ] === dirruns && cache[ 1 ]; - diff = nodeIndex && cache[ 2 ]; - node = nodeIndex && parent.childNodes[ nodeIndex ]; - - while ( ( node = ++nodeIndex && node && node[ dir ] || - - // Fallback to seeking `elem` from the start - ( diff = nodeIndex = 0 ) || start.pop() ) ) { - - // When found, cache indexes on `parent` and break - if ( node.nodeType === 1 && ++diff && node === elem ) { - uniqueCache[ type ] = [ dirruns, nodeIndex, diff ]; - break; - } - } - - } else { - - // Use previously-cached element index if available - if ( useCache ) { - - // ...in a gzip-friendly way - node = elem; - outerCache = node[ expando ] || ( node[ expando ] = {} ); - - // Support: IE <9 only - // Defend against cloned attroperties (jQuery gh-1709) - uniqueCache = outerCache[ node.uniqueID ] || - ( outerCache[ node.uniqueID ] = {} ); - - cache = uniqueCache[ type ] || []; - nodeIndex = cache[ 0 ] === dirruns && cache[ 1 ]; - diff = nodeIndex; - } - - // xml :nth-child(...) - // or :nth-last-child(...) or :nth(-last)?-of-type(...) - if ( diff === false ) { - - // Use the same loop as above to seek `elem` from the start - while ( ( node = ++nodeIndex && node && node[ dir ] || - ( diff = nodeIndex = 0 ) || start.pop() ) ) { - - if ( ( ofType ? - node.nodeName.toLowerCase() === name : - node.nodeType === 1 ) && - ++diff ) { - - // Cache the index of each encountered element - if ( useCache ) { - outerCache = node[ expando ] || - ( node[ expando ] = {} ); - - // Support: IE <9 only - // Defend against cloned attroperties (jQuery gh-1709) - uniqueCache = outerCache[ node.uniqueID ] || - ( outerCache[ node.uniqueID ] = {} ); - - uniqueCache[ type ] = [ dirruns, diff ]; - } - - if ( node === elem ) { - break; - } - } - } - } - } - - // Incorporate the offset, then check against cycle size - diff -= last; - return diff === first || ( diff % first === 0 && diff / first >= 0 ); - } - }; - }, - - "PSEUDO": function( pseudo, argument ) { - - // pseudo-class names are case-insensitive - // http://www.w3.org/TR/selectors/#pseudo-classes - // Prioritize by case sensitivity in case custom pseudos are added with uppercase letters - // Remember that setFilters inherits from pseudos - var args, - fn = Expr.pseudos[ pseudo ] || Expr.setFilters[ pseudo.toLowerCase() ] || - Sizzle.error( "unsupported pseudo: " + pseudo ); - - // The user may use createPseudo to indicate that - // arguments are needed to create the filter function - // just as Sizzle does - if ( fn[ expando ] ) { - return fn( argument ); - } - - // But maintain support for old signatures - if ( fn.length > 1 ) { - args = [ pseudo, pseudo, "", argument ]; - return Expr.setFilters.hasOwnProperty( pseudo.toLowerCase() ) ? - markFunction( function( seed, matches ) { - var idx, - matched = fn( seed, argument ), - i = matched.length; - while ( i-- ) { - idx = indexOf( seed, matched[ i ] ); - seed[ idx ] = !( matches[ idx ] = matched[ i ] ); - } - } ) : - function( elem ) { - return fn( elem, 0, args ); - }; - } - - return fn; - } - }, - - pseudos: { - - // Potentially complex pseudos - "not": markFunction( function( selector ) { - - // Trim the selector passed to compile - // to avoid treating leading and trailing - // spaces as combinators - var input = [], - results = [], - matcher = compile( selector.replace( rtrim, "$1" ) ); - - return matcher[ expando ] ? - markFunction( function( seed, matches, _context, xml ) { - var elem, - unmatched = matcher( seed, null, xml, [] ), - i = seed.length; - - // Match elements unmatched by `matcher` - while ( i-- ) { - if ( ( elem = unmatched[ i ] ) ) { - seed[ i ] = !( matches[ i ] = elem ); - } - } - } ) : - function( elem, _context, xml ) { - input[ 0 ] = elem; - matcher( input, null, xml, results ); - - // Don't keep the element (issue #299) - input[ 0 ] = null; - return !results.pop(); - }; - } ), - - "has": markFunction( function( selector ) { - return function( elem ) { - return Sizzle( selector, elem ).length > 0; - }; - } ), - - "contains": markFunction( function( text ) { - text = text.replace( runescape, funescape ); - return function( elem ) { - return ( elem.textContent || getText( elem ) ).indexOf( text ) > -1; - }; - } ), - - // "Whether an element is represented by a :lang() selector - // is based solely on the element's language value - // being equal to the identifier C, - // or beginning with the identifier C immediately followed by "-". - // The matching of C against the element's language value is performed case-insensitively. - // The identifier C does not have to be a valid language name." - // http://www.w3.org/TR/selectors/#lang-pseudo - "lang": markFunction( function( lang ) { - - // lang value must be a valid identifier - if ( !ridentifier.test( lang || "" ) ) { - Sizzle.error( "unsupported lang: " + lang ); - } - lang = lang.replace( runescape, funescape ).toLowerCase(); - return function( elem ) { - var elemLang; - do { - if ( ( elemLang = documentIsHTML ? - elem.lang : - elem.getAttribute( "xml:lang" ) || elem.getAttribute( "lang" ) ) ) { - - elemLang = elemLang.toLowerCase(); - return elemLang === lang || elemLang.indexOf( lang + "-" ) === 0; - } - } while ( ( elem = elem.parentNode ) && elem.nodeType === 1 ); - return false; - }; - } ), - - // Miscellaneous - "target": function( elem ) { - var hash = window.location && window.location.hash; - return hash && hash.slice( 1 ) === elem.id; - }, - - "root": function( elem ) { - return elem === docElem; - }, - - "focus": function( elem ) { - return elem === document.activeElement && - ( !document.hasFocus || document.hasFocus() ) && - !!( elem.type || elem.href || ~elem.tabIndex ); - }, - - // Boolean properties - "enabled": createDisabledPseudo( false ), - "disabled": createDisabledPseudo( true ), - - "checked": function( elem ) { - - // In CSS3, :checked should return both checked and selected elements - // http://www.w3.org/TR/2011/REC-css3-selectors-20110929/#checked - var nodeName = elem.nodeName.toLowerCase(); - return ( nodeName === "input" && !!elem.checked ) || - ( nodeName === "option" && !!elem.selected ); - }, - - "selected": function( elem ) { - - // Accessing this property makes selected-by-default - // options in Safari work properly - if ( elem.parentNode ) { - // eslint-disable-next-line no-unused-expressions - elem.parentNode.selectedIndex; - } - - return elem.selected === true; - }, - - // Contents - "empty": function( elem ) { - - // http://www.w3.org/TR/selectors/#empty-pseudo - // :empty is negated by element (1) or content nodes (text: 3; cdata: 4; entity ref: 5), - // but not by others (comment: 8; processing instruction: 7; etc.) - // nodeType < 6 works because attributes (2) do not appear as children - for ( elem = elem.firstChild; elem; elem = elem.nextSibling ) { - if ( elem.nodeType < 6 ) { - return false; - } - } - return true; - }, - - "parent": function( elem ) { - return !Expr.pseudos[ "empty" ]( elem ); - }, - - // Element/input types - "header": function( elem ) { - return rheader.test( elem.nodeName ); - }, - - "input": function( elem ) { - return rinputs.test( elem.nodeName ); - }, - - "button": function( elem ) { - var name = elem.nodeName.toLowerCase(); - return name === "input" && elem.type === "button" || name === "button"; - }, - - "text": function( elem ) { - var attr; - return elem.nodeName.toLowerCase() === "input" && - elem.type === "text" && - - // Support: IE<8 - // New HTML5 attribute values (e.g., "search") appear with elem.type === "text" - ( ( attr = elem.getAttribute( "type" ) ) == null || - attr.toLowerCase() === "text" ); - }, - - // Position-in-collection - "first": createPositionalPseudo( function() { - return [ 0 ]; - } ), - - "last": createPositionalPseudo( function( _matchIndexes, length ) { - return [ length - 1 ]; - } ), - - "eq": createPositionalPseudo( function( _matchIndexes, length, argument ) { - return [ argument < 0 ? argument + length : argument ]; - } ), - - "even": createPositionalPseudo( function( matchIndexes, length ) { - var i = 0; - for ( ; i < length; i += 2 ) { - matchIndexes.push( i ); - } - return matchIndexes; - } ), - - "odd": createPositionalPseudo( function( matchIndexes, length ) { - var i = 1; - for ( ; i < length; i += 2 ) { - matchIndexes.push( i ); - } - return matchIndexes; - } ), - - "lt": createPositionalPseudo( function( matchIndexes, length, argument ) { - var i = argument < 0 ? - argument + length : - argument > length ? - length : - argument; - for ( ; --i >= 0; ) { - matchIndexes.push( i ); - } - return matchIndexes; - } ), - - "gt": createPositionalPseudo( function( matchIndexes, length, argument ) { - var i = argument < 0 ? argument + length : argument; - for ( ; ++i < length; ) { - matchIndexes.push( i ); - } - return matchIndexes; - } ) - } -}; - -Expr.pseudos[ "nth" ] = Expr.pseudos[ "eq" ]; - -// Add button/input type pseudos -for ( i in { radio: true, checkbox: true, file: true, password: true, image: true } ) { - Expr.pseudos[ i ] = createInputPseudo( i ); -} -for ( i in { submit: true, reset: true } ) { - Expr.pseudos[ i ] = createButtonPseudo( i ); -} - -// Easy API for creating new setFilters -function setFilters() {} -setFilters.prototype = Expr.filters = Expr.pseudos; -Expr.setFilters = new setFilters(); - -tokenize = Sizzle.tokenize = function( selector, parseOnly ) { - var matched, match, tokens, type, - soFar, groups, preFilters, - cached = tokenCache[ selector + " " ]; - - if ( cached ) { - return parseOnly ? 0 : cached.slice( 0 ); - } - - soFar = selector; - groups = []; - preFilters = Expr.preFilter; - - while ( soFar ) { - - // Comma and first run - if ( !matched || ( match = rcomma.exec( soFar ) ) ) { - if ( match ) { - - // Don't consume trailing commas as valid - soFar = soFar.slice( match[ 0 ].length ) || soFar; - } - groups.push( ( tokens = [] ) ); - } - - matched = false; - - // Combinators - if ( ( match = rcombinators.exec( soFar ) ) ) { - matched = match.shift(); - tokens.push( { - value: matched, - - // Cast descendant combinators to space - type: match[ 0 ].replace( rtrim, " " ) - } ); - soFar = soFar.slice( matched.length ); - } - - // Filters - for ( type in Expr.filter ) { - if ( ( match = matchExpr[ type ].exec( soFar ) ) && ( !preFilters[ type ] || - ( match = preFilters[ type ]( match ) ) ) ) { - matched = match.shift(); - tokens.push( { - value: matched, - type: type, - matches: match - } ); - soFar = soFar.slice( matched.length ); - } - } - - if ( !matched ) { - break; - } - } - - // Return the length of the invalid excess - // if we're just parsing - // Otherwise, throw an error or return tokens - return parseOnly ? - soFar.length : - soFar ? - Sizzle.error( selector ) : - - // Cache the tokens - tokenCache( selector, groups ).slice( 0 ); -}; - -function toSelector( tokens ) { - var i = 0, - len = tokens.length, - selector = ""; - for ( ; i < len; i++ ) { - selector += tokens[ i ].value; - } - return selector; -} - -function addCombinator( matcher, combinator, base ) { - var dir = combinator.dir, - skip = combinator.next, - key = skip || dir, - checkNonElements = base && key === "parentNode", - doneName = done++; - - return combinator.first ? - - // Check against closest ancestor/preceding element - function( elem, context, xml ) { - while ( ( elem = elem[ dir ] ) ) { - if ( elem.nodeType === 1 || checkNonElements ) { - return matcher( elem, context, xml ); - } - } - return false; - } : - - // Check against all ancestor/preceding elements - function( elem, context, xml ) { - var oldCache, uniqueCache, outerCache, - newCache = [ dirruns, doneName ]; - - // We can't set arbitrary data on XML nodes, so they don't benefit from combinator caching - if ( xml ) { - while ( ( elem = elem[ dir ] ) ) { - if ( elem.nodeType === 1 || checkNonElements ) { - if ( matcher( elem, context, xml ) ) { - return true; - } - } - } - } else { - while ( ( elem = elem[ dir ] ) ) { - if ( elem.nodeType === 1 || checkNonElements ) { - outerCache = elem[ expando ] || ( elem[ expando ] = {} ); - - // Support: IE <9 only - // Defend against cloned attroperties (jQuery gh-1709) - uniqueCache = outerCache[ elem.uniqueID ] || - ( outerCache[ elem.uniqueID ] = {} ); - - if ( skip && skip === elem.nodeName.toLowerCase() ) { - elem = elem[ dir ] || elem; - } else if ( ( oldCache = uniqueCache[ key ] ) && - oldCache[ 0 ] === dirruns && oldCache[ 1 ] === doneName ) { - - // Assign to newCache so results back-propagate to previous elements - return ( newCache[ 2 ] = oldCache[ 2 ] ); - } else { - - // Reuse newcache so results back-propagate to previous elements - uniqueCache[ key ] = newCache; - - // A match means we're done; a fail means we have to keep checking - if ( ( newCache[ 2 ] = matcher( elem, context, xml ) ) ) { - return true; - } - } - } - } - } - return false; - }; -} - -function elementMatcher( matchers ) { - return matchers.length > 1 ? - function( elem, context, xml ) { - var i = matchers.length; - while ( i-- ) { - if ( !matchers[ i ]( elem, context, xml ) ) { - return false; - } - } - return true; - } : - matchers[ 0 ]; -} - -function multipleContexts( selector, contexts, results ) { - var i = 0, - len = contexts.length; - for ( ; i < len; i++ ) { - Sizzle( selector, contexts[ i ], results ); - } - return results; -} - -function condense( unmatched, map, filter, context, xml ) { - var elem, - newUnmatched = [], - i = 0, - len = unmatched.length, - mapped = map != null; - - for ( ; i < len; i++ ) { - if ( ( elem = unmatched[ i ] ) ) { - if ( !filter || filter( elem, context, xml ) ) { - newUnmatched.push( elem ); - if ( mapped ) { - map.push( i ); - } - } - } - } - - return newUnmatched; -} - -function setMatcher( preFilter, selector, matcher, postFilter, postFinder, postSelector ) { - if ( postFilter && !postFilter[ expando ] ) { - postFilter = setMatcher( postFilter ); - } - if ( postFinder && !postFinder[ expando ] ) { - postFinder = setMatcher( postFinder, postSelector ); - } - return markFunction( function( seed, results, context, xml ) { - var temp, i, elem, - preMap = [], - postMap = [], - preexisting = results.length, - - // Get initial elements from seed or context - elems = seed || multipleContexts( - selector || "*", - context.nodeType ? [ context ] : context, - [] - ), - - // Prefilter to get matcher input, preserving a map for seed-results synchronization - matcherIn = preFilter && ( seed || !selector ) ? - condense( elems, preMap, preFilter, context, xml ) : - elems, - - matcherOut = matcher ? - - // If we have a postFinder, or filtered seed, or non-seed postFilter or preexisting results, - postFinder || ( seed ? preFilter : preexisting || postFilter ) ? - - // ...intermediate processing is necessary - [] : - - // ...otherwise use results directly - results : - matcherIn; - - // Find primary matches - if ( matcher ) { - matcher( matcherIn, matcherOut, context, xml ); - } - - // Apply postFilter - if ( postFilter ) { - temp = condense( matcherOut, postMap ); - postFilter( temp, [], context, xml ); - - // Un-match failing elements by moving them back to matcherIn - i = temp.length; - while ( i-- ) { - if ( ( elem = temp[ i ] ) ) { - matcherOut[ postMap[ i ] ] = !( matcherIn[ postMap[ i ] ] = elem ); - } - } - } - - if ( seed ) { - if ( postFinder || preFilter ) { - if ( postFinder ) { - - // Get the final matcherOut by condensing this intermediate into postFinder contexts - temp = []; - i = matcherOut.length; - while ( i-- ) { - if ( ( elem = matcherOut[ i ] ) ) { - - // Restore matcherIn since elem is not yet a final match - temp.push( ( matcherIn[ i ] = elem ) ); - } - } - postFinder( null, ( matcherOut = [] ), temp, xml ); - } - - // Move matched elements from seed to results to keep them synchronized - i = matcherOut.length; - while ( i-- ) { - if ( ( elem = matcherOut[ i ] ) && - ( temp = postFinder ? indexOf( seed, elem ) : preMap[ i ] ) > -1 ) { - - seed[ temp ] = !( results[ temp ] = elem ); - } - } - } - - // Add elements to results, through postFinder if defined - } else { - matcherOut = condense( - matcherOut === results ? - matcherOut.splice( preexisting, matcherOut.length ) : - matcherOut - ); - if ( postFinder ) { - postFinder( null, results, matcherOut, xml ); - } else { - push.apply( results, matcherOut ); - } - } - } ); -} - -function matcherFromTokens( tokens ) { - var checkContext, matcher, j, - len = tokens.length, - leadingRelative = Expr.relative[ tokens[ 0 ].type ], - implicitRelative = leadingRelative || Expr.relative[ " " ], - i = leadingRelative ? 1 : 0, - - // The foundational matcher ensures that elements are reachable from top-level context(s) - matchContext = addCombinator( function( elem ) { - return elem === checkContext; - }, implicitRelative, true ), - matchAnyContext = addCombinator( function( elem ) { - return indexOf( checkContext, elem ) > -1; - }, implicitRelative, true ), - matchers = [ function( elem, context, xml ) { - var ret = ( !leadingRelative && ( xml || context !== outermostContext ) ) || ( - ( checkContext = context ).nodeType ? - matchContext( elem, context, xml ) : - matchAnyContext( elem, context, xml ) ); - - // Avoid hanging onto element (issue #299) - checkContext = null; - return ret; - } ]; - - for ( ; i < len; i++ ) { - if ( ( matcher = Expr.relative[ tokens[ i ].type ] ) ) { - matchers = [ addCombinator( elementMatcher( matchers ), matcher ) ]; - } else { - matcher = Expr.filter[ tokens[ i ].type ].apply( null, tokens[ i ].matches ); - - // Return special upon seeing a positional matcher - if ( matcher[ expando ] ) { - - // Find the next relative operator (if any) for proper handling - j = ++i; - for ( ; j < len; j++ ) { - if ( Expr.relative[ tokens[ j ].type ] ) { - break; - } - } - return setMatcher( - i > 1 && elementMatcher( matchers ), - i > 1 && toSelector( - - // If the preceding token was a descendant combinator, insert an implicit any-element `*` - tokens - .slice( 0, i - 1 ) - .concat( { value: tokens[ i - 2 ].type === " " ? "*" : "" } ) - ).replace( rtrim, "$1" ), - matcher, - i < j && matcherFromTokens( tokens.slice( i, j ) ), - j < len && matcherFromTokens( ( tokens = tokens.slice( j ) ) ), - j < len && toSelector( tokens ) - ); - } - matchers.push( matcher ); - } - } - - return elementMatcher( matchers ); -} - -function matcherFromGroupMatchers( elementMatchers, setMatchers ) { - var bySet = setMatchers.length > 0, - byElement = elementMatchers.length > 0, - superMatcher = function( seed, context, xml, results, outermost ) { - var elem, j, matcher, - matchedCount = 0, - i = "0", - unmatched = seed && [], - setMatched = [], - contextBackup = outermostContext, - - // We must always have either seed elements or outermost context - elems = seed || byElement && Expr.find[ "TAG" ]( "*", outermost ), - - // Use integer dirruns iff this is the outermost matcher - dirrunsUnique = ( dirruns += contextBackup == null ? 1 : Math.random() || 0.1 ), - len = elems.length; - - if ( outermost ) { - - // Support: IE 11+, Edge 17 - 18+ - // IE/Edge sometimes throw a "Permission denied" error when strict-comparing - // two documents; shallow comparisons work. - // eslint-disable-next-line eqeqeq - outermostContext = context == document || context || outermost; - } - - // Add elements passing elementMatchers directly to results - // Support: IE<9, Safari - // Tolerate NodeList properties (IE: "length"; Safari: ) matching elements by id - for ( ; i !== len && ( elem = elems[ i ] ) != null; i++ ) { - if ( byElement && elem ) { - j = 0; - - // Support: IE 11+, Edge 17 - 18+ - // IE/Edge sometimes throw a "Permission denied" error when strict-comparing - // two documents; shallow comparisons work. - // eslint-disable-next-line eqeqeq - if ( !context && elem.ownerDocument != document ) { - setDocument( elem ); - xml = !documentIsHTML; - } - while ( ( matcher = elementMatchers[ j++ ] ) ) { - if ( matcher( elem, context || document, xml ) ) { - results.push( elem ); - break; - } - } - if ( outermost ) { - dirruns = dirrunsUnique; - } - } - - // Track unmatched elements for set filters - if ( bySet ) { - - // They will have gone through all possible matchers - if ( ( elem = !matcher && elem ) ) { - matchedCount--; - } - - // Lengthen the array for every element, matched or not - if ( seed ) { - unmatched.push( elem ); - } - } - } - - // `i` is now the count of elements visited above, and adding it to `matchedCount` - // makes the latter nonnegative. - matchedCount += i; - - // Apply set filters to unmatched elements - // NOTE: This can be skipped if there are no unmatched elements (i.e., `matchedCount` - // equals `i`), unless we didn't visit _any_ elements in the above loop because we have - // no element matchers and no seed. - // Incrementing an initially-string "0" `i` allows `i` to remain a string only in that - // case, which will result in a "00" `matchedCount` that differs from `i` but is also - // numerically zero. - if ( bySet && i !== matchedCount ) { - j = 0; - while ( ( matcher = setMatchers[ j++ ] ) ) { - matcher( unmatched, setMatched, context, xml ); - } - - if ( seed ) { - - // Reintegrate element matches to eliminate the need for sorting - if ( matchedCount > 0 ) { - while ( i-- ) { - if ( !( unmatched[ i ] || setMatched[ i ] ) ) { - setMatched[ i ] = pop.call( results ); - } - } - } - - // Discard index placeholder values to get only actual matches - setMatched = condense( setMatched ); - } - - // Add matches to results - push.apply( results, setMatched ); - - // Seedless set matches succeeding multiple successful matchers stipulate sorting - if ( outermost && !seed && setMatched.length > 0 && - ( matchedCount + setMatchers.length ) > 1 ) { - - Sizzle.uniqueSort( results ); - } - } - - // Override manipulation of globals by nested matchers - if ( outermost ) { - dirruns = dirrunsUnique; - outermostContext = contextBackup; - } - - return unmatched; - }; - - return bySet ? - markFunction( superMatcher ) : - superMatcher; -} - -compile = Sizzle.compile = function( selector, match /* Internal Use Only */ ) { - var i, - setMatchers = [], - elementMatchers = [], - cached = compilerCache[ selector + " " ]; - - if ( !cached ) { - - // Generate a function of recursive functions that can be used to check each element - if ( !match ) { - match = tokenize( selector ); - } - i = match.length; - while ( i-- ) { - cached = matcherFromTokens( match[ i ] ); - if ( cached[ expando ] ) { - setMatchers.push( cached ); - } else { - elementMatchers.push( cached ); - } - } - - // Cache the compiled function - cached = compilerCache( - selector, - matcherFromGroupMatchers( elementMatchers, setMatchers ) - ); - - // Save selector and tokenization - cached.selector = selector; - } - return cached; -}; - -/** - * A low-level selection function that works with Sizzle's compiled - * selector functions - * @param {String|Function} selector A selector or a pre-compiled - * selector function built with Sizzle.compile - * @param {Element} context - * @param {Array} [results] - * @param {Array} [seed] A set of elements to match against - */ -select = Sizzle.select = function( selector, context, results, seed ) { - var i, tokens, token, type, find, - compiled = typeof selector === "function" && selector, - match = !seed && tokenize( ( selector = compiled.selector || selector ) ); - - results = results || []; - - // Try to minimize operations if there is only one selector in the list and no seed - // (the latter of which guarantees us context) - if ( match.length === 1 ) { - - // Reduce context if the leading compound selector is an ID - tokens = match[ 0 ] = match[ 0 ].slice( 0 ); - if ( tokens.length > 2 && ( token = tokens[ 0 ] ).type === "ID" && - context.nodeType === 9 && documentIsHTML && Expr.relative[ tokens[ 1 ].type ] ) { - - context = ( Expr.find[ "ID" ]( token.matches[ 0 ] - .replace( runescape, funescape ), context ) || [] )[ 0 ]; - if ( !context ) { - return results; - - // Precompiled matchers will still verify ancestry, so step up a level - } else if ( compiled ) { - context = context.parentNode; - } - - selector = selector.slice( tokens.shift().value.length ); - } - - // Fetch a seed set for right-to-left matching - i = matchExpr[ "needsContext" ].test( selector ) ? 0 : tokens.length; - while ( i-- ) { - token = tokens[ i ]; - - // Abort if we hit a combinator - if ( Expr.relative[ ( type = token.type ) ] ) { - break; - } - if ( ( find = Expr.find[ type ] ) ) { - - // Search, expanding context for leading sibling combinators - if ( ( seed = find( - token.matches[ 0 ].replace( runescape, funescape ), - rsibling.test( tokens[ 0 ].type ) && testContext( context.parentNode ) || - context - ) ) ) { - - // If seed is empty or no tokens remain, we can return early - tokens.splice( i, 1 ); - selector = seed.length && toSelector( tokens ); - if ( !selector ) { - push.apply( results, seed ); - return results; - } - - break; - } - } - } - } - - // Compile and execute a filtering function if one is not provided - // Provide `match` to avoid retokenization if we modified the selector above - ( compiled || compile( selector, match ) )( - seed, - context, - !documentIsHTML, - results, - !context || rsibling.test( selector ) && testContext( context.parentNode ) || context - ); - return results; -}; - -// One-time assignments - -// Sort stability -support.sortStable = expando.split( "" ).sort( sortOrder ).join( "" ) === expando; - -// Support: Chrome 14-35+ -// Always assume duplicates if they aren't passed to the comparison function -support.detectDuplicates = !!hasDuplicate; - -// Initialize against the default document -setDocument(); - -// Support: Webkit<537.32 - Safari 6.0.3/Chrome 25 (fixed in Chrome 27) -// Detached nodes confoundingly follow *each other* -support.sortDetached = assert( function( el ) { - - // Should return 1, but returns 4 (following) - return el.compareDocumentPosition( document.createElement( "fieldset" ) ) & 1; -} ); - -// Support: IE<8 -// Prevent attribute/property "interpolation" -// https://msdn.microsoft.com/en-us/library/ms536429%28VS.85%29.aspx -if ( !assert( function( el ) { - el.innerHTML = ""; - return el.firstChild.getAttribute( "href" ) === "#"; -} ) ) { - addHandle( "type|href|height|width", function( elem, name, isXML ) { - if ( !isXML ) { - return elem.getAttribute( name, name.toLowerCase() === "type" ? 1 : 2 ); - } - } ); -} - -// Support: IE<9 -// Use defaultValue in place of getAttribute("value") -if ( !support.attributes || !assert( function( el ) { - el.innerHTML = ""; - el.firstChild.setAttribute( "value", "" ); - return el.firstChild.getAttribute( "value" ) === ""; -} ) ) { - addHandle( "value", function( elem, _name, isXML ) { - if ( !isXML && elem.nodeName.toLowerCase() === "input" ) { - return elem.defaultValue; - } - } ); -} - -// Support: IE<9 -// Use getAttributeNode to fetch booleans when getAttribute lies -if ( !assert( function( el ) { - return el.getAttribute( "disabled" ) == null; -} ) ) { - addHandle( booleans, function( elem, name, isXML ) { - var val; - if ( !isXML ) { - return elem[ name ] === true ? name.toLowerCase() : - ( val = elem.getAttributeNode( name ) ) && val.specified ? - val.value : - null; - } - } ); -} - -return Sizzle; - -} )( window ); - - - -jQuery.find = Sizzle; -jQuery.expr = Sizzle.selectors; - -// Deprecated -jQuery.expr[ ":" ] = jQuery.expr.pseudos; -jQuery.uniqueSort = jQuery.unique = Sizzle.uniqueSort; -jQuery.text = Sizzle.getText; -jQuery.isXMLDoc = Sizzle.isXML; -jQuery.contains = Sizzle.contains; -jQuery.escapeSelector = Sizzle.escape; - - - - -var dir = function( elem, dir, until ) { - var matched = [], - truncate = until !== undefined; - - while ( ( elem = elem[ dir ] ) && elem.nodeType !== 9 ) { - if ( elem.nodeType === 1 ) { - if ( truncate && jQuery( elem ).is( until ) ) { - break; - } - matched.push( elem ); - } - } - return matched; -}; - - -var siblings = function( n, elem ) { - var matched = []; - - for ( ; n; n = n.nextSibling ) { - if ( n.nodeType === 1 && n !== elem ) { - matched.push( n ); - } - } - - return matched; -}; - - -var rneedsContext = jQuery.expr.match.needsContext; - - - -function nodeName( elem, name ) { - - return elem.nodeName && elem.nodeName.toLowerCase() === name.toLowerCase(); - -}; -var rsingleTag = ( /^<([a-z][^\/\0>:\x20\t\r\n\f]*)[\x20\t\r\n\f]*\/?>(?:<\/\1>|)$/i ); - - - -// Implement the identical functionality for filter and not -function winnow( elements, qualifier, not ) { - if ( isFunction( qualifier ) ) { - return jQuery.grep( elements, function( elem, i ) { - return !!qualifier.call( elem, i, elem ) !== not; - } ); - } - - // Single element - if ( qualifier.nodeType ) { - return jQuery.grep( elements, function( elem ) { - return ( elem === qualifier ) !== not; - } ); - } - - // Arraylike of elements (jQuery, arguments, Array) - if ( typeof qualifier !== "string" ) { - return jQuery.grep( elements, function( elem ) { - return ( indexOf.call( qualifier, elem ) > -1 ) !== not; - } ); - } - - // Filtered directly for both simple and complex selectors - return jQuery.filter( qualifier, elements, not ); -} - -jQuery.filter = function( expr, elems, not ) { - var elem = elems[ 0 ]; - - if ( not ) { - expr = ":not(" + expr + ")"; - } - - if ( elems.length === 1 && elem.nodeType === 1 ) { - return jQuery.find.matchesSelector( elem, expr ) ? [ elem ] : []; - } - - return jQuery.find.matches( expr, jQuery.grep( elems, function( elem ) { - return elem.nodeType === 1; - } ) ); -}; - -jQuery.fn.extend( { - find: function( selector ) { - var i, ret, - len = this.length, - self = this; - - if ( typeof selector !== "string" ) { - return this.pushStack( jQuery( selector ).filter( function() { - for ( i = 0; i < len; i++ ) { - if ( jQuery.contains( self[ i ], this ) ) { - return true; - } - } - } ) ); - } - - ret = this.pushStack( [] ); - - for ( i = 0; i < len; i++ ) { - jQuery.find( selector, self[ i ], ret ); - } - - return len > 1 ? jQuery.uniqueSort( ret ) : ret; - }, - filter: function( selector ) { - return this.pushStack( winnow( this, selector || [], false ) ); - }, - not: function( selector ) { - return this.pushStack( winnow( this, selector || [], true ) ); - }, - is: function( selector ) { - return !!winnow( - this, - - // If this is a positional/relative selector, check membership in the returned set - // so $("p:first").is("p:last") won't return true for a doc with two "p". - typeof selector === "string" && rneedsContext.test( selector ) ? - jQuery( selector ) : - selector || [], - false - ).length; - } -} ); - - -// Initialize a jQuery object - - -// A central reference to the root jQuery(document) -var rootjQuery, - - // A simple way to check for HTML strings - // Prioritize #id over to avoid XSS via location.hash (#9521) - // Strict HTML recognition (#11290: must start with <) - // Shortcut simple #id case for speed - rquickExpr = /^(?:\s*(<[\w\W]+>)[^>]*|#([\w-]+))$/, - - init = jQuery.fn.init = function( selector, context, root ) { - var match, elem; - - // HANDLE: $(""), $(null), $(undefined), $(false) - if ( !selector ) { - return this; - } - - // Method init() accepts an alternate rootjQuery - // so migrate can support jQuery.sub (gh-2101) - root = root || rootjQuery; - - // Handle HTML strings - if ( typeof selector === "string" ) { - if ( selector[ 0 ] === "<" && - selector[ selector.length - 1 ] === ">" && - selector.length >= 3 ) { - - // Assume that strings that start and end with <> are HTML and skip the regex check - match = [ null, selector, null ]; - - } else { - match = rquickExpr.exec( selector ); - } - - // Match html or make sure no context is specified for #id - if ( match && ( match[ 1 ] || !context ) ) { - - // HANDLE: $(html) -> $(array) - if ( match[ 1 ] ) { - context = context instanceof jQuery ? context[ 0 ] : context; - - // Option to run scripts is true for back-compat - // Intentionally let the error be thrown if parseHTML is not present - jQuery.merge( this, jQuery.parseHTML( - match[ 1 ], - context && context.nodeType ? context.ownerDocument || context : document, - true - ) ); - - // HANDLE: $(html, props) - if ( rsingleTag.test( match[ 1 ] ) && jQuery.isPlainObject( context ) ) { - for ( match in context ) { - - // Properties of context are called as methods if possible - if ( isFunction( this[ match ] ) ) { - this[ match ]( context[ match ] ); - - // ...and otherwise set as attributes - } else { - this.attr( match, context[ match ] ); - } - } - } - - return this; - - // HANDLE: $(#id) - } else { - elem = document.getElementById( match[ 2 ] ); - - if ( elem ) { - - // Inject the element directly into the jQuery object - this[ 0 ] = elem; - this.length = 1; - } - return this; - } - - // HANDLE: $(expr, $(...)) - } else if ( !context || context.jquery ) { - return ( context || root ).find( selector ); - - // HANDLE: $(expr, context) - // (which is just equivalent to: $(context).find(expr) - } else { - return this.constructor( context ).find( selector ); - } - - // HANDLE: $(DOMElement) - } else if ( selector.nodeType ) { - this[ 0 ] = selector; - this.length = 1; - return this; - - // HANDLE: $(function) - // Shortcut for document ready - } else if ( isFunction( selector ) ) { - return root.ready !== undefined ? - root.ready( selector ) : - - // Execute immediately if ready is not present - selector( jQuery ); - } - - return jQuery.makeArray( selector, this ); - }; - -// Give the init function the jQuery prototype for later instantiation -init.prototype = jQuery.fn; - -// Initialize central reference -rootjQuery = jQuery( document ); - - -var rparentsprev = /^(?:parents|prev(?:Until|All))/, - - // Methods guaranteed to produce a unique set when starting from a unique set - guaranteedUnique = { - children: true, - contents: true, - next: true, - prev: true - }; - -jQuery.fn.extend( { - has: function( target ) { - var targets = jQuery( target, this ), - l = targets.length; - - return this.filter( function() { - var i = 0; - for ( ; i < l; i++ ) { - if ( jQuery.contains( this, targets[ i ] ) ) { - return true; - } - } - } ); - }, - - closest: function( selectors, context ) { - var cur, - i = 0, - l = this.length, - matched = [], - targets = typeof selectors !== "string" && jQuery( selectors ); - - // Positional selectors never match, since there's no _selection_ context - if ( !rneedsContext.test( selectors ) ) { - for ( ; i < l; i++ ) { - for ( cur = this[ i ]; cur && cur !== context; cur = cur.parentNode ) { - - // Always skip document fragments - if ( cur.nodeType < 11 && ( targets ? - targets.index( cur ) > -1 : - - // Don't pass non-elements to Sizzle - cur.nodeType === 1 && - jQuery.find.matchesSelector( cur, selectors ) ) ) { - - matched.push( cur ); - break; - } - } - } - } - - return this.pushStack( matched.length > 1 ? jQuery.uniqueSort( matched ) : matched ); - }, - - // Determine the position of an element within the set - index: function( elem ) { - - // No argument, return index in parent - if ( !elem ) { - return ( this[ 0 ] && this[ 0 ].parentNode ) ? this.first().prevAll().length : -1; - } - - // Index in selector - if ( typeof elem === "string" ) { - return indexOf.call( jQuery( elem ), this[ 0 ] ); - } - - // Locate the position of the desired element - return indexOf.call( this, - - // If it receives a jQuery object, the first element is used - elem.jquery ? elem[ 0 ] : elem - ); - }, - - add: function( selector, context ) { - return this.pushStack( - jQuery.uniqueSort( - jQuery.merge( this.get(), jQuery( selector, context ) ) - ) - ); - }, - - addBack: function( selector ) { - return this.add( selector == null ? - this.prevObject : this.prevObject.filter( selector ) - ); - } -} ); - -function sibling( cur, dir ) { - while ( ( cur = cur[ dir ] ) && cur.nodeType !== 1 ) {} - return cur; -} - -jQuery.each( { - parent: function( elem ) { - var parent = elem.parentNode; - return parent && parent.nodeType !== 11 ? parent : null; - }, - parents: function( elem ) { - return dir( elem, "parentNode" ); - }, - parentsUntil: function( elem, _i, until ) { - return dir( elem, "parentNode", until ); - }, - next: function( elem ) { - return sibling( elem, "nextSibling" ); - }, - prev: function( elem ) { - return sibling( elem, "previousSibling" ); - }, - nextAll: function( elem ) { - return dir( elem, "nextSibling" ); - }, - prevAll: function( elem ) { - return dir( elem, "previousSibling" ); - }, - nextUntil: function( elem, _i, until ) { - return dir( elem, "nextSibling", until ); - }, - prevUntil: function( elem, _i, until ) { - return dir( elem, "previousSibling", until ); - }, - siblings: function( elem ) { - return siblings( ( elem.parentNode || {} ).firstChild, elem ); - }, - children: function( elem ) { - return siblings( elem.firstChild ); - }, - contents: function( elem ) { - if ( elem.contentDocument != null && - - // Support: IE 11+ - // elements with no `data` attribute has an object - // `contentDocument` with a `null` prototype. - getProto( elem.contentDocument ) ) { - - return elem.contentDocument; - } - - // Support: IE 9 - 11 only, iOS 7 only, Android Browser <=4.3 only - // Treat the template element as a regular one in browsers that - // don't support it. - if ( nodeName( elem, "template" ) ) { - elem = elem.content || elem; - } - - return jQuery.merge( [], elem.childNodes ); - } -}, function( name, fn ) { - jQuery.fn[ name ] = function( until, selector ) { - var matched = jQuery.map( this, fn, until ); - - if ( name.slice( -5 ) !== "Until" ) { - selector = until; - } - - if ( selector && typeof selector === "string" ) { - matched = jQuery.filter( selector, matched ); - } - - if ( this.length > 1 ) { - - // Remove duplicates - if ( !guaranteedUnique[ name ] ) { - jQuery.uniqueSort( matched ); - } - - // Reverse order for parents* and prev-derivatives - if ( rparentsprev.test( name ) ) { - matched.reverse(); - } - } - - return this.pushStack( matched ); - }; -} ); -var rnothtmlwhite = ( /[^\x20\t\r\n\f]+/g ); - - - -// Convert String-formatted options into Object-formatted ones -function createOptions( options ) { - var object = {}; - jQuery.each( options.match( rnothtmlwhite ) || [], function( _, flag ) { - object[ flag ] = true; - } ); - return object; -} - -/* - * Create a callback list using the following parameters: - * - * options: an optional list of space-separated options that will change how - * the callback list behaves or a more traditional option object - * - * By default a callback list will act like an event callback list and can be - * "fired" multiple times. - * - * Possible options: - * - * once: will ensure the callback list can only be fired once (like a Deferred) - * - * memory: will keep track of previous values and will call any callback added - * after the list has been fired right away with the latest "memorized" - * values (like a Deferred) - * - * unique: will ensure a callback can only be added once (no duplicate in the list) - * - * stopOnFalse: interrupt callings when a callback returns false - * - */ -jQuery.Callbacks = function( options ) { - - // Convert options from String-formatted to Object-formatted if needed - // (we check in cache first) - options = typeof options === "string" ? - createOptions( options ) : - jQuery.extend( {}, options ); - - var // Flag to know if list is currently firing - firing, - - // Last fire value for non-forgettable lists - memory, - - // Flag to know if list was already fired - fired, - - // Flag to prevent firing - locked, - - // Actual callback list - list = [], - - // Queue of execution data for repeatable lists - queue = [], - - // Index of currently firing callback (modified by add/remove as needed) - firingIndex = -1, - - // Fire callbacks - fire = function() { - - // Enforce single-firing - locked = locked || options.once; - - // Execute callbacks for all pending executions, - // respecting firingIndex overrides and runtime changes - fired = firing = true; - for ( ; queue.length; firingIndex = -1 ) { - memory = queue.shift(); - while ( ++firingIndex < list.length ) { - - // Run callback and check for early termination - if ( list[ firingIndex ].apply( memory[ 0 ], memory[ 1 ] ) === false && - options.stopOnFalse ) { - - // Jump to end and forget the data so .add doesn't re-fire - firingIndex = list.length; - memory = false; - } - } - } - - // Forget the data if we're done with it - if ( !options.memory ) { - memory = false; - } - - firing = false; - - // Clean up if we're done firing for good - if ( locked ) { - - // Keep an empty list if we have data for future add calls - if ( memory ) { - list = []; - - // Otherwise, this object is spent - } else { - list = ""; - } - } - }, - - // Actual Callbacks object - self = { - - // Add a callback or a collection of callbacks to the list - add: function() { - if ( list ) { - - // If we have memory from a past run, we should fire after adding - if ( memory && !firing ) { - firingIndex = list.length - 1; - queue.push( memory ); - } - - ( function add( args ) { - jQuery.each( args, function( _, arg ) { - if ( isFunction( arg ) ) { - if ( !options.unique || !self.has( arg ) ) { - list.push( arg ); - } - } else if ( arg && arg.length && toType( arg ) !== "string" ) { - - // Inspect recursively - add( arg ); - } - } ); - } )( arguments ); - - if ( memory && !firing ) { - fire(); - } - } - return this; - }, - - // Remove a callback from the list - remove: function() { - jQuery.each( arguments, function( _, arg ) { - var index; - while ( ( index = jQuery.inArray( arg, list, index ) ) > -1 ) { - list.splice( index, 1 ); - - // Handle firing indexes - if ( index <= firingIndex ) { - firingIndex--; - } - } - } ); - return this; - }, - - // Check if a given callback is in the list. - // If no argument is given, return whether or not list has callbacks attached. - has: function( fn ) { - return fn ? - jQuery.inArray( fn, list ) > -1 : - list.length > 0; - }, - - // Remove all callbacks from the list - empty: function() { - if ( list ) { - list = []; - } - return this; - }, - - // Disable .fire and .add - // Abort any current/pending executions - // Clear all callbacks and values - disable: function() { - locked = queue = []; - list = memory = ""; - return this; - }, - disabled: function() { - return !list; - }, - - // Disable .fire - // Also disable .add unless we have memory (since it would have no effect) - // Abort any pending executions - lock: function() { - locked = queue = []; - if ( !memory && !firing ) { - list = memory = ""; - } - return this; - }, - locked: function() { - return !!locked; - }, - - // Call all callbacks with the given context and arguments - fireWith: function( context, args ) { - if ( !locked ) { - args = args || []; - args = [ context, args.slice ? args.slice() : args ]; - queue.push( args ); - if ( !firing ) { - fire(); - } - } - return this; - }, - - // Call all the callbacks with the given arguments - fire: function() { - self.fireWith( this, arguments ); - return this; - }, - - // To know if the callbacks have already been called at least once - fired: function() { - return !!fired; - } - }; - - return self; -}; - - -function Identity( v ) { - return v; -} -function Thrower( ex ) { - throw ex; -} - -function adoptValue( value, resolve, reject, noValue ) { - var method; - - try { - - // Check for promise aspect first to privilege synchronous behavior - if ( value && isFunction( ( method = value.promise ) ) ) { - method.call( value ).done( resolve ).fail( reject ); - - // Other thenables - } else if ( value && isFunction( ( method = value.then ) ) ) { - method.call( value, resolve, reject ); - - // Other non-thenables - } else { - - // Control `resolve` arguments by letting Array#slice cast boolean `noValue` to integer: - // * false: [ value ].slice( 0 ) => resolve( value ) - // * true: [ value ].slice( 1 ) => resolve() - resolve.apply( undefined, [ value ].slice( noValue ) ); - } - - // For Promises/A+, convert exceptions into rejections - // Since jQuery.when doesn't unwrap thenables, we can skip the extra checks appearing in - // Deferred#then to conditionally suppress rejection. - } catch ( value ) { - - // Support: Android 4.0 only - // Strict mode functions invoked without .call/.apply get global-object context - reject.apply( undefined, [ value ] ); - } -} - -jQuery.extend( { - - Deferred: function( func ) { - var tuples = [ - - // action, add listener, callbacks, - // ... .then handlers, argument index, [final state] - [ "notify", "progress", jQuery.Callbacks( "memory" ), - jQuery.Callbacks( "memory" ), 2 ], - [ "resolve", "done", jQuery.Callbacks( "once memory" ), - jQuery.Callbacks( "once memory" ), 0, "resolved" ], - [ "reject", "fail", jQuery.Callbacks( "once memory" ), - jQuery.Callbacks( "once memory" ), 1, "rejected" ] - ], - state = "pending", - promise = { - state: function() { - return state; - }, - always: function() { - deferred.done( arguments ).fail( arguments ); - return this; - }, - "catch": function( fn ) { - return promise.then( null, fn ); - }, - - // Keep pipe for back-compat - pipe: function( /* fnDone, fnFail, fnProgress */ ) { - var fns = arguments; - - return jQuery.Deferred( function( newDefer ) { - jQuery.each( tuples, function( _i, tuple ) { - - // Map tuples (progress, done, fail) to arguments (done, fail, progress) - var fn = isFunction( fns[ tuple[ 4 ] ] ) && fns[ tuple[ 4 ] ]; - - // deferred.progress(function() { bind to newDefer or newDefer.notify }) - // deferred.done(function() { bind to newDefer or newDefer.resolve }) - // deferred.fail(function() { bind to newDefer or newDefer.reject }) - deferred[ tuple[ 1 ] ]( function() { - var returned = fn && fn.apply( this, arguments ); - if ( returned && isFunction( returned.promise ) ) { - returned.promise() - .progress( newDefer.notify ) - .done( newDefer.resolve ) - .fail( newDefer.reject ); - } else { - newDefer[ tuple[ 0 ] + "With" ]( - this, - fn ? [ returned ] : arguments - ); - } - } ); - } ); - fns = null; - } ).promise(); - }, - then: function( onFulfilled, onRejected, onProgress ) { - var maxDepth = 0; - function resolve( depth, deferred, handler, special ) { - return function() { - var that = this, - args = arguments, - mightThrow = function() { - var returned, then; - - // Support: Promises/A+ section 2.3.3.3.3 - // https://promisesaplus.com/#point-59 - // Ignore double-resolution attempts - if ( depth < maxDepth ) { - return; - } - - returned = handler.apply( that, args ); - - // Support: Promises/A+ section 2.3.1 - // https://promisesaplus.com/#point-48 - if ( returned === deferred.promise() ) { - throw new TypeError( "Thenable self-resolution" ); - } - - // Support: Promises/A+ sections 2.3.3.1, 3.5 - // https://promisesaplus.com/#point-54 - // https://promisesaplus.com/#point-75 - // Retrieve `then` only once - then = returned && - - // Support: Promises/A+ section 2.3.4 - // https://promisesaplus.com/#point-64 - // Only check objects and functions for thenability - ( typeof returned === "object" || - typeof returned === "function" ) && - returned.then; - - // Handle a returned thenable - if ( isFunction( then ) ) { - - // Special processors (notify) just wait for resolution - if ( special ) { - then.call( - returned, - resolve( maxDepth, deferred, Identity, special ), - resolve( maxDepth, deferred, Thrower, special ) - ); - - // Normal processors (resolve) also hook into progress - } else { - - // ...and disregard older resolution values - maxDepth++; - - then.call( - returned, - resolve( maxDepth, deferred, Identity, special ), - resolve( maxDepth, deferred, Thrower, special ), - resolve( maxDepth, deferred, Identity, - deferred.notifyWith ) - ); - } - - // Handle all other returned values - } else { - - // Only substitute handlers pass on context - // and multiple values (non-spec behavior) - if ( handler !== Identity ) { - that = undefined; - args = [ returned ]; - } - - // Process the value(s) - // Default process is resolve - ( special || deferred.resolveWith )( that, args ); - } - }, - - // Only normal processors (resolve) catch and reject exceptions - process = special ? - mightThrow : - function() { - try { - mightThrow(); - } catch ( e ) { - - if ( jQuery.Deferred.exceptionHook ) { - jQuery.Deferred.exceptionHook( e, - process.stackTrace ); - } - - // Support: Promises/A+ section 2.3.3.3.4.1 - // https://promisesaplus.com/#point-61 - // Ignore post-resolution exceptions - if ( depth + 1 >= maxDepth ) { - - // Only substitute handlers pass on context - // and multiple values (non-spec behavior) - if ( handler !== Thrower ) { - that = undefined; - args = [ e ]; - } - - deferred.rejectWith( that, args ); - } - } - }; - - // Support: Promises/A+ section 2.3.3.3.1 - // https://promisesaplus.com/#point-57 - // Re-resolve promises immediately to dodge false rejection from - // subsequent errors - if ( depth ) { - process(); - } else { - - // Call an optional hook to record the stack, in case of exception - // since it's otherwise lost when execution goes async - if ( jQuery.Deferred.getStackHook ) { - process.stackTrace = jQuery.Deferred.getStackHook(); - } - window.setTimeout( process ); - } - }; - } - - return jQuery.Deferred( function( newDefer ) { - - // progress_handlers.add( ... ) - tuples[ 0 ][ 3 ].add( - resolve( - 0, - newDefer, - isFunction( onProgress ) ? - onProgress : - Identity, - newDefer.notifyWith - ) - ); - - // fulfilled_handlers.add( ... ) - tuples[ 1 ][ 3 ].add( - resolve( - 0, - newDefer, - isFunction( onFulfilled ) ? - onFulfilled : - Identity - ) - ); - - // rejected_handlers.add( ... ) - tuples[ 2 ][ 3 ].add( - resolve( - 0, - newDefer, - isFunction( onRejected ) ? - onRejected : - Thrower - ) - ); - } ).promise(); - }, - - // Get a promise for this deferred - // If obj is provided, the promise aspect is added to the object - promise: function( obj ) { - return obj != null ? jQuery.extend( obj, promise ) : promise; - } - }, - deferred = {}; - - // Add list-specific methods - jQuery.each( tuples, function( i, tuple ) { - var list = tuple[ 2 ], - stateString = tuple[ 5 ]; - - // promise.progress = list.add - // promise.done = list.add - // promise.fail = list.add - promise[ tuple[ 1 ] ] = list.add; - - // Handle state - if ( stateString ) { - list.add( - function() { - - // state = "resolved" (i.e., fulfilled) - // state = "rejected" - state = stateString; - }, - - // rejected_callbacks.disable - // fulfilled_callbacks.disable - tuples[ 3 - i ][ 2 ].disable, - - // rejected_handlers.disable - // fulfilled_handlers.disable - tuples[ 3 - i ][ 3 ].disable, - - // progress_callbacks.lock - tuples[ 0 ][ 2 ].lock, - - // progress_handlers.lock - tuples[ 0 ][ 3 ].lock - ); - } - - // progress_handlers.fire - // fulfilled_handlers.fire - // rejected_handlers.fire - list.add( tuple[ 3 ].fire ); - - // deferred.notify = function() { deferred.notifyWith(...) } - // deferred.resolve = function() { deferred.resolveWith(...) } - // deferred.reject = function() { deferred.rejectWith(...) } - deferred[ tuple[ 0 ] ] = function() { - deferred[ tuple[ 0 ] + "With" ]( this === deferred ? undefined : this, arguments ); - return this; - }; - - // deferred.notifyWith = list.fireWith - // deferred.resolveWith = list.fireWith - // deferred.rejectWith = list.fireWith - deferred[ tuple[ 0 ] + "With" ] = list.fireWith; - } ); - - // Make the deferred a promise - promise.promise( deferred ); - - // Call given func if any - if ( func ) { - func.call( deferred, deferred ); - } - - // All done! - return deferred; - }, - - // Deferred helper - when: function( singleValue ) { - var - - // count of uncompleted subordinates - remaining = arguments.length, - - // count of unprocessed arguments - i = remaining, - - // subordinate fulfillment data - resolveContexts = Array( i ), - resolveValues = slice.call( arguments ), - - // the master Deferred - master = jQuery.Deferred(), - - // subordinate callback factory - updateFunc = function( i ) { - return function( value ) { - resolveContexts[ i ] = this; - resolveValues[ i ] = arguments.length > 1 ? slice.call( arguments ) : value; - if ( !( --remaining ) ) { - master.resolveWith( resolveContexts, resolveValues ); - } - }; - }; - - // Single- and empty arguments are adopted like Promise.resolve - if ( remaining <= 1 ) { - adoptValue( singleValue, master.done( updateFunc( i ) ).resolve, master.reject, - !remaining ); - - // Use .then() to unwrap secondary thenables (cf. gh-3000) - if ( master.state() === "pending" || - isFunction( resolveValues[ i ] && resolveValues[ i ].then ) ) { - - return master.then(); - } - } - - // Multiple arguments are aggregated like Promise.all array elements - while ( i-- ) { - adoptValue( resolveValues[ i ], updateFunc( i ), master.reject ); - } - - return master.promise(); - } -} ); - - -// These usually indicate a programmer mistake during development, -// warn about them ASAP rather than swallowing them by default. -var rerrorNames = /^(Eval|Internal|Range|Reference|Syntax|Type|URI)Error$/; - -jQuery.Deferred.exceptionHook = function( error, stack ) { - - // Support: IE 8 - 9 only - // Console exists when dev tools are open, which can happen at any time - if ( window.console && window.console.warn && error && rerrorNames.test( error.name ) ) { - window.console.warn( "jQuery.Deferred exception: " + error.message, error.stack, stack ); - } -}; - - - - -jQuery.readyException = function( error ) { - window.setTimeout( function() { - throw error; - } ); -}; - - - - -// The deferred used on DOM ready -var readyList = jQuery.Deferred(); - -jQuery.fn.ready = function( fn ) { - - readyList - .then( fn ) - - // Wrap jQuery.readyException in a function so that the lookup - // happens at the time of error handling instead of callback - // registration. - .catch( function( error ) { - jQuery.readyException( error ); - } ); - - return this; -}; - -jQuery.extend( { - - // Is the DOM ready to be used? Set to true once it occurs. - isReady: false, - - // A counter to track how many items to wait for before - // the ready event fires. See #6781 - readyWait: 1, - - // Handle when the DOM is ready - ready: function( wait ) { - - // Abort if there are pending holds or we're already ready - if ( wait === true ? --jQuery.readyWait : jQuery.isReady ) { - return; - } - - // Remember that the DOM is ready - jQuery.isReady = true; - - // If a normal DOM Ready event fired, decrement, and wait if need be - if ( wait !== true && --jQuery.readyWait > 0 ) { - return; - } - - // If there are functions bound, to execute - readyList.resolveWith( document, [ jQuery ] ); - } -} ); - -jQuery.ready.then = readyList.then; - -// The ready event handler and self cleanup method -function completed() { - document.removeEventListener( "DOMContentLoaded", completed ); - window.removeEventListener( "load", completed ); - jQuery.ready(); -} - -// Catch cases where $(document).ready() is called -// after the browser event has already occurred. -// Support: IE <=9 - 10 only -// Older IE sometimes signals "interactive" too soon -if ( document.readyState === "complete" || - ( document.readyState !== "loading" && !document.documentElement.doScroll ) ) { - - // Handle it asynchronously to allow scripts the opportunity to delay ready - window.setTimeout( jQuery.ready ); - -} else { - - // Use the handy event callback - document.addEventListener( "DOMContentLoaded", completed ); - - // A fallback to window.onload, that will always work - window.addEventListener( "load", completed ); -} - - - - -// Multifunctional method to get and set values of a collection -// The value/s can optionally be executed if it's a function -var access = function( elems, fn, key, value, chainable, emptyGet, raw ) { - var i = 0, - len = elems.length, - bulk = key == null; - - // Sets many values - if ( toType( key ) === "object" ) { - chainable = true; - for ( i in key ) { - access( elems, fn, i, key[ i ], true, emptyGet, raw ); - } - - // Sets one value - } else if ( value !== undefined ) { - chainable = true; - - if ( !isFunction( value ) ) { - raw = true; - } - - if ( bulk ) { - - // Bulk operations run against the entire set - if ( raw ) { - fn.call( elems, value ); - fn = null; - - // ...except when executing function values - } else { - bulk = fn; - fn = function( elem, _key, value ) { - return bulk.call( jQuery( elem ), value ); - }; - } - } - - if ( fn ) { - for ( ; i < len; i++ ) { - fn( - elems[ i ], key, raw ? - value : - value.call( elems[ i ], i, fn( elems[ i ], key ) ) - ); - } - } - } - - if ( chainable ) { - return elems; - } - - // Gets - if ( bulk ) { - return fn.call( elems ); - } - - return len ? fn( elems[ 0 ], key ) : emptyGet; -}; - - -// Matches dashed string for camelizing -var rmsPrefix = /^-ms-/, - rdashAlpha = /-([a-z])/g; - -// Used by camelCase as callback to replace() -function fcamelCase( _all, letter ) { - return letter.toUpperCase(); -} - -// Convert dashed to camelCase; used by the css and data modules -// Support: IE <=9 - 11, Edge 12 - 15 -// Microsoft forgot to hump their vendor prefix (#9572) -function camelCase( string ) { - return string.replace( rmsPrefix, "ms-" ).replace( rdashAlpha, fcamelCase ); -} -var acceptData = function( owner ) { - - // Accepts only: - // - Node - // - Node.ELEMENT_NODE - // - Node.DOCUMENT_NODE - // - Object - // - Any - return owner.nodeType === 1 || owner.nodeType === 9 || !( +owner.nodeType ); -}; - - - - -function Data() { - this.expando = jQuery.expando + Data.uid++; -} - -Data.uid = 1; - -Data.prototype = { - - cache: function( owner ) { - - // Check if the owner object already has a cache - var value = owner[ this.expando ]; - - // If not, create one - if ( !value ) { - value = {}; - - // We can accept data for non-element nodes in modern browsers, - // but we should not, see #8335. - // Always return an empty object. - if ( acceptData( owner ) ) { - - // If it is a node unlikely to be stringify-ed or looped over - // use plain assignment - if ( owner.nodeType ) { - owner[ this.expando ] = value; - - // Otherwise secure it in a non-enumerable property - // configurable must be true to allow the property to be - // deleted when data is removed - } else { - Object.defineProperty( owner, this.expando, { - value: value, - configurable: true - } ); - } - } - } - - return value; - }, - set: function( owner, data, value ) { - var prop, - cache = this.cache( owner ); - - // Handle: [ owner, key, value ] args - // Always use camelCase key (gh-2257) - if ( typeof data === "string" ) { - cache[ camelCase( data ) ] = value; - - // Handle: [ owner, { properties } ] args - } else { - - // Copy the properties one-by-one to the cache object - for ( prop in data ) { - cache[ camelCase( prop ) ] = data[ prop ]; - } - } - return cache; - }, - get: function( owner, key ) { - return key === undefined ? - this.cache( owner ) : - - // Always use camelCase key (gh-2257) - owner[ this.expando ] && owner[ this.expando ][ camelCase( key ) ]; - }, - access: function( owner, key, value ) { - - // In cases where either: - // - // 1. No key was specified - // 2. A string key was specified, but no value provided - // - // Take the "read" path and allow the get method to determine - // which value to return, respectively either: - // - // 1. The entire cache object - // 2. The data stored at the key - // - if ( key === undefined || - ( ( key && typeof key === "string" ) && value === undefined ) ) { - - return this.get( owner, key ); - } - - // When the key is not a string, or both a key and value - // are specified, set or extend (existing objects) with either: - // - // 1. An object of properties - // 2. A key and value - // - this.set( owner, key, value ); - - // Since the "set" path can have two possible entry points - // return the expected data based on which path was taken[*] - return value !== undefined ? value : key; - }, - remove: function( owner, key ) { - var i, - cache = owner[ this.expando ]; - - if ( cache === undefined ) { - return; - } - - if ( key !== undefined ) { - - // Support array or space separated string of keys - if ( Array.isArray( key ) ) { - - // If key is an array of keys... - // We always set camelCase keys, so remove that. - key = key.map( camelCase ); - } else { - key = camelCase( key ); - - // If a key with the spaces exists, use it. - // Otherwise, create an array by matching non-whitespace - key = key in cache ? - [ key ] : - ( key.match( rnothtmlwhite ) || [] ); - } - - i = key.length; - - while ( i-- ) { - delete cache[ key[ i ] ]; - } - } - - // Remove the expando if there's no more data - if ( key === undefined || jQuery.isEmptyObject( cache ) ) { - - // Support: Chrome <=35 - 45 - // Webkit & Blink performance suffers when deleting properties - // from DOM nodes, so set to undefined instead - // https://bugs.chromium.org/p/chromium/issues/detail?id=378607 (bug restricted) - if ( owner.nodeType ) { - owner[ this.expando ] = undefined; - } else { - delete owner[ this.expando ]; - } - } - }, - hasData: function( owner ) { - var cache = owner[ this.expando ]; - return cache !== undefined && !jQuery.isEmptyObject( cache ); - } -}; -var dataPriv = new Data(); - -var dataUser = new Data(); - - - -// Implementation Summary -// -// 1. Enforce API surface and semantic compatibility with 1.9.x branch -// 2. Improve the module's maintainability by reducing the storage -// paths to a single mechanism. -// 3. Use the same single mechanism to support "private" and "user" data. -// 4. _Never_ expose "private" data to user code (TODO: Drop _data, _removeData) -// 5. Avoid exposing implementation details on user objects (eg. expando properties) -// 6. Provide a clear path for implementation upgrade to WeakMap in 2014 - -var rbrace = /^(?:\{[\w\W]*\}|\[[\w\W]*\])$/, - rmultiDash = /[A-Z]/g; - -function getData( data ) { - if ( data === "true" ) { - return true; - } - - if ( data === "false" ) { - return false; - } - - if ( data === "null" ) { - return null; - } - - // Only convert to a number if it doesn't change the string - if ( data === +data + "" ) { - return +data; - } - - if ( rbrace.test( data ) ) { - return JSON.parse( data ); - } - - return data; -} - -function dataAttr( elem, key, data ) { - var name; - - // If nothing was found internally, try to fetch any - // data from the HTML5 data-* attribute - if ( data === undefined && elem.nodeType === 1 ) { - name = "data-" + key.replace( rmultiDash, "-$&" ).toLowerCase(); - data = elem.getAttribute( name ); - - if ( typeof data === "string" ) { - try { - data = getData( data ); - } catch ( e ) {} - - // Make sure we set the data so it isn't changed later - dataUser.set( elem, key, data ); - } else { - data = undefined; - } - } - return data; -} - -jQuery.extend( { - hasData: function( elem ) { - return dataUser.hasData( elem ) || dataPriv.hasData( elem ); - }, - - data: function( elem, name, data ) { - return dataUser.access( elem, name, data ); - }, - - removeData: function( elem, name ) { - dataUser.remove( elem, name ); - }, - - // TODO: Now that all calls to _data and _removeData have been replaced - // with direct calls to dataPriv methods, these can be deprecated. - _data: function( elem, name, data ) { - return dataPriv.access( elem, name, data ); - }, - - _removeData: function( elem, name ) { - dataPriv.remove( elem, name ); - } -} ); - -jQuery.fn.extend( { - data: function( key, value ) { - var i, name, data, - elem = this[ 0 ], - attrs = elem && elem.attributes; - - // Gets all values - if ( key === undefined ) { - if ( this.length ) { - data = dataUser.get( elem ); - - if ( elem.nodeType === 1 && !dataPriv.get( elem, "hasDataAttrs" ) ) { - i = attrs.length; - while ( i-- ) { - - // Support: IE 11 only - // The attrs elements can be null (#14894) - if ( attrs[ i ] ) { - name = attrs[ i ].name; - if ( name.indexOf( "data-" ) === 0 ) { - name = camelCase( name.slice( 5 ) ); - dataAttr( elem, name, data[ name ] ); - } - } - } - dataPriv.set( elem, "hasDataAttrs", true ); - } - } - - return data; - } - - // Sets multiple values - if ( typeof key === "object" ) { - return this.each( function() { - dataUser.set( this, key ); - } ); - } - - return access( this, function( value ) { - var data; - - // The calling jQuery object (element matches) is not empty - // (and therefore has an element appears at this[ 0 ]) and the - // `value` parameter was not undefined. An empty jQuery object - // will result in `undefined` for elem = this[ 0 ] which will - // throw an exception if an attempt to read a data cache is made. - if ( elem && value === undefined ) { - - // Attempt to get data from the cache - // The key will always be camelCased in Data - data = dataUser.get( elem, key ); - if ( data !== undefined ) { - return data; - } - - // Attempt to "discover" the data in - // HTML5 custom data-* attrs - data = dataAttr( elem, key ); - if ( data !== undefined ) { - return data; - } - - // We tried really hard, but the data doesn't exist. - return; - } - - // Set the data... - this.each( function() { - - // We always store the camelCased key - dataUser.set( this, key, value ); - } ); - }, null, value, arguments.length > 1, null, true ); - }, - - removeData: function( key ) { - return this.each( function() { - dataUser.remove( this, key ); - } ); - } -} ); - - -jQuery.extend( { - queue: function( elem, type, data ) { - var queue; - - if ( elem ) { - type = ( type || "fx" ) + "queue"; - queue = dataPriv.get( elem, type ); - - // Speed up dequeue by getting out quickly if this is just a lookup - if ( data ) { - if ( !queue || Array.isArray( data ) ) { - queue = dataPriv.access( elem, type, jQuery.makeArray( data ) ); - } else { - queue.push( data ); - } - } - return queue || []; - } - }, - - dequeue: function( elem, type ) { - type = type || "fx"; - - var queue = jQuery.queue( elem, type ), - startLength = queue.length, - fn = queue.shift(), - hooks = jQuery._queueHooks( elem, type ), - next = function() { - jQuery.dequeue( elem, type ); - }; - - // If the fx queue is dequeued, always remove the progress sentinel - if ( fn === "inprogress" ) { - fn = queue.shift(); - startLength--; - } - - if ( fn ) { - - // Add a progress sentinel to prevent the fx queue from being - // automatically dequeued - if ( type === "fx" ) { - queue.unshift( "inprogress" ); - } - - // Clear up the last queue stop function - delete hooks.stop; - fn.call( elem, next, hooks ); - } - - if ( !startLength && hooks ) { - hooks.empty.fire(); - } - }, - - // Not public - generate a queueHooks object, or return the current one - _queueHooks: function( elem, type ) { - var key = type + "queueHooks"; - return dataPriv.get( elem, key ) || dataPriv.access( elem, key, { - empty: jQuery.Callbacks( "once memory" ).add( function() { - dataPriv.remove( elem, [ type + "queue", key ] ); - } ) - } ); - } -} ); - -jQuery.fn.extend( { - queue: function( type, data ) { - var setter = 2; - - if ( typeof type !== "string" ) { - data = type; - type = "fx"; - setter--; - } - - if ( arguments.length < setter ) { - return jQuery.queue( this[ 0 ], type ); - } - - return data === undefined ? - this : - this.each( function() { - var queue = jQuery.queue( this, type, data ); - - // Ensure a hooks for this queue - jQuery._queueHooks( this, type ); - - if ( type === "fx" && queue[ 0 ] !== "inprogress" ) { - jQuery.dequeue( this, type ); - } - } ); - }, - dequeue: function( type ) { - return this.each( function() { - jQuery.dequeue( this, type ); - } ); - }, - clearQueue: function( type ) { - return this.queue( type || "fx", [] ); - }, - - // Get a promise resolved when queues of a certain type - // are emptied (fx is the type by default) - promise: function( type, obj ) { - var tmp, - count = 1, - defer = jQuery.Deferred(), - elements = this, - i = this.length, - resolve = function() { - if ( !( --count ) ) { - defer.resolveWith( elements, [ elements ] ); - } - }; - - if ( typeof type !== "string" ) { - obj = type; - type = undefined; - } - type = type || "fx"; - - while ( i-- ) { - tmp = dataPriv.get( elements[ i ], type + "queueHooks" ); - if ( tmp && tmp.empty ) { - count++; - tmp.empty.add( resolve ); - } - } - resolve(); - return defer.promise( obj ); - } -} ); -var pnum = ( /[+-]?(?:\d*\.|)\d+(?:[eE][+-]?\d+|)/ ).source; - -var rcssNum = new RegExp( "^(?:([+-])=|)(" + pnum + ")([a-z%]*)$", "i" ); - - -var cssExpand = [ "Top", "Right", "Bottom", "Left" ]; - -var documentElement = document.documentElement; - - - - var isAttached = function( elem ) { - return jQuery.contains( elem.ownerDocument, elem ); - }, - composed = { composed: true }; - - // Support: IE 9 - 11+, Edge 12 - 18+, iOS 10.0 - 10.2 only - // Check attachment across shadow DOM boundaries when possible (gh-3504) - // Support: iOS 10.0-10.2 only - // Early iOS 10 versions support `attachShadow` but not `getRootNode`, - // leading to errors. We need to check for `getRootNode`. - if ( documentElement.getRootNode ) { - isAttached = function( elem ) { - return jQuery.contains( elem.ownerDocument, elem ) || - elem.getRootNode( composed ) === elem.ownerDocument; - }; - } -var isHiddenWithinTree = function( elem, el ) { - - // isHiddenWithinTree might be called from jQuery#filter function; - // in that case, element will be second argument - elem = el || elem; - - // Inline style trumps all - return elem.style.display === "none" || - elem.style.display === "" && - - // Otherwise, check computed style - // Support: Firefox <=43 - 45 - // Disconnected elements can have computed display: none, so first confirm that elem is - // in the document. - isAttached( elem ) && - - jQuery.css( elem, "display" ) === "none"; - }; - - - -function adjustCSS( elem, prop, valueParts, tween ) { - var adjusted, scale, - maxIterations = 20, - currentValue = tween ? - function() { - return tween.cur(); - } : - function() { - return jQuery.css( elem, prop, "" ); - }, - initial = currentValue(), - unit = valueParts && valueParts[ 3 ] || ( jQuery.cssNumber[ prop ] ? "" : "px" ), - - // Starting value computation is required for potential unit mismatches - initialInUnit = elem.nodeType && - ( jQuery.cssNumber[ prop ] || unit !== "px" && +initial ) && - rcssNum.exec( jQuery.css( elem, prop ) ); - - if ( initialInUnit && initialInUnit[ 3 ] !== unit ) { - - // Support: Firefox <=54 - // Halve the iteration target value to prevent interference from CSS upper bounds (gh-2144) - initial = initial / 2; - - // Trust units reported by jQuery.css - unit = unit || initialInUnit[ 3 ]; - - // Iteratively approximate from a nonzero starting point - initialInUnit = +initial || 1; - - while ( maxIterations-- ) { - - // Evaluate and update our best guess (doubling guesses that zero out). - // Finish if the scale equals or crosses 1 (making the old*new product non-positive). - jQuery.style( elem, prop, initialInUnit + unit ); - if ( ( 1 - scale ) * ( 1 - ( scale = currentValue() / initial || 0.5 ) ) <= 0 ) { - maxIterations = 0; - } - initialInUnit = initialInUnit / scale; - - } - - initialInUnit = initialInUnit * 2; - jQuery.style( elem, prop, initialInUnit + unit ); - - // Make sure we update the tween properties later on - valueParts = valueParts || []; - } - - if ( valueParts ) { - initialInUnit = +initialInUnit || +initial || 0; - - // Apply relative offset (+=/-=) if specified - adjusted = valueParts[ 1 ] ? - initialInUnit + ( valueParts[ 1 ] + 1 ) * valueParts[ 2 ] : - +valueParts[ 2 ]; - if ( tween ) { - tween.unit = unit; - tween.start = initialInUnit; - tween.end = adjusted; - } - } - return adjusted; -} - - -var defaultDisplayMap = {}; - -function getDefaultDisplay( elem ) { - var temp, - doc = elem.ownerDocument, - nodeName = elem.nodeName, - display = defaultDisplayMap[ nodeName ]; - - if ( display ) { - return display; - } - - temp = doc.body.appendChild( doc.createElement( nodeName ) ); - display = jQuery.css( temp, "display" ); - - temp.parentNode.removeChild( temp ); - - if ( display === "none" ) { - display = "block"; - } - defaultDisplayMap[ nodeName ] = display; - - return display; -} - -function showHide( elements, show ) { - var display, elem, - values = [], - index = 0, - length = elements.length; - - // Determine new display value for elements that need to change - for ( ; index < length; index++ ) { - elem = elements[ index ]; - if ( !elem.style ) { - continue; - } - - display = elem.style.display; - if ( show ) { - - // Since we force visibility upon cascade-hidden elements, an immediate (and slow) - // check is required in this first loop unless we have a nonempty display value (either - // inline or about-to-be-restored) - if ( display === "none" ) { - values[ index ] = dataPriv.get( elem, "display" ) || null; - if ( !values[ index ] ) { - elem.style.display = ""; - } - } - if ( elem.style.display === "" && isHiddenWithinTree( elem ) ) { - values[ index ] = getDefaultDisplay( elem ); - } - } else { - if ( display !== "none" ) { - values[ index ] = "none"; - - // Remember what we're overwriting - dataPriv.set( elem, "display", display ); - } - } - } - - // Set the display of the elements in a second loop to avoid constant reflow - for ( index = 0; index < length; index++ ) { - if ( values[ index ] != null ) { - elements[ index ].style.display = values[ index ]; - } - } - - return elements; -} - -jQuery.fn.extend( { - show: function() { - return showHide( this, true ); - }, - hide: function() { - return showHide( this ); - }, - toggle: function( state ) { - if ( typeof state === "boolean" ) { - return state ? this.show() : this.hide(); - } - - return this.each( function() { - if ( isHiddenWithinTree( this ) ) { - jQuery( this ).show(); - } else { - jQuery( this ).hide(); - } - } ); - } -} ); -var rcheckableType = ( /^(?:checkbox|radio)$/i ); - -var rtagName = ( /<([a-z][^\/\0>\x20\t\r\n\f]*)/i ); - -var rscriptType = ( /^$|^module$|\/(?:java|ecma)script/i ); - - - -( function() { - var fragment = document.createDocumentFragment(), - div = fragment.appendChild( document.createElement( "div" ) ), - input = document.createElement( "input" ); - - // Support: Android 4.0 - 4.3 only - // Check state lost if the name is set (#11217) - // Support: Windows Web Apps (WWA) - // `name` and `type` must use .setAttribute for WWA (#14901) - input.setAttribute( "type", "radio" ); - input.setAttribute( "checked", "checked" ); - input.setAttribute( "name", "t" ); - - div.appendChild( input ); - - // Support: Android <=4.1 only - // Older WebKit doesn't clone checked state correctly in fragments - support.checkClone = div.cloneNode( true ).cloneNode( true ).lastChild.checked; - - // Support: IE <=11 only - // Make sure textarea (and checkbox) defaultValue is properly cloned - div.innerHTML = ""; - support.noCloneChecked = !!div.cloneNode( true ).lastChild.defaultValue; - - // Support: IE <=9 only - // IE <=9 replaces "; - support.option = !!div.lastChild; -} )(); - - -// We have to close these tags to support XHTML (#13200) -var wrapMap = { - - // XHTML parsers do not magically insert elements in the - // same way that tag soup parsers do. So we cannot shorten - // this by omitting or other required elements. - thead: [ 1, "", "
" ], - col: [ 2, "", "
" ], - tr: [ 2, "", "
" ], - td: [ 3, "", "
" ], - - _default: [ 0, "", "" ] -}; - -wrapMap.tbody = wrapMap.tfoot = wrapMap.colgroup = wrapMap.caption = wrapMap.thead; -wrapMap.th = wrapMap.td; - -// Support: IE <=9 only -if ( !support.option ) { - wrapMap.optgroup = wrapMap.option = [ 1, "" ]; -} - - -function getAll( context, tag ) { - - // Support: IE <=9 - 11 only - // Use typeof to avoid zero-argument method invocation on host objects (#15151) - var ret; - - if ( typeof context.getElementsByTagName !== "undefined" ) { - ret = context.getElementsByTagName( tag || "*" ); - - } else if ( typeof context.querySelectorAll !== "undefined" ) { - ret = context.querySelectorAll( tag || "*" ); - - } else { - ret = []; - } - - if ( tag === undefined || tag && nodeName( context, tag ) ) { - return jQuery.merge( [ context ], ret ); - } - - return ret; -} - - -// Mark scripts as having already been evaluated -function setGlobalEval( elems, refElements ) { - var i = 0, - l = elems.length; - - for ( ; i < l; i++ ) { - dataPriv.set( - elems[ i ], - "globalEval", - !refElements || dataPriv.get( refElements[ i ], "globalEval" ) - ); - } -} - - -var rhtml = /<|&#?\w+;/; - -function buildFragment( elems, context, scripts, selection, ignored ) { - var elem, tmp, tag, wrap, attached, j, - fragment = context.createDocumentFragment(), - nodes = [], - i = 0, - l = elems.length; - - for ( ; i < l; i++ ) { - elem = elems[ i ]; - - if ( elem || elem === 0 ) { - - // Add nodes directly - if ( toType( elem ) === "object" ) { - - // Support: Android <=4.0 only, PhantomJS 1 only - // push.apply(_, arraylike) throws on ancient WebKit - jQuery.merge( nodes, elem.nodeType ? [ elem ] : elem ); - - // Convert non-html into a text node - } else if ( !rhtml.test( elem ) ) { - nodes.push( context.createTextNode( elem ) ); - - // Convert html into DOM nodes - } else { - tmp = tmp || fragment.appendChild( context.createElement( "div" ) ); - - // Deserialize a standard representation - tag = ( rtagName.exec( elem ) || [ "", "" ] )[ 1 ].toLowerCase(); - wrap = wrapMap[ tag ] || wrapMap._default; - tmp.innerHTML = wrap[ 1 ] + jQuery.htmlPrefilter( elem ) + wrap[ 2 ]; - - // Descend through wrappers to the right content - j = wrap[ 0 ]; - while ( j-- ) { - tmp = tmp.lastChild; - } - - // Support: Android <=4.0 only, PhantomJS 1 only - // push.apply(_, arraylike) throws on ancient WebKit - jQuery.merge( nodes, tmp.childNodes ); - - // Remember the top-level container - tmp = fragment.firstChild; - - // Ensure the created nodes are orphaned (#12392) - tmp.textContent = ""; - } - } - } - - // Remove wrapper from fragment - fragment.textContent = ""; - - i = 0; - while ( ( elem = nodes[ i++ ] ) ) { - - // Skip elements already in the context collection (trac-4087) - if ( selection && jQuery.inArray( elem, selection ) > -1 ) { - if ( ignored ) { - ignored.push( elem ); - } - continue; - } - - attached = isAttached( elem ); - - // Append to fragment - tmp = getAll( fragment.appendChild( elem ), "script" ); - - // Preserve script evaluation history - if ( attached ) { - setGlobalEval( tmp ); - } - - // Capture executables - if ( scripts ) { - j = 0; - while ( ( elem = tmp[ j++ ] ) ) { - if ( rscriptType.test( elem.type || "" ) ) { - scripts.push( elem ); - } - } - } - } - - return fragment; -} - - -var - rkeyEvent = /^key/, - rmouseEvent = /^(?:mouse|pointer|contextmenu|drag|drop)|click/, - rtypenamespace = /^([^.]*)(?:\.(.+)|)/; - -function returnTrue() { - return true; -} - -function returnFalse() { - return false; -} - -// Support: IE <=9 - 11+ -// focus() and blur() are asynchronous, except when they are no-op. -// So expect focus to be synchronous when the element is already active, -// and blur to be synchronous when the element is not already active. -// (focus and blur are always synchronous in other supported browsers, -// this just defines when we can count on it). -function expectSync( elem, type ) { - return ( elem === safeActiveElement() ) === ( type === "focus" ); -} - -// Support: IE <=9 only -// Accessing document.activeElement can throw unexpectedly -// https://bugs.jquery.com/ticket/13393 -function safeActiveElement() { - try { - return document.activeElement; - } catch ( err ) { } -} - -function on( elem, types, selector, data, fn, one ) { - var origFn, type; - - // Types can be a map of types/handlers - if ( typeof types === "object" ) { - - // ( types-Object, selector, data ) - if ( typeof selector !== "string" ) { - - // ( types-Object, data ) - data = data || selector; - selector = undefined; - } - for ( type in types ) { - on( elem, type, selector, data, types[ type ], one ); - } - return elem; - } - - if ( data == null && fn == null ) { - - // ( types, fn ) - fn = selector; - data = selector = undefined; - } else if ( fn == null ) { - if ( typeof selector === "string" ) { - - // ( types, selector, fn ) - fn = data; - data = undefined; - } else { - - // ( types, data, fn ) - fn = data; - data = selector; - selector = undefined; - } - } - if ( fn === false ) { - fn = returnFalse; - } else if ( !fn ) { - return elem; - } - - if ( one === 1 ) { - origFn = fn; - fn = function( event ) { - - // Can use an empty set, since event contains the info - jQuery().off( event ); - return origFn.apply( this, arguments ); - }; - - // Use same guid so caller can remove using origFn - fn.guid = origFn.guid || ( origFn.guid = jQuery.guid++ ); - } - return elem.each( function() { - jQuery.event.add( this, types, fn, data, selector ); - } ); -} - -/* - * Helper functions for managing events -- not part of the public interface. - * Props to Dean Edwards' addEvent library for many of the ideas. - */ -jQuery.event = { - - global: {}, - - add: function( elem, types, handler, data, selector ) { - - var handleObjIn, eventHandle, tmp, - events, t, handleObj, - special, handlers, type, namespaces, origType, - elemData = dataPriv.get( elem ); - - // Only attach events to objects that accept data - if ( !acceptData( elem ) ) { - return; - } - - // Caller can pass in an object of custom data in lieu of the handler - if ( handler.handler ) { - handleObjIn = handler; - handler = handleObjIn.handler; - selector = handleObjIn.selector; - } - - // Ensure that invalid selectors throw exceptions at attach time - // Evaluate against documentElement in case elem is a non-element node (e.g., document) - if ( selector ) { - jQuery.find.matchesSelector( documentElement, selector ); - } - - // Make sure that the handler has a unique ID, used to find/remove it later - if ( !handler.guid ) { - handler.guid = jQuery.guid++; - } - - // Init the element's event structure and main handler, if this is the first - if ( !( events = elemData.events ) ) { - events = elemData.events = Object.create( null ); - } - if ( !( eventHandle = elemData.handle ) ) { - eventHandle = elemData.handle = function( e ) { - - // Discard the second event of a jQuery.event.trigger() and - // when an event is called after a page has unloaded - return typeof jQuery !== "undefined" && jQuery.event.triggered !== e.type ? - jQuery.event.dispatch.apply( elem, arguments ) : undefined; - }; - } - - // Handle multiple events separated by a space - types = ( types || "" ).match( rnothtmlwhite ) || [ "" ]; - t = types.length; - while ( t-- ) { - tmp = rtypenamespace.exec( types[ t ] ) || []; - type = origType = tmp[ 1 ]; - namespaces = ( tmp[ 2 ] || "" ).split( "." ).sort(); - - // There *must* be a type, no attaching namespace-only handlers - if ( !type ) { - continue; - } - - // If event changes its type, use the special event handlers for the changed type - special = jQuery.event.special[ type ] || {}; - - // If selector defined, determine special event api type, otherwise given type - type = ( selector ? special.delegateType : special.bindType ) || type; - - // Update special based on newly reset type - special = jQuery.event.special[ type ] || {}; - - // handleObj is passed to all event handlers - handleObj = jQuery.extend( { - type: type, - origType: origType, - data: data, - handler: handler, - guid: handler.guid, - selector: selector, - needsContext: selector && jQuery.expr.match.needsContext.test( selector ), - namespace: namespaces.join( "." ) - }, handleObjIn ); - - // Init the event handler queue if we're the first - if ( !( handlers = events[ type ] ) ) { - handlers = events[ type ] = []; - handlers.delegateCount = 0; - - // Only use addEventListener if the special events handler returns false - if ( !special.setup || - special.setup.call( elem, data, namespaces, eventHandle ) === false ) { - - if ( elem.addEventListener ) { - elem.addEventListener( type, eventHandle ); - } - } - } - - if ( special.add ) { - special.add.call( elem, handleObj ); - - if ( !handleObj.handler.guid ) { - handleObj.handler.guid = handler.guid; - } - } - - // Add to the element's handler list, delegates in front - if ( selector ) { - handlers.splice( handlers.delegateCount++, 0, handleObj ); - } else { - handlers.push( handleObj ); - } - - // Keep track of which events have ever been used, for event optimization - jQuery.event.global[ type ] = true; - } - - }, - - // Detach an event or set of events from an element - remove: function( elem, types, handler, selector, mappedTypes ) { - - var j, origCount, tmp, - events, t, handleObj, - special, handlers, type, namespaces, origType, - elemData = dataPriv.hasData( elem ) && dataPriv.get( elem ); - - if ( !elemData || !( events = elemData.events ) ) { - return; - } - - // Once for each type.namespace in types; type may be omitted - types = ( types || "" ).match( rnothtmlwhite ) || [ "" ]; - t = types.length; - while ( t-- ) { - tmp = rtypenamespace.exec( types[ t ] ) || []; - type = origType = tmp[ 1 ]; - namespaces = ( tmp[ 2 ] || "" ).split( "." ).sort(); - - // Unbind all events (on this namespace, if provided) for the element - if ( !type ) { - for ( type in events ) { - jQuery.event.remove( elem, type + types[ t ], handler, selector, true ); - } - continue; - } - - special = jQuery.event.special[ type ] || {}; - type = ( selector ? special.delegateType : special.bindType ) || type; - handlers = events[ type ] || []; - tmp = tmp[ 2 ] && - new RegExp( "(^|\\.)" + namespaces.join( "\\.(?:.*\\.|)" ) + "(\\.|$)" ); - - // Remove matching events - origCount = j = handlers.length; - while ( j-- ) { - handleObj = handlers[ j ]; - - if ( ( mappedTypes || origType === handleObj.origType ) && - ( !handler || handler.guid === handleObj.guid ) && - ( !tmp || tmp.test( handleObj.namespace ) ) && - ( !selector || selector === handleObj.selector || - selector === "**" && handleObj.selector ) ) { - handlers.splice( j, 1 ); - - if ( handleObj.selector ) { - handlers.delegateCount--; - } - if ( special.remove ) { - special.remove.call( elem, handleObj ); - } - } - } - - // Remove generic event handler if we removed something and no more handlers exist - // (avoids potential for endless recursion during removal of special event handlers) - if ( origCount && !handlers.length ) { - if ( !special.teardown || - special.teardown.call( elem, namespaces, elemData.handle ) === false ) { - - jQuery.removeEvent( elem, type, elemData.handle ); - } - - delete events[ type ]; - } - } - - // Remove data and the expando if it's no longer used - if ( jQuery.isEmptyObject( events ) ) { - dataPriv.remove( elem, "handle events" ); - } - }, - - dispatch: function( nativeEvent ) { - - var i, j, ret, matched, handleObj, handlerQueue, - args = new Array( arguments.length ), - - // Make a writable jQuery.Event from the native event object - event = jQuery.event.fix( nativeEvent ), - - handlers = ( - dataPriv.get( this, "events" ) || Object.create( null ) - )[ event.type ] || [], - special = jQuery.event.special[ event.type ] || {}; - - // Use the fix-ed jQuery.Event rather than the (read-only) native event - args[ 0 ] = event; - - for ( i = 1; i < arguments.length; i++ ) { - args[ i ] = arguments[ i ]; - } - - event.delegateTarget = this; - - // Call the preDispatch hook for the mapped type, and let it bail if desired - if ( special.preDispatch && special.preDispatch.call( this, event ) === false ) { - return; - } - - // Determine handlers - handlerQueue = jQuery.event.handlers.call( this, event, handlers ); - - // Run delegates first; they may want to stop propagation beneath us - i = 0; - while ( ( matched = handlerQueue[ i++ ] ) && !event.isPropagationStopped() ) { - event.currentTarget = matched.elem; - - j = 0; - while ( ( handleObj = matched.handlers[ j++ ] ) && - !event.isImmediatePropagationStopped() ) { - - // If the event is namespaced, then each handler is only invoked if it is - // specially universal or its namespaces are a superset of the event's. - if ( !event.rnamespace || handleObj.namespace === false || - event.rnamespace.test( handleObj.namespace ) ) { - - event.handleObj = handleObj; - event.data = handleObj.data; - - ret = ( ( jQuery.event.special[ handleObj.origType ] || {} ).handle || - handleObj.handler ).apply( matched.elem, args ); - - if ( ret !== undefined ) { - if ( ( event.result = ret ) === false ) { - event.preventDefault(); - event.stopPropagation(); - } - } - } - } - } - - // Call the postDispatch hook for the mapped type - if ( special.postDispatch ) { - special.postDispatch.call( this, event ); - } - - return event.result; - }, - - handlers: function( event, handlers ) { - var i, handleObj, sel, matchedHandlers, matchedSelectors, - handlerQueue = [], - delegateCount = handlers.delegateCount, - cur = event.target; - - // Find delegate handlers - if ( delegateCount && - - // Support: IE <=9 - // Black-hole SVG instance trees (trac-13180) - cur.nodeType && - - // Support: Firefox <=42 - // Suppress spec-violating clicks indicating a non-primary pointer button (trac-3861) - // https://www.w3.org/TR/DOM-Level-3-Events/#event-type-click - // Support: IE 11 only - // ...but not arrow key "clicks" of radio inputs, which can have `button` -1 (gh-2343) - !( event.type === "click" && event.button >= 1 ) ) { - - for ( ; cur !== this; cur = cur.parentNode || this ) { - - // Don't check non-elements (#13208) - // Don't process clicks on disabled elements (#6911, #8165, #11382, #11764) - if ( cur.nodeType === 1 && !( event.type === "click" && cur.disabled === true ) ) { - matchedHandlers = []; - matchedSelectors = {}; - for ( i = 0; i < delegateCount; i++ ) { - handleObj = handlers[ i ]; - - // Don't conflict with Object.prototype properties (#13203) - sel = handleObj.selector + " "; - - if ( matchedSelectors[ sel ] === undefined ) { - matchedSelectors[ sel ] = handleObj.needsContext ? - jQuery( sel, this ).index( cur ) > -1 : - jQuery.find( sel, this, null, [ cur ] ).length; - } - if ( matchedSelectors[ sel ] ) { - matchedHandlers.push( handleObj ); - } - } - if ( matchedHandlers.length ) { - handlerQueue.push( { elem: cur, handlers: matchedHandlers } ); - } - } - } - } - - // Add the remaining (directly-bound) handlers - cur = this; - if ( delegateCount < handlers.length ) { - handlerQueue.push( { elem: cur, handlers: handlers.slice( delegateCount ) } ); - } - - return handlerQueue; - }, - - addProp: function( name, hook ) { - Object.defineProperty( jQuery.Event.prototype, name, { - enumerable: true, - configurable: true, - - get: isFunction( hook ) ? - function() { - if ( this.originalEvent ) { - return hook( this.originalEvent ); - } - } : - function() { - if ( this.originalEvent ) { - return this.originalEvent[ name ]; - } - }, - - set: function( value ) { - Object.defineProperty( this, name, { - enumerable: true, - configurable: true, - writable: true, - value: value - } ); - } - } ); - }, - - fix: function( originalEvent ) { - return originalEvent[ jQuery.expando ] ? - originalEvent : - new jQuery.Event( originalEvent ); - }, - - special: { - load: { - - // Prevent triggered image.load events from bubbling to window.load - noBubble: true - }, - click: { - - // Utilize native event to ensure correct state for checkable inputs - setup: function( data ) { - - // For mutual compressibility with _default, replace `this` access with a local var. - // `|| data` is dead code meant only to preserve the variable through minification. - var el = this || data; - - // Claim the first handler - if ( rcheckableType.test( el.type ) && - el.click && nodeName( el, "input" ) ) { - - // dataPriv.set( el, "click", ... ) - leverageNative( el, "click", returnTrue ); - } - - // Return false to allow normal processing in the caller - return false; - }, - trigger: function( data ) { - - // For mutual compressibility with _default, replace `this` access with a local var. - // `|| data` is dead code meant only to preserve the variable through minification. - var el = this || data; - - // Force setup before triggering a click - if ( rcheckableType.test( el.type ) && - el.click && nodeName( el, "input" ) ) { - - leverageNative( el, "click" ); - } - - // Return non-false to allow normal event-path propagation - return true; - }, - - // For cross-browser consistency, suppress native .click() on links - // Also prevent it if we're currently inside a leveraged native-event stack - _default: function( event ) { - var target = event.target; - return rcheckableType.test( target.type ) && - target.click && nodeName( target, "input" ) && - dataPriv.get( target, "click" ) || - nodeName( target, "a" ); - } - }, - - beforeunload: { - postDispatch: function( event ) { - - // Support: Firefox 20+ - // Firefox doesn't alert if the returnValue field is not set. - if ( event.result !== undefined && event.originalEvent ) { - event.originalEvent.returnValue = event.result; - } - } - } - } -}; - -// Ensure the presence of an event listener that handles manually-triggered -// synthetic events by interrupting progress until reinvoked in response to -// *native* events that it fires directly, ensuring that state changes have -// already occurred before other listeners are invoked. -function leverageNative( el, type, expectSync ) { - - // Missing expectSync indicates a trigger call, which must force setup through jQuery.event.add - if ( !expectSync ) { - if ( dataPriv.get( el, type ) === undefined ) { - jQuery.event.add( el, type, returnTrue ); - } - return; - } - - // Register the controller as a special universal handler for all event namespaces - dataPriv.set( el, type, false ); - jQuery.event.add( el, type, { - namespace: false, - handler: function( event ) { - var notAsync, result, - saved = dataPriv.get( this, type ); - - if ( ( event.isTrigger & 1 ) && this[ type ] ) { - - // Interrupt processing of the outer synthetic .trigger()ed event - // Saved data should be false in such cases, but might be a leftover capture object - // from an async native handler (gh-4350) - if ( !saved.length ) { - - // Store arguments for use when handling the inner native event - // There will always be at least one argument (an event object), so this array - // will not be confused with a leftover capture object. - saved = slice.call( arguments ); - dataPriv.set( this, type, saved ); - - // Trigger the native event and capture its result - // Support: IE <=9 - 11+ - // focus() and blur() are asynchronous - notAsync = expectSync( this, type ); - this[ type ](); - result = dataPriv.get( this, type ); - if ( saved !== result || notAsync ) { - dataPriv.set( this, type, false ); - } else { - result = {}; - } - if ( saved !== result ) { - - // Cancel the outer synthetic event - event.stopImmediatePropagation(); - event.preventDefault(); - return result.value; - } - - // If this is an inner synthetic event for an event with a bubbling surrogate - // (focus or blur), assume that the surrogate already propagated from triggering the - // native event and prevent that from happening again here. - // This technically gets the ordering wrong w.r.t. to `.trigger()` (in which the - // bubbling surrogate propagates *after* the non-bubbling base), but that seems - // less bad than duplication. - } else if ( ( jQuery.event.special[ type ] || {} ).delegateType ) { - event.stopPropagation(); - } - - // If this is a native event triggered above, everything is now in order - // Fire an inner synthetic event with the original arguments - } else if ( saved.length ) { - - // ...and capture the result - dataPriv.set( this, type, { - value: jQuery.event.trigger( - - // Support: IE <=9 - 11+ - // Extend with the prototype to reset the above stopImmediatePropagation() - jQuery.extend( saved[ 0 ], jQuery.Event.prototype ), - saved.slice( 1 ), - this - ) - } ); - - // Abort handling of the native event - event.stopImmediatePropagation(); - } - } - } ); -} - -jQuery.removeEvent = function( elem, type, handle ) { - - // This "if" is needed for plain objects - if ( elem.removeEventListener ) { - elem.removeEventListener( type, handle ); - } -}; - -jQuery.Event = function( src, props ) { - - // Allow instantiation without the 'new' keyword - if ( !( this instanceof jQuery.Event ) ) { - return new jQuery.Event( src, props ); - } - - // Event object - if ( src && src.type ) { - this.originalEvent = src; - this.type = src.type; - - // Events bubbling up the document may have been marked as prevented - // by a handler lower down the tree; reflect the correct value. - this.isDefaultPrevented = src.defaultPrevented || - src.defaultPrevented === undefined && - - // Support: Android <=2.3 only - src.returnValue === false ? - returnTrue : - returnFalse; - - // Create target properties - // Support: Safari <=6 - 7 only - // Target should not be a text node (#504, #13143) - this.target = ( src.target && src.target.nodeType === 3 ) ? - src.target.parentNode : - src.target; - - this.currentTarget = src.currentTarget; - this.relatedTarget = src.relatedTarget; - - // Event type - } else { - this.type = src; - } - - // Put explicitly provided properties onto the event object - if ( props ) { - jQuery.extend( this, props ); - } - - // Create a timestamp if incoming event doesn't have one - this.timeStamp = src && src.timeStamp || Date.now(); - - // Mark it as fixed - this[ jQuery.expando ] = true; -}; - -// jQuery.Event is based on DOM3 Events as specified by the ECMAScript Language Binding -// https://www.w3.org/TR/2003/WD-DOM-Level-3-Events-20030331/ecma-script-binding.html -jQuery.Event.prototype = { - constructor: jQuery.Event, - isDefaultPrevented: returnFalse, - isPropagationStopped: returnFalse, - isImmediatePropagationStopped: returnFalse, - isSimulated: false, - - preventDefault: function() { - var e = this.originalEvent; - - this.isDefaultPrevented = returnTrue; - - if ( e && !this.isSimulated ) { - e.preventDefault(); - } - }, - stopPropagation: function() { - var e = this.originalEvent; - - this.isPropagationStopped = returnTrue; - - if ( e && !this.isSimulated ) { - e.stopPropagation(); - } - }, - stopImmediatePropagation: function() { - var e = this.originalEvent; - - this.isImmediatePropagationStopped = returnTrue; - - if ( e && !this.isSimulated ) { - e.stopImmediatePropagation(); - } - - this.stopPropagation(); - } -}; - -// Includes all common event props including KeyEvent and MouseEvent specific props -jQuery.each( { - altKey: true, - bubbles: true, - cancelable: true, - changedTouches: true, - ctrlKey: true, - detail: true, - eventPhase: true, - metaKey: true, - pageX: true, - pageY: true, - shiftKey: true, - view: true, - "char": true, - code: true, - charCode: true, - key: true, - keyCode: true, - button: true, - buttons: true, - clientX: true, - clientY: true, - offsetX: true, - offsetY: true, - pointerId: true, - pointerType: true, - screenX: true, - screenY: true, - targetTouches: true, - toElement: true, - touches: true, - - which: function( event ) { - var button = event.button; - - // Add which for key events - if ( event.which == null && rkeyEvent.test( event.type ) ) { - return event.charCode != null ? event.charCode : event.keyCode; - } - - // Add which for click: 1 === left; 2 === middle; 3 === right - if ( !event.which && button !== undefined && rmouseEvent.test( event.type ) ) { - if ( button & 1 ) { - return 1; - } - - if ( button & 2 ) { - return 3; - } - - if ( button & 4 ) { - return 2; - } - - return 0; - } - - return event.which; - } -}, jQuery.event.addProp ); - -jQuery.each( { focus: "focusin", blur: "focusout" }, function( type, delegateType ) { - jQuery.event.special[ type ] = { - - // Utilize native event if possible so blur/focus sequence is correct - setup: function() { - - // Claim the first handler - // dataPriv.set( this, "focus", ... ) - // dataPriv.set( this, "blur", ... ) - leverageNative( this, type, expectSync ); - - // Return false to allow normal processing in the caller - return false; - }, - trigger: function() { - - // Force setup before trigger - leverageNative( this, type ); - - // Return non-false to allow normal event-path propagation - return true; - }, - - delegateType: delegateType - }; -} ); - -// Create mouseenter/leave events using mouseover/out and event-time checks -// so that event delegation works in jQuery. -// Do the same for pointerenter/pointerleave and pointerover/pointerout -// -// Support: Safari 7 only -// Safari sends mouseenter too often; see: -// https://bugs.chromium.org/p/chromium/issues/detail?id=470258 -// for the description of the bug (it existed in older Chrome versions as well). -jQuery.each( { - mouseenter: "mouseover", - mouseleave: "mouseout", - pointerenter: "pointerover", - pointerleave: "pointerout" -}, function( orig, fix ) { - jQuery.event.special[ orig ] = { - delegateType: fix, - bindType: fix, - - handle: function( event ) { - var ret, - target = this, - related = event.relatedTarget, - handleObj = event.handleObj; - - // For mouseenter/leave call the handler if related is outside the target. - // NB: No relatedTarget if the mouse left/entered the browser window - if ( !related || ( related !== target && !jQuery.contains( target, related ) ) ) { - event.type = handleObj.origType; - ret = handleObj.handler.apply( this, arguments ); - event.type = fix; - } - return ret; - } - }; -} ); - -jQuery.fn.extend( { - - on: function( types, selector, data, fn ) { - return on( this, types, selector, data, fn ); - }, - one: function( types, selector, data, fn ) { - return on( this, types, selector, data, fn, 1 ); - }, - off: function( types, selector, fn ) { - var handleObj, type; - if ( types && types.preventDefault && types.handleObj ) { - - // ( event ) dispatched jQuery.Event - handleObj = types.handleObj; - jQuery( types.delegateTarget ).off( - handleObj.namespace ? - handleObj.origType + "." + handleObj.namespace : - handleObj.origType, - handleObj.selector, - handleObj.handler - ); - return this; - } - if ( typeof types === "object" ) { - - // ( types-object [, selector] ) - for ( type in types ) { - this.off( type, selector, types[ type ] ); - } - return this; - } - if ( selector === false || typeof selector === "function" ) { - - // ( types [, fn] ) - fn = selector; - selector = undefined; - } - if ( fn === false ) { - fn = returnFalse; - } - return this.each( function() { - jQuery.event.remove( this, types, fn, selector ); - } ); - } -} ); - - -var - - // Support: IE <=10 - 11, Edge 12 - 13 only - // In IE/Edge using regex groups here causes severe slowdowns. - // See https://connect.microsoft.com/IE/feedback/details/1736512/ - rnoInnerhtml = /\s*$/g; - -// Prefer a tbody over its parent table for containing new rows -function manipulationTarget( elem, content ) { - if ( nodeName( elem, "table" ) && - nodeName( content.nodeType !== 11 ? content : content.firstChild, "tr" ) ) { - - return jQuery( elem ).children( "tbody" )[ 0 ] || elem; - } - - return elem; -} - -// Replace/restore the type attribute of script elements for safe DOM manipulation -function disableScript( elem ) { - elem.type = ( elem.getAttribute( "type" ) !== null ) + "/" + elem.type; - return elem; -} -function restoreScript( elem ) { - if ( ( elem.type || "" ).slice( 0, 5 ) === "true/" ) { - elem.type = elem.type.slice( 5 ); - } else { - elem.removeAttribute( "type" ); - } - - return elem; -} - -function cloneCopyEvent( src, dest ) { - var i, l, type, pdataOld, udataOld, udataCur, events; - - if ( dest.nodeType !== 1 ) { - return; - } - - // 1. Copy private data: events, handlers, etc. - if ( dataPriv.hasData( src ) ) { - pdataOld = dataPriv.get( src ); - events = pdataOld.events; - - if ( events ) { - dataPriv.remove( dest, "handle events" ); - - for ( type in events ) { - for ( i = 0, l = events[ type ].length; i < l; i++ ) { - jQuery.event.add( dest, type, events[ type ][ i ] ); - } - } - } - } - - // 2. Copy user data - if ( dataUser.hasData( src ) ) { - udataOld = dataUser.access( src ); - udataCur = jQuery.extend( {}, udataOld ); - - dataUser.set( dest, udataCur ); - } -} - -// Fix IE bugs, see support tests -function fixInput( src, dest ) { - var nodeName = dest.nodeName.toLowerCase(); - - // Fails to persist the checked state of a cloned checkbox or radio button. - if ( nodeName === "input" && rcheckableType.test( src.type ) ) { - dest.checked = src.checked; - - // Fails to return the selected option to the default selected state when cloning options - } else if ( nodeName === "input" || nodeName === "textarea" ) { - dest.defaultValue = src.defaultValue; - } -} - -function domManip( collection, args, callback, ignored ) { - - // Flatten any nested arrays - args = flat( args ); - - var fragment, first, scripts, hasScripts, node, doc, - i = 0, - l = collection.length, - iNoClone = l - 1, - value = args[ 0 ], - valueIsFunction = isFunction( value ); - - // We can't cloneNode fragments that contain checked, in WebKit - if ( valueIsFunction || - ( l > 1 && typeof value === "string" && - !support.checkClone && rchecked.test( value ) ) ) { - return collection.each( function( index ) { - var self = collection.eq( index ); - if ( valueIsFunction ) { - args[ 0 ] = value.call( this, index, self.html() ); - } - domManip( self, args, callback, ignored ); - } ); - } - - if ( l ) { - fragment = buildFragment( args, collection[ 0 ].ownerDocument, false, collection, ignored ); - first = fragment.firstChild; - - if ( fragment.childNodes.length === 1 ) { - fragment = first; - } - - // Require either new content or an interest in ignored elements to invoke the callback - if ( first || ignored ) { - scripts = jQuery.map( getAll( fragment, "script" ), disableScript ); - hasScripts = scripts.length; - - // Use the original fragment for the last item - // instead of the first because it can end up - // being emptied incorrectly in certain situations (#8070). - for ( ; i < l; i++ ) { - node = fragment; - - if ( i !== iNoClone ) { - node = jQuery.clone( node, true, true ); - - // Keep references to cloned scripts for later restoration - if ( hasScripts ) { - - // Support: Android <=4.0 only, PhantomJS 1 only - // push.apply(_, arraylike) throws on ancient WebKit - jQuery.merge( scripts, getAll( node, "script" ) ); - } - } - - callback.call( collection[ i ], node, i ); - } - - if ( hasScripts ) { - doc = scripts[ scripts.length - 1 ].ownerDocument; - - // Reenable scripts - jQuery.map( scripts, restoreScript ); - - // Evaluate executable scripts on first document insertion - for ( i = 0; i < hasScripts; i++ ) { - node = scripts[ i ]; - if ( rscriptType.test( node.type || "" ) && - !dataPriv.access( node, "globalEval" ) && - jQuery.contains( doc, node ) ) { - - if ( node.src && ( node.type || "" ).toLowerCase() !== "module" ) { - - // Optional AJAX dependency, but won't run scripts if not present - if ( jQuery._evalUrl && !node.noModule ) { - jQuery._evalUrl( node.src, { - nonce: node.nonce || node.getAttribute( "nonce" ) - }, doc ); - } - } else { - DOMEval( node.textContent.replace( rcleanScript, "" ), node, doc ); - } - } - } - } - } - } - - return collection; -} - -function remove( elem, selector, keepData ) { - var node, - nodes = selector ? jQuery.filter( selector, elem ) : elem, - i = 0; - - for ( ; ( node = nodes[ i ] ) != null; i++ ) { - if ( !keepData && node.nodeType === 1 ) { - jQuery.cleanData( getAll( node ) ); - } - - if ( node.parentNode ) { - if ( keepData && isAttached( node ) ) { - setGlobalEval( getAll( node, "script" ) ); - } - node.parentNode.removeChild( node ); - } - } - - return elem; -} - -jQuery.extend( { - htmlPrefilter: function( html ) { - return html; - }, - - clone: function( elem, dataAndEvents, deepDataAndEvents ) { - var i, l, srcElements, destElements, - clone = elem.cloneNode( true ), - inPage = isAttached( elem ); - - // Fix IE cloning issues - if ( !support.noCloneChecked && ( elem.nodeType === 1 || elem.nodeType === 11 ) && - !jQuery.isXMLDoc( elem ) ) { - - // We eschew Sizzle here for performance reasons: https://jsperf.com/getall-vs-sizzle/2 - destElements = getAll( clone ); - srcElements = getAll( elem ); - - for ( i = 0, l = srcElements.length; i < l; i++ ) { - fixInput( srcElements[ i ], destElements[ i ] ); - } - } - - // Copy the events from the original to the clone - if ( dataAndEvents ) { - if ( deepDataAndEvents ) { - srcElements = srcElements || getAll( elem ); - destElements = destElements || getAll( clone ); - - for ( i = 0, l = srcElements.length; i < l; i++ ) { - cloneCopyEvent( srcElements[ i ], destElements[ i ] ); - } - } else { - cloneCopyEvent( elem, clone ); - } - } - - // Preserve script evaluation history - destElements = getAll( clone, "script" ); - if ( destElements.length > 0 ) { - setGlobalEval( destElements, !inPage && getAll( elem, "script" ) ); - } - - // Return the cloned set - return clone; - }, - - cleanData: function( elems ) { - var data, elem, type, - special = jQuery.event.special, - i = 0; - - for ( ; ( elem = elems[ i ] ) !== undefined; i++ ) { - if ( acceptData( elem ) ) { - if ( ( data = elem[ dataPriv.expando ] ) ) { - if ( data.events ) { - for ( type in data.events ) { - if ( special[ type ] ) { - jQuery.event.remove( elem, type ); - - // This is a shortcut to avoid jQuery.event.remove's overhead - } else { - jQuery.removeEvent( elem, type, data.handle ); - } - } - } - - // Support: Chrome <=35 - 45+ - // Assign undefined instead of using delete, see Data#remove - elem[ dataPriv.expando ] = undefined; - } - if ( elem[ dataUser.expando ] ) { - - // Support: Chrome <=35 - 45+ - // Assign undefined instead of using delete, see Data#remove - elem[ dataUser.expando ] = undefined; - } - } - } - } -} ); - -jQuery.fn.extend( { - detach: function( selector ) { - return remove( this, selector, true ); - }, - - remove: function( selector ) { - return remove( this, selector ); - }, - - text: function( value ) { - return access( this, function( value ) { - return value === undefined ? - jQuery.text( this ) : - this.empty().each( function() { - if ( this.nodeType === 1 || this.nodeType === 11 || this.nodeType === 9 ) { - this.textContent = value; - } - } ); - }, null, value, arguments.length ); - }, - - append: function() { - return domManip( this, arguments, function( elem ) { - if ( this.nodeType === 1 || this.nodeType === 11 || this.nodeType === 9 ) { - var target = manipulationTarget( this, elem ); - target.appendChild( elem ); - } - } ); - }, - - prepend: function() { - return domManip( this, arguments, function( elem ) { - if ( this.nodeType === 1 || this.nodeType === 11 || this.nodeType === 9 ) { - var target = manipulationTarget( this, elem ); - target.insertBefore( elem, target.firstChild ); - } - } ); - }, - - before: function() { - return domManip( this, arguments, function( elem ) { - if ( this.parentNode ) { - this.parentNode.insertBefore( elem, this ); - } - } ); - }, - - after: function() { - return domManip( this, arguments, function( elem ) { - if ( this.parentNode ) { - this.parentNode.insertBefore( elem, this.nextSibling ); - } - } ); - }, - - empty: function() { - var elem, - i = 0; - - for ( ; ( elem = this[ i ] ) != null; i++ ) { - if ( elem.nodeType === 1 ) { - - // Prevent memory leaks - jQuery.cleanData( getAll( elem, false ) ); - - // Remove any remaining nodes - elem.textContent = ""; - } - } - - return this; - }, - - clone: function( dataAndEvents, deepDataAndEvents ) { - dataAndEvents = dataAndEvents == null ? false : dataAndEvents; - deepDataAndEvents = deepDataAndEvents == null ? dataAndEvents : deepDataAndEvents; - - return this.map( function() { - return jQuery.clone( this, dataAndEvents, deepDataAndEvents ); - } ); - }, - - html: function( value ) { - return access( this, function( value ) { - var elem = this[ 0 ] || {}, - i = 0, - l = this.length; - - if ( value === undefined && elem.nodeType === 1 ) { - return elem.innerHTML; - } - - // See if we can take a shortcut and just use innerHTML - if ( typeof value === "string" && !rnoInnerhtml.test( value ) && - !wrapMap[ ( rtagName.exec( value ) || [ "", "" ] )[ 1 ].toLowerCase() ] ) { - - value = jQuery.htmlPrefilter( value ); - - try { - for ( ; i < l; i++ ) { - elem = this[ i ] || {}; - - // Remove element nodes and prevent memory leaks - if ( elem.nodeType === 1 ) { - jQuery.cleanData( getAll( elem, false ) ); - elem.innerHTML = value; - } - } - - elem = 0; - - // If using innerHTML throws an exception, use the fallback method - } catch ( e ) {} - } - - if ( elem ) { - this.empty().append( value ); - } - }, null, value, arguments.length ); - }, - - replaceWith: function() { - var ignored = []; - - // Make the changes, replacing each non-ignored context element with the new content - return domManip( this, arguments, function( elem ) { - var parent = this.parentNode; - - if ( jQuery.inArray( this, ignored ) < 0 ) { - jQuery.cleanData( getAll( this ) ); - if ( parent ) { - parent.replaceChild( elem, this ); - } - } - - // Force callback invocation - }, ignored ); - } -} ); - -jQuery.each( { - appendTo: "append", - prependTo: "prepend", - insertBefore: "before", - insertAfter: "after", - replaceAll: "replaceWith" -}, function( name, original ) { - jQuery.fn[ name ] = function( selector ) { - var elems, - ret = [], - insert = jQuery( selector ), - last = insert.length - 1, - i = 0; - - for ( ; i <= last; i++ ) { - elems = i === last ? this : this.clone( true ); - jQuery( insert[ i ] )[ original ]( elems ); - - // Support: Android <=4.0 only, PhantomJS 1 only - // .get() because push.apply(_, arraylike) throws on ancient WebKit - push.apply( ret, elems.get() ); - } - - return this.pushStack( ret ); - }; -} ); -var rnumnonpx = new RegExp( "^(" + pnum + ")(?!px)[a-z%]+$", "i" ); - -var getStyles = function( elem ) { - - // Support: IE <=11 only, Firefox <=30 (#15098, #14150) - // IE throws on elements created in popups - // FF meanwhile throws on frame elements through "defaultView.getComputedStyle" - var view = elem.ownerDocument.defaultView; - - if ( !view || !view.opener ) { - view = window; - } - - return view.getComputedStyle( elem ); - }; - -var swap = function( elem, options, callback ) { - var ret, name, - old = {}; - - // Remember the old values, and insert the new ones - for ( name in options ) { - old[ name ] = elem.style[ name ]; - elem.style[ name ] = options[ name ]; - } - - ret = callback.call( elem ); - - // Revert the old values - for ( name in options ) { - elem.style[ name ] = old[ name ]; - } - - return ret; -}; - - -var rboxStyle = new RegExp( cssExpand.join( "|" ), "i" ); - - - -( function() { - - // Executing both pixelPosition & boxSizingReliable tests require only one layout - // so they're executed at the same time to save the second computation. - function computeStyleTests() { - - // This is a singleton, we need to execute it only once - if ( !div ) { - return; - } - - container.style.cssText = "position:absolute;left:-11111px;width:60px;" + - "margin-top:1px;padding:0;border:0"; - div.style.cssText = - "position:relative;display:block;box-sizing:border-box;overflow:scroll;" + - "margin:auto;border:1px;padding:1px;" + - "width:60%;top:1%"; - documentElement.appendChild( container ).appendChild( div ); - - var divStyle = window.getComputedStyle( div ); - pixelPositionVal = divStyle.top !== "1%"; - - // Support: Android 4.0 - 4.3 only, Firefox <=3 - 44 - reliableMarginLeftVal = roundPixelMeasures( divStyle.marginLeft ) === 12; - - // Support: Android 4.0 - 4.3 only, Safari <=9.1 - 10.1, iOS <=7.0 - 9.3 - // Some styles come back with percentage values, even though they shouldn't - div.style.right = "60%"; - pixelBoxStylesVal = roundPixelMeasures( divStyle.right ) === 36; - - // Support: IE 9 - 11 only - // Detect misreporting of content dimensions for box-sizing:border-box elements - boxSizingReliableVal = roundPixelMeasures( divStyle.width ) === 36; - - // Support: IE 9 only - // Detect overflow:scroll screwiness (gh-3699) - // Support: Chrome <=64 - // Don't get tricked when zoom affects offsetWidth (gh-4029) - div.style.position = "absolute"; - scrollboxSizeVal = roundPixelMeasures( div.offsetWidth / 3 ) === 12; - - documentElement.removeChild( container ); - - // Nullify the div so it wouldn't be stored in the memory and - // it will also be a sign that checks already performed - div = null; - } - - function roundPixelMeasures( measure ) { - return Math.round( parseFloat( measure ) ); - } - - var pixelPositionVal, boxSizingReliableVal, scrollboxSizeVal, pixelBoxStylesVal, - reliableTrDimensionsVal, reliableMarginLeftVal, - container = document.createElement( "div" ), - div = document.createElement( "div" ); - - // Finish early in limited (non-browser) environments - if ( !div.style ) { - return; - } - - // Support: IE <=9 - 11 only - // Style of cloned element affects source element cloned (#8908) - div.style.backgroundClip = "content-box"; - div.cloneNode( true ).style.backgroundClip = ""; - support.clearCloneStyle = div.style.backgroundClip === "content-box"; - - jQuery.extend( support, { - boxSizingReliable: function() { - computeStyleTests(); - return boxSizingReliableVal; - }, - pixelBoxStyles: function() { - computeStyleTests(); - return pixelBoxStylesVal; - }, - pixelPosition: function() { - computeStyleTests(); - return pixelPositionVal; - }, - reliableMarginLeft: function() { - computeStyleTests(); - return reliableMarginLeftVal; - }, - scrollboxSize: function() { - computeStyleTests(); - return scrollboxSizeVal; - }, - - // Support: IE 9 - 11+, Edge 15 - 18+ - // IE/Edge misreport `getComputedStyle` of table rows with width/height - // set in CSS while `offset*` properties report correct values. - // Behavior in IE 9 is more subtle than in newer versions & it passes - // some versions of this test; make sure not to make it pass there! - reliableTrDimensions: function() { - var table, tr, trChild, trStyle; - if ( reliableTrDimensionsVal == null ) { - table = document.createElement( "table" ); - tr = document.createElement( "tr" ); - trChild = document.createElement( "div" ); - - table.style.cssText = "position:absolute;left:-11111px"; - tr.style.height = "1px"; - trChild.style.height = "9px"; - - documentElement - .appendChild( table ) - .appendChild( tr ) - .appendChild( trChild ); - - trStyle = window.getComputedStyle( tr ); - reliableTrDimensionsVal = parseInt( trStyle.height ) > 3; - - documentElement.removeChild( table ); - } - return reliableTrDimensionsVal; - } - } ); -} )(); - - -function curCSS( elem, name, computed ) { - var width, minWidth, maxWidth, ret, - - // Support: Firefox 51+ - // Retrieving style before computed somehow - // fixes an issue with getting wrong values - // on detached elements - style = elem.style; - - computed = computed || getStyles( elem ); - - // getPropertyValue is needed for: - // .css('filter') (IE 9 only, #12537) - // .css('--customProperty) (#3144) - if ( computed ) { - ret = computed.getPropertyValue( name ) || computed[ name ]; - - if ( ret === "" && !isAttached( elem ) ) { - ret = jQuery.style( elem, name ); - } - - // A tribute to the "awesome hack by Dean Edwards" - // Android Browser returns percentage for some values, - // but width seems to be reliably pixels. - // This is against the CSSOM draft spec: - // https://drafts.csswg.org/cssom/#resolved-values - if ( !support.pixelBoxStyles() && rnumnonpx.test( ret ) && rboxStyle.test( name ) ) { - - // Remember the original values - width = style.width; - minWidth = style.minWidth; - maxWidth = style.maxWidth; - - // Put in the new values to get a computed value out - style.minWidth = style.maxWidth = style.width = ret; - ret = computed.width; - - // Revert the changed values - style.width = width; - style.minWidth = minWidth; - style.maxWidth = maxWidth; - } - } - - return ret !== undefined ? - - // Support: IE <=9 - 11 only - // IE returns zIndex value as an integer. - ret + "" : - ret; -} - - -function addGetHookIf( conditionFn, hookFn ) { - - // Define the hook, we'll check on the first run if it's really needed. - return { - get: function() { - if ( conditionFn() ) { - - // Hook not needed (or it's not possible to use it due - // to missing dependency), remove it. - delete this.get; - return; - } - - // Hook needed; redefine it so that the support test is not executed again. - return ( this.get = hookFn ).apply( this, arguments ); - } - }; -} - - -var cssPrefixes = [ "Webkit", "Moz", "ms" ], - emptyStyle = document.createElement( "div" ).style, - vendorProps = {}; - -// Return a vendor-prefixed property or undefined -function vendorPropName( name ) { - - // Check for vendor prefixed names - var capName = name[ 0 ].toUpperCase() + name.slice( 1 ), - i = cssPrefixes.length; - - while ( i-- ) { - name = cssPrefixes[ i ] + capName; - if ( name in emptyStyle ) { - return name; - } - } -} - -// Return a potentially-mapped jQuery.cssProps or vendor prefixed property -function finalPropName( name ) { - var final = jQuery.cssProps[ name ] || vendorProps[ name ]; - - if ( final ) { - return final; - } - if ( name in emptyStyle ) { - return name; - } - return vendorProps[ name ] = vendorPropName( name ) || name; -} - - -var - - // Swappable if display is none or starts with table - // except "table", "table-cell", or "table-caption" - // See here for display values: https://developer.mozilla.org/en-US/docs/CSS/display - rdisplayswap = /^(none|table(?!-c[ea]).+)/, - rcustomProp = /^--/, - cssShow = { position: "absolute", visibility: "hidden", display: "block" }, - cssNormalTransform = { - letterSpacing: "0", - fontWeight: "400" - }; - -function setPositiveNumber( _elem, value, subtract ) { - - // Any relative (+/-) values have already been - // normalized at this point - var matches = rcssNum.exec( value ); - return matches ? - - // Guard against undefined "subtract", e.g., when used as in cssHooks - Math.max( 0, matches[ 2 ] - ( subtract || 0 ) ) + ( matches[ 3 ] || "px" ) : - value; -} - -function boxModelAdjustment( elem, dimension, box, isBorderBox, styles, computedVal ) { - var i = dimension === "width" ? 1 : 0, - extra = 0, - delta = 0; - - // Adjustment may not be necessary - if ( box === ( isBorderBox ? "border" : "content" ) ) { - return 0; - } - - for ( ; i < 4; i += 2 ) { - - // Both box models exclude margin - if ( box === "margin" ) { - delta += jQuery.css( elem, box + cssExpand[ i ], true, styles ); - } - - // If we get here with a content-box, we're seeking "padding" or "border" or "margin" - if ( !isBorderBox ) { - - // Add padding - delta += jQuery.css( elem, "padding" + cssExpand[ i ], true, styles ); - - // For "border" or "margin", add border - if ( box !== "padding" ) { - delta += jQuery.css( elem, "border" + cssExpand[ i ] + "Width", true, styles ); - - // But still keep track of it otherwise - } else { - extra += jQuery.css( elem, "border" + cssExpand[ i ] + "Width", true, styles ); - } - - // If we get here with a border-box (content + padding + border), we're seeking "content" or - // "padding" or "margin" - } else { - - // For "content", subtract padding - if ( box === "content" ) { - delta -= jQuery.css( elem, "padding" + cssExpand[ i ], true, styles ); - } - - // For "content" or "padding", subtract border - if ( box !== "margin" ) { - delta -= jQuery.css( elem, "border" + cssExpand[ i ] + "Width", true, styles ); - } - } - } - - // Account for positive content-box scroll gutter when requested by providing computedVal - if ( !isBorderBox && computedVal >= 0 ) { - - // offsetWidth/offsetHeight is a rounded sum of content, padding, scroll gutter, and border - // Assuming integer scroll gutter, subtract the rest and round down - delta += Math.max( 0, Math.ceil( - elem[ "offset" + dimension[ 0 ].toUpperCase() + dimension.slice( 1 ) ] - - computedVal - - delta - - extra - - 0.5 - - // If offsetWidth/offsetHeight is unknown, then we can't determine content-box scroll gutter - // Use an explicit zero to avoid NaN (gh-3964) - ) ) || 0; - } - - return delta; -} - -function getWidthOrHeight( elem, dimension, extra ) { - - // Start with computed style - var styles = getStyles( elem ), - - // To avoid forcing a reflow, only fetch boxSizing if we need it (gh-4322). - // Fake content-box until we know it's needed to know the true value. - boxSizingNeeded = !support.boxSizingReliable() || extra, - isBorderBox = boxSizingNeeded && - jQuery.css( elem, "boxSizing", false, styles ) === "border-box", - valueIsBorderBox = isBorderBox, - - val = curCSS( elem, dimension, styles ), - offsetProp = "offset" + dimension[ 0 ].toUpperCase() + dimension.slice( 1 ); - - // Support: Firefox <=54 - // Return a confounding non-pixel value or feign ignorance, as appropriate. - if ( rnumnonpx.test( val ) ) { - if ( !extra ) { - return val; - } - val = "auto"; - } - - - // Support: IE 9 - 11 only - // Use offsetWidth/offsetHeight for when box sizing is unreliable. - // In those cases, the computed value can be trusted to be border-box. - if ( ( !support.boxSizingReliable() && isBorderBox || - - // Support: IE 10 - 11+, Edge 15 - 18+ - // IE/Edge misreport `getComputedStyle` of table rows with width/height - // set in CSS while `offset*` properties report correct values. - // Interestingly, in some cases IE 9 doesn't suffer from this issue. - !support.reliableTrDimensions() && nodeName( elem, "tr" ) || - - // Fall back to offsetWidth/offsetHeight when value is "auto" - // This happens for inline elements with no explicit setting (gh-3571) - val === "auto" || - - // Support: Android <=4.1 - 4.3 only - // Also use offsetWidth/offsetHeight for misreported inline dimensions (gh-3602) - !parseFloat( val ) && jQuery.css( elem, "display", false, styles ) === "inline" ) && - - // Make sure the element is visible & connected - elem.getClientRects().length ) { - - isBorderBox = jQuery.css( elem, "boxSizing", false, styles ) === "border-box"; - - // Where available, offsetWidth/offsetHeight approximate border box dimensions. - // Where not available (e.g., SVG), assume unreliable box-sizing and interpret the - // retrieved value as a content box dimension. - valueIsBorderBox = offsetProp in elem; - if ( valueIsBorderBox ) { - val = elem[ offsetProp ]; - } - } - - // Normalize "" and auto - val = parseFloat( val ) || 0; - - // Adjust for the element's box model - return ( val + - boxModelAdjustment( - elem, - dimension, - extra || ( isBorderBox ? "border" : "content" ), - valueIsBorderBox, - styles, - - // Provide the current computed size to request scroll gutter calculation (gh-3589) - val - ) - ) + "px"; -} - -jQuery.extend( { - - // Add in style property hooks for overriding the default - // behavior of getting and setting a style property - cssHooks: { - opacity: { - get: function( elem, computed ) { - if ( computed ) { - - // We should always get a number back from opacity - var ret = curCSS( elem, "opacity" ); - return ret === "" ? "1" : ret; - } - } - } - }, - - // Don't automatically add "px" to these possibly-unitless properties - cssNumber: { - "animationIterationCount": true, - "columnCount": true, - "fillOpacity": true, - "flexGrow": true, - "flexShrink": true, - "fontWeight": true, - "gridArea": true, - "gridColumn": true, - "gridColumnEnd": true, - "gridColumnStart": true, - "gridRow": true, - "gridRowEnd": true, - "gridRowStart": true, - "lineHeight": true, - "opacity": true, - "order": true, - "orphans": true, - "widows": true, - "zIndex": true, - "zoom": true - }, - - // Add in properties whose names you wish to fix before - // setting or getting the value - cssProps: {}, - - // Get and set the style property on a DOM Node - style: function( elem, name, value, extra ) { - - // Don't set styles on text and comment nodes - if ( !elem || elem.nodeType === 3 || elem.nodeType === 8 || !elem.style ) { - return; - } - - // Make sure that we're working with the right name - var ret, type, hooks, - origName = camelCase( name ), - isCustomProp = rcustomProp.test( name ), - style = elem.style; - - // Make sure that we're working with the right name. We don't - // want to query the value if it is a CSS custom property - // since they are user-defined. - if ( !isCustomProp ) { - name = finalPropName( origName ); - } - - // Gets hook for the prefixed version, then unprefixed version - hooks = jQuery.cssHooks[ name ] || jQuery.cssHooks[ origName ]; - - // Check if we're setting a value - if ( value !== undefined ) { - type = typeof value; - - // Convert "+=" or "-=" to relative numbers (#7345) - if ( type === "string" && ( ret = rcssNum.exec( value ) ) && ret[ 1 ] ) { - value = adjustCSS( elem, name, ret ); - - // Fixes bug #9237 - type = "number"; - } - - // Make sure that null and NaN values aren't set (#7116) - if ( value == null || value !== value ) { - return; - } - - // If a number was passed in, add the unit (except for certain CSS properties) - // The isCustomProp check can be removed in jQuery 4.0 when we only auto-append - // "px" to a few hardcoded values. - if ( type === "number" && !isCustomProp ) { - value += ret && ret[ 3 ] || ( jQuery.cssNumber[ origName ] ? "" : "px" ); - } - - // background-* props affect original clone's values - if ( !support.clearCloneStyle && value === "" && name.indexOf( "background" ) === 0 ) { - style[ name ] = "inherit"; - } - - // If a hook was provided, use that value, otherwise just set the specified value - if ( !hooks || !( "set" in hooks ) || - ( value = hooks.set( elem, value, extra ) ) !== undefined ) { - - if ( isCustomProp ) { - style.setProperty( name, value ); - } else { - style[ name ] = value; - } - } - - } else { - - // If a hook was provided get the non-computed value from there - if ( hooks && "get" in hooks && - ( ret = hooks.get( elem, false, extra ) ) !== undefined ) { - - return ret; - } - - // Otherwise just get the value from the style object - return style[ name ]; - } - }, - - css: function( elem, name, extra, styles ) { - var val, num, hooks, - origName = camelCase( name ), - isCustomProp = rcustomProp.test( name ); - - // Make sure that we're working with the right name. We don't - // want to modify the value if it is a CSS custom property - // since they are user-defined. - if ( !isCustomProp ) { - name = finalPropName( origName ); - } - - // Try prefixed name followed by the unprefixed name - hooks = jQuery.cssHooks[ name ] || jQuery.cssHooks[ origName ]; - - // If a hook was provided get the computed value from there - if ( hooks && "get" in hooks ) { - val = hooks.get( elem, true, extra ); - } - - // Otherwise, if a way to get the computed value exists, use that - if ( val === undefined ) { - val = curCSS( elem, name, styles ); - } - - // Convert "normal" to computed value - if ( val === "normal" && name in cssNormalTransform ) { - val = cssNormalTransform[ name ]; - } - - // Make numeric if forced or a qualifier was provided and val looks numeric - if ( extra === "" || extra ) { - num = parseFloat( val ); - return extra === true || isFinite( num ) ? num || 0 : val; - } - - return val; - } -} ); - -jQuery.each( [ "height", "width" ], function( _i, dimension ) { - jQuery.cssHooks[ dimension ] = { - get: function( elem, computed, extra ) { - if ( computed ) { - - // Certain elements can have dimension info if we invisibly show them - // but it must have a current display style that would benefit - return rdisplayswap.test( jQuery.css( elem, "display" ) ) && - - // Support: Safari 8+ - // Table columns in Safari have non-zero offsetWidth & zero - // getBoundingClientRect().width unless display is changed. - // Support: IE <=11 only - // Running getBoundingClientRect on a disconnected node - // in IE throws an error. - ( !elem.getClientRects().length || !elem.getBoundingClientRect().width ) ? - swap( elem, cssShow, function() { - return getWidthOrHeight( elem, dimension, extra ); - } ) : - getWidthOrHeight( elem, dimension, extra ); - } - }, - - set: function( elem, value, extra ) { - var matches, - styles = getStyles( elem ), - - // Only read styles.position if the test has a chance to fail - // to avoid forcing a reflow. - scrollboxSizeBuggy = !support.scrollboxSize() && - styles.position === "absolute", - - // To avoid forcing a reflow, only fetch boxSizing if we need it (gh-3991) - boxSizingNeeded = scrollboxSizeBuggy || extra, - isBorderBox = boxSizingNeeded && - jQuery.css( elem, "boxSizing", false, styles ) === "border-box", - subtract = extra ? - boxModelAdjustment( - elem, - dimension, - extra, - isBorderBox, - styles - ) : - 0; - - // Account for unreliable border-box dimensions by comparing offset* to computed and - // faking a content-box to get border and padding (gh-3699) - if ( isBorderBox && scrollboxSizeBuggy ) { - subtract -= Math.ceil( - elem[ "offset" + dimension[ 0 ].toUpperCase() + dimension.slice( 1 ) ] - - parseFloat( styles[ dimension ] ) - - boxModelAdjustment( elem, dimension, "border", false, styles ) - - 0.5 - ); - } - - // Convert to pixels if value adjustment is needed - if ( subtract && ( matches = rcssNum.exec( value ) ) && - ( matches[ 3 ] || "px" ) !== "px" ) { - - elem.style[ dimension ] = value; - value = jQuery.css( elem, dimension ); - } - - return setPositiveNumber( elem, value, subtract ); - } - }; -} ); - -jQuery.cssHooks.marginLeft = addGetHookIf( support.reliableMarginLeft, - function( elem, computed ) { - if ( computed ) { - return ( parseFloat( curCSS( elem, "marginLeft" ) ) || - elem.getBoundingClientRect().left - - swap( elem, { marginLeft: 0 }, function() { - return elem.getBoundingClientRect().left; - } ) - ) + "px"; - } - } -); - -// These hooks are used by animate to expand properties -jQuery.each( { - margin: "", - padding: "", - border: "Width" -}, function( prefix, suffix ) { - jQuery.cssHooks[ prefix + suffix ] = { - expand: function( value ) { - var i = 0, - expanded = {}, - - // Assumes a single number if not a string - parts = typeof value === "string" ? value.split( " " ) : [ value ]; - - for ( ; i < 4; i++ ) { - expanded[ prefix + cssExpand[ i ] + suffix ] = - parts[ i ] || parts[ i - 2 ] || parts[ 0 ]; - } - - return expanded; - } - }; - - if ( prefix !== "margin" ) { - jQuery.cssHooks[ prefix + suffix ].set = setPositiveNumber; - } -} ); - -jQuery.fn.extend( { - css: function( name, value ) { - return access( this, function( elem, name, value ) { - var styles, len, - map = {}, - i = 0; - - if ( Array.isArray( name ) ) { - styles = getStyles( elem ); - len = name.length; - - for ( ; i < len; i++ ) { - map[ name[ i ] ] = jQuery.css( elem, name[ i ], false, styles ); - } - - return map; - } - - return value !== undefined ? - jQuery.style( elem, name, value ) : - jQuery.css( elem, name ); - }, name, value, arguments.length > 1 ); - } -} ); - - -function Tween( elem, options, prop, end, easing ) { - return new Tween.prototype.init( elem, options, prop, end, easing ); -} -jQuery.Tween = Tween; - -Tween.prototype = { - constructor: Tween, - init: function( elem, options, prop, end, easing, unit ) { - this.elem = elem; - this.prop = prop; - this.easing = easing || jQuery.easing._default; - this.options = options; - this.start = this.now = this.cur(); - this.end = end; - this.unit = unit || ( jQuery.cssNumber[ prop ] ? "" : "px" ); - }, - cur: function() { - var hooks = Tween.propHooks[ this.prop ]; - - return hooks && hooks.get ? - hooks.get( this ) : - Tween.propHooks._default.get( this ); - }, - run: function( percent ) { - var eased, - hooks = Tween.propHooks[ this.prop ]; - - if ( this.options.duration ) { - this.pos = eased = jQuery.easing[ this.easing ]( - percent, this.options.duration * percent, 0, 1, this.options.duration - ); - } else { - this.pos = eased = percent; - } - this.now = ( this.end - this.start ) * eased + this.start; - - if ( this.options.step ) { - this.options.step.call( this.elem, this.now, this ); - } - - if ( hooks && hooks.set ) { - hooks.set( this ); - } else { - Tween.propHooks._default.set( this ); - } - return this; - } -}; - -Tween.prototype.init.prototype = Tween.prototype; - -Tween.propHooks = { - _default: { - get: function( tween ) { - var result; - - // Use a property on the element directly when it is not a DOM element, - // or when there is no matching style property that exists. - if ( tween.elem.nodeType !== 1 || - tween.elem[ tween.prop ] != null && tween.elem.style[ tween.prop ] == null ) { - return tween.elem[ tween.prop ]; - } - - // Passing an empty string as a 3rd parameter to .css will automatically - // attempt a parseFloat and fallback to a string if the parse fails. - // Simple values such as "10px" are parsed to Float; - // complex values such as "rotate(1rad)" are returned as-is. - result = jQuery.css( tween.elem, tween.prop, "" ); - - // Empty strings, null, undefined and "auto" are converted to 0. - return !result || result === "auto" ? 0 : result; - }, - set: function( tween ) { - - // Use step hook for back compat. - // Use cssHook if its there. - // Use .style if available and use plain properties where available. - if ( jQuery.fx.step[ tween.prop ] ) { - jQuery.fx.step[ tween.prop ]( tween ); - } else if ( tween.elem.nodeType === 1 && ( - jQuery.cssHooks[ tween.prop ] || - tween.elem.style[ finalPropName( tween.prop ) ] != null ) ) { - jQuery.style( tween.elem, tween.prop, tween.now + tween.unit ); - } else { - tween.elem[ tween.prop ] = tween.now; - } - } - } -}; - -// Support: IE <=9 only -// Panic based approach to setting things on disconnected nodes -Tween.propHooks.scrollTop = Tween.propHooks.scrollLeft = { - set: function( tween ) { - if ( tween.elem.nodeType && tween.elem.parentNode ) { - tween.elem[ tween.prop ] = tween.now; - } - } -}; - -jQuery.easing = { - linear: function( p ) { - return p; - }, - swing: function( p ) { - return 0.5 - Math.cos( p * Math.PI ) / 2; - }, - _default: "swing" -}; - -jQuery.fx = Tween.prototype.init; - -// Back compat <1.8 extension point -jQuery.fx.step = {}; - - - - -var - fxNow, inProgress, - rfxtypes = /^(?:toggle|show|hide)$/, - rrun = /queueHooks$/; - -function schedule() { - if ( inProgress ) { - if ( document.hidden === false && window.requestAnimationFrame ) { - window.requestAnimationFrame( schedule ); - } else { - window.setTimeout( schedule, jQuery.fx.interval ); - } - - jQuery.fx.tick(); - } -} - -// Animations created synchronously will run synchronously -function createFxNow() { - window.setTimeout( function() { - fxNow = undefined; - } ); - return ( fxNow = Date.now() ); -} - -// Generate parameters to create a standard animation -function genFx( type, includeWidth ) { - var which, - i = 0, - attrs = { height: type }; - - // If we include width, step value is 1 to do all cssExpand values, - // otherwise step value is 2 to skip over Left and Right - includeWidth = includeWidth ? 1 : 0; - for ( ; i < 4; i += 2 - includeWidth ) { - which = cssExpand[ i ]; - attrs[ "margin" + which ] = attrs[ "padding" + which ] = type; - } - - if ( includeWidth ) { - attrs.opacity = attrs.width = type; - } - - return attrs; -} - -function createTween( value, prop, animation ) { - var tween, - collection = ( Animation.tweeners[ prop ] || [] ).concat( Animation.tweeners[ "*" ] ), - index = 0, - length = collection.length; - for ( ; index < length; index++ ) { - if ( ( tween = collection[ index ].call( animation, prop, value ) ) ) { - - // We're done with this property - return tween; - } - } -} - -function defaultPrefilter( elem, props, opts ) { - var prop, value, toggle, hooks, oldfire, propTween, restoreDisplay, display, - isBox = "width" in props || "height" in props, - anim = this, - orig = {}, - style = elem.style, - hidden = elem.nodeType && isHiddenWithinTree( elem ), - dataShow = dataPriv.get( elem, "fxshow" ); - - // Queue-skipping animations hijack the fx hooks - if ( !opts.queue ) { - hooks = jQuery._queueHooks( elem, "fx" ); - if ( hooks.unqueued == null ) { - hooks.unqueued = 0; - oldfire = hooks.empty.fire; - hooks.empty.fire = function() { - if ( !hooks.unqueued ) { - oldfire(); - } - }; - } - hooks.unqueued++; - - anim.always( function() { - - // Ensure the complete handler is called before this completes - anim.always( function() { - hooks.unqueued--; - if ( !jQuery.queue( elem, "fx" ).length ) { - hooks.empty.fire(); - } - } ); - } ); - } - - // Detect show/hide animations - for ( prop in props ) { - value = props[ prop ]; - if ( rfxtypes.test( value ) ) { - delete props[ prop ]; - toggle = toggle || value === "toggle"; - if ( value === ( hidden ? "hide" : "show" ) ) { - - // Pretend to be hidden if this is a "show" and - // there is still data from a stopped show/hide - if ( value === "show" && dataShow && dataShow[ prop ] !== undefined ) { - hidden = true; - - // Ignore all other no-op show/hide data - } else { - continue; - } - } - orig[ prop ] = dataShow && dataShow[ prop ] || jQuery.style( elem, prop ); - } - } - - // Bail out if this is a no-op like .hide().hide() - propTween = !jQuery.isEmptyObject( props ); - if ( !propTween && jQuery.isEmptyObject( orig ) ) { - return; - } - - // Restrict "overflow" and "display" styles during box animations - if ( isBox && elem.nodeType === 1 ) { - - // Support: IE <=9 - 11, Edge 12 - 15 - // Record all 3 overflow attributes because IE does not infer the shorthand - // from identically-valued overflowX and overflowY and Edge just mirrors - // the overflowX value there. - opts.overflow = [ style.overflow, style.overflowX, style.overflowY ]; - - // Identify a display type, preferring old show/hide data over the CSS cascade - restoreDisplay = dataShow && dataShow.display; - if ( restoreDisplay == null ) { - restoreDisplay = dataPriv.get( elem, "display" ); - } - display = jQuery.css( elem, "display" ); - if ( display === "none" ) { - if ( restoreDisplay ) { - display = restoreDisplay; - } else { - - // Get nonempty value(s) by temporarily forcing visibility - showHide( [ elem ], true ); - restoreDisplay = elem.style.display || restoreDisplay; - display = jQuery.css( elem, "display" ); - showHide( [ elem ] ); - } - } - - // Animate inline elements as inline-block - if ( display === "inline" || display === "inline-block" && restoreDisplay != null ) { - if ( jQuery.css( elem, "float" ) === "none" ) { - - // Restore the original display value at the end of pure show/hide animations - if ( !propTween ) { - anim.done( function() { - style.display = restoreDisplay; - } ); - if ( restoreDisplay == null ) { - display = style.display; - restoreDisplay = display === "none" ? "" : display; - } - } - style.display = "inline-block"; - } - } - } - - if ( opts.overflow ) { - style.overflow = "hidden"; - anim.always( function() { - style.overflow = opts.overflow[ 0 ]; - style.overflowX = opts.overflow[ 1 ]; - style.overflowY = opts.overflow[ 2 ]; - } ); - } - - // Implement show/hide animations - propTween = false; - for ( prop in orig ) { - - // General show/hide setup for this element animation - if ( !propTween ) { - if ( dataShow ) { - if ( "hidden" in dataShow ) { - hidden = dataShow.hidden; - } - } else { - dataShow = dataPriv.access( elem, "fxshow", { display: restoreDisplay } ); - } - - // Store hidden/visible for toggle so `.stop().toggle()` "reverses" - if ( toggle ) { - dataShow.hidden = !hidden; - } - - // Show elements before animating them - if ( hidden ) { - showHide( [ elem ], true ); - } - - /* eslint-disable no-loop-func */ - - anim.done( function() { - - /* eslint-enable no-loop-func */ - - // The final step of a "hide" animation is actually hiding the element - if ( !hidden ) { - showHide( [ elem ] ); - } - dataPriv.remove( elem, "fxshow" ); - for ( prop in orig ) { - jQuery.style( elem, prop, orig[ prop ] ); - } - } ); - } - - // Per-property setup - propTween = createTween( hidden ? dataShow[ prop ] : 0, prop, anim ); - if ( !( prop in dataShow ) ) { - dataShow[ prop ] = propTween.start; - if ( hidden ) { - propTween.end = propTween.start; - propTween.start = 0; - } - } - } -} - -function propFilter( props, specialEasing ) { - var index, name, easing, value, hooks; - - // camelCase, specialEasing and expand cssHook pass - for ( index in props ) { - name = camelCase( index ); - easing = specialEasing[ name ]; - value = props[ index ]; - if ( Array.isArray( value ) ) { - easing = value[ 1 ]; - value = props[ index ] = value[ 0 ]; - } - - if ( index !== name ) { - props[ name ] = value; - delete props[ index ]; - } - - hooks = jQuery.cssHooks[ name ]; - if ( hooks && "expand" in hooks ) { - value = hooks.expand( value ); - delete props[ name ]; - - // Not quite $.extend, this won't overwrite existing keys. - // Reusing 'index' because we have the correct "name" - for ( index in value ) { - if ( !( index in props ) ) { - props[ index ] = value[ index ]; - specialEasing[ index ] = easing; - } - } - } else { - specialEasing[ name ] = easing; - } - } -} - -function Animation( elem, properties, options ) { - var result, - stopped, - index = 0, - length = Animation.prefilters.length, - deferred = jQuery.Deferred().always( function() { - - // Don't match elem in the :animated selector - delete tick.elem; - } ), - tick = function() { - if ( stopped ) { - return false; - } - var currentTime = fxNow || createFxNow(), - remaining = Math.max( 0, animation.startTime + animation.duration - currentTime ), - - // Support: Android 2.3 only - // Archaic crash bug won't allow us to use `1 - ( 0.5 || 0 )` (#12497) - temp = remaining / animation.duration || 0, - percent = 1 - temp, - index = 0, - length = animation.tweens.length; - - for ( ; index < length; index++ ) { - animation.tweens[ index ].run( percent ); - } - - deferred.notifyWith( elem, [ animation, percent, remaining ] ); - - // If there's more to do, yield - if ( percent < 1 && length ) { - return remaining; - } - - // If this was an empty animation, synthesize a final progress notification - if ( !length ) { - deferred.notifyWith( elem, [ animation, 1, 0 ] ); - } - - // Resolve the animation and report its conclusion - deferred.resolveWith( elem, [ animation ] ); - return false; - }, - animation = deferred.promise( { - elem: elem, - props: jQuery.extend( {}, properties ), - opts: jQuery.extend( true, { - specialEasing: {}, - easing: jQuery.easing._default - }, options ), - originalProperties: properties, - originalOptions: options, - startTime: fxNow || createFxNow(), - duration: options.duration, - tweens: [], - createTween: function( prop, end ) { - var tween = jQuery.Tween( elem, animation.opts, prop, end, - animation.opts.specialEasing[ prop ] || animation.opts.easing ); - animation.tweens.push( tween ); - return tween; - }, - stop: function( gotoEnd ) { - var index = 0, - - // If we are going to the end, we want to run all the tweens - // otherwise we skip this part - length = gotoEnd ? animation.tweens.length : 0; - if ( stopped ) { - return this; - } - stopped = true; - for ( ; index < length; index++ ) { - animation.tweens[ index ].run( 1 ); - } - - // Resolve when we played the last frame; otherwise, reject - if ( gotoEnd ) { - deferred.notifyWith( elem, [ animation, 1, 0 ] ); - deferred.resolveWith( elem, [ animation, gotoEnd ] ); - } else { - deferred.rejectWith( elem, [ animation, gotoEnd ] ); - } - return this; - } - } ), - props = animation.props; - - propFilter( props, animation.opts.specialEasing ); - - for ( ; index < length; index++ ) { - result = Animation.prefilters[ index ].call( animation, elem, props, animation.opts ); - if ( result ) { - if ( isFunction( result.stop ) ) { - jQuery._queueHooks( animation.elem, animation.opts.queue ).stop = - result.stop.bind( result ); - } - return result; - } - } - - jQuery.map( props, createTween, animation ); - - if ( isFunction( animation.opts.start ) ) { - animation.opts.start.call( elem, animation ); - } - - // Attach callbacks from options - animation - .progress( animation.opts.progress ) - .done( animation.opts.done, animation.opts.complete ) - .fail( animation.opts.fail ) - .always( animation.opts.always ); - - jQuery.fx.timer( - jQuery.extend( tick, { - elem: elem, - anim: animation, - queue: animation.opts.queue - } ) - ); - - return animation; -} - -jQuery.Animation = jQuery.extend( Animation, { - - tweeners: { - "*": [ function( prop, value ) { - var tween = this.createTween( prop, value ); - adjustCSS( tween.elem, prop, rcssNum.exec( value ), tween ); - return tween; - } ] - }, - - tweener: function( props, callback ) { - if ( isFunction( props ) ) { - callback = props; - props = [ "*" ]; - } else { - props = props.match( rnothtmlwhite ); - } - - var prop, - index = 0, - length = props.length; - - for ( ; index < length; index++ ) { - prop = props[ index ]; - Animation.tweeners[ prop ] = Animation.tweeners[ prop ] || []; - Animation.tweeners[ prop ].unshift( callback ); - } - }, - - prefilters: [ defaultPrefilter ], - - prefilter: function( callback, prepend ) { - if ( prepend ) { - Animation.prefilters.unshift( callback ); - } else { - Animation.prefilters.push( callback ); - } - } -} ); - -jQuery.speed = function( speed, easing, fn ) { - var opt = speed && typeof speed === "object" ? jQuery.extend( {}, speed ) : { - complete: fn || !fn && easing || - isFunction( speed ) && speed, - duration: speed, - easing: fn && easing || easing && !isFunction( easing ) && easing - }; - - // Go to the end state if fx are off - if ( jQuery.fx.off ) { - opt.duration = 0; - - } else { - if ( typeof opt.duration !== "number" ) { - if ( opt.duration in jQuery.fx.speeds ) { - opt.duration = jQuery.fx.speeds[ opt.duration ]; - - } else { - opt.duration = jQuery.fx.speeds._default; - } - } - } - - // Normalize opt.queue - true/undefined/null -> "fx" - if ( opt.queue == null || opt.queue === true ) { - opt.queue = "fx"; - } - - // Queueing - opt.old = opt.complete; - - opt.complete = function() { - if ( isFunction( opt.old ) ) { - opt.old.call( this ); - } - - if ( opt.queue ) { - jQuery.dequeue( this, opt.queue ); - } - }; - - return opt; -}; - -jQuery.fn.extend( { - fadeTo: function( speed, to, easing, callback ) { - - // Show any hidden elements after setting opacity to 0 - return this.filter( isHiddenWithinTree ).css( "opacity", 0 ).show() - - // Animate to the value specified - .end().animate( { opacity: to }, speed, easing, callback ); - }, - animate: function( prop, speed, easing, callback ) { - var empty = jQuery.isEmptyObject( prop ), - optall = jQuery.speed( speed, easing, callback ), - doAnimation = function() { - - // Operate on a copy of prop so per-property easing won't be lost - var anim = Animation( this, jQuery.extend( {}, prop ), optall ); - - // Empty animations, or finishing resolves immediately - if ( empty || dataPriv.get( this, "finish" ) ) { - anim.stop( true ); - } - }; - doAnimation.finish = doAnimation; - - return empty || optall.queue === false ? - this.each( doAnimation ) : - this.queue( optall.queue, doAnimation ); - }, - stop: function( type, clearQueue, gotoEnd ) { - var stopQueue = function( hooks ) { - var stop = hooks.stop; - delete hooks.stop; - stop( gotoEnd ); - }; - - if ( typeof type !== "string" ) { - gotoEnd = clearQueue; - clearQueue = type; - type = undefined; - } - if ( clearQueue ) { - this.queue( type || "fx", [] ); - } - - return this.each( function() { - var dequeue = true, - index = type != null && type + "queueHooks", - timers = jQuery.timers, - data = dataPriv.get( this ); - - if ( index ) { - if ( data[ index ] && data[ index ].stop ) { - stopQueue( data[ index ] ); - } - } else { - for ( index in data ) { - if ( data[ index ] && data[ index ].stop && rrun.test( index ) ) { - stopQueue( data[ index ] ); - } - } - } - - for ( index = timers.length; index--; ) { - if ( timers[ index ].elem === this && - ( type == null || timers[ index ].queue === type ) ) { - - timers[ index ].anim.stop( gotoEnd ); - dequeue = false; - timers.splice( index, 1 ); - } - } - - // Start the next in the queue if the last step wasn't forced. - // Timers currently will call their complete callbacks, which - // will dequeue but only if they were gotoEnd. - if ( dequeue || !gotoEnd ) { - jQuery.dequeue( this, type ); - } - } ); - }, - finish: function( type ) { - if ( type !== false ) { - type = type || "fx"; - } - return this.each( function() { - var index, - data = dataPriv.get( this ), - queue = data[ type + "queue" ], - hooks = data[ type + "queueHooks" ], - timers = jQuery.timers, - length = queue ? queue.length : 0; - - // Enable finishing flag on private data - data.finish = true; - - // Empty the queue first - jQuery.queue( this, type, [] ); - - if ( hooks && hooks.stop ) { - hooks.stop.call( this, true ); - } - - // Look for any active animations, and finish them - for ( index = timers.length; index--; ) { - if ( timers[ index ].elem === this && timers[ index ].queue === type ) { - timers[ index ].anim.stop( true ); - timers.splice( index, 1 ); - } - } - - // Look for any animations in the old queue and finish them - for ( index = 0; index < length; index++ ) { - if ( queue[ index ] && queue[ index ].finish ) { - queue[ index ].finish.call( this ); - } - } - - // Turn off finishing flag - delete data.finish; - } ); - } -} ); - -jQuery.each( [ "toggle", "show", "hide" ], function( _i, name ) { - var cssFn = jQuery.fn[ name ]; - jQuery.fn[ name ] = function( speed, easing, callback ) { - return speed == null || typeof speed === "boolean" ? - cssFn.apply( this, arguments ) : - this.animate( genFx( name, true ), speed, easing, callback ); - }; -} ); - -// Generate shortcuts for custom animations -jQuery.each( { - slideDown: genFx( "show" ), - slideUp: genFx( "hide" ), - slideToggle: genFx( "toggle" ), - fadeIn: { opacity: "show" }, - fadeOut: { opacity: "hide" }, - fadeToggle: { opacity: "toggle" } -}, function( name, props ) { - jQuery.fn[ name ] = function( speed, easing, callback ) { - return this.animate( props, speed, easing, callback ); - }; -} ); - -jQuery.timers = []; -jQuery.fx.tick = function() { - var timer, - i = 0, - timers = jQuery.timers; - - fxNow = Date.now(); - - for ( ; i < timers.length; i++ ) { - timer = timers[ i ]; - - // Run the timer and safely remove it when done (allowing for external removal) - if ( !timer() && timers[ i ] === timer ) { - timers.splice( i--, 1 ); - } - } - - if ( !timers.length ) { - jQuery.fx.stop(); - } - fxNow = undefined; -}; - -jQuery.fx.timer = function( timer ) { - jQuery.timers.push( timer ); - jQuery.fx.start(); -}; - -jQuery.fx.interval = 13; -jQuery.fx.start = function() { - if ( inProgress ) { - return; - } - - inProgress = true; - schedule(); -}; - -jQuery.fx.stop = function() { - inProgress = null; -}; - -jQuery.fx.speeds = { - slow: 600, - fast: 200, - - // Default speed - _default: 400 -}; - - -// Based off of the plugin by Clint Helfers, with permission. -// https://web.archive.org/web/20100324014747/http://blindsignals.com/index.php/2009/07/jquery-delay/ -jQuery.fn.delay = function( time, type ) { - time = jQuery.fx ? jQuery.fx.speeds[ time ] || time : time; - type = type || "fx"; - - return this.queue( type, function( next, hooks ) { - var timeout = window.setTimeout( next, time ); - hooks.stop = function() { - window.clearTimeout( timeout ); - }; - } ); -}; - - -( function() { - var input = document.createElement( "input" ), - select = document.createElement( "select" ), - opt = select.appendChild( document.createElement( "option" ) ); - - input.type = "checkbox"; - - // Support: Android <=4.3 only - // Default value for a checkbox should be "on" - support.checkOn = input.value !== ""; - - // Support: IE <=11 only - // Must access selectedIndex to make default options select - support.optSelected = opt.selected; - - // Support: IE <=11 only - // An input loses its value after becoming a radio - input = document.createElement( "input" ); - input.value = "t"; - input.type = "radio"; - support.radioValue = input.value === "t"; -} )(); - - -var boolHook, - attrHandle = jQuery.expr.attrHandle; - -jQuery.fn.extend( { - attr: function( name, value ) { - return access( this, jQuery.attr, name, value, arguments.length > 1 ); - }, - - removeAttr: function( name ) { - return this.each( function() { - jQuery.removeAttr( this, name ); - } ); - } -} ); - -jQuery.extend( { - attr: function( elem, name, value ) { - var ret, hooks, - nType = elem.nodeType; - - // Don't get/set attributes on text, comment and attribute nodes - if ( nType === 3 || nType === 8 || nType === 2 ) { - return; - } - - // Fallback to prop when attributes are not supported - if ( typeof elem.getAttribute === "undefined" ) { - return jQuery.prop( elem, name, value ); - } - - // Attribute hooks are determined by the lowercase version - // Grab necessary hook if one is defined - if ( nType !== 1 || !jQuery.isXMLDoc( elem ) ) { - hooks = jQuery.attrHooks[ name.toLowerCase() ] || - ( jQuery.expr.match.bool.test( name ) ? boolHook : undefined ); - } - - if ( value !== undefined ) { - if ( value === null ) { - jQuery.removeAttr( elem, name ); - return; - } - - if ( hooks && "set" in hooks && - ( ret = hooks.set( elem, value, name ) ) !== undefined ) { - return ret; - } - - elem.setAttribute( name, value + "" ); - return value; - } - - if ( hooks && "get" in hooks && ( ret = hooks.get( elem, name ) ) !== null ) { - return ret; - } - - ret = jQuery.find.attr( elem, name ); - - // Non-existent attributes return null, we normalize to undefined - return ret == null ? undefined : ret; - }, - - attrHooks: { - type: { - set: function( elem, value ) { - if ( !support.radioValue && value === "radio" && - nodeName( elem, "input" ) ) { - var val = elem.value; - elem.setAttribute( "type", value ); - if ( val ) { - elem.value = val; - } - return value; - } - } - } - }, - - removeAttr: function( elem, value ) { - var name, - i = 0, - - // Attribute names can contain non-HTML whitespace characters - // https://html.spec.whatwg.org/multipage/syntax.html#attributes-2 - attrNames = value && value.match( rnothtmlwhite ); - - if ( attrNames && elem.nodeType === 1 ) { - while ( ( name = attrNames[ i++ ] ) ) { - elem.removeAttribute( name ); - } - } - } -} ); - -// Hooks for boolean attributes -boolHook = { - set: function( elem, value, name ) { - if ( value === false ) { - - // Remove boolean attributes when set to false - jQuery.removeAttr( elem, name ); - } else { - elem.setAttribute( name, name ); - } - return name; - } -}; - -jQuery.each( jQuery.expr.match.bool.source.match( /\w+/g ), function( _i, name ) { - var getter = attrHandle[ name ] || jQuery.find.attr; - - attrHandle[ name ] = function( elem, name, isXML ) { - var ret, handle, - lowercaseName = name.toLowerCase(); - - if ( !isXML ) { - - // Avoid an infinite loop by temporarily removing this function from the getter - handle = attrHandle[ lowercaseName ]; - attrHandle[ lowercaseName ] = ret; - ret = getter( elem, name, isXML ) != null ? - lowercaseName : - null; - attrHandle[ lowercaseName ] = handle; - } - return ret; - }; -} ); - - - - -var rfocusable = /^(?:input|select|textarea|button)$/i, - rclickable = /^(?:a|area)$/i; - -jQuery.fn.extend( { - prop: function( name, value ) { - return access( this, jQuery.prop, name, value, arguments.length > 1 ); - }, - - removeProp: function( name ) { - return this.each( function() { - delete this[ jQuery.propFix[ name ] || name ]; - } ); - } -} ); - -jQuery.extend( { - prop: function( elem, name, value ) { - var ret, hooks, - nType = elem.nodeType; - - // Don't get/set properties on text, comment and attribute nodes - if ( nType === 3 || nType === 8 || nType === 2 ) { - return; - } - - if ( nType !== 1 || !jQuery.isXMLDoc( elem ) ) { - - // Fix name and attach hooks - name = jQuery.propFix[ name ] || name; - hooks = jQuery.propHooks[ name ]; - } - - if ( value !== undefined ) { - if ( hooks && "set" in hooks && - ( ret = hooks.set( elem, value, name ) ) !== undefined ) { - return ret; - } - - return ( elem[ name ] = value ); - } - - if ( hooks && "get" in hooks && ( ret = hooks.get( elem, name ) ) !== null ) { - return ret; - } - - return elem[ name ]; - }, - - propHooks: { - tabIndex: { - get: function( elem ) { - - // Support: IE <=9 - 11 only - // elem.tabIndex doesn't always return the - // correct value when it hasn't been explicitly set - // https://web.archive.org/web/20141116233347/http://fluidproject.org/blog/2008/01/09/getting-setting-and-removing-tabindex-values-with-javascript/ - // Use proper attribute retrieval(#12072) - var tabindex = jQuery.find.attr( elem, "tabindex" ); - - if ( tabindex ) { - return parseInt( tabindex, 10 ); - } - - if ( - rfocusable.test( elem.nodeName ) || - rclickable.test( elem.nodeName ) && - elem.href - ) { - return 0; - } - - return -1; - } - } - }, - - propFix: { - "for": "htmlFor", - "class": "className" - } -} ); - -// Support: IE <=11 only -// Accessing the selectedIndex property -// forces the browser to respect setting selected -// on the option -// The getter ensures a default option is selected -// when in an optgroup -// eslint rule "no-unused-expressions" is disabled for this code -// since it considers such accessions noop -if ( !support.optSelected ) { - jQuery.propHooks.selected = { - get: function( elem ) { - - /* eslint no-unused-expressions: "off" */ - - var parent = elem.parentNode; - if ( parent && parent.parentNode ) { - parent.parentNode.selectedIndex; - } - return null; - }, - set: function( elem ) { - - /* eslint no-unused-expressions: "off" */ - - var parent = elem.parentNode; - if ( parent ) { - parent.selectedIndex; - - if ( parent.parentNode ) { - parent.parentNode.selectedIndex; - } - } - } - }; -} - -jQuery.each( [ - "tabIndex", - "readOnly", - "maxLength", - "cellSpacing", - "cellPadding", - "rowSpan", - "colSpan", - "useMap", - "frameBorder", - "contentEditable" -], function() { - jQuery.propFix[ this.toLowerCase() ] = this; -} ); - - - - - // Strip and collapse whitespace according to HTML spec - // https://infra.spec.whatwg.org/#strip-and-collapse-ascii-whitespace - function stripAndCollapse( value ) { - var tokens = value.match( rnothtmlwhite ) || []; - return tokens.join( " " ); - } - - -function getClass( elem ) { - return elem.getAttribute && elem.getAttribute( "class" ) || ""; -} - -function classesToArray( value ) { - if ( Array.isArray( value ) ) { - return value; - } - if ( typeof value === "string" ) { - return value.match( rnothtmlwhite ) || []; - } - return []; -} - -jQuery.fn.extend( { - addClass: function( value ) { - var classes, elem, cur, curValue, clazz, j, finalValue, - i = 0; - - if ( isFunction( value ) ) { - return this.each( function( j ) { - jQuery( this ).addClass( value.call( this, j, getClass( this ) ) ); - } ); - } - - classes = classesToArray( value ); - - if ( classes.length ) { - while ( ( elem = this[ i++ ] ) ) { - curValue = getClass( elem ); - cur = elem.nodeType === 1 && ( " " + stripAndCollapse( curValue ) + " " ); - - if ( cur ) { - j = 0; - while ( ( clazz = classes[ j++ ] ) ) { - if ( cur.indexOf( " " + clazz + " " ) < 0 ) { - cur += clazz + " "; - } - } - - // Only assign if different to avoid unneeded rendering. - finalValue = stripAndCollapse( cur ); - if ( curValue !== finalValue ) { - elem.setAttribute( "class", finalValue ); - } - } - } - } - - return this; - }, - - removeClass: function( value ) { - var classes, elem, cur, curValue, clazz, j, finalValue, - i = 0; - - if ( isFunction( value ) ) { - return this.each( function( j ) { - jQuery( this ).removeClass( value.call( this, j, getClass( this ) ) ); - } ); - } - - if ( !arguments.length ) { - return this.attr( "class", "" ); - } - - classes = classesToArray( value ); - - if ( classes.length ) { - while ( ( elem = this[ i++ ] ) ) { - curValue = getClass( elem ); - - // This expression is here for better compressibility (see addClass) - cur = elem.nodeType === 1 && ( " " + stripAndCollapse( curValue ) + " " ); - - if ( cur ) { - j = 0; - while ( ( clazz = classes[ j++ ] ) ) { - - // Remove *all* instances - while ( cur.indexOf( " " + clazz + " " ) > -1 ) { - cur = cur.replace( " " + clazz + " ", " " ); - } - } - - // Only assign if different to avoid unneeded rendering. - finalValue = stripAndCollapse( cur ); - if ( curValue !== finalValue ) { - elem.setAttribute( "class", finalValue ); - } - } - } - } - - return this; - }, - - toggleClass: function( value, stateVal ) { - var type = typeof value, - isValidValue = type === "string" || Array.isArray( value ); - - if ( typeof stateVal === "boolean" && isValidValue ) { - return stateVal ? this.addClass( value ) : this.removeClass( value ); - } - - if ( isFunction( value ) ) { - return this.each( function( i ) { - jQuery( this ).toggleClass( - value.call( this, i, getClass( this ), stateVal ), - stateVal - ); - } ); - } - - return this.each( function() { - var className, i, self, classNames; - - if ( isValidValue ) { - - // Toggle individual class names - i = 0; - self = jQuery( this ); - classNames = classesToArray( value ); - - while ( ( className = classNames[ i++ ] ) ) { - - // Check each className given, space separated list - if ( self.hasClass( className ) ) { - self.removeClass( className ); - } else { - self.addClass( className ); - } - } - - // Toggle whole class name - } else if ( value === undefined || type === "boolean" ) { - className = getClass( this ); - if ( className ) { - - // Store className if set - dataPriv.set( this, "__className__", className ); - } - - // If the element has a class name or if we're passed `false`, - // then remove the whole classname (if there was one, the above saved it). - // Otherwise bring back whatever was previously saved (if anything), - // falling back to the empty string if nothing was stored. - if ( this.setAttribute ) { - this.setAttribute( "class", - className || value === false ? - "" : - dataPriv.get( this, "__className__" ) || "" - ); - } - } - } ); - }, - - hasClass: function( selector ) { - var className, elem, - i = 0; - - className = " " + selector + " "; - while ( ( elem = this[ i++ ] ) ) { - if ( elem.nodeType === 1 && - ( " " + stripAndCollapse( getClass( elem ) ) + " " ).indexOf( className ) > -1 ) { - return true; - } - } - - return false; - } -} ); - - - - -var rreturn = /\r/g; - -jQuery.fn.extend( { - val: function( value ) { - var hooks, ret, valueIsFunction, - elem = this[ 0 ]; - - if ( !arguments.length ) { - if ( elem ) { - hooks = jQuery.valHooks[ elem.type ] || - jQuery.valHooks[ elem.nodeName.toLowerCase() ]; - - if ( hooks && - "get" in hooks && - ( ret = hooks.get( elem, "value" ) ) !== undefined - ) { - return ret; - } - - ret = elem.value; - - // Handle most common string cases - if ( typeof ret === "string" ) { - return ret.replace( rreturn, "" ); - } - - // Handle cases where value is null/undef or number - return ret == null ? "" : ret; - } - - return; - } - - valueIsFunction = isFunction( value ); - - return this.each( function( i ) { - var val; - - if ( this.nodeType !== 1 ) { - return; - } - - if ( valueIsFunction ) { - val = value.call( this, i, jQuery( this ).val() ); - } else { - val = value; - } - - // Treat null/undefined as ""; convert numbers to string - if ( val == null ) { - val = ""; - - } else if ( typeof val === "number" ) { - val += ""; - - } else if ( Array.isArray( val ) ) { - val = jQuery.map( val, function( value ) { - return value == null ? "" : value + ""; - } ); - } - - hooks = jQuery.valHooks[ this.type ] || jQuery.valHooks[ this.nodeName.toLowerCase() ]; - - // If set returns undefined, fall back to normal setting - if ( !hooks || !( "set" in hooks ) || hooks.set( this, val, "value" ) === undefined ) { - this.value = val; - } - } ); - } -} ); - -jQuery.extend( { - valHooks: { - option: { - get: function( elem ) { - - var val = jQuery.find.attr( elem, "value" ); - return val != null ? - val : - - // Support: IE <=10 - 11 only - // option.text throws exceptions (#14686, #14858) - // Strip and collapse whitespace - // https://html.spec.whatwg.org/#strip-and-collapse-whitespace - stripAndCollapse( jQuery.text( elem ) ); - } - }, - select: { - get: function( elem ) { - var value, option, i, - options = elem.options, - index = elem.selectedIndex, - one = elem.type === "select-one", - values = one ? null : [], - max = one ? index + 1 : options.length; - - if ( index < 0 ) { - i = max; - - } else { - i = one ? index : 0; - } - - // Loop through all the selected options - for ( ; i < max; i++ ) { - option = options[ i ]; - - // Support: IE <=9 only - // IE8-9 doesn't update selected after form reset (#2551) - if ( ( option.selected || i === index ) && - - // Don't return options that are disabled or in a disabled optgroup - !option.disabled && - ( !option.parentNode.disabled || - !nodeName( option.parentNode, "optgroup" ) ) ) { - - // Get the specific value for the option - value = jQuery( option ).val(); - - // We don't need an array for one selects - if ( one ) { - return value; - } - - // Multi-Selects return an array - values.push( value ); - } - } - - return values; - }, - - set: function( elem, value ) { - var optionSet, option, - options = elem.options, - values = jQuery.makeArray( value ), - i = options.length; - - while ( i-- ) { - option = options[ i ]; - - /* eslint-disable no-cond-assign */ - - if ( option.selected = - jQuery.inArray( jQuery.valHooks.option.get( option ), values ) > -1 - ) { - optionSet = true; - } - - /* eslint-enable no-cond-assign */ - } - - // Force browsers to behave consistently when non-matching value is set - if ( !optionSet ) { - elem.selectedIndex = -1; - } - return values; - } - } - } -} ); - -// Radios and checkboxes getter/setter -jQuery.each( [ "radio", "checkbox" ], function() { - jQuery.valHooks[ this ] = { - set: function( elem, value ) { - if ( Array.isArray( value ) ) { - return ( elem.checked = jQuery.inArray( jQuery( elem ).val(), value ) > -1 ); - } - } - }; - if ( !support.checkOn ) { - jQuery.valHooks[ this ].get = function( elem ) { - return elem.getAttribute( "value" ) === null ? "on" : elem.value; - }; - } -} ); - - - - -// Return jQuery for attributes-only inclusion - - -support.focusin = "onfocusin" in window; - - -var rfocusMorph = /^(?:focusinfocus|focusoutblur)$/, - stopPropagationCallback = function( e ) { - e.stopPropagation(); - }; - -jQuery.extend( jQuery.event, { - - trigger: function( event, data, elem, onlyHandlers ) { - - var i, cur, tmp, bubbleType, ontype, handle, special, lastElement, - eventPath = [ elem || document ], - type = hasOwn.call( event, "type" ) ? event.type : event, - namespaces = hasOwn.call( event, "namespace" ) ? event.namespace.split( "." ) : []; - - cur = lastElement = tmp = elem = elem || document; - - // Don't do events on text and comment nodes - if ( elem.nodeType === 3 || elem.nodeType === 8 ) { - return; - } - - // focus/blur morphs to focusin/out; ensure we're not firing them right now - if ( rfocusMorph.test( type + jQuery.event.triggered ) ) { - return; - } - - if ( type.indexOf( "." ) > -1 ) { - - // Namespaced trigger; create a regexp to match event type in handle() - namespaces = type.split( "." ); - type = namespaces.shift(); - namespaces.sort(); - } - ontype = type.indexOf( ":" ) < 0 && "on" + type; - - // Caller can pass in a jQuery.Event object, Object, or just an event type string - event = event[ jQuery.expando ] ? - event : - new jQuery.Event( type, typeof event === "object" && event ); - - // Trigger bitmask: & 1 for native handlers; & 2 for jQuery (always true) - event.isTrigger = onlyHandlers ? 2 : 3; - event.namespace = namespaces.join( "." ); - event.rnamespace = event.namespace ? - new RegExp( "(^|\\.)" + namespaces.join( "\\.(?:.*\\.|)" ) + "(\\.|$)" ) : - null; - - // Clean up the event in case it is being reused - event.result = undefined; - if ( !event.target ) { - event.target = elem; - } - - // Clone any incoming data and prepend the event, creating the handler arg list - data = data == null ? - [ event ] : - jQuery.makeArray( data, [ event ] ); - - // Allow special events to draw outside the lines - special = jQuery.event.special[ type ] || {}; - if ( !onlyHandlers && special.trigger && special.trigger.apply( elem, data ) === false ) { - return; - } - - // Determine event propagation path in advance, per W3C events spec (#9951) - // Bubble up to document, then to window; watch for a global ownerDocument var (#9724) - if ( !onlyHandlers && !special.noBubble && !isWindow( elem ) ) { - - bubbleType = special.delegateType || type; - if ( !rfocusMorph.test( bubbleType + type ) ) { - cur = cur.parentNode; - } - for ( ; cur; cur = cur.parentNode ) { - eventPath.push( cur ); - tmp = cur; - } - - // Only add window if we got to document (e.g., not plain obj or detached DOM) - if ( tmp === ( elem.ownerDocument || document ) ) { - eventPath.push( tmp.defaultView || tmp.parentWindow || window ); - } - } - - // Fire handlers on the event path - i = 0; - while ( ( cur = eventPath[ i++ ] ) && !event.isPropagationStopped() ) { - lastElement = cur; - event.type = i > 1 ? - bubbleType : - special.bindType || type; - - // jQuery handler - handle = ( - dataPriv.get( cur, "events" ) || Object.create( null ) - )[ event.type ] && - dataPriv.get( cur, "handle" ); - if ( handle ) { - handle.apply( cur, data ); - } - - // Native handler - handle = ontype && cur[ ontype ]; - if ( handle && handle.apply && acceptData( cur ) ) { - event.result = handle.apply( cur, data ); - if ( event.result === false ) { - event.preventDefault(); - } - } - } - event.type = type; - - // If nobody prevented the default action, do it now - if ( !onlyHandlers && !event.isDefaultPrevented() ) { - - if ( ( !special._default || - special._default.apply( eventPath.pop(), data ) === false ) && - acceptData( elem ) ) { - - // Call a native DOM method on the target with the same name as the event. - // Don't do default actions on window, that's where global variables be (#6170) - if ( ontype && isFunction( elem[ type ] ) && !isWindow( elem ) ) { - - // Don't re-trigger an onFOO event when we call its FOO() method - tmp = elem[ ontype ]; - - if ( tmp ) { - elem[ ontype ] = null; - } - - // Prevent re-triggering of the same event, since we already bubbled it above - jQuery.event.triggered = type; - - if ( event.isPropagationStopped() ) { - lastElement.addEventListener( type, stopPropagationCallback ); - } - - elem[ type ](); - - if ( event.isPropagationStopped() ) { - lastElement.removeEventListener( type, stopPropagationCallback ); - } - - jQuery.event.triggered = undefined; - - if ( tmp ) { - elem[ ontype ] = tmp; - } - } - } - } - - return event.result; - }, - - // Piggyback on a donor event to simulate a different one - // Used only for `focus(in | out)` events - simulate: function( type, elem, event ) { - var e = jQuery.extend( - new jQuery.Event(), - event, - { - type: type, - isSimulated: true - } - ); - - jQuery.event.trigger( e, null, elem ); - } - -} ); - -jQuery.fn.extend( { - - trigger: function( type, data ) { - return this.each( function() { - jQuery.event.trigger( type, data, this ); - } ); - }, - triggerHandler: function( type, data ) { - var elem = this[ 0 ]; - if ( elem ) { - return jQuery.event.trigger( type, data, elem, true ); - } - } -} ); - - -// Support: Firefox <=44 -// Firefox doesn't have focus(in | out) events -// Related ticket - https://bugzilla.mozilla.org/show_bug.cgi?id=687787 -// -// Support: Chrome <=48 - 49, Safari <=9.0 - 9.1 -// focus(in | out) events fire after focus & blur events, -// which is spec violation - http://www.w3.org/TR/DOM-Level-3-Events/#events-focusevent-event-order -// Related ticket - https://bugs.chromium.org/p/chromium/issues/detail?id=449857 -if ( !support.focusin ) { - jQuery.each( { focus: "focusin", blur: "focusout" }, function( orig, fix ) { - - // Attach a single capturing handler on the document while someone wants focusin/focusout - var handler = function( event ) { - jQuery.event.simulate( fix, event.target, jQuery.event.fix( event ) ); - }; - - jQuery.event.special[ fix ] = { - setup: function() { - - // Handle: regular nodes (via `this.ownerDocument`), window - // (via `this.document`) & document (via `this`). - var doc = this.ownerDocument || this.document || this, - attaches = dataPriv.access( doc, fix ); - - if ( !attaches ) { - doc.addEventListener( orig, handler, true ); - } - dataPriv.access( doc, fix, ( attaches || 0 ) + 1 ); - }, - teardown: function() { - var doc = this.ownerDocument || this.document || this, - attaches = dataPriv.access( doc, fix ) - 1; - - if ( !attaches ) { - doc.removeEventListener( orig, handler, true ); - dataPriv.remove( doc, fix ); - - } else { - dataPriv.access( doc, fix, attaches ); - } - } - }; - } ); -} -var location = window.location; - -var nonce = { guid: Date.now() }; - -var rquery = ( /\?/ ); - - - -// Cross-browser xml parsing -jQuery.parseXML = function( data ) { - var xml; - if ( !data || typeof data !== "string" ) { - return null; - } - - // Support: IE 9 - 11 only - // IE throws on parseFromString with invalid input. - try { - xml = ( new window.DOMParser() ).parseFromString( data, "text/xml" ); - } catch ( e ) { - xml = undefined; - } - - if ( !xml || xml.getElementsByTagName( "parsererror" ).length ) { - jQuery.error( "Invalid XML: " + data ); - } - return xml; -}; - - -var - rbracket = /\[\]$/, - rCRLF = /\r?\n/g, - rsubmitterTypes = /^(?:submit|button|image|reset|file)$/i, - rsubmittable = /^(?:input|select|textarea|keygen)/i; - -function buildParams( prefix, obj, traditional, add ) { - var name; - - if ( Array.isArray( obj ) ) { - - // Serialize array item. - jQuery.each( obj, function( i, v ) { - if ( traditional || rbracket.test( prefix ) ) { - - // Treat each array item as a scalar. - add( prefix, v ); - - } else { - - // Item is non-scalar (array or object), encode its numeric index. - buildParams( - prefix + "[" + ( typeof v === "object" && v != null ? i : "" ) + "]", - v, - traditional, - add - ); - } - } ); - - } else if ( !traditional && toType( obj ) === "object" ) { - - // Serialize object item. - for ( name in obj ) { - buildParams( prefix + "[" + name + "]", obj[ name ], traditional, add ); - } - - } else { - - // Serialize scalar item. - add( prefix, obj ); - } -} - -// Serialize an array of form elements or a set of -// key/values into a query string -jQuery.param = function( a, traditional ) { - var prefix, - s = [], - add = function( key, valueOrFunction ) { - - // If value is a function, invoke it and use its return value - var value = isFunction( valueOrFunction ) ? - valueOrFunction() : - valueOrFunction; - - s[ s.length ] = encodeURIComponent( key ) + "=" + - encodeURIComponent( value == null ? "" : value ); - }; - - if ( a == null ) { - return ""; - } - - // If an array was passed in, assume that it is an array of form elements. - if ( Array.isArray( a ) || ( a.jquery && !jQuery.isPlainObject( a ) ) ) { - - // Serialize the form elements - jQuery.each( a, function() { - add( this.name, this.value ); - } ); - - } else { - - // If traditional, encode the "old" way (the way 1.3.2 or older - // did it), otherwise encode params recursively. - for ( prefix in a ) { - buildParams( prefix, a[ prefix ], traditional, add ); - } - } - - // Return the resulting serialization - return s.join( "&" ); -}; - -jQuery.fn.extend( { - serialize: function() { - return jQuery.param( this.serializeArray() ); - }, - serializeArray: function() { - return this.map( function() { - - // Can add propHook for "elements" to filter or add form elements - var elements = jQuery.prop( this, "elements" ); - return elements ? jQuery.makeArray( elements ) : this; - } ) - .filter( function() { - var type = this.type; - - // Use .is( ":disabled" ) so that fieldset[disabled] works - return this.name && !jQuery( this ).is( ":disabled" ) && - rsubmittable.test( this.nodeName ) && !rsubmitterTypes.test( type ) && - ( this.checked || !rcheckableType.test( type ) ); - } ) - .map( function( _i, elem ) { - var val = jQuery( this ).val(); - - if ( val == null ) { - return null; - } - - if ( Array.isArray( val ) ) { - return jQuery.map( val, function( val ) { - return { name: elem.name, value: val.replace( rCRLF, "\r\n" ) }; - } ); - } - - return { name: elem.name, value: val.replace( rCRLF, "\r\n" ) }; - } ).get(); - } -} ); - - -var - r20 = /%20/g, - rhash = /#.*$/, - rantiCache = /([?&])_=[^&]*/, - rheaders = /^(.*?):[ \t]*([^\r\n]*)$/mg, - - // #7653, #8125, #8152: local protocol detection - rlocalProtocol = /^(?:about|app|app-storage|.+-extension|file|res|widget):$/, - rnoContent = /^(?:GET|HEAD)$/, - rprotocol = /^\/\//, - - /* Prefilters - * 1) They are useful to introduce custom dataTypes (see ajax/jsonp.js for an example) - * 2) These are called: - * - BEFORE asking for a transport - * - AFTER param serialization (s.data is a string if s.processData is true) - * 3) key is the dataType - * 4) the catchall symbol "*" can be used - * 5) execution will start with transport dataType and THEN continue down to "*" if needed - */ - prefilters = {}, - - /* Transports bindings - * 1) key is the dataType - * 2) the catchall symbol "*" can be used - * 3) selection will start with transport dataType and THEN go to "*" if needed - */ - transports = {}, - - // Avoid comment-prolog char sequence (#10098); must appease lint and evade compression - allTypes = "*/".concat( "*" ), - - // Anchor tag for parsing the document origin - originAnchor = document.createElement( "a" ); - originAnchor.href = location.href; - -// Base "constructor" for jQuery.ajaxPrefilter and jQuery.ajaxTransport -function addToPrefiltersOrTransports( structure ) { - - // dataTypeExpression is optional and defaults to "*" - return function( dataTypeExpression, func ) { - - if ( typeof dataTypeExpression !== "string" ) { - func = dataTypeExpression; - dataTypeExpression = "*"; - } - - var dataType, - i = 0, - dataTypes = dataTypeExpression.toLowerCase().match( rnothtmlwhite ) || []; - - if ( isFunction( func ) ) { - - // For each dataType in the dataTypeExpression - while ( ( dataType = dataTypes[ i++ ] ) ) { - - // Prepend if requested - if ( dataType[ 0 ] === "+" ) { - dataType = dataType.slice( 1 ) || "*"; - ( structure[ dataType ] = structure[ dataType ] || [] ).unshift( func ); - - // Otherwise append - } else { - ( structure[ dataType ] = structure[ dataType ] || [] ).push( func ); - } - } - } - }; -} - -// Base inspection function for prefilters and transports -function inspectPrefiltersOrTransports( structure, options, originalOptions, jqXHR ) { - - var inspected = {}, - seekingTransport = ( structure === transports ); - - function inspect( dataType ) { - var selected; - inspected[ dataType ] = true; - jQuery.each( structure[ dataType ] || [], function( _, prefilterOrFactory ) { - var dataTypeOrTransport = prefilterOrFactory( options, originalOptions, jqXHR ); - if ( typeof dataTypeOrTransport === "string" && - !seekingTransport && !inspected[ dataTypeOrTransport ] ) { - - options.dataTypes.unshift( dataTypeOrTransport ); - inspect( dataTypeOrTransport ); - return false; - } else if ( seekingTransport ) { - return !( selected = dataTypeOrTransport ); - } - } ); - return selected; - } - - return inspect( options.dataTypes[ 0 ] ) || !inspected[ "*" ] && inspect( "*" ); -} - -// A special extend for ajax options -// that takes "flat" options (not to be deep extended) -// Fixes #9887 -function ajaxExtend( target, src ) { - var key, deep, - flatOptions = jQuery.ajaxSettings.flatOptions || {}; - - for ( key in src ) { - if ( src[ key ] !== undefined ) { - ( flatOptions[ key ] ? target : ( deep || ( deep = {} ) ) )[ key ] = src[ key ]; - } - } - if ( deep ) { - jQuery.extend( true, target, deep ); - } - - return target; -} - -/* Handles responses to an ajax request: - * - finds the right dataType (mediates between content-type and expected dataType) - * - returns the corresponding response - */ -function ajaxHandleResponses( s, jqXHR, responses ) { - - var ct, type, finalDataType, firstDataType, - contents = s.contents, - dataTypes = s.dataTypes; - - // Remove auto dataType and get content-type in the process - while ( dataTypes[ 0 ] === "*" ) { - dataTypes.shift(); - if ( ct === undefined ) { - ct = s.mimeType || jqXHR.getResponseHeader( "Content-Type" ); - } - } - - // Check if we're dealing with a known content-type - if ( ct ) { - for ( type in contents ) { - if ( contents[ type ] && contents[ type ].test( ct ) ) { - dataTypes.unshift( type ); - break; - } - } - } - - // Check to see if we have a response for the expected dataType - if ( dataTypes[ 0 ] in responses ) { - finalDataType = dataTypes[ 0 ]; - } else { - - // Try convertible dataTypes - for ( type in responses ) { - if ( !dataTypes[ 0 ] || s.converters[ type + " " + dataTypes[ 0 ] ] ) { - finalDataType = type; - break; - } - if ( !firstDataType ) { - firstDataType = type; - } - } - - // Or just use first one - finalDataType = finalDataType || firstDataType; - } - - // If we found a dataType - // We add the dataType to the list if needed - // and return the corresponding response - if ( finalDataType ) { - if ( finalDataType !== dataTypes[ 0 ] ) { - dataTypes.unshift( finalDataType ); - } - return responses[ finalDataType ]; - } -} - -/* Chain conversions given the request and the original response - * Also sets the responseXXX fields on the jqXHR instance - */ -function ajaxConvert( s, response, jqXHR, isSuccess ) { - var conv2, current, conv, tmp, prev, - converters = {}, - - // Work with a copy of dataTypes in case we need to modify it for conversion - dataTypes = s.dataTypes.slice(); - - // Create converters map with lowercased keys - if ( dataTypes[ 1 ] ) { - for ( conv in s.converters ) { - converters[ conv.toLowerCase() ] = s.converters[ conv ]; - } - } - - current = dataTypes.shift(); - - // Convert to each sequential dataType - while ( current ) { - - if ( s.responseFields[ current ] ) { - jqXHR[ s.responseFields[ current ] ] = response; - } - - // Apply the dataFilter if provided - if ( !prev && isSuccess && s.dataFilter ) { - response = s.dataFilter( response, s.dataType ); - } - - prev = current; - current = dataTypes.shift(); - - if ( current ) { - - // There's only work to do if current dataType is non-auto - if ( current === "*" ) { - - current = prev; - - // Convert response if prev dataType is non-auto and differs from current - } else if ( prev !== "*" && prev !== current ) { - - // Seek a direct converter - conv = converters[ prev + " " + current ] || converters[ "* " + current ]; - - // If none found, seek a pair - if ( !conv ) { - for ( conv2 in converters ) { - - // If conv2 outputs current - tmp = conv2.split( " " ); - if ( tmp[ 1 ] === current ) { - - // If prev can be converted to accepted input - conv = converters[ prev + " " + tmp[ 0 ] ] || - converters[ "* " + tmp[ 0 ] ]; - if ( conv ) { - - // Condense equivalence converters - if ( conv === true ) { - conv = converters[ conv2 ]; - - // Otherwise, insert the intermediate dataType - } else if ( converters[ conv2 ] !== true ) { - current = tmp[ 0 ]; - dataTypes.unshift( tmp[ 1 ] ); - } - break; - } - } - } - } - - // Apply converter (if not an equivalence) - if ( conv !== true ) { - - // Unless errors are allowed to bubble, catch and return them - if ( conv && s.throws ) { - response = conv( response ); - } else { - try { - response = conv( response ); - } catch ( e ) { - return { - state: "parsererror", - error: conv ? e : "No conversion from " + prev + " to " + current - }; - } - } - } - } - } - } - - return { state: "success", data: response }; -} - -jQuery.extend( { - - // Counter for holding the number of active queries - active: 0, - - // Last-Modified header cache for next request - lastModified: {}, - etag: {}, - - ajaxSettings: { - url: location.href, - type: "GET", - isLocal: rlocalProtocol.test( location.protocol ), - global: true, - processData: true, - async: true, - contentType: "application/x-www-form-urlencoded; charset=UTF-8", - - /* - timeout: 0, - data: null, - dataType: null, - username: null, - password: null, - cache: null, - throws: false, - traditional: false, - headers: {}, - */ - - accepts: { - "*": allTypes, - text: "text/plain", - html: "text/html", - xml: "application/xml, text/xml", - json: "application/json, text/javascript" - }, - - contents: { - xml: /\bxml\b/, - html: /\bhtml/, - json: /\bjson\b/ - }, - - responseFields: { - xml: "responseXML", - text: "responseText", - json: "responseJSON" - }, - - // Data converters - // Keys separate source (or catchall "*") and destination types with a single space - converters: { - - // Convert anything to text - "* text": String, - - // Text to html (true = no transformation) - "text html": true, - - // Evaluate text as a json expression - "text json": JSON.parse, - - // Parse text as xml - "text xml": jQuery.parseXML - }, - - // For options that shouldn't be deep extended: - // you can add your own custom options here if - // and when you create one that shouldn't be - // deep extended (see ajaxExtend) - flatOptions: { - url: true, - context: true - } - }, - - // Creates a full fledged settings object into target - // with both ajaxSettings and settings fields. - // If target is omitted, writes into ajaxSettings. - ajaxSetup: function( target, settings ) { - return settings ? - - // Building a settings object - ajaxExtend( ajaxExtend( target, jQuery.ajaxSettings ), settings ) : - - // Extending ajaxSettings - ajaxExtend( jQuery.ajaxSettings, target ); - }, - - ajaxPrefilter: addToPrefiltersOrTransports( prefilters ), - ajaxTransport: addToPrefiltersOrTransports( transports ), - - // Main method - ajax: function( url, options ) { - - // If url is an object, simulate pre-1.5 signature - if ( typeof url === "object" ) { - options = url; - url = undefined; - } - - // Force options to be an object - options = options || {}; - - var transport, - - // URL without anti-cache param - cacheURL, - - // Response headers - responseHeadersString, - responseHeaders, - - // timeout handle - timeoutTimer, - - // Url cleanup var - urlAnchor, - - // Request state (becomes false upon send and true upon completion) - completed, - - // To know if global events are to be dispatched - fireGlobals, - - // Loop variable - i, - - // uncached part of the url - uncached, - - // Create the final options object - s = jQuery.ajaxSetup( {}, options ), - - // Callbacks context - callbackContext = s.context || s, - - // Context for global events is callbackContext if it is a DOM node or jQuery collection - globalEventContext = s.context && - ( callbackContext.nodeType || callbackContext.jquery ) ? - jQuery( callbackContext ) : - jQuery.event, - - // Deferreds - deferred = jQuery.Deferred(), - completeDeferred = jQuery.Callbacks( "once memory" ), - - // Status-dependent callbacks - statusCode = s.statusCode || {}, - - // Headers (they are sent all at once) - requestHeaders = {}, - requestHeadersNames = {}, - - // Default abort message - strAbort = "canceled", - - // Fake xhr - jqXHR = { - readyState: 0, - - // Builds headers hashtable if needed - getResponseHeader: function( key ) { - var match; - if ( completed ) { - if ( !responseHeaders ) { - responseHeaders = {}; - while ( ( match = rheaders.exec( responseHeadersString ) ) ) { - responseHeaders[ match[ 1 ].toLowerCase() + " " ] = - ( responseHeaders[ match[ 1 ].toLowerCase() + " " ] || [] ) - .concat( match[ 2 ] ); - } - } - match = responseHeaders[ key.toLowerCase() + " " ]; - } - return match == null ? null : match.join( ", " ); - }, - - // Raw string - getAllResponseHeaders: function() { - return completed ? responseHeadersString : null; - }, - - // Caches the header - setRequestHeader: function( name, value ) { - if ( completed == null ) { - name = requestHeadersNames[ name.toLowerCase() ] = - requestHeadersNames[ name.toLowerCase() ] || name; - requestHeaders[ name ] = value; - } - return this; - }, - - // Overrides response content-type header - overrideMimeType: function( type ) { - if ( completed == null ) { - s.mimeType = type; - } - return this; - }, - - // Status-dependent callbacks - statusCode: function( map ) { - var code; - if ( map ) { - if ( completed ) { - - // Execute the appropriate callbacks - jqXHR.always( map[ jqXHR.status ] ); - } else { - - // Lazy-add the new callbacks in a way that preserves old ones - for ( code in map ) { - statusCode[ code ] = [ statusCode[ code ], map[ code ] ]; - } - } - } - return this; - }, - - // Cancel the request - abort: function( statusText ) { - var finalText = statusText || strAbort; - if ( transport ) { - transport.abort( finalText ); - } - done( 0, finalText ); - return this; - } - }; - - // Attach deferreds - deferred.promise( jqXHR ); - - // Add protocol if not provided (prefilters might expect it) - // Handle falsy url in the settings object (#10093: consistency with old signature) - // We also use the url parameter if available - s.url = ( ( url || s.url || location.href ) + "" ) - .replace( rprotocol, location.protocol + "//" ); - - // Alias method option to type as per ticket #12004 - s.type = options.method || options.type || s.method || s.type; - - // Extract dataTypes list - s.dataTypes = ( s.dataType || "*" ).toLowerCase().match( rnothtmlwhite ) || [ "" ]; - - // A cross-domain request is in order when the origin doesn't match the current origin. - if ( s.crossDomain == null ) { - urlAnchor = document.createElement( "a" ); - - // Support: IE <=8 - 11, Edge 12 - 15 - // IE throws exception on accessing the href property if url is malformed, - // e.g. http://example.com:80x/ - try { - urlAnchor.href = s.url; - - // Support: IE <=8 - 11 only - // Anchor's host property isn't correctly set when s.url is relative - urlAnchor.href = urlAnchor.href; - s.crossDomain = originAnchor.protocol + "//" + originAnchor.host !== - urlAnchor.protocol + "//" + urlAnchor.host; - } catch ( e ) { - - // If there is an error parsing the URL, assume it is crossDomain, - // it can be rejected by the transport if it is invalid - s.crossDomain = true; - } - } - - // Convert data if not already a string - if ( s.data && s.processData && typeof s.data !== "string" ) { - s.data = jQuery.param( s.data, s.traditional ); - } - - // Apply prefilters - inspectPrefiltersOrTransports( prefilters, s, options, jqXHR ); - - // If request was aborted inside a prefilter, stop there - if ( completed ) { - return jqXHR; - } - - // We can fire global events as of now if asked to - // Don't fire events if jQuery.event is undefined in an AMD-usage scenario (#15118) - fireGlobals = jQuery.event && s.global; - - // Watch for a new set of requests - if ( fireGlobals && jQuery.active++ === 0 ) { - jQuery.event.trigger( "ajaxStart" ); - } - - // Uppercase the type - s.type = s.type.toUpperCase(); - - // Determine if request has content - s.hasContent = !rnoContent.test( s.type ); - - // Save the URL in case we're toying with the If-Modified-Since - // and/or If-None-Match header later on - // Remove hash to simplify url manipulation - cacheURL = s.url.replace( rhash, "" ); - - // More options handling for requests with no content - if ( !s.hasContent ) { - - // Remember the hash so we can put it back - uncached = s.url.slice( cacheURL.length ); - - // If data is available and should be processed, append data to url - if ( s.data && ( s.processData || typeof s.data === "string" ) ) { - cacheURL += ( rquery.test( cacheURL ) ? "&" : "?" ) + s.data; - - // #9682: remove data so that it's not used in an eventual retry - delete s.data; - } - - // Add or update anti-cache param if needed - if ( s.cache === false ) { - cacheURL = cacheURL.replace( rantiCache, "$1" ); - uncached = ( rquery.test( cacheURL ) ? "&" : "?" ) + "_=" + ( nonce.guid++ ) + - uncached; - } - - // Put hash and anti-cache on the URL that will be requested (gh-1732) - s.url = cacheURL + uncached; - - // Change '%20' to '+' if this is encoded form body content (gh-2658) - } else if ( s.data && s.processData && - ( s.contentType || "" ).indexOf( "application/x-www-form-urlencoded" ) === 0 ) { - s.data = s.data.replace( r20, "+" ); - } - - // Set the If-Modified-Since and/or If-None-Match header, if in ifModified mode. - if ( s.ifModified ) { - if ( jQuery.lastModified[ cacheURL ] ) { - jqXHR.setRequestHeader( "If-Modified-Since", jQuery.lastModified[ cacheURL ] ); - } - if ( jQuery.etag[ cacheURL ] ) { - jqXHR.setRequestHeader( "If-None-Match", jQuery.etag[ cacheURL ] ); - } - } - - // Set the correct header, if data is being sent - if ( s.data && s.hasContent && s.contentType !== false || options.contentType ) { - jqXHR.setRequestHeader( "Content-Type", s.contentType ); - } - - // Set the Accepts header for the server, depending on the dataType - jqXHR.setRequestHeader( - "Accept", - s.dataTypes[ 0 ] && s.accepts[ s.dataTypes[ 0 ] ] ? - s.accepts[ s.dataTypes[ 0 ] ] + - ( s.dataTypes[ 0 ] !== "*" ? ", " + allTypes + "; q=0.01" : "" ) : - s.accepts[ "*" ] - ); - - // Check for headers option - for ( i in s.headers ) { - jqXHR.setRequestHeader( i, s.headers[ i ] ); - } - - // Allow custom headers/mimetypes and early abort - if ( s.beforeSend && - ( s.beforeSend.call( callbackContext, jqXHR, s ) === false || completed ) ) { - - // Abort if not done already and return - return jqXHR.abort(); - } - - // Aborting is no longer a cancellation - strAbort = "abort"; - - // Install callbacks on deferreds - completeDeferred.add( s.complete ); - jqXHR.done( s.success ); - jqXHR.fail( s.error ); - - // Get transport - transport = inspectPrefiltersOrTransports( transports, s, options, jqXHR ); - - // If no transport, we auto-abort - if ( !transport ) { - done( -1, "No Transport" ); - } else { - jqXHR.readyState = 1; - - // Send global event - if ( fireGlobals ) { - globalEventContext.trigger( "ajaxSend", [ jqXHR, s ] ); - } - - // If request was aborted inside ajaxSend, stop there - if ( completed ) { - return jqXHR; - } - - // Timeout - if ( s.async && s.timeout > 0 ) { - timeoutTimer = window.setTimeout( function() { - jqXHR.abort( "timeout" ); - }, s.timeout ); - } - - try { - completed = false; - transport.send( requestHeaders, done ); - } catch ( e ) { - - // Rethrow post-completion exceptions - if ( completed ) { - throw e; - } - - // Propagate others as results - done( -1, e ); - } - } - - // Callback for when everything is done - function done( status, nativeStatusText, responses, headers ) { - var isSuccess, success, error, response, modified, - statusText = nativeStatusText; - - // Ignore repeat invocations - if ( completed ) { - return; - } - - completed = true; - - // Clear timeout if it exists - if ( timeoutTimer ) { - window.clearTimeout( timeoutTimer ); - } - - // Dereference transport for early garbage collection - // (no matter how long the jqXHR object will be used) - transport = undefined; - - // Cache response headers - responseHeadersString = headers || ""; - - // Set readyState - jqXHR.readyState = status > 0 ? 4 : 0; - - // Determine if successful - isSuccess = status >= 200 && status < 300 || status === 304; - - // Get response data - if ( responses ) { - response = ajaxHandleResponses( s, jqXHR, responses ); - } - - // Use a noop converter for missing script - if ( !isSuccess && jQuery.inArray( "script", s.dataTypes ) > -1 ) { - s.converters[ "text script" ] = function() {}; - } - - // Convert no matter what (that way responseXXX fields are always set) - response = ajaxConvert( s, response, jqXHR, isSuccess ); - - // If successful, handle type chaining - if ( isSuccess ) { - - // Set the If-Modified-Since and/or If-None-Match header, if in ifModified mode. - if ( s.ifModified ) { - modified = jqXHR.getResponseHeader( "Last-Modified" ); - if ( modified ) { - jQuery.lastModified[ cacheURL ] = modified; - } - modified = jqXHR.getResponseHeader( "etag" ); - if ( modified ) { - jQuery.etag[ cacheURL ] = modified; - } - } - - // if no content - if ( status === 204 || s.type === "HEAD" ) { - statusText = "nocontent"; - - // if not modified - } else if ( status === 304 ) { - statusText = "notmodified"; - - // If we have data, let's convert it - } else { - statusText = response.state; - success = response.data; - error = response.error; - isSuccess = !error; - } - } else { - - // Extract error from statusText and normalize for non-aborts - error = statusText; - if ( status || !statusText ) { - statusText = "error"; - if ( status < 0 ) { - status = 0; - } - } - } - - // Set data for the fake xhr object - jqXHR.status = status; - jqXHR.statusText = ( nativeStatusText || statusText ) + ""; - - // Success/Error - if ( isSuccess ) { - deferred.resolveWith( callbackContext, [ success, statusText, jqXHR ] ); - } else { - deferred.rejectWith( callbackContext, [ jqXHR, statusText, error ] ); - } - - // Status-dependent callbacks - jqXHR.statusCode( statusCode ); - statusCode = undefined; - - if ( fireGlobals ) { - globalEventContext.trigger( isSuccess ? "ajaxSuccess" : "ajaxError", - [ jqXHR, s, isSuccess ? success : error ] ); - } - - // Complete - completeDeferred.fireWith( callbackContext, [ jqXHR, statusText ] ); - - if ( fireGlobals ) { - globalEventContext.trigger( "ajaxComplete", [ jqXHR, s ] ); - - // Handle the global AJAX counter - if ( !( --jQuery.active ) ) { - jQuery.event.trigger( "ajaxStop" ); - } - } - } - - return jqXHR; - }, - - getJSON: function( url, data, callback ) { - return jQuery.get( url, data, callback, "json" ); - }, - - getScript: function( url, callback ) { - return jQuery.get( url, undefined, callback, "script" ); - } -} ); - -jQuery.each( [ "get", "post" ], function( _i, method ) { - jQuery[ method ] = function( url, data, callback, type ) { - - // Shift arguments if data argument was omitted - if ( isFunction( data ) ) { - type = type || callback; - callback = data; - data = undefined; - } - - // The url can be an options object (which then must have .url) - return jQuery.ajax( jQuery.extend( { - url: url, - type: method, - dataType: type, - data: data, - success: callback - }, jQuery.isPlainObject( url ) && url ) ); - }; -} ); - -jQuery.ajaxPrefilter( function( s ) { - var i; - for ( i in s.headers ) { - if ( i.toLowerCase() === "content-type" ) { - s.contentType = s.headers[ i ] || ""; - } - } -} ); - - -jQuery._evalUrl = function( url, options, doc ) { - return jQuery.ajax( { - url: url, - - // Make this explicit, since user can override this through ajaxSetup (#11264) - type: "GET", - dataType: "script", - cache: true, - async: false, - global: false, - - // Only evaluate the response if it is successful (gh-4126) - // dataFilter is not invoked for failure responses, so using it instead - // of the default converter is kludgy but it works. - converters: { - "text script": function() {} - }, - dataFilter: function( response ) { - jQuery.globalEval( response, options, doc ); - } - } ); -}; - - -jQuery.fn.extend( { - wrapAll: function( html ) { - var wrap; - - if ( this[ 0 ] ) { - if ( isFunction( html ) ) { - html = html.call( this[ 0 ] ); - } - - // The elements to wrap the target around - wrap = jQuery( html, this[ 0 ].ownerDocument ).eq( 0 ).clone( true ); - - if ( this[ 0 ].parentNode ) { - wrap.insertBefore( this[ 0 ] ); - } - - wrap.map( function() { - var elem = this; - - while ( elem.firstElementChild ) { - elem = elem.firstElementChild; - } - - return elem; - } ).append( this ); - } - - return this; - }, - - wrapInner: function( html ) { - if ( isFunction( html ) ) { - return this.each( function( i ) { - jQuery( this ).wrapInner( html.call( this, i ) ); - } ); - } - - return this.each( function() { - var self = jQuery( this ), - contents = self.contents(); - - if ( contents.length ) { - contents.wrapAll( html ); - - } else { - self.append( html ); - } - } ); - }, - - wrap: function( html ) { - var htmlIsFunction = isFunction( html ); - - return this.each( function( i ) { - jQuery( this ).wrapAll( htmlIsFunction ? html.call( this, i ) : html ); - } ); - }, - - unwrap: function( selector ) { - this.parent( selector ).not( "body" ).each( function() { - jQuery( this ).replaceWith( this.childNodes ); - } ); - return this; - } -} ); - - -jQuery.expr.pseudos.hidden = function( elem ) { - return !jQuery.expr.pseudos.visible( elem ); -}; -jQuery.expr.pseudos.visible = function( elem ) { - return !!( elem.offsetWidth || elem.offsetHeight || elem.getClientRects().length ); -}; - - - - -jQuery.ajaxSettings.xhr = function() { - try { - return new window.XMLHttpRequest(); - } catch ( e ) {} -}; - -var xhrSuccessStatus = { - - // File protocol always yields status code 0, assume 200 - 0: 200, - - // Support: IE <=9 only - // #1450: sometimes IE returns 1223 when it should be 204 - 1223: 204 - }, - xhrSupported = jQuery.ajaxSettings.xhr(); - -support.cors = !!xhrSupported && ( "withCredentials" in xhrSupported ); -support.ajax = xhrSupported = !!xhrSupported; - -jQuery.ajaxTransport( function( options ) { - var callback, errorCallback; - - // Cross domain only allowed if supported through XMLHttpRequest - if ( support.cors || xhrSupported && !options.crossDomain ) { - return { - send: function( headers, complete ) { - var i, - xhr = options.xhr(); - - xhr.open( - options.type, - options.url, - options.async, - options.username, - options.password - ); - - // Apply custom fields if provided - if ( options.xhrFields ) { - for ( i in options.xhrFields ) { - xhr[ i ] = options.xhrFields[ i ]; - } - } - - // Override mime type if needed - if ( options.mimeType && xhr.overrideMimeType ) { - xhr.overrideMimeType( options.mimeType ); - } - - // X-Requested-With header - // For cross-domain requests, seeing as conditions for a preflight are - // akin to a jigsaw puzzle, we simply never set it to be sure. - // (it can always be set on a per-request basis or even using ajaxSetup) - // For same-domain requests, won't change header if already provided. - if ( !options.crossDomain && !headers[ "X-Requested-With" ] ) { - headers[ "X-Requested-With" ] = "XMLHttpRequest"; - } - - // Set headers - for ( i in headers ) { - xhr.setRequestHeader( i, headers[ i ] ); - } - - // Callback - callback = function( type ) { - return function() { - if ( callback ) { - callback = errorCallback = xhr.onload = - xhr.onerror = xhr.onabort = xhr.ontimeout = - xhr.onreadystatechange = null; - - if ( type === "abort" ) { - xhr.abort(); - } else if ( type === "error" ) { - - // Support: IE <=9 only - // On a manual native abort, IE9 throws - // errors on any property access that is not readyState - if ( typeof xhr.status !== "number" ) { - complete( 0, "error" ); - } else { - complete( - - // File: protocol always yields status 0; see #8605, #14207 - xhr.status, - xhr.statusText - ); - } - } else { - complete( - xhrSuccessStatus[ xhr.status ] || xhr.status, - xhr.statusText, - - // Support: IE <=9 only - // IE9 has no XHR2 but throws on binary (trac-11426) - // For XHR2 non-text, let the caller handle it (gh-2498) - ( xhr.responseType || "text" ) !== "text" || - typeof xhr.responseText !== "string" ? - { binary: xhr.response } : - { text: xhr.responseText }, - xhr.getAllResponseHeaders() - ); - } - } - }; - }; - - // Listen to events - xhr.onload = callback(); - errorCallback = xhr.onerror = xhr.ontimeout = callback( "error" ); - - // Support: IE 9 only - // Use onreadystatechange to replace onabort - // to handle uncaught aborts - if ( xhr.onabort !== undefined ) { - xhr.onabort = errorCallback; - } else { - xhr.onreadystatechange = function() { - - // Check readyState before timeout as it changes - if ( xhr.readyState === 4 ) { - - // Allow onerror to be called first, - // but that will not handle a native abort - // Also, save errorCallback to a variable - // as xhr.onerror cannot be accessed - window.setTimeout( function() { - if ( callback ) { - errorCallback(); - } - } ); - } - }; - } - - // Create the abort callback - callback = callback( "abort" ); - - try { - - // Do send the request (this may raise an exception) - xhr.send( options.hasContent && options.data || null ); - } catch ( e ) { - - // #14683: Only rethrow if this hasn't been notified as an error yet - if ( callback ) { - throw e; - } - } - }, - - abort: function() { - if ( callback ) { - callback(); - } - } - }; - } -} ); - - - - -// Prevent auto-execution of scripts when no explicit dataType was provided (See gh-2432) -jQuery.ajaxPrefilter( function( s ) { - if ( s.crossDomain ) { - s.contents.script = false; - } -} ); - -// Install script dataType -jQuery.ajaxSetup( { - accepts: { - script: "text/javascript, application/javascript, " + - "application/ecmascript, application/x-ecmascript" - }, - contents: { - script: /\b(?:java|ecma)script\b/ - }, - converters: { - "text script": function( text ) { - jQuery.globalEval( text ); - return text; - } - } -} ); - -// Handle cache's special case and crossDomain -jQuery.ajaxPrefilter( "script", function( s ) { - if ( s.cache === undefined ) { - s.cache = false; - } - if ( s.crossDomain ) { - s.type = "GET"; - } -} ); - -// Bind script tag hack transport -jQuery.ajaxTransport( "script", function( s ) { - - // This transport only deals with cross domain or forced-by-attrs requests - if ( s.crossDomain || s.scriptAttrs ) { - var script, callback; - return { - send: function( _, complete ) { - script = jQuery( " - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Hardware agnostic training (preparation)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Hardware agnostic training (preparation)

-

To train on CPU/GPU/TPU without changing your code, we need to build a few good habits :)

-
-
-

Delete .cuda() or .to() calls

-

Delete any calls to .cuda() or .to(device).

-
# before lightning
-def forward(self, x):
-    x = x.cuda(0)
-    layer_1.cuda(0)
-    x_hat = layer_1(x)
-
-
-# after lightning
-def forward(self, x):
-    x_hat = layer_1(x)
-
-
-
-
-
-

Init tensors using type_as and register_buffer

-

When you need to create a new tensor, use type_as. -This will make your code scale to any arbitrary number of GPUs or TPUs with Lightning.

-
# before lightning
-def forward(self, x):
-    z = torch.Tensor(2, 3)
-    z = z.cuda(0)
-
-
-# with lightning
-def forward(self, x):
-    z = torch.Tensor(2, 3)
-    z = z.type_as(x)
-
-
-

The LightningModule knows what device it is on. You can access the reference via self.device. -Sometimes it is necessary to store tensors as module attributes. However, if they are not parameters they will -remain on the CPU even if the module gets moved to a new device. To prevent that and remain device agnostic, -register the tensor as a buffer in your modules’ __init__ method with register_buffer().

-
class LitModel(LightningModule):
-    def __init__(self):
-        ...
-        self.register_buffer("sigma", torch.eye(3))
-        # you can now access self.sigma anywhere in your module
-
-
-
-
-
-

Remove samplers

-

DistributedSampler is automatically handled by Lightning.

-

See replace_sampler_ddp for more information.

-
-
-
-

Synchronize validation and test logging

-

When running in distributed mode, we have to ensure that the validation and test step logging calls are synchronized across processes. -This is done by adding sync_dist=True to all self.log calls in the validation and test step. -This ensures that each GPU worker has the same behaviour when tracking model checkpoints, which is important for later downstream tasks such as testing the best checkpoint across all workers. -The sync_dist option can also be used in logging calls during the step methods, but be aware that this can lead to significant communication overhead and slow down your training.

-

Note if you use any built in metrics or custom metrics that use TorchMetrics, these do not need to be updated and are automatically handled for you.

-
def validation_step(self, batch, batch_idx):
-    x, y = batch
-    logits = self(x)
-    loss = self.loss(logits, y)
-    # Add sync_dist=True to sync logging across all GPU workers (may have performance impact)
-    self.log("validation_loss", loss, on_step=True, on_epoch=True, sync_dist=True)
-
-
-def test_step(self, batch, batch_idx):
-    x, y = batch
-    logits = self(x)
-    loss = self.loss(logits, y)
-    # Add sync_dist=True to sync logging across all GPU workers (may have performance impact)
-    self.log("test_loss", loss, on_step=True, on_epoch=True, sync_dist=True)
-
-
-

It is possible to perform some computation manually and log the reduced result on rank 0 as follows:

-
def test_step(self, batch, batch_idx):
-    x, y = batch
-    tensors = self(x)
-    return tensors
-
-
-def test_epoch_end(self, outputs):
-    mean = torch.mean(self.all_gather(outputs))
-
-    # When logging only on rank 0, don't forget to add
-    # ``rank_zero_only=True`` to avoid deadlocks on synchronization.
-    if self.trainer.is_global_zero:
-        self.log("my_reduced_metric", mean, rank_zero_only=True)
-
-
-
-
-
-

Make models pickleable

-

It’s very likely your code is already pickleable, -in that case no change in necessary. -However, if you run a distributed model and get the following error:

-
self._launch(process_obj)
-File "/net/software/local/python/3.6.5/lib/python3.6/multiprocessing/popen_spawn_posix.py", line 47,
-in _launch reduction.dump(process_obj, fp)
-File "/net/software/local/python/3.6.5/lib/python3.6/multiprocessing/reduction.py", line 60, in dump
-ForkingPickler(file, protocol).dump(obj)
-_pickle.PicklingError: Can't pickle <function <lambda> at 0x2b599e088ae8>:
-attribute lookup <lambda> on __main__ failed
-
-
-

This means something in your model definition, transforms, optimizer, dataloader or callbacks cannot be pickled, and the following code will fail:

-
import pickle
-
-pickle.dump(some_object)
-
-
-

This is a limitation of using multiple processes for distributed training within PyTorch. -To fix this issue, find your piece of code that cannot be pickled. The end of the stacktrace -is usually helpful. -ie: in the stacktrace example here, there seems to be a lambda function somewhere in the code -which cannot be pickled.

-
self._launch(process_obj)
-File "/net/software/local/python/3.6.5/lib/python3.6/multiprocessing/popen_spawn_posix.py", line 47,
-in _launch reduction.dump(process_obj, fp)
-File "/net/software/local/python/3.6.5/lib/python3.6/multiprocessing/reduction.py", line 60, in dump
-ForkingPickler(file, protocol).dump(obj)
-_pickle.PicklingError: Can't pickle [THIS IS THE THING TO FIND AND DELETE]:
-attribute lookup <lambda> on __main__ failed
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/accelerators/gpu.html b/docs/accelerators/gpu.html deleted file mode 100644 index 64b6384..0000000 --- a/docs/accelerators/gpu.html +++ /dev/null @@ -1,761 +0,0 @@ - - - - - - - - - - - - - - Accelerator: GPU training — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Accelerator: GPU training
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
- - -
- -
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/accelerators/gpu_advanced.html b/docs/accelerators/gpu_advanced.html deleted file mode 100644 index dcccce2..0000000 --- a/docs/accelerators/gpu_advanced.html +++ /dev/null @@ -1,692 +0,0 @@ - - - - - - - - - - - - - - GPU training (Advanced) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • GPU training (Advanced)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

GPU training (Advanced)

-

Audience: Users looking to scale massive models (ie: 1 Trillion parameters).

-
-

For experts pushing the state-of-the-art in model development, Lightning offers various techniques to enable Trillion+ parameter-scale models.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
- -
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/accelerators/gpu_basic.html b/docs/accelerators/gpu_basic.html deleted file mode 100644 index bf93504..0000000 --- a/docs/accelerators/gpu_basic.html +++ /dev/null @@ -1,802 +0,0 @@ - - - - - - - - - - - - - - GPU training (Basic) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • GPU training (Basic)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

GPU training (Basic)

-

Audience: Users looking to save money and run large models faster using single or multiple

-
-
-

What is a GPU?

-

A Graphics Processing Unit (GPU), is a specialized hardware accelerator designed to speed up mathematical computations used in gaming and deep learning.

-
-
-
-

Train on 1 GPU

-

Make sure you’re running on a machine with at least one GPU. There’s no need to specify any NVIDIA flags -as Lightning will do it for you.

-
trainer = Trainer(accelerator="gpu", devices=1)
-
-
-
-
-
-

Train on multiple GPUs

-

To use multiple GPUs, set the number of devices in the Trainer or the index of the GPUs.

-
trainer = Trainer(accelerator="gpu", devices=4)
-
-
-
-

Choosing GPU devices

-

You can select the GPU devices using ranges, a list of indices or a string containing -a comma separated list of GPU ids:

-
# DEFAULT (int) specifies how many GPUs to use per node
-Trainer(accelerator="gpu", devices=k)
-
-# Above is equivalent to
-Trainer(accelerator="gpu", devices=list(range(k)))
-
-# Specify which GPUs to use (don't use when running on cluster)
-Trainer(accelerator="gpu", devices=[0, 1])
-
-# Equivalent using a string
-Trainer(accelerator="gpu", devices="0, 1")
-
-# To use all available GPUs put -1 or '-1'
-# equivalent to list(range(torch.cuda.device_count()))
-Trainer(accelerator="gpu", devices=-1)
-
-
-

The table below lists examples of possible input formats and how they are interpreted by Lightning.

- ------ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -

devices

Type

Parsed

Meaning

3

int

[0, 1, 2]

first 3 GPUs

-1

int

[0, 1, 2, …]

all available GPUs

[0]

list

[0]

GPU 0

[1, 3]

list

[1, 3]

GPUs 1 and 3

“3”

str

[0, 1, 2]

first 3 GPUs

“1, 3”

str

[1, 3]

GPUs 1 and 3

“-1”

str

[0, 1, 2, …]

all available GPUs

-
-

Note

-

When specifying number of devices as an integer devices=k, setting the trainer flag -auto_select_gpus=True will automatically help you find k GPUs that are not -occupied by other processes. This is especially useful when GPUs are configured -to be in “exclusive mode”, such that only one process at a time can access them. -For more details see the trainer guide.

-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/accelerators/gpu_expert.html b/docs/accelerators/gpu_expert.html deleted file mode 100644 index 6fb1e99..0000000 --- a/docs/accelerators/gpu_expert.html +++ /dev/null @@ -1,887 +0,0 @@ - - - - - - - - - - - - - - GPU training (Expert) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • GPU training (Expert)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

GPU training (Expert)

-

Audience: Experts creating new scaling techniques such as Deepspeed or FSDP

-
-

Lightning enables experts focused on researching new ways of optimizing distributed training/inference strategies to create new strategies and plug them into Lightning.

-

For example, Lightning worked closely with the Microsoft team to develop a Deepspeed integration and with the Facebook(Meta) team to develop a FSDP integration.

-
-
-
-

Strategy Registry

-
-

Warning

-

The Strategy Registry is experimental and subject to change.

-
-

Lightning includes a registry that holds information about Training strategies and allows for the registration of new custom strategies.

-

The Strategies are assigned strings that identify them, such as “ddp”, “deepspeed_stage_2_offload”, and so on. -It also returns the optional description and parameters for initialising the Strategy that were defined during registration.

-
# Training with the DDP Strategy with `find_unused_parameters` as False
-trainer = Trainer(strategy="ddp_find_unused_parameters_false", accelerator="gpu", devices=4)
-
-# Training with DeepSpeed ZeRO Stage 3 and CPU Offload
-trainer = Trainer(strategy="deepspeed_stage_3_offload", accelerator="gpu", devices=3)
-
-# Training with the TPU Spawn Strategy with `debug` as True
-trainer = Trainer(strategy="tpu_spawn_debug", accelerator="tpu", devices=8)
-
-
-

Additionally, you can pass your custom registered training strategies to the strategy argument.

-
from pytorch_lightning.strategies import DDPStrategy, StrategyRegistry, CheckpointIO
-
-
-class CustomCheckpointIO(CheckpointIO):
-    def save_checkpoint(self, checkpoint: Dict[str, Any], path: Union[str, Path]) -> None:
-        ...
-
-    def load_checkpoint(self, path: Union[str, Path]) -> Dict[str, Any]:
-        ...
-
-
-custom_checkpoint_io = CustomCheckpointIO()
-
-# Register the DDP Strategy with your custom CheckpointIO plugin
-StrategyRegistry.register(
-    "ddp_custom_checkpoint_io",
-    DDPStrategy,
-    description="DDP Strategy with custom checkpoint io plugin",
-    checkpoint_io=custom_checkpoint_io,
-)
-
-trainer = Trainer(strategy="ddp_custom_checkpoint_io", accelerator="gpu", devices=2)
-
-
-
-
-
orphan
-

-
-
-

What is a Strategy?

-

Strategy controls the model distribution across training, evaluation, and prediction to be used by the Trainer. It can be controlled by passing different -strategy with aliases ("ddp", "ddp_spawn", "deepspeed" and so on) as well as a custom strategy to the strategy parameter for Trainer.

-

The Strategy in PyTorch Lightning handles the following responsibilities:

-
    -
  • Launch and teardown of training processes (if applicable).

  • -
  • Setup communication between processes (NCCL, GLOO, MPI, and so on).

  • -
  • Provide a unified communication interface for reduction, broadcast, and so on.

  • -
  • Owns the LightningModule

  • -
  • Handles/owns optimizers and schedulers.

  • -
-

Strategy also manages the accelerator, precision, and checkpointing plugins.

-Illustration of the Strategy as a composition of the Accelerator and several plugins -

We expose Strategies mainly for expert users that want to extend Lightning for new hardware support or new distributed backends (e.g. a backend not yet supported by PyTorch itself).

-
-
-
-

Enable Different Strategies

-
# Training with the DistributedDataParallel strategy on 4 GPUs
-trainer = Trainer(strategy="ddp", accelerator="gpu", devices=4)
-
-# Training with the custom DistributedDataParallel strategy on 4 GPUs
-trainer = Trainer(strategy=DDPStrategy(...), accelerator="gpu", devices=4)
-
-# Training with the DDP Spawn strategy using auto accelerator selection
-trainer = Trainer(strategy="ddp_spawn", accelerator="auto", devices=4)
-
-# Training with the DeepSpeed strategy on available GPUs
-trainer = Trainer(strategy="deepspeed", accelerator="gpu", devices="auto")
-
-# Training with the DDP strategy using 3 CPU processes
-trainer = Trainer(strategy="ddp", accelerator="cpu", devices=3)
-
-# Training with the DDP Spawn strategy on 8 TPU cores
-trainer = Trainer(strategy="ddp_spawn", accelerator="tpu", devices=8)
-
-# Training with the default IPU strategy on 8 IPUs
-trainer = Trainer(accelerator="ipu", devices=8)
-
-
-
-
-
-

Create a Custom Strategy

-

Expert users may choose to extend an existing strategy by overriding its methods.

-
from pytorch_lightning.strategies import DDPStrategy
-
-
-class CustomDDPStrategy(DDPStrategy):
-    def configure_ddp(self):
-        self.model = MyCustomDistributedDataParallel(
-            self.model,
-            device_ids=...,
-        )
-
-
-

or by subclassing the base class Strategy to create new ones. These custom strategies -can then be passed into the Trainer directly via the strategy parameter.

-
# custom plugins
-trainer = Trainer(strategy=CustomDDPStrategy())
-
-# fully custom accelerator and plugins
-accelerator = MyAccelerator()
-precision_plugin = MyPrecisionPlugin()
-training_strategy = CustomDDPStrategy(accelerator=accelerator, precision_plugin=precision_plugin)
-trainer = Trainer(strategy=training_strategy)
-
-
-

The complete list of built-in strategies is listed below.

-
-
-
-

Available Training Strategies

- ---- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -

BaguaStrategy

Strategy for training using the Bagua library, with advanced distributed training algorithms and system optimizations.

DDP2Strategy

DDP2 behaves like DP in one node, but synchronization across nodes behaves like in DDP.

DDPFullyShardedStrategy

Plugin for Fully Sharded Data Parallel provided by FairScale.

DDPShardedStrategy

Optimizer and gradient sharded training provided by FairScale.

DDPSpawnShardedStrategy

Optimizer sharded training provided by FairScale.

DDPSpawnStrategy

Spawns processes using the torch.multiprocessing.spawn() method and joins processes after training finishes.

DDPStrategy

Strategy for multi-process single-device training on one or multiple nodes.

DataParallelStrategy

Implements data-parallel training in a single process, i.e., the model gets replicated to each device and each gets a split of the data.

DeepSpeedStrategy

Provides capabilities to run training using the DeepSpeed library, with training optimizations for large billion parameter models.

HorovodStrategy

Plugin for Horovod distributed training integration.

HPUParallelStrategy

Strategy for distributed training on multiple HPU devices.

IPUStrategy

Plugin for training on IPU devices.

ParallelStrategy

Plugin for training with multiple processes in parallel.

SingleDeviceStrategy

Strategy that handles communication on a single device.

SingleHPUStrategy

Strategy for training on single HPU device.

SingleTPUStrategy

Strategy for training on a single TPU device.

Strategy

Base class for all strategies that change the behaviour of the training, validation and test- loop.

TPUSpawnStrategy

Strategy for training multiple TPU devices using the torch_xla.distributed.xla_multiprocessing.spawn() method.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/accelerators/gpu_faq.html b/docs/accelerators/gpu_faq.html deleted file mode 100644 index acbcd6f..0000000 --- a/docs/accelerators/gpu_faq.html +++ /dev/null @@ -1,766 +0,0 @@ - - - - - - - - - - - - - - GPU training (FAQ) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • GPU training (FAQ)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

GPU training (FAQ)

-
-

How should I adjust the learning rate when using multiple devices?

-

When using distributed training make sure to modify your learning rate according to your effective -batch size.

-

Let’s say you have a batch size of 7 in your dataloader.

-
class LitModel(LightningModule):
-    def train_dataloader(self):
-        return Dataset(..., batch_size=7)
-
-
-

In DDP, DDP_SPAWN, Deepspeed, DDP_SHARDED, or Horovod your effective batch size will be 7 * devices * num_nodes.

-
# effective batch size = 7 * 8
-Trainer(accelerator="gpu", devices=8, strategy="ddp")
-Trainer(accelerator="gpu", devices=8, strategy="ddp_spawn")
-Trainer(accelerator="gpu", devices=8, strategy="ddp_sharded")
-Trainer(accelerator="gpu", devices=8, strategy="horovod")
-
-# effective batch size = 7 * 8 * 10
-Trainer(accelerator="gpu", devices=8, num_nodes=10, strategy="ddp")
-Trainer(accelerator="gpu", devices=8, num_nodes=10, strategy="ddp_spawn")
-Trainer(accelerator="gpu", devices=8, num_nodes=10, strategy="ddp_sharded")
-Trainer(accelerator="gpu", devices=8, num_nodes=10, strategy="horovod")
-
-
-

In DDP2 or DP, your effective batch size will be 7 * num_nodes. -The reason is that the full batch is visible to all GPUs on the node when using DDP2.

-
# effective batch size = 7
-Trainer(accelerator="gpu", devices=8, strategy="ddp2")
-Trainer(accelerator="gpu", devices=8, strategy="dp")
-
-# effective batch size = 7 * 10
-Trainer(accelerator="gpu", devices=8, num_nodes=10, strategy="ddp2")
-Trainer(accelerator="gpu", devices=8, strategy="dp")
-
-
-
-

Note

-

Huge batch sizes are actually really bad for convergence. Check out: -Accurate, Large Minibatch SGD: Training ImageNet in 1 Hour

-
-
-
-
-

How do I use multiple GPUs on Jupyter or Colab notebooks?

-

To use multiple GPUs on notebooks, use the DP mode.

-
Trainer(accelerator="gpu", devices=4, strategy="dp")
-
-
-

If you want to use other models, please launch your training via the command-shell.

-
-

Note

-

Learn how to access a cloud machine with multiple GPUs in this guide.

-
-
-
- -
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/accelerators/gpu_intermediate.html b/docs/accelerators/gpu_intermediate.html deleted file mode 100644 index 4792c6d..0000000 --- a/docs/accelerators/gpu_intermediate.html +++ /dev/null @@ -1,1205 +0,0 @@ - - - - - - - - - - - - - - GPU training (Intermediate) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • GPU training (Intermediate)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

GPU training (Intermediate)

-

Audience: Users looking to train across machines or experiment with different scaling techniques.

-
-
-

Distributed Training strategies

-

Lightning supports multiple ways of doing distributed training.

-
-

-
-
    -
  • Data Parallel (strategy='dp') (multiple-gpus, 1 machine)

  • -
  • DistributedDataParallel (strategy='ddp') (multiple-gpus across many machines (python script based)).

  • -
  • DistributedDataParallel (strategy='ddp_spawn') (multiple-gpus across many machines (spawn based)).

  • -
  • DistributedDataParallel 2 (strategy='ddp2') (DP in a machine, DDP across machines).

  • -
  • Horovod (strategy='horovod') (multi-machine, multi-gpu, configured at runtime)

  • -
  • Bagua (strategy='bagua') (multiple-gpus across many machines with advanced training algorithms)

  • -
-
-

Note

-

If you request multiple GPUs or nodes without setting a mode, DDP Spawn will be automatically used.

-
-

For a deeper understanding of what Lightning is doing, feel free to read this -guide.

-
-

Data Parallel

-

DataParallel (DP) splits a batch across k GPUs. -That is, if you have a batch of 32 and use DP with 2 GPUs, each GPU will process 16 samples, -after which the root node will aggregate the results.

-
-

Warning

-

DP use is discouraged by PyTorch and Lightning. State is not maintained on the replicas created by the -DataParallel wrapper and you may see errors or misbehavior if you assign state to the module -in the forward() or *_step() methods. For the same reason we cannot fully support -Manual Optimization with DP. Use DDP which is more stable and at least 3x faster.

-
-
-

Warning

-

DP only supports scattering and gathering primitive collections of tensors like lists, dicts, etc. -Therefore the transfer_batch_to_device() hook does not apply in -this mode and if you have overridden it, it will not be called.

-
-
# train on 2 GPUs (using DP mode)
-trainer = Trainer(accelerator="gpu", devices=2, strategy="dp")
-
-
-
-
-

Distributed Data Parallel

-

DistributedDataParallel (DDP) works as follows:

-
    -
  1. Each GPU across each node gets its own process.

  2. -
  3. Each GPU gets visibility into a subset of the overall dataset. It will only ever see that subset.

  4. -
  5. Each process inits the model.

  6. -
  7. Each process performs a full forward and backward pass in parallel.

  8. -
  9. The gradients are synced and averaged across all processes.

  10. -
  11. Each process updates its optimizer.

  12. -
-
# train on 8 GPUs (same machine (ie: node))
-trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp")
-
-# train on 32 GPUs (4 nodes)
-trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp", num_nodes=4)
-
-
-

This Lightning implementation of DDP calls your script under the hood multiple times with the correct environment -variables:

-
# example for 3 GPUs DDP
-MASTER_ADDR=localhost MASTER_PORT=random() WORLD_SIZE=3 NODE_RANK=0 LOCAL_RANK=0 python my_file.py --accelerator 'gpu' --devices 3 --etc
-MASTER_ADDR=localhost MASTER_PORT=random() WORLD_SIZE=3 NODE_RANK=1 LOCAL_RANK=0 python my_file.py --accelerator 'gpu' --devices 3 --etc
-MASTER_ADDR=localhost MASTER_PORT=random() WORLD_SIZE=3 NODE_RANK=2 LOCAL_RANK=0 python my_file.py --accelerator 'gpu' --devices 3 --etc
-
-
-

We use DDP this way because ddp_spawn has a few limitations (due to Python and PyTorch):

-
    -
  1. Since .spawn() trains the model in subprocesses, the model on the main process does not get updated.

  2. -
  3. Dataloader(num_workers=N), where N is large, bottlenecks training with DDP… ie: it will be VERY slow or won’t work at all. This is a PyTorch limitation.

  4. -
  5. Forces everything to be picklable.

  6. -
-

There are cases in which it is NOT possible to use DDP. Examples are:

-
    -
  • Jupyter Notebook, Google COLAB, Kaggle, etc.

  • -
  • You have a nested script without a root package

  • -
-

In these situations you should use dp or ddp_spawn instead.

-
-
-

Distributed Data Parallel 2

-

In certain cases, it’s advantageous to use all batches on the same machine instead of a subset. -For instance, you might want to compute a NCE loss where it pays to have more negative samples.

-

In this case, we can use DDP2 which behaves like DP in a machine and DDP across nodes. DDP2 does the following:

-
    -
  1. Copies a subset of the data to each node.

  2. -
  3. Inits a model on each node.

  4. -
  5. Runs a forward and backward pass using DP.

  6. -
  7. Syncs gradients across nodes.

  8. -
  9. Applies the optimizer updates.

  10. -
-
# train on 32 GPUs (4 nodes)
-trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp2", num_nodes=4)
-
-
-
-
-

Distributed Data Parallel Spawn

-

ddp_spawn is exactly like ddp except that it uses .spawn to start the training processes.

-
-

Warning

-

It is STRONGLY recommended to use DDP for speed and performance.

-
-
mp.spawn(self.ddp_train, nprocs=self.num_processes, args=(model,))
-
-
-

If your script does not support being called from the command line (ie: it is nested without a root -project module) you can use the following method:

-
# train on 8 GPUs (same machine (ie: node))
-trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp_spawn")
-
-
-

We STRONGLY discourage this use because it has limitations (due to Python and PyTorch):

-
    -
  1. The model you pass in will not update. Please save a checkpoint and restore from there.

  2. -
  3. Set Dataloader(num_workers=0) or it will bottleneck training.

  4. -
-

ddp is MUCH faster than ddp_spawn. We recommend you

-
    -
  1. Install a top-level module for your project using setup.py

  2. -
-
# setup.py
-#!/usr/bin/env python
-
-from setuptools import setup, find_packages
-
-setup(
-    name="src",
-    version="0.0.1",
-    description="Describe Your Cool Project",
-    author="",
-    author_email="",
-    url="https://github.com/YourSeed",  # REPLACE WITH YOUR OWN GITHUB PROJECT LINK
-    install_requires=["pytorch-lightning"],
-    packages=find_packages(),
-)
-
-
-
    -
  1. Setup your project like so:

  2. -
-
/project
-    /src
-        some_file.py
-        /or_a_folder
-    setup.py
-
-
-
    -
  1. Install as a root-level package

  2. -
-
cd /project
-pip install -e .
-
-
-

You can then call your scripts anywhere

-
cd /project/src
-python some_file.py --accelerator 'gpu' --devices 8 --strategy 'ddp'
-
-
-
-
-

Horovod

-

Horovod allows the same training script to be used for single-GPU, -multi-GPU, and multi-node training.

-

Like Distributed Data Parallel, every process in Horovod operates on a single GPU with a fixed -subset of the data. Gradients are averaged across all GPUs in parallel during the backward pass, -then synchronously applied before beginning the next step.

-

The number of worker processes is configured by a driver application (horovodrun or mpirun). In -the training script, Horovod will detect the number of workers from the environment, and automatically -scale the learning rate to compensate for the increased total batch size.

-

Horovod can be configured in the training script to run with any number of GPUs / processes as follows:

-
# train Horovod on GPU (number of GPUs / machines provided on command-line)
-trainer = Trainer(strategy="horovod", accelerator="gpu", devices=1)
-
-# train Horovod on CPU (number of processes / machines provided on command-line)
-trainer = Trainer(strategy="horovod")
-
-
-

When starting the training job, the driver application will then be used to specify the total -number of worker processes:

-
# run training with 4 GPUs on a single machine
-horovodrun -np 4 python train.py
-
-# run training with 8 GPUs on two machines (4 GPUs each)
-horovodrun -np 8 -H hostname1:4,hostname2:4 python train.py
-
-
-

See the official Horovod documentation for details -on installation and performance tuning.

-
-
-

Bagua

-

Bagua is a deep learning training acceleration framework which supports -multiple advanced distributed training algorithms including:

-
    -
  • Gradient AllReduce for centralized synchronous communication, where gradients are averaged among all workers.

  • -
  • Decentralized SGD for decentralized synchronous communication, where each worker exchanges data with one or a few specific workers.

  • -
  • ByteGrad and QAdam for low precision communication, where data is compressed into low precision before communication.

  • -
  • Asynchronous Model Average for asynchronous communication, where workers are not required to be synchronized in the same iteration in a lock-step style.

  • -
-

By default, Bagua uses Gradient AllReduce algorithm, which is also the algorithm implemented in Distributed Data Parallel and Horovod, -but Bagua can usually produce a higher training throughput due to its backend written in Rust.

-
# train on 4 GPUs (using Bagua mode)
-trainer = Trainer(strategy="bagua", accelerator="gpu", devices=4)
-
-
-

By specifying the algorithm in the BaguaStrategy, you can select more advanced training algorithms featured by Bagua:

-
# train on 4 GPUs, using Bagua Gradient AllReduce algorithm
-trainer = Trainer(
-    strategy=BaguaStrategy(algorithm="gradient_allreduce"),
-    accelerator="gpu",
-    devices=4,
-)
-
-# train on 4 GPUs, using Bagua ByteGrad algorithm
-trainer = Trainer(
-    strategy=BaguaStrategy(algorithm="bytegrad"),
-    accelerator="gpu",
-    devices=4,
-)
-
-# train on 4 GPUs, using Bagua Decentralized SGD
-trainer = Trainer(
-    strategy=BaguaStrategy(algorithm="decentralized"),
-    accelerator="gpu",
-    devices=4,
-)
-
-# train on 4 GPUs, using Bagua Low Precision Decentralized SGD
-trainer = Trainer(
-    strategy=BaguaStrategy(algorithm="low_precision_decentralized"),
-    accelerator="gpu",
-    devices=4,
-)
-
-# train on 4 GPUs, using Asynchronous Model Average algorithm, with a synchronization interval of 100ms
-trainer = Trainer(
-    strategy=BaguaStrategy(algorithm="async", sync_interval_ms=100),
-    accelerator="gpu",
-    devices=4,
-)
-
-
-

To use QAdam, we need to initialize -QAdamOptimizer first:

-
from pytorch_lightning.strategies import BaguaStrategy
-from bagua.torch_api.algorithms.q_adam import QAdamOptimizer
-
-
-class MyModel(pl.LightningModule):
-    ...
-
-    def configure_optimizers(self):
-        # initialize QAdam Optimizer
-        return QAdamOptimizer(self.parameters(), lr=0.05, warmup_steps=100)
-
-
-model = MyModel()
-trainer = Trainer(
-    accelerator="gpu",
-    devices=4,
-    strategy=BaguaStrategy(algorithm="qadam"),
-)
-trainer.fit(model)
-
-
-

Bagua relies on its own launcher to schedule jobs. -Below, find examples using bagua.distributed.launch which follows torch.distributed.launch API:

-
# start training with 8 GPUs on a single node
-python -m bagua.distributed.launch --nproc_per_node=8 train.py
-
-
-

If the ssh service is available with passwordless login on each node, you can launch the distributed job on a -single node with baguarun which has a similar syntax as mpirun. When staring the job, baguarun will -automatically spawn new processes on each of your training node provided by --host_list option and each node in it -is described as an ip address followed by a ssh port.

-
# Run on node1 (or node2) to start training on two nodes (node1 and node2), 8 GPUs per node
-baguarun --host_list hostname1:ssh_port1,hostname2:ssh_port2 --nproc_per_node=8 --master_port=port1 train.py
-
-
-
-

Note

-

You can also start training in the same way as Distributed Data Parallel. However, system optimizations like -Bagua-Net and -Performance autotuning can only be enabled through bagua -launcher. It is worth noting that with Bagua-Net, Distributed Data Parallel can also achieve -better performance without modifying the training script.

-
-

See Bagua Tutorials for more details on installation and advanced features.

-
-
-

DP/DDP2 caveats

-

In DP and DDP2 each GPU within a machine sees a portion of a batch. -DP and ddp2 roughly do the following:

-
def distributed_forward(batch, model):
-    batch = torch.Tensor(32, 8)
-    gpu_0_batch = batch[:8]
-    gpu_1_batch = batch[8:16]
-    gpu_2_batch = batch[16:24]
-    gpu_3_batch = batch[24:]
-
-    y_0 = model_copy_gpu_0(gpu_0_batch)
-    y_1 = model_copy_gpu_1(gpu_1_batch)
-    y_2 = model_copy_gpu_2(gpu_2_batch)
-    y_3 = model_copy_gpu_3(gpu_3_batch)
-
-    return [y_0, y_1, y_2, y_3]
-
-
-

So, when Lightning calls any of the training_step, validation_step, test_step -you will only be operating on one of those pieces.

-
# the batch here is a portion of the FULL batch
-def training_step(self, batch, batch_idx):
-    y_0 = batch
-
-
-

For most metrics, this doesn’t really matter. However, if you want -to add something to your computational graph (like softmax) -using all batch parts you can use the training_step_end step.

-
def training_step_end(self, outputs):
-    # only use when  on dp
-    outputs = torch.cat(outputs, dim=1)
-    softmax = softmax(outputs, dim=1)
-    out = softmax.mean()
-    return out
-
-
-

In pseudocode, the full sequence is:

-
# get data
-batch = next(dataloader)
-
-# copy model and data to each gpu
-batch_splits = split_batch(batch, num_gpus)
-models = copy_model_to_gpus(model)
-
-# in parallel, operate on each batch chunk
-all_results = []
-for gpu_num in gpus:
-    batch_split = batch_splits[gpu_num]
-    gpu_model = models[gpu_num]
-    out = gpu_model(batch_split)
-    all_results.append(out)
-
-# use the full batch for something like softmax
-full_out = model.training_step_end(all_results)
-
-
-

To illustrate why this is needed, let’s look at DataParallel

-
def training_step(self, batch, batch_idx):
-    x, y = batch
-    y_hat = self(batch)
-
-    # on dp or ddp2 if we did softmax now it would be wrong
-    # because batch is actually a piece of the full batch
-    return y_hat
-
-
-def training_step_end(self, step_output):
-    # step_output has outputs of each part of the batch
-
-    # do softmax here
-    outputs = torch.cat(outputs, dim=1)
-    softmax = softmax(outputs, dim=1)
-    out = softmax.mean()
-
-    return out
-
-
-

If training_step_end is defined it will be called regardless of TPU, DP, DDP, etc… which means -it will behave the same regardless of the backend.

-

Validation and test step have the same option when using DP.

-
def validation_step_end(self, step_output):
-    ...
-
-
-def test_step_end(self, step_output):
-    ...
-
-
-
-
-

Distributed and 16-bit precision

-

Due to an issue with Apex and DataParallel (PyTorch and NVIDIA issue), Lightning does -not allow 16-bit and DP training. We tried to get this to work, but it’s an issue on their end.

-

Below are the possible configurations we support.

- -------- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -

1 GPU

1+ GPUs

DP

DDP

16-bit

command

Y

Trainer(accelerator=”gpu”, devices=1)

Y

Y

Trainer(accelerator=”gpu”, devices=1, precision=16)

Y

Y

Trainer(accelerator=”gpu”, devices=k, strategy=’dp’)

Y

Y

Trainer(accelerator=”gpu”, devices=k, strategy=’ddp’)

Y

Y

Y

Trainer(accelerator=”gpu”, devices=k, strategy=’ddp’, precision=16)

-
-
-

Implement Your Own Distributed (DDP) training

-

If you need your own way to init PyTorch DDP you can override pytorch_lightning.strategies.ddp.DDPStrategy.init_dist_connection().

-

If you also need to use your own DDP implementation, override pytorch_lightning.strategies.ddp.DDPStrategy.configure_ddp().

-
-
-
-
-

Torch Distributed Elastic

-

Lightning supports the use of Torch Distributed Elastic to enable fault-tolerant and elastic distributed job scheduling. To use it, specify the ‘ddp’ or ‘ddp2’ backend and the number of GPUs you want to use in the trainer.

-
Trainer(accelerator="gpu", devices=8, strategy="ddp")
-
-
-

To launch a fault-tolerant job, run the following on all nodes.

-
python -m torch.distributed.run
-        --nnodes=NUM_NODES
-        --nproc_per_node=TRAINERS_PER_NODE
-        --rdzv_id=JOB_ID
-        --rdzv_backend=c10d
-        --rdzv_endpoint=HOST_NODE_ADDR
-        YOUR_LIGHTNING_TRAINING_SCRIPT.py (--arg1 ... train script args...)
-
-
-

To launch an elastic job, run the following on at least MIN_SIZE nodes and at most MAX_SIZE nodes.

-
python -m torch.distributed.run
-        --nnodes=MIN_SIZE:MAX_SIZE
-        --nproc_per_node=TRAINERS_PER_NODE
-        --rdzv_id=JOB_ID
-        --rdzv_backend=c10d
-        --rdzv_endpoint=HOST_NODE_ADDR
-        YOUR_LIGHTNING_TRAINING_SCRIPT.py (--arg1 ... train script args...)
-
-
-

See the official Torch Distributed Elastic documentation for details -on installation and more use cases.

-
-
-

Optimize multi-machine communication

-

By default, Lightning will select the nccl backend over gloo when running on GPUs. -Find more information about PyTorch’s supported backends here.

-

Lightning allows explicitly specifying the backend via the process_group_backend constructor argument on the relevant Strategy classes. By default, Lightning will select the appropriate process group backend based on the hardware used.

-
from pytorch_lightning.strategies import DDPStrategy
-
-# Explicitly specify the process group backend if you choose to
-ddp = DDPStrategy(process_group_backend="nccl")
-
-# Configure the strategy on the Trainer
-trainer = Trainer(strategy=ddp, accelerator="gpu", devices=8)
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/accelerators/hpu.html b/docs/accelerators/hpu.html deleted file mode 100644 index 767c74b..0000000 --- a/docs/accelerators/hpu.html +++ /dev/null @@ -1,731 +0,0 @@ - - - - - - - - - - - - - - Accelerator: HPU training — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Accelerator: HPU training
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
- -
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/accelerators/hpu_basic.html b/docs/accelerators/hpu_basic.html deleted file mode 100644 index ee508e5..0000000 --- a/docs/accelerators/hpu_basic.html +++ /dev/null @@ -1,757 +0,0 @@ - - - - - - - - - - - - - - Accelerator: HPU training — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Accelerator: HPU training
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Accelerator: HPU training

-

Audience: Users looking to save money and run large models faster using single or multiple Gaudi devices.

-
-
-

What is an HPU?

-

Habana® Gaudi® AI Processor (HPU) training processors are built on a heterogeneous architecture with a cluster of fully programmable Tensor Processing Cores (TPC) along with its associated development tools and libraries, and a configurable Matrix Math engine.

-

The TPC core is a VLIW SIMD processor with an instruction set and hardware tailored to serve training workloads efficiently. -The Gaudi memory architecture includes on-die SRAM and local memories in each TPC and, -Gaudi is the first DL training processor that has integrated RDMA over Converged Ethernet (RoCE v2) engines on-chip.

-

On the software side, the PyTorch Habana bridge interfaces between the framework and SynapseAI software stack to enable the execution of deep learning models on the Habana Gaudi device.

-

Gaudi offers a substantial price/performance advantage – so you get to do more deep learning training while spending less.

-

For more information, check out Gaudi Architecture and Gaudi Developer Docs.

-
-
-
-

Run on 1 Gaudi

-

To enable PyTorch Lightning to utilize the HPU accelerator, simply provide accelerator="hpu" parameter to the Trainer class.

-
trainer = Trainer(accelerator="hpu", devices=1)
-
-
-
-
-
-

Run on multiple Gaudis

-

The devices=8 and accelerator="hpu" parameters to the Trainer class enables the Habana accelerator for distributed training with 8 Gaudis. -It uses HPUParallelStrategy internally which is based on DDP strategy with the addition of Habana’s collective communication library (HCCL) to support scale-up within a node and scale-out across multiple nodes.

-
trainer = Trainer(devices=8, accelerator="hpu")
-
-
-
-
-
-

Select Gaudis automatically

-

Lightning can automatically detect the number of Gaudi devices to run on. This setting is enabled by default if the devices argument is missing.

-
# equivalent
-trainer = Trainer(accelerator="hpu")
-trainer = Trainer(accelerator="hpu", devices="auto")
-
-
-
-
-
-

How to access HPUs

-

To use HPUs, you must have access to a system with HPU devices.

-
-

AWS

-

You can either use Gaudi-based AWS EC2 DL1 instances or Supermicro X12 Gaudi server to get access to HPUs.

-

Check out the Get Started Guide with AWS and Habana.

-
-
-
-
-

Known limitations

-
    -
  • Multiple optimizers are not supported.

  • -
  • Habana dataloader is not supported.

  • -
  • DeviceStatsMonitor is not supported.

  • -
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/accelerators/hpu_intermediate.html b/docs/accelerators/hpu_intermediate.html deleted file mode 100644 index 1ab7684..0000000 --- a/docs/accelerators/hpu_intermediate.html +++ /dev/null @@ -1,744 +0,0 @@ - - - - - - - - - - - - - - Accelerator: HPU training — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Accelerator: HPU training
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Accelerator: HPU training

-

Audience: Gaudi chip users looking to save memory and scale models with mixed-precision training.

-
-
-

Enable Mixed Precision

-

Lightning also allows mixed precision training with HPUs. -By default, HPU training will use 32-bit precision. To enable mixed precision, set the precision flag.

-
trainer = Trainer(devices=1, accelerator="hpu", precision=16)
-
-
-
-
-
-

Customize Mixed Precision

-

Internally, HPUPrecisionPlugin uses the Habana Mixed Precision (HMP) package to enable mixed precision training.

-

You can execute the ops in FP32 or BF16 precision. The HMP package modifies the Python operators to add the appropriate cast operations for the arguments before execution. -The default settings enable users to enable mixed precision training with minimal code easily.

-

In addition to the default settings in HMP, users also have the option of overriding these defaults and providing their -BF16 and FP32 operator lists by passing them as parameter to HPUPrecisionPlugin.

-

The below snippet shows an example model using MNIST with a single Habana Gaudi device and making use of HMP by overriding the default parameters. -This enables advanced users to provide their own BF16 and FP32 operator list instead of using the HMP defaults.

-
import pytorch_lightning as pl
-from pytorch_lightning.plugins import HPUPrecisionPlugin
-
-# Initialize a trainer with HPU accelerator for HPU strategy for single device,
-# with mixed precision using overidden HMP settings
-trainer = pl.Trainer(
-    accelerator="hpu",
-    devices=1,
-    # Optional Habana mixed precision params to be set
-    # Checkout `pl_examples/hpu_examples/simple_mnist/ops_bf16_mnist.txt` for the format
-    plugins=[
-        HPUPrecisionPlugin(
-            precision=16,
-            opt_level="O1",
-            verbose=False,
-            bf16_file_path="ops_bf16_mnist.txt",
-            fp32_file_path="ops_fp32_mnist.txt",
-        )
-    ],
-)
-
-# Init our model
-model = LitClassifier()
-# Init the data
-dm = MNISTDataModule(batch_size=batch_size)
-
-# Train the model ⚡
-trainer.fit(model, datamodule=dm)
-
-
-

For more details, please refer to PyTorch Mixed Precision Training on Gaudi.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/accelerators/ipu.html b/docs/accelerators/ipu.html deleted file mode 100644 index e7964d4..0000000 --- a/docs/accelerators/ipu.html +++ /dev/null @@ -1,741 +0,0 @@ - - - - - - - - - - - - - - Accelerator: IPU training — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Accelerator: IPU training
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
- -
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/accelerators/ipu_advanced.html b/docs/accelerators/ipu_advanced.html deleted file mode 100644 index 6a91759..0000000 --- a/docs/accelerators/ipu_advanced.html +++ /dev/null @@ -1,811 +0,0 @@ - - - - - - - - - - - - - - Accelerator: IPU training — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Accelerator: IPU training
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Accelerator: IPU training

-

Audience: Users looking to customize IPU training for massive models.

-
-
-

Advanced IPU options

-

IPUs provide further optimizations to speed up training. By using the IPUStrategy we can set the device_iterations, which controls the number of iterations run directly on the IPU devices before returning to the host. Increasing the number of on-device iterations will improve throughput, as there is less device to host communication required.

-
-

Note

-

When using model parallelism, it is a hard requirement to increase the number of device iterations to ensure we fully saturate the devices via micro-batching. see Model parallelism for more information.

-
-
import pytorch_lightning as pl
-from pytorch_lightning.strategies import IPUStrategy
-
-model = MyLightningModule()
-trainer = pl.Trainer(accelerator="ipu", devices=8, strategy=IPUStrategy(device_iterations=32))
-trainer.fit(model)
-
-
-

Note that by default we return the last device iteration loss. You can override this by passing in your own poptorch.Options and setting the AnchorMode as described in the PopTorch documentation.

-
import poptorch
-import pytorch_lightning as pl
-from pytorch_lightning.strategies import IPUStrategy
-
-model = MyLightningModule()
-inference_opts = poptorch.Options()
-inference_opts.deviceIterations(32)
-
-training_opts = poptorch.Options()
-training_opts.anchorMode(poptorch.AnchorMode.All)
-training_opts.deviceIterations(32)
-
-trainer = Trainer(
-    accelerator="ipu", devices=8, strategy=IPUStrategy(inference_opts=inference_opts, training_opts=training_opts)
-)
-trainer.fit(model)
-
-
-

You can also override all options by passing the poptorch.Options to the plugin. See PopTorch options documentation for more information.

-
-
-
-

Model parallelism

-

Due to the IPU architecture, larger models should be parallelized across IPUs by design. Currently PopTorch provides the capabilities via annotations as described in parallel execution strategies.

-

Below is an example using the block annotation in a LightningModule.

-
-

Note

-

Currently, when using model parallelism we do not infer the number of IPUs required for you. This is done via the annotations themselves. If you specify 4 different IDs when defining Blocks, this means your model will be split onto 4 different IPUs.

-

This is also mutually exclusive with the Trainer flag. In other words, if your model is split onto 2 IPUs and you set Trainer(accelerator="ipu", devices=4) this will require 8 IPUs in total: data parallelism will be used to replicate the two-IPU model 4 times.

-

When pipelining the model you must also increase the device_iterations to ensure full data saturation of the devices data, i.e whilst one device in the model pipeline processes a batch of data, the other device can start on the next batch. For example if the model is split onto 4 IPUs, we require device_iterations to be at-least 4.

-
-
import pytorch_lightning as pl
-import poptorch
-
-
-class MyLightningModule(pl.LightningModule):
-    def __init__(self):
-        super().__init__()
-        # This will place layer1, layer2+layer3, layer4, softmax on different IPUs at runtime.
-        # BeginBlock will start a new id for all layers within this block
-        self.layer1 = poptorch.BeginBlock(torch.nn.Linear(5, 10), ipu_id=0)
-
-        # This layer starts a new block,
-        # adding subsequent layers to this current block at runtime
-        # till the next block has been declared
-        self.layer2 = poptorch.BeginBlock(torch.nn.Linear(10, 5), ipu_id=1)
-        self.layer3 = torch.nn.Linear(5, 5)
-
-        # Create new blocks
-        self.layer4 = poptorch.BeginBlock(torch.nn.Linear(5, 5), ipu_id=2)
-        self.softmax = poptorch.BeginBlock(torch.nn.Softmax(dim=1), ipu_id=3)
-
-    ...
-
-
-model = MyLightningModule()
-trainer = pl.Trainer(accelerator="ipu", devices=8, strategy=IPUStrategy(device_iterations=20))
-trainer.fit(model)
-
-
-

You can also use the block context manager within the forward function, or any of the step functions.

-
import pytorch_lightning as pl
-import poptorch
-
-
-class MyLightningModule(pl.LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.layer1 = torch.nn.Linear(5, 10)
-        self.layer2 = torch.nn.Linear(10, 5)
-        self.layer3 = torch.nn.Linear(5, 5)
-        self.layer4 = torch.nn.Linear(5, 5)
-
-        self.act = torch.nn.ReLU()
-        self.softmax = torch.nn.Softmax(dim=1)
-
-    def forward(self, x):
-
-        with poptorch.Block(ipu_id=0):
-            x = self.act(self.layer1(x))
-
-        with poptorch.Block(ipu_id=1):
-            x = self.act(self.layer2(x))
-
-        with poptorch.Block(ipu_id=2):
-            x = self.act(self.layer3(x))
-            x = self.act(self.layer4(x))
-
-        with poptorch.Block(ipu_id=3):
-            x = self.softmax(x)
-        return x
-
-    ...
-
-
-model = MyLightningModule()
-trainer = pl.Trainer(accelerator="ipu", devices=8, strategy=IPUStrategy(device_iterations=20))
-trainer.fit(model)
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/accelerators/ipu_basic.html b/docs/accelerators/ipu_basic.html deleted file mode 100644 index bf22ee9..0000000 --- a/docs/accelerators/ipu_basic.html +++ /dev/null @@ -1,742 +0,0 @@ - - - - - - - - - - - - - - Accelerator: IPU training — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Accelerator: IPU training
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Accelerator: IPU training

-

Audience: Users looking to save money and run large models faster using single or multiple IPU devices.

-
-
-

What is an IPU?

-

The Graphcore Intelligence Processing Unit (IPU), built for Artificial Intelligence and Machine Learning, consists of many individual cores, called tiles, allowing highly parallel computation. Due to the high bandwidth between tiles, IPUs facilitate machine learning loads where parallelization is essential. Because computation is heavily parallelized,

-

IPUs operate in a different way to conventional accelerators such as CPU/GPUs. IPUs do not require large batch sizes for maximum parallelization, can provide optimizations across the compiled graph and rely on model parallelism to fully utilize tiles for larger models.

-

IPUs are used to build IPU-PODs, rack-based systems of IPU-Machines for larger workloads. See the IPU Architecture for more information.

-

See the Graphcore Glossary for the definitions of other IPU-specific terminology.

-
-

Note

-

IPU support is experimental and a work in progress (see Known limitations). If you run into any problems, please leave an issue.

-
-
-
-
-

Run on 1 IPU

-

To use a single IPU, set the accelerator and devices argument.

-
trainer = pl.Trainer(accelerator="ipu", devices=1)
-
-
-
-
-
-

Run on multiple IPUs

-

To use multiple IPUs set the devices to a number that is a power of 2 (i.e: 2, 4, 8, 16, …)

-
trainer = pl.Trainer(accelerator="ipu", devices=8)
-
-
-
-
-
-

How to access IPUs

-

To use IPUs you must have access to a system with IPU devices. To get access see get started.

-

You must ensure that the IPU system has enabled the PopART and Poplar packages from the SDK. Instructions are in the Get Started guide for your IPU system, on the Graphcore documents portal.

-
-
-
-

Known limitations

-

Currently there are some known limitations that are being addressed in the near future to make the experience seamless when moving from different devices.

-

Please see the MNIST example which displays most of the limitations and how to overcome them till they are resolved.

-
    -
  • self.log is not supported in the training_step, validation_step, test_step or predict_step. This is due to the step function being traced and sent to the IPU devices. We’re actively working on fixing this

  • -
  • Multiple optimizers are not supported. training_step only supports returning one loss from the training_step function as a result

  • -
  • Since the step functions are traced, branching logic or any form of primitive values are traced into constants. Be mindful as this could lead to errors in your custom code

  • -
  • Clipping gradients is not supported

  • -
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/accelerators/ipu_intermediate.html b/docs/accelerators/ipu_intermediate.html deleted file mode 100644 index 246fd36..0000000 --- a/docs/accelerators/ipu_intermediate.html +++ /dev/null @@ -1,739 +0,0 @@ - - - - - - - - - - - - - - Accelerator: IPU training — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Accelerator: IPU training
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Accelerator: IPU training

-

Audience: IPU users looking to increase performance via mixed precision and analysis tools.

-
-
-

Mixed precision & 16 bit precision

-

Lightning also supports training in mixed precision with IPUs. -By default, IPU training will use 32-bit precision. To enable mixed precision, -set the precision flag.

-
-

Note

-

Currently there is no dynamic scaling of the loss with mixed precision training.

-
-
import pytorch_lightning as pl
-
-model = MyLightningModule()
-trainer = pl.Trainer(accelerator="ipu", devices=8, precision=16)
-trainer.fit(model)
-
-
-

You can also use pure 16-bit training, where the weights are also in 16-bit precision.

-
import pytorch_lightning as pl
-from pytorch_lightning.strategies import IPUStrategy
-
-model = MyLightningModule()
-model = model.half()
-trainer = pl.Trainer(accelerator="ipu", devices=8, precision=16)
-trainer.fit(model)
-
-
-
-
-
-

PopVision Graph Analyser

-
-PopVision Graph Analyser -
-

Lightning supports integration with the PopVision Graph Analyser Tool. This helps to look at utilization of IPU devices and provides helpful metrics during the lifecycle of your trainer. Once you have gained access, The PopVision Graph Analyser Tool can be downloaded via the GraphCore download website.

-

Lightning supports dumping all reports to a directory to open using the tool.

-
import pytorch_lightning as pl
-from pytorch_lightning.strategies import IPUStrategy
-
-model = MyLightningModule()
-trainer = pl.Trainer(accelerator="ipu", devices=8, strategy=IPUStrategy(autoreport_dir="report_dir/"))
-trainer.fit(model)
-
-
-

This will dump all reports to report_dir/ which can then be opened using the Graph Analyser Tool, see Opening Reports.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/accelerators/tpu.html b/docs/accelerators/tpu.html deleted file mode 100644 index 7bed7d0..0000000 --- a/docs/accelerators/tpu.html +++ /dev/null @@ -1,751 +0,0 @@ - - - - - - - - - - - - - - Accelerator: TPU training — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Accelerator: TPU training
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
- -
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/accelerators/tpu_advanced.html b/docs/accelerators/tpu_advanced.html deleted file mode 100644 index c24e042..0000000 --- a/docs/accelerators/tpu_advanced.html +++ /dev/null @@ -1,748 +0,0 @@ - - - - - - - - - - - - - - TPU training (Advanced) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • TPU training (Advanced)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

TPU training (Advanced)

-

Audience: Users looking to apply advanced performance techniques to TPU training.

-
-
-

Weight Sharing/Tying

-

Weight Tying/Sharing is a technique where in the module weights are shared among two or more layers. -This is a common method to reduce memory consumption and is utilized in many State of the Art -architectures today.

-

PyTorch XLA requires these weights to be tied/shared after moving the model -to the TPU device. To support this requirement Lightning provides a model hook which is -called after the model is moved to the device. Any weights that require to be tied should -be done in the on_post_move_to_device model hook. This will ensure that the weights -among the modules are shared and not copied.

-

PyTorch Lightning has an inbuilt check which verifies that the model parameter lengths -match once the model is moved to the device. If the lengths do not match Lightning -throws a warning message.

-

Example:

-
from pytorch_lightning.core.lightning import LightningModule
-from torch import nn
-from pytorch_lightning.trainer.trainer import Trainer
-
-
-class WeightSharingModule(LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.layer_1 = nn.Linear(32, 10, bias=False)
-        self.layer_2 = nn.Linear(10, 32, bias=False)
-        self.layer_3 = nn.Linear(32, 10, bias=False)
-        # TPU shared weights are copied independently
-        # on the XLA device and this line won't have any effect.
-        # However, it works fine for CPU and GPU.
-        self.layer_3.weight = self.layer_1.weight
-
-    def forward(self, x):
-        x = self.layer_1(x)
-        x = self.layer_2(x)
-        x = self.layer_3(x)
-        return x
-
-    def on_post_move_to_device(self):
-        # Weights shared after the model has been moved to TPU Device
-        self.layer_3.weight = self.layer_1.weight
-
-
-model = WeightSharingModule()
-trainer = Trainer(max_epochs=1, accelerator="tpu", devices=8)
-
-
-

See XLA Documentation

-
-
-
-

XLA

-

XLA is the library that interfaces PyTorch with the TPUs. -For more information check out XLA.

-

Guide for troubleshooting XLA

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/accelerators/tpu_basic.html b/docs/accelerators/tpu_basic.html deleted file mode 100644 index 1acb332..0000000 --- a/docs/accelerators/tpu_basic.html +++ /dev/null @@ -1,896 +0,0 @@ - - - - - - - - - - - - - - TPU training (Basic) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • TPU training (Basic)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

TPU training (Basic)

-

Audience: Users looking to train on single or multiple TPU cores.

-
-
-

-
-

Lightning supports running on TPUs. At this moment, TPUs are available -on Google Cloud (GCP), Google Colab and Kaggle Environments. For more information on TPUs -watch this video.

-
-
-

What is a TPU?

-

Tensor Processing Unit (TPU) is an AI accelerator application-specific integrated circuit (ASIC) developed by Google specifically for neural networks.

-

A TPU has 8 cores where each core is optimized for 128x128 matrix multiplies. In general, a single TPU is about as fast as 5 V100 GPUs!

-

A TPU pod hosts many TPUs on it. Currently, TPU v3 Pod has up to 2048 TPU cores and 32 TiB of memory! -You can request a full pod from Google cloud or a “slice” which gives you -some subset of those 2048 cores.

-
-
-
-

Run on 1 TPU core

-

Enable the following Trainer arguments to run on 1 TPU.

-
trainer = Trainer(accelerator="tpu", devices=1)
-
-
-
-
-
-

Run on multiple TPU cores

-

For multiple TPU cores, change the value of the devices flag.

-
trainer = Trainer(accelerator="tpu", devices=8)
-
-
-
-
-
-

Run on a specific TPU core

-

To run on a specific core, specify the index of the TPU core.

-
trainer = pl.Trainer(accelerator="tpu", devices=[5])
-
-
-

This example runs on the 5th core, not on five cores.

-
-
-
-

How to access TPUs

-

To access TPUs, there are three main ways.

-
-

Google Colab

-

Colab is like a jupyter notebook with a free GPU or TPU -hosted on GCP.

-

To get a TPU on colab, follow these steps:

-
    -
  1. Go to https://colab.research.google.com/.

  2. -
  3. Click “new notebook” (bottom right of pop-up).

  4. -
  5. Click runtime > change runtime settings. Select Python 3, and hardware accelerator “TPU”. -This will give you a TPU with 8 cores.

  6. -
  7. Next, insert this code into the first cell and execute. -This will install the xla library that interfaces between PyTorch and the TPU.

    -
    !pip install cloud-tpu-client==0.10 https://storage.googleapis.com/tpu-pytorch/wheels/torch_xla-1.9-cp37-cp37m-linux_x86_64.whl
    -
    -
    -
  8. -
  9. Once the above is done, install PyTorch Lightning.

    -
    !pip install pytorch-lightning
    -
    -
    -
  10. -
  11. Then set up your LightningModule as normal.

  12. -
-
-
-

Google Cloud (GCP)

-

?

-
-
-

Kaggle

-

For starting Kaggle projects with TPUs, refer to this kernel.

-
-
-
-
-

Optimize Performance

-

The TPU was designed for specific workloads and operations to carry out large volumes of matrix multiplication, -convolution operations and other commonly used ops in applied deep learning. -The specialization makes it a strong choice for NLP tasks, sequential convolutional networks, and under low precision operation. -There are cases in which training on TPUs is slower when compared with GPUs, for possible reasons listed:

-
    -
  • Too small batch size.

  • -
  • Explicit evaluation of tensors during training, e.g. tensor.item()

  • -
  • Tensor shapes (e.g. model inputs) change often during training.

  • -
  • Limited resources when using TPU’s with PyTorch Link

  • -
  • XLA Graph compilation during the initial steps Reference

  • -
  • Some tensor ops are not fully supported on TPU, or not supported at all. These operations will be performed on CPU (context switch).

  • -
  • PyTorch integration is still experimental. Some performance bottlenecks may simply be the result of unfinished implementation.

  • -
-

The official PyTorch XLA performance guide -has more detailed information on how PyTorch code can be optimized for TPU. In particular, the -metrics report allows -one to identify operations that lead to context switching.

-
-
-
-

FAQ

-

XLA configuration is missing

-
File "/usr/local/lib/python3.8/dist-packages/torch_xla/core/xla_model.py", line 18, in <lambda>
-    _DEVICES = xu.LazyProperty(lambda: torch_xla._XLAC._xla_get_devices())
-RuntimeError: tensorflow/compiler/xla/xla_client/computation_client.cc:273 : Missing XLA configuration
-Traceback (most recent call last):
-...
-File "/home/kaushikbokka/pytorch-lightning/pytorch_lightning/utilities/device_parser.py", line 125, in parse_tpu_cores
-    raise MisconfigurationException('No TPU devices were found.')
-pytorch_lightning.utilities.exceptions.MisconfigurationException: No TPU devices were found.
-
-
-

This means the system is missing XLA configuration. You would need to set up XRT TPU device configuration.

-

For TPUVM architecture, you could set it in your terminal by:

-
export XRT_TPU_CONFIG="localservice;0;localhost:51011"
-
-
-

And for the old TPU + 2VM architecture, you could set it by:

-
export TPU_IP_ADDRESS=10.39.209.42  # You could get the IP Address in the GCP TPUs section
-export XRT_TPU_CONFIG="tpu_worker;0;$TPU_IP_ADDRESS:8470"
-
-
-
-

How to clear up the programs using TPUs in the background

-
lsof -w /lib/libtpu.so | grep "python" |  awk '{print $2}' | xargs -r kill -9
-
-
-

Sometimes, there can still be old programs running on the TPUs, which would make the TPUs unavailable to use. You could use the above command in the terminal to kill the running processes.

-
-

Replication issue

-
File "/usr/local/lib/python3.6/dist-packages/torch_xla/core/xla_model.py", line 200, in set_replication
-    replication_devices = xla_replication_devices(devices)
-File "/usr/local/lib/python3.6/dist-packages/torch_xla/core/xla_model.py", line 187, in xla_replication_devices
-    .format(len(local_devices), len(kind_devices)))
-RuntimeError: Cannot replicate if number of devices (1) is different from 8
-
-
-

This error is raised when the XLA device is called outside the spawn process. Internally in TPUSpawn Strategy for training on multiple tpu cores, we use XLA’s xmp.spawn. -Don’t use xm.xla_device() while working on Lightning + TPUs!

-
-

Unsupported datatype transfer to TPU

-
File "/usr/local/lib/python3.8/dist-packages/torch_xla/utils/utils.py", line 205, in _for_each_instance_rewrite
-    v = _for_each_instance_rewrite(result.__dict__[k], select_fn, fn, rwmap)
-File "/usr/local/lib/python3.8/dist-packages/torch_xla/utils/utils.py", line 206, in _for_each_instance_rewrite
-    result.__dict__[k] = v
-TypeError: 'mappingproxy' object does not support item assignment
-
-
-

PyTorch XLA only supports Tensor objects for CPU to TPU data transfer. Might cause issues if the User is trying to send some non-tensor objects through the DataLoader or during saving states.

-
-

Using `tpu_spawn_debug` Strategy alias

-
import pytorch_lightning as pl
-
-my_model = MyLightningModule()
-trainer = pl.Trainer(accelerator="tpu", devices=8, strategy="tpu_spawn_debug")
-trainer.fit(my_model)
-
-
-

Example Metrics report:

-
Metric: CompileTime
-    TotalSamples: 202
-    Counter: 06m09s401ms746.001us
-    ValueRate: 778ms572.062us / second
-    Rate: 0.425201 / second
-    Percentiles: 1%=001ms32.778us; 5%=001ms61.283us; 10%=001ms79.236us; 20%=001ms110.973us; 50%=001ms228.773us; 80%=001ms339.183us; 90%=001ms434.305us; 95%=002ms921.063us; 99%=21s102ms853.173us
-
-
-

A lot of PyTorch operations aren’t lowered to XLA, which could lead to significant slowdown of the training process. -These operations are moved to the CPU memory and evaluated, and then the results are transferred back to the XLA device(s). -By using the tpu_spawn_debug Strategy, users could create a metrics report to diagnose issues.

-

The report includes things like (XLA Reference):

-
    -
  • how many times we issue XLA compilations and time spent on issuing.

  • -
  • how many times we execute and time spent on execution

  • -
  • how many device data handles we create/destroy etc.

  • -
-
-

TPU Pod Training Startup script

-

All TPU VMs in a Pod setup are required to access the model code and data. -One easy way to achieve this is to use the following startup script when creating the TPU VM pod. -It will perform the data downloading on all TPU VMs. Note that you need to export the corresponding environment variables following the instruction in Create TPU Node.

-
gcloud alpha compute tpus tpu-vm create ${TPU_NAME} --zone ${ZONE} --project ${PROJECT_ID} --accelerator-type v3-32 --version ${RUNTIME_VERSION} --metadata startup-script=setup.py
-
-
-

Then users could ssh to any TPU worker, e.g. worker 0, check if data/model downloading is finished and -start the training after generating the ssh-keys to ssh between VM workers on a pod:

-
python3 -m torch_xla.distributed.xla_dist --tpu=$TPU_NAME -- python3 train.py --max_epochs=5 --batch_size=32
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/accelerators/tpu_faq.html b/docs/accelerators/tpu_faq.html deleted file mode 100644 index b65e83b..0000000 --- a/docs/accelerators/tpu_faq.html +++ /dev/null @@ -1,896 +0,0 @@ - - - - - - - - - - - - - - TPU training (Basic) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • TPU training (Basic)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

TPU training (Basic)

-

Audience: Users looking to train on single or multiple TPU cores.

-
-
-

-
-

Lightning supports running on TPUs. At this moment, TPUs are available -on Google Cloud (GCP), Google Colab and Kaggle Environments. For more information on TPUs -watch this video.

-
-
-

What is a TPU?

-

Tensor Processing Unit (TPU) is an AI accelerator application-specific integrated circuit (ASIC) developed by Google specifically for neural networks.

-

A TPU has 8 cores where each core is optimized for 128x128 matrix multiplies. In general, a single TPU is about as fast as 5 V100 GPUs!

-

A TPU pod hosts many TPUs on it. Currently, TPU v3 Pod has up to 2048 TPU cores and 32 TiB of memory! -You can request a full pod from Google cloud or a “slice” which gives you -some subset of those 2048 cores.

-
-
-
-

Run on 1 TPU core

-

Enable the following Trainer arguments to run on 1 TPU.

-
trainer = Trainer(accelerator="tpu", devices=1)
-
-
-
-
-
-

Run on multiple TPU cores

-

For multiple TPU cores, change the value of the devices flag.

-
trainer = Trainer(accelerator="tpu", devices=8)
-
-
-
-
-
-

Run on a specific TPU core

-

To run on a specific core, specify the index of the TPU core.

-
trainer = pl.Trainer(accelerator="tpu", devices=[5])
-
-
-

This example runs on the 5th core, not on five cores.

-
-
-
-

How to access TPUs

-

To access TPUs, there are three main ways.

-
-

Google Colab

-

Colab is like a jupyter notebook with a free GPU or TPU -hosted on GCP.

-

To get a TPU on colab, follow these steps:

-
    -
  1. Go to https://colab.research.google.com/.

  2. -
  3. Click “new notebook” (bottom right of pop-up).

  4. -
  5. Click runtime > change runtime settings. Select Python 3, and hardware accelerator “TPU”. -This will give you a TPU with 8 cores.

  6. -
  7. Next, insert this code into the first cell and execute. -This will install the xla library that interfaces between PyTorch and the TPU.

    -
    !pip install cloud-tpu-client==0.10 https://storage.googleapis.com/tpu-pytorch/wheels/torch_xla-1.9-cp37-cp37m-linux_x86_64.whl
    -
    -
    -
  8. -
  9. Once the above is done, install PyTorch Lightning.

    -
    !pip install pytorch-lightning
    -
    -
    -
  10. -
  11. Then set up your LightningModule as normal.

  12. -
-
-
-

Google Cloud (GCP)

-

?

-
-
-

Kaggle

-

For starting Kaggle projects with TPUs, refer to this kernel.

-
-
-
-
-

Optimize Performance

-

The TPU was designed for specific workloads and operations to carry out large volumes of matrix multiplication, -convolution operations and other commonly used ops in applied deep learning. -The specialization makes it a strong choice for NLP tasks, sequential convolutional networks, and under low precision operation. -There are cases in which training on TPUs is slower when compared with GPUs, for possible reasons listed:

-
    -
  • Too small batch size.

  • -
  • Explicit evaluation of tensors during training, e.g. tensor.item()

  • -
  • Tensor shapes (e.g. model inputs) change often during training.

  • -
  • Limited resources when using TPU’s with PyTorch Link

  • -
  • XLA Graph compilation during the initial steps Reference

  • -
  • Some tensor ops are not fully supported on TPU, or not supported at all. These operations will be performed on CPU (context switch).

  • -
  • PyTorch integration is still experimental. Some performance bottlenecks may simply be the result of unfinished implementation.

  • -
-

The official PyTorch XLA performance guide -has more detailed information on how PyTorch code can be optimized for TPU. In particular, the -metrics report allows -one to identify operations that lead to context switching.

-
-
-
-

FAQ

-

XLA configuration is missing

-
File "/usr/local/lib/python3.8/dist-packages/torch_xla/core/xla_model.py", line 18, in <lambda>
-    _DEVICES = xu.LazyProperty(lambda: torch_xla._XLAC._xla_get_devices())
-RuntimeError: tensorflow/compiler/xla/xla_client/computation_client.cc:273 : Missing XLA configuration
-Traceback (most recent call last):
-...
-File "/home/kaushikbokka/pytorch-lightning/pytorch_lightning/utilities/device_parser.py", line 125, in parse_tpu_cores
-    raise MisconfigurationException('No TPU devices were found.')
-pytorch_lightning.utilities.exceptions.MisconfigurationException: No TPU devices were found.
-
-
-

This means the system is missing XLA configuration. You would need to set up XRT TPU device configuration.

-

For TPUVM architecture, you could set it in your terminal by:

-
export XRT_TPU_CONFIG="localservice;0;localhost:51011"
-
-
-

And for the old TPU + 2VM architecture, you could set it by:

-
export TPU_IP_ADDRESS=10.39.209.42  # You could get the IP Address in the GCP TPUs section
-export XRT_TPU_CONFIG="tpu_worker;0;$TPU_IP_ADDRESS:8470"
-
-
-
-

How to clear up the programs using TPUs in the background

-
lsof -w /lib/libtpu.so | grep "python" |  awk '{print $2}' | xargs -r kill -9
-
-
-

Sometimes, there can still be old programs running on the TPUs, which would make the TPUs unavailable to use. You could use the above command in the terminal to kill the running processes.

-
-

Replication issue

-
File "/usr/local/lib/python3.6/dist-packages/torch_xla/core/xla_model.py", line 200, in set_replication
-    replication_devices = xla_replication_devices(devices)
-File "/usr/local/lib/python3.6/dist-packages/torch_xla/core/xla_model.py", line 187, in xla_replication_devices
-    .format(len(local_devices), len(kind_devices)))
-RuntimeError: Cannot replicate if number of devices (1) is different from 8
-
-
-

This error is raised when the XLA device is called outside the spawn process. Internally in TPUSpawn Strategy for training on multiple tpu cores, we use XLA’s xmp.spawn. -Don’t use xm.xla_device() while working on Lightning + TPUs!

-
-

Unsupported datatype transfer to TPU

-
File "/usr/local/lib/python3.8/dist-packages/torch_xla/utils/utils.py", line 205, in _for_each_instance_rewrite
-    v = _for_each_instance_rewrite(result.__dict__[k], select_fn, fn, rwmap)
-File "/usr/local/lib/python3.8/dist-packages/torch_xla/utils/utils.py", line 206, in _for_each_instance_rewrite
-    result.__dict__[k] = v
-TypeError: 'mappingproxy' object does not support item assignment
-
-
-

PyTorch XLA only supports Tensor objects for CPU to TPU data transfer. Might cause issues if the User is trying to send some non-tensor objects through the DataLoader or during saving states.

-
-

Using `tpu_spawn_debug` Strategy alias

-
import pytorch_lightning as pl
-
-my_model = MyLightningModule()
-trainer = pl.Trainer(accelerator="tpu", devices=8, strategy="tpu_spawn_debug")
-trainer.fit(my_model)
-
-
-

Example Metrics report:

-
Metric: CompileTime
-    TotalSamples: 202
-    Counter: 06m09s401ms746.001us
-    ValueRate: 778ms572.062us / second
-    Rate: 0.425201 / second
-    Percentiles: 1%=001ms32.778us; 5%=001ms61.283us; 10%=001ms79.236us; 20%=001ms110.973us; 50%=001ms228.773us; 80%=001ms339.183us; 90%=001ms434.305us; 95%=002ms921.063us; 99%=21s102ms853.173us
-
-
-

A lot of PyTorch operations aren’t lowered to XLA, which could lead to significant slowdown of the training process. -These operations are moved to the CPU memory and evaluated, and then the results are transferred back to the XLA device(s). -By using the tpu_spawn_debug Strategy, users could create a metrics report to diagnose issues.

-

The report includes things like (XLA Reference):

-
    -
  • how many times we issue XLA compilations and time spent on issuing.

  • -
  • how many times we execute and time spent on execution

  • -
  • how many device data handles we create/destroy etc.

  • -
-
-

TPU Pod Training Startup script

-

All TPU VMs in a Pod setup are required to access the model code and data. -One easy way to achieve this is to use the following startup script when creating the TPU VM pod. -It will perform the data downloading on all TPU VMs. Note that you need to export the corresponding environment variables following the instruction in Create TPU Node.

-
gcloud alpha compute tpus tpu-vm create ${TPU_NAME} --zone ${ZONE} --project ${PROJECT_ID} --accelerator-type v3-32 --version ${RUNTIME_VERSION} --metadata startup-script=setup.py
-
-
-

Then users could ssh to any TPU worker, e.g. worker 0, check if data/model downloading is finished and -start the training after generating the ssh-keys to ssh between VM workers on a pod:

-
python3 -m torch_xla.distributed.xla_dist --tpu=$TPU_NAME -- python3 train.py --max_epochs=5 --batch_size=32
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/accelerators/tpu_intermediate.html b/docs/accelerators/tpu_intermediate.html deleted file mode 100644 index 3e76dda..0000000 --- a/docs/accelerators/tpu_intermediate.html +++ /dev/null @@ -1,788 +0,0 @@ - - - - - - - - - - - - - - TPU training (Intermediate) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • TPU training (Intermediate)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

TPU training (Intermediate)

-

Audience: Users looking to use cloud TPUs.

-
-
-

DistributedSamplers

-

Lightning automatically inserts the correct samplers - no need to do this yourself!

-

Usually, with TPUs (and DDP), you would need to define a DistributedSampler to move the right -chunk of data to the appropriate TPU. As mentioned, this is not needed in Lightning

-
-

Note

-

Don’t add distributedSamplers. Lightning does this automatically

-
-

If for some reason you still need to, this is how to construct the sampler -for TPU use

-
import torch_xla.core.xla_model as xm
-
-
-def train_dataloader(self):
-    dataset = MNIST(os.getcwd(), train=True, download=True, transform=transforms.ToTensor())
-
-    # required for TPU support
-    sampler = None
-    if use_tpu:
-        sampler = torch.utils.data.distributed.DistributedSampler(
-            dataset, num_replicas=xm.xrt_world_size(), rank=xm.get_ordinal(), shuffle=True
-        )
-
-    loader = DataLoader(dataset, sampler=sampler, batch_size=32)
-
-    return loader
-
-
-

Configure the number of TPU cores in the trainer. You can only choose 1 or 8. -To use a full TPU pod skip to the TPU pod section.

-
import pytorch_lightning as pl
-
-my_model = MyLightningModule()
-trainer = pl.Trainer(accelerator="tpu", devices=8)
-trainer.fit(my_model)
-
-
-

That’s it! Your model will train on all 8 TPU cores.

-
-
-
-

Distributed Backend with TPU

-

The accelerator option used for GPUs does not apply to TPUs. -TPUs work in DDP mode by default (distributing over each core)

-
-
-
-

TPU VM

-

Lightning supports training on the new Cloud TPU VMs. -Previously, we needed separate VMs to connect to the TPU machines, but as -Cloud TPU VMs run on the TPU Host machines, it allows direct SSH access -for the users. Hence, this architecture upgrade leads to cheaper and significantly -better performance and usability while working with TPUs.

-

The TPUVMs come pre-installed with latest versions of PyTorch and PyTorch XLA. -After connecting to the VM and before running your Lightning code, you would need -to set the XRT TPU device configuration.

-
$ export XRT_TPU_CONFIG="localservice;0;localhost:51011"
-
-
-

You could learn more about the Cloud TPU VM architecture here

-
-
-
-

TPU Pod

-

To train on more than 8 cores, your code actually doesn’t change! -All you need to do is submit the following command:

-
$ python -m torch_xla.distributed.xla_dist
---tpu=$TPU_POD_NAME
---conda-env=torch-xla-nightly
--- python /usr/share/torch-xla-1.8.1/pytorch/xla/test/test_train_imagenet.py --fake_data
-
-
-

See this guide -on how to set up the instance groups and VMs needed to run TPU Pods.

-
-
-
-

16 bit precision

-

Lightning also supports training in 16-bit precision with TPUs. -By default, TPU training will use 32-bit precision. To enable 16-bit, -set the 16-bit flag.

-
import pytorch_lightning as pl
-
-my_model = MyLightningModule()
-trainer = pl.Trainer(accelerator="tpu", devices=8, precision=16)
-trainer.fit(my_model)
-
-
-

Under the hood the xla library will use the bfloat16 type.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/advanced/model_parallel.html b/docs/advanced/model_parallel.html deleted file mode 100644 index 4d9d962..0000000 --- a/docs/advanced/model_parallel.html +++ /dev/null @@ -1,1477 +0,0 @@ - - - - - - - - - - - - - - Train 1 trillion+ parameter models — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Train 1 trillion+ parameter models
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Train 1 trillion+ parameter models

-

When training large models, fitting larger batch sizes, or trying to increase throughput using multi-GPU compute, Lightning provides advanced optimized distributed training strategies to support these cases and offer substantial improvements in memory usage.

-

In many cases these strategies are some flavour of model parallelism however we only introduce concepts at a high level to get you started. Refer to the FairScale documentation for more information about model parallelism.

-

Note that some of the extreme memory saving configurations will affect the speed of training. This Speed/Memory trade-off in most cases can be adjusted.

-

Some of these memory-efficient strategies rely on offloading onto other forms of memory, such as CPU RAM or NVMe. This means you can even see memory benefits on a single GPU, using a strategy such as DeepSpeed ZeRO Stage 3 Offload.

-

Check out this amazing video explaining model parallelism and how it works behind the scenes:

-
-

Choosing an Advanced Distributed GPU Strategy

-

If you would like to stick with PyTorch DDP, see DDP Optimizations.

-

Unlike DistributedDataParallel (DDP) where the maximum trainable model size and batch size do not change with respect to the number of GPUs, memory-optimized strategies can accommodate bigger models and larger batches as more GPUs are used. This means as you scale up the number of GPUs, you can reach the number of model parameters you’d like to train.

-

There are many considerations when choosing a strategy as described below. In addition, check out the visualization of various strategy benchmarks using minGPT here.

-
-

Pre-training vs Fine-tuning

-

When fine-tuning, we often use a magnitude less data compared to pre-training a model. This is important when choosing a distributed strategy as usually for pre-training, we are compute-bound. -This means we cannot sacrifice throughput as much as if we were fine-tuning, because in fine-tuning the data requirement is smaller.

-

Overall:

- -

For example when using 128 GPUs, you can pre-train large 10 to 20 Billion parameter models using DeepSpeed ZeRO Stage 2 without having to take a performance hit with more advanced optimized multi-gpu strategy.

-

But for fine-tuning a model, you can reach 10 to 20 Billion parameter models using DeepSpeed ZeRO Stage 3 Offload on a single GPU. This does come with a significant throughput hit, which needs to be weighed accordingly.

-
-
-

When Shouldn’t I use an Optimized Distributed Strategy?

-

Sharding techniques help when model sizes are fairly large; roughly 500M+ parameters is where we’ve seen benefits. However, in the following cases, we recommend sticking to ordinary distributed strategies -* When your model is small (ResNet50 of around 80M Parameters), unless you are using unusually large batch sizes or inputs. -* Due to high distributed communication between devices, if running on a slow network/interconnect, the training might be much slower than expected and then it’s up to you to determince the tradeoff here.

-
-
-
-
-

Sharded Training

-

Lightning integration of optimizer sharded training provided by FairScale. -The technique can be found within DeepSpeed ZeRO and -ZeRO-2, -however the implementation is built from the ground up to be PyTorch compatible and standalone. -Sharded Training allows you to maintain GPU scaling efficiency, whilst reducing memory overhead drastically. In short, expect near-normal linear scaling (if your network allows), and significantly reduced memory usage when training large models.

-

Sharded Training still utilizes Data Parallel Training under the hood, except optimizer states and gradients are sharded across GPUs. -This means the memory overhead per GPU is lower, as each GPU only has to maintain a partition of your optimizer state and gradients.

-

The benefits vary by model and parameter sizes, but we’ve recorded up to a 63% memory reduction per GPU allowing us to double our model sizes. Because of efficient communication, -these benefits in multi-GPU setups are almost free and throughput scales well with multi-node setups.

-

It is highly recommended to use Sharded Training in multi-GPU environments where memory is limited, or where training larger models are beneficial (500M+ parameter models). -A technical note: as batch size scales, storing activations for the backwards pass becomes the bottleneck in training. As a result, sharding optimizer state and gradients becomes less impactful. -Use FairScale Activation Checkpointing to see even more benefit at the cost of some throughput.

-

To use Sharded Training, you need to first install FairScale using the command below.

-
pip install fairscale
-
-
-
# train using Sharded DDP
-trainer = Trainer(strategy="ddp_sharded")
-
-
-

Sharded Training can work across all DDP variants by adding the additional --strategy ddp_sharded flag via command line using a PyTorch Lightning script.

-

Internally we re-initialize your optimizers and shard them across your machines and processes. We handle all communication using PyTorch distributed, so no code changes are required.

-
-
-
-

Fully Sharded Training

-
-

Warning

-

Fully Sharded Training is in beta and the API is subject to change. Please create an issue if you run into any issues.

-
-

Fully Sharded shards optimizer state, gradients and parameters across data parallel workers. This allows you to fit much larger models onto multiple GPUs into memory.

-

Fully Sharded Training alleviates the need to worry about balancing layers onto specific devices using some form of pipe parallelism, and optimizes for distributed communication with minimal effort.

-
-

Shard Parameters to Reach 10+ Billion Parameters

-

To reach larger parameter sizes and be memory efficient, we have to shard parameters. There are various ways to enable this.

-
-

Note

-

Currently Fully Sharded Training relies on the user to wrap the model with Fully Sharded within the LightningModule. -This means you must create a single model that is treated as a torch.nn.Module within the LightningModule. -This is a limitation of Fully Sharded Training that will be resolved in the future.

-
-
-
-

Enabling Module Sharding for Maximum Memory Efficiency

-

To activate parameter sharding, you must wrap your model using provided wrap or auto_wrap functions as described below. Internally in Lightning, we enable a context manager around the configure_sharded_model function to make sure the wrap and auto_wrap parameters are passed correctly.

-

When not using Fully Sharded these wrap functions are a no-op. This means once the changes have been made, there is no need to remove the changes for other strategies.

-

auto_wrap will recursively wrap Module within the LightningModule with nested Fully Sharded Wrappers, -signalling that we’d like to partition these modules across data parallel devices, discarding the full weights when not required (information here).

-

auto_wrap can have varying level of success based on the complexity of your model. Auto Wrap does not support models with shared parameters.

-

wrap will simply wrap the module with a Fully Sharded Parallel class with the correct parameters from the Lightning context manager.

-

Below is an example of using both wrap and auto_wrap to create your model.

-
import torch
-import torch.nn as nn
-import pytorch_lightning as pl
-from pytorch_lightning import Trainer
-from fairscale.nn import checkpoint_wrapper, auto_wrap, wrap
-
-
-class MyModel(pl.LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.linear_layer = nn.Linear(32, 32)
-        self.block = nn.Sequential(nn.Linear(32, 32), nn.ReLU())
-        self.final_block = nn.Sequential(nn.Linear(32, 32), nn.ReLU())
-
-    def configure_sharded_model(self):
-        # modules are sharded across processes
-        # as soon as they are wrapped with ``wrap`` or ``auto_wrap``.
-        # During the forward/backward passes, weights get synced across processes
-        # and de-allocated once computation is complete, saving memory.
-
-        # Wraps the layer in a Fully Sharded Wrapper automatically
-        linear_layer = wrap(self.linear_layer)
-
-        # Wraps the module recursively
-        # based on a minimum number of parameters (default 100M parameters)
-        block = auto_wrap(self.block)
-
-        # For best memory efficiency,
-        # add FairScale activation checkpointing
-        final_block = auto_wrap(checkpoint_wrapper(self.final_block))
-        self.model = nn.Sequential(linear_layer, nn.ReLU(), block, final_block)
-
-    def configure_optimizers(self):
-        return torch.optim.AdamW(self.model.parameters())
-
-
-model = MyModel()
-trainer = Trainer(accelerator="gpu", devices=4, strategy="fsdp", precision=16)
-trainer.fit(model)
-
-trainer.test()
-trainer.predict()
-
-
-
-
-
-
-

FairScale Activation Checkpointing

-

Activation checkpointing frees activations from memory as soon as they are not needed during the forward pass. They are then re-computed for the backwards pass as needed. Activation checkpointing is very useful when you have intermediate layers that produce large activations.

-

FairScales’ checkpointing wrapper also handles batch norm layers correctly unlike the PyTorch implementation, ensuring stats are tracked correctly due to the multiple forward passes.

-

This saves memory when training larger models however requires wrapping modules you’d like to use activation checkpointing on. See here for more information.

-
-

Warning

-

Ensure to not wrap the entire model with activation checkpointing. This is not the intended usage of activation checkpointing, and will lead to failures as seen in this discussion.

-
-
from pytorch_lightning import Trainer
-from fairscale.nn import checkpoint_wrapper
-
-
-class MyModel(pl.LightningModule):
-    def __init__(self):
-        super().__init__()
-        # Wrap layers using checkpoint_wrapper
-        self.block_1 = checkpoint_wrapper(nn.Sequential(nn.Linear(32, 32), nn.ReLU()))
-        self.block_2 = nn.Linear(32, 2)
-
-
-
-
-

DeepSpeed

-
-

Note

-

The DeepSpeed strategy is in beta and the API is subject to change. Please create an issue if you run into any issues.

-
-

DeepSpeed is a deep learning training optimization library, providing the means to train massive billion parameter models at scale. -Using the DeepSpeed strategy, we were able to train model sizes of 10 Billion parameters and above, with a lot of useful information in this benchmark and the DeepSpeed docs. -DeepSpeed also offers lower level training optimizations, and efficient optimizers such as 1-bit Adam. We recommend using DeepSpeed in environments where speed and memory optimizations are important (such as training large billion parameter models).

-

Below is a summary of all the configurations of DeepSpeed.

-
    -
  • DeepSpeed ZeRO Stage 1 - Shard optimizer states, remains at speed parity with DDP whilst providing memory improvement

  • -
  • DeepSpeed ZeRO Stage 2 - Shard optimizer states and gradients, remains at speed parity with DDP whilst providing even more memory improvement

  • -
  • DeepSpeed ZeRO Stage 2 Offload - Offload optimizer states and gradients to CPU. Increases distributed communication volume and GPU-CPU device transfer, but provides significant memory improvement

  • -
  • DeepSpeed ZeRO Stage 3 - Shard optimizer states, gradients, parameters and optionally activations. Increases distributed communication volume, but provides even more memory improvement

  • -
  • DeepSpeed ZeRO Stage 3 Offload - Offload optimizer states, gradients, parameters and optionally activations to CPU. Increases distributed communication volume and GPU-CPU device transfer, but even more significant memory improvement.

  • -
  • DeepSpeed Activation Checkpointing - Free activations after forward pass. Increases computation, but provides memory improvement for all stages.

  • -
-

To use DeepSpeed, you first need to install DeepSpeed using the commands below.

-
pip install deepspeed
-
-
-

If you run into an issue with the install or later in training, ensure that the CUDA version of the PyTorch you’ve installed matches your locally installed CUDA (you can see which one has been recognized by running nvcc --version).

-
-

Note

-

DeepSpeed currently only supports single optimizer, single scheduler within the training loop.

-

When saving a checkpoint we rely on DeepSpeed which saves a directory containing the model and various components.

-
-
-

DeepSpeed ZeRO Stage 1

-

DeepSpeed ZeRO Stage 1 partitions your optimizer states (Stage 1) across your GPUs to reduce memory.

-

It is recommended to skip Stage 1 and use Stage 2, which comes with larger memory improvements and still remains efficient. Stage 1 is useful to pair with certain optimizations such as Torch ORT.

-
from pytorch_lightning import Trainer
-
-model = MyModel()
-trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_1", precision=16)
-trainer.fit(model)
-
-
-
-
-

DeepSpeed ZeRO Stage 2

-

DeepSpeed ZeRO Stage 2 partitions your optimizer states (Stage 1) and your gradients (Stage 2) across your GPUs to reduce memory. In most cases, this is more efficient or at parity with DDP, primarily due to the optimized custom communications written by the DeepSpeed team. -As a result, benefits can also be seen on a single GPU. Do note that the default bucket sizes allocate around 3.6GB of VRAM to use during distributed communications, which can be tweaked when instantiating the strategy described in a few sections below.

-
from pytorch_lightning import Trainer
-
-model = MyModel()
-trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_2", precision=16)
-trainer.fit(model)
-
-
-
python train.py --strategy deepspeed_stage_2 --precision 16 --accelerator 'gpu' --devices 4
-
-
-
-
-

DeepSpeed ZeRO Stage 2 Offload

-

Below we show an example of running ZeRO-Offload. ZeRO-Offload leverages the host CPU to offload optimizer memory/computation, reducing the overall memory consumption.

-
from pytorch_lightning import Trainer
-
-model = MyModel()
-trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_2_offload", precision=16)
-trainer.fit(model)
-
-
-

This can also be done via the command line using a PyTorch Lightning script:

-
python train.py --strategy deepspeed_stage_2_offload --precision 16 --accelerator 'gpu' --devices 4
-
-
-

You can also modify the ZeRO-Offload parameters via the strategy as below.

-
from pytorch_lightning import Trainer
-from pytorch_lightning.strategies import DeepSpeedStrategy
-
-model = MyModel()
-trainer = Trainer(
-    accelerator="gpu",
-    devices=4,
-    strategy=DeepSpeedStrategy(offload_optimizer=True, allgather_bucket_size=5e8, reduce_bucket_size=5e8),
-    precision=16,
-)
-trainer.fit(model)
-
-
-
-

Note

-

We suggest tuning the allgather_bucket_size parameter and reduce_bucket_size parameter to find optimum parameters based on your model size. -These control how large a buffer we limit the model to using when reducing gradients/gathering updated parameters. Smaller values will result in less memory, but tradeoff with speed.

-

DeepSpeed allocates a reduce buffer size multiplied by 1.5x so take that into consideration when tweaking the parameters.

-

The strategy sets a reasonable default of 2e8, which should work for most low VRAM GPUs (less than 7GB), allocating roughly 3.6GB of VRAM as buffer. Higher VRAM GPUs should aim for values around 5e8.

-
-

For even more speed benefit, DeepSpeed offers an optimized CPU version of ADAM called DeepSpeedCPUAdam to run the offloaded computation, which is faster than the standard PyTorch implementation.

-
import pytorch_lightning
-from pytorch_lightning import Trainer
-from deepspeed.ops.adam import DeepSpeedCPUAdam
-
-
-class MyModel(pl.LightningModule):
-    ...
-
-    def configure_optimizers(self):
-        # DeepSpeedCPUAdam provides 5x to 7x speedup over torch.optim.adam(w)
-        return DeepSpeedCPUAdam(self.parameters())
-
-
-model = MyModel()
-trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_2_offload", precision=16)
-trainer.fit(model)
-
-
-
-
-

DeepSpeed ZeRO Stage 3

-

DeepSpeed ZeRO Stage 3 shards the optimizer states, gradients and the model parameters (also optionally activations). Sharding model parameters and activations comes with an increase in distributed communication, however allows you to scale your models massively from one GPU to multiple GPUs. -The DeepSpeed team report the ability to fine-tune models with over 40B parameters on a single GPU and over 2 Trillion parameters on 512 GPUs. For more information we suggest checking the DeepSpeed ZeRO-3 Offload documentation.

-

We’ve ran benchmarks for all these features and given a simple example of how all these features work in Lightning, which you can see at minGPT.

-

To reach the highest memory efficiency or model size, you must:

-
    -
  1. Use the DeepSpeed strategy with the stage 3 parameter

  2. -
  3. Use CPU Offloading to offload weights to CPU, plus have a reasonable amount of CPU RAM to offload onto

  4. -
  5. Use DeepSpeed Activation Checkpointing to shard activations

  6. -
-

Below we describe how to enable all of these to see benefit. With all these improvements we reached 45 Billion parameters training a GPT model on 8 GPUs with ~1TB of CPU RAM available.

-

Also please have a look at our DeepSpeed ZeRO Stage 3 Tips which contains a lot of helpful information when configuring your own models.

-
-

Note

-

When saving a model using DeepSpeed and Stage 3, model states and optimizer states will be saved in separate sharded states (based on the world size). See Collating Single File Checkpoint for DeepSpeed ZeRO Stage 3 to obtain a single checkpoint file.

-
-
from pytorch_lightning import Trainer
-from deepspeed.ops.adam import FusedAdam
-
-
-class MyModel(pl.LightningModule):
-    ...
-
-    def configure_optimizers(self):
-        return FusedAdam(self.parameters())
-
-
-model = MyModel()
-trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3", precision=16)
-trainer.fit(model)
-
-trainer.test()
-trainer.predict()
-
-
-

You can also use the Lightning Trainer to run predict or evaluate with DeepSpeed once the model has been trained.

-
from pytorch_lightning import Trainer
-
-
-class MyModel(pl.LightningModule):
-    ...
-
-
-model = MyModel()
-trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3", precision=16)
-trainer.test(ckpt_path="my_saved_deepspeed_checkpoint.ckpt")
-
-
-
-
-

Shard Model Instantly to Reduce Initialization Time/Memory

-

When instantiating really large models, it is sometimes necessary to shard the model layers instantly.

-

This is the case if layers may not fit on one single machines CPU or GPU memory, but would fit once sharded across multiple machines. -We expose a hook that layers initialized within the hook will be sharded instantly on a per layer basis, allowing you to instantly shard models.

-

This reduces the time taken to initialize very large models, as well as ensure we do not run out of memory when instantiating larger models. For more information you can refer to the DeepSpeed docs for Constructing Massive Models.

-
import torch.nn as nn
-from pytorch_lightning import Trainer
-from deepspeed.ops.adam import FusedAdam
-
-
-class MyModel(pl.LightningModule):
-    ...
-
-    def configure_sharded_model(self):
-        # Created within sharded model context, modules are instantly sharded across processes
-        # as soon as they are made.
-        self.block = nn.Sequential(nn.Linear(32, 32), nn.ReLU())
-
-    def configure_optimizers(self):
-        return FusedAdam(self.parameters())
-
-
-model = MyModel()
-trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3", precision=16)
-trainer.fit(model)
-
-trainer.test()
-trainer.predict()
-
-
-
-
-

DeepSpeed ZeRO Stage 3 Offload

-

DeepSpeed ZeRO Stage 3 Offloads optimizer state, gradients to the host CPU to reduce memory usage as ZeRO Stage 2 does, however additionally allows you to offload the parameters as well for even more memory saving.

-
-

Note

-

When saving a model using DeepSpeed and Stage 3, model states and optimizer states will be saved in separate sharded states (based on the world size). See Collating Single File Checkpoint for DeepSpeed ZeRO Stage 3 to obtain a single checkpoint file.

-
-
from pytorch_lightning import Trainer
-from pytorch_lightning.strategies import DeepSpeedStrategy
-
-# Enable CPU Offloading
-model = MyModel()
-trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3_offload", precision=16)
-trainer.fit(model)
-
-# Enable CPU Offloading, and offload parameters to CPU
-model = MyModel()
-trainer = Trainer(
-    accelerator="gpu",
-    devices=4,
-    strategy=DeepSpeedStrategy(
-        stage=3,
-        offload_optimizer=True,
-        offload_parameters=True,
-    ),
-    precision=16,
-)
-trainer.fit(model)
-
-
-
-
-

DeepSpeed Infinity (NVMe Offloading)

-

Additionally, DeepSpeed supports offloading to NVMe drives for even larger models, utilizing the large memory space found in NVMes. DeepSpeed reports the ability to fine-tune 1 Trillion+ parameters using NVMe Offloading on one 8 GPU machine. Below shows how to enable this, assuming the NVMe drive is mounted in a directory called /local_nvme.

-
from pytorch_lightning import Trainer
-from pytorch_lightning.strategies import DeepSpeedStrategy
-
-# Enable CPU Offloading
-model = MyModel()
-trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3_offload", precision=16)
-trainer.fit(model)
-
-# Enable CPU Offloading, and offload parameters to CPU
-model = MyModel()
-trainer = Trainer(
-    accelerator="gpu",
-    devices=4,
-    strategy=DeepSpeedStrategy(
-        stage=3,
-        offload_optimizer=True,
-        offload_parameters=True,
-        remote_device="nvme",
-        offload_params_device="nvme",
-        offload_optimizer_device="nvme",
-        nvme_path="/local_nvme",
-    ),
-    precision=16,
-)
-trainer.fit(model)
-
-
-

When offloading to NVMe you may notice that the speed is slow. There are parameters that need to be tuned based on the drives that you are using. Running the aio_bench_perf_sweep.py script can help you to find optimum parameters. See the issue for more information on how to parse the information.

-
-
-

DeepSpeed Activation Checkpointing

-

Activation checkpointing frees activations from memory as soon as they are not needed during the forward pass. -They are then re-computed for the backwards pass as needed.

-

Activation checkpointing is very useful when you have intermediate layers that produce large activations.

-

This saves memory when training larger models, however requires using a checkpoint function to run modules as shown below.

-
-

Warning

-

Ensure to not wrap the entire model with activation checkpointing. This is not the intended usage of activation checkpointing, and will lead to failures as seen in this discussion.

-
-
from pytorch_lightning import Trainer
-import deepspeed
-
-
-class MyModel(LightningModule):
-    ...
-
-    def __init__(self):
-        super().__init__()
-        self.block_1 = nn.Sequential(nn.Linear(32, 32), nn.ReLU())
-        self.block_2 = torch.nn.Linear(32, 2)
-
-    def forward(self, x):
-        # Use the DeepSpeed checkpointing function instead of calling the module directly
-        # checkpointing self.block_1 means the activations are deleted after use,
-        # and re-calculated during the backward passes
-        x = deepspeed.checkpointing.checkpoint(self.block_1, x)
-        return self.block_2(x)
-
-
-
from pytorch_lightning import Trainer
-from pytorch_lightning.strategies import DeepSpeedStrategy
-import deepspeed
-
-
-class MyModel(pl.LightningModule):
-    ...
-
-    def configure_sharded_model(self):
-        self.block_1 = nn.Sequential(nn.Linear(32, 32), nn.ReLU())
-        self.block_2 = torch.nn.Linear(32, 2)
-
-    def forward(self, x):
-        # Use the DeepSpeed checkpointing function instead of calling the module directly
-        x = deepspeed.checkpointing.checkpoint(self.block_1, x)
-        return self.block_2(x)
-
-
-model = MyModel()
-
-trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3_offload", precision=16)
-
-# Enable CPU Activation Checkpointing
-trainer = Trainer(
-    accelerator="gpu",
-    devices=4,
-    strategy=DeepSpeedStrategy(
-        stage=3,
-        offload_optimizer=True,  # Enable CPU Offloading
-        cpu_checkpointing=True,  # (Optional) offload activations to CPU
-    ),
-    precision=16,
-)
-trainer.fit(model)
-
-
-
-
-

DeepSpeed ZeRO Stage 3 Tips

-

Here is some helpful information when setting up DeepSpeed ZeRO Stage 3 with Lightning.

-
    -
  • If you’re using Adam or AdamW, ensure to use FusedAdam or DeepSpeedCPUAdam (for CPU Offloading) rather than the default torch optimizers as they come with large speed benefits

  • -
  • Treat your GPU/CPU memory as one large pool. In some cases, you may not want to offload certain things (like activations) to provide even more space to offload model parameters

  • -
  • When offloading to the CPU, make sure to bump up the batch size as GPU memory will be freed

  • -
  • We also support sharded checkpointing. By passing save_full_weights=False to the DeepSpeedStrategy, we’ll save shards of the model which allows you to save extremely large models. However to load the model and run test/validation/predict you must use the Trainer object.

  • -
-
-
-

Collating Single File Checkpoint for DeepSpeed ZeRO Stage 3

-

After training using ZeRO Stage 3, you’ll notice that your checkpoints are a directory of sharded model and optimizer states. If you’d like to collate a single file from the checkpoint directory please use the below command, which handles all the Lightning states additionally when collating the file.

-
from pytorch_lightning.utilities.deepspeed import convert_zero_checkpoint_to_fp32_state_dict
-
-# lightning deepspeed has saved a directory instead of a file
-save_path = "lightning_logs/version_0/checkpoints/epoch=0-step=0.ckpt/"
-output_path = "lightning_model.pt"
-convert_zero_checkpoint_to_fp32_state_dict(save_path, output_path)
-
-
-
-

Warning

-

This single file checkpoint does not include the optimizer/lr-scheduler states. This means we cannot restore training via the trainer.fit(ckpt_path=) call. Ensure to keep the sharded checkpoint directory if this is required.

-
-
-
-

Custom DeepSpeed Config

-

In some cases you may want to define your own DeepSpeed Config, to access all parameters defined. We’ve exposed most of the important parameters, however, there may be debugging parameters to enable. Also, DeepSpeed allows the use of custom DeepSpeed optimizers and schedulers defined within a config file that is supported.

-
-

Note

-

All strategy default parameters will be ignored when a config object is passed. -All compatible arguments can be seen in the DeepSpeed docs.

-
-
from pytorch_lightning import Trainer
-from pytorch_lightning.strategies import DeepSpeedStrategy
-
-deepspeed_config = {
-    "zero_allow_untested_optimizer": True,
-    "optimizer": {
-        "type": "OneBitAdam",
-        "params": {
-            "lr": 3e-5,
-            "betas": [0.998, 0.999],
-            "eps": 1e-5,
-            "weight_decay": 1e-9,
-            "cuda_aware": True,
-        },
-    },
-    "scheduler": {
-        "type": "WarmupLR",
-        "params": {
-            "last_batch_iteration": -1,
-            "warmup_min_lr": 0,
-            "warmup_max_lr": 3e-5,
-            "warmup_num_steps": 100,
-        },
-    },
-    "zero_optimization": {
-        "stage": 2,  # Enable Stage 2 ZeRO (Optimizer/Gradient state partitioning)
-        "offload_optimizer": True,  # Enable Offloading optimizer state/calculation to the host CPU
-        "contiguous_gradients": True,  # Reduce gradient fragmentation.
-        "overlap_comm": True,  # Overlap reduce/backward operation of gradients for speed.
-        "allgather_bucket_size": 2e8,  # Number of elements to all gather at once.
-        "reduce_bucket_size": 2e8,  # Number of elements we reduce/allreduce at once.
-    },
-}
-
-model = MyModel()
-trainer = Trainer(accelerator="gpu", devices=4, strategy=DeepSpeedStrategy(config=deepspeed_config), precision=16)
-trainer.fit(model)
-
-
-

We support taking the config as a json formatted file:

-
from pytorch_lightning import Trainer
-from pytorch_lightning.strategies import DeepSpeedStrategy
-
-model = MyModel()
-trainer = Trainer(
-    accelerator="gpu", devices=4, strategy=DeepSpeedStrategy(config="/path/to/deepspeed_config.json"), precision=16
-)
-trainer.fit(model)
-
-
-

You can use also use an environment variable via your PyTorch Lightning script:

-
PL_DEEPSPEED_CONFIG_PATH=/path/to/deepspeed_config.json python train.py --strategy deepspeed
-
-
-
-
-
-
-

DDP Optimizations

-
-

When Using DDP Strategies, Set find_unused_parameters=False

-

By default, we have set find_unused_parameters=True for compatibility reasons that have been observed in the past (refer to the discussion for more details). -When enabled, it can result in a performance hit and can be disabled in most cases. Read more about it here.

-
-

Tip

-

It applies to all DDP strategies that support find_unused_parameters as input.

-
-
from pytorch_lightning.strategies import DDPStrategy
-
-trainer = pl.Trainer(
-    accelerator="gpu",
-    devices=2,
-    strategy=DDPStrategy(find_unused_parameters=False),
-)
-
-
-
from pytorch_lightning.strategies import DDPSpawnStrategy
-
-trainer = pl.Trainer(
-    accelerator="gpu",
-    devices=2,
-    strategy=DDPSpawnStrategy(find_unused_parameters=False),
-)
-
-
-
-
-

DDP Static Graph

-

DDP static graph assumes that your model -employs the same set of used/unused parameters in every iteration, so that it can deterministically know the flow of -training and apply special optimizations during runtime.

-
-

Note

-

DDP static graph support requires PyTorch>=1.11.0

-
-
from pytorch_lightning import Trainer
-from pytorch_lightning.strategies import DDPStrategy
-
-trainer = Trainer(devices=4, strategy=DDPStrategy(static_graph=True))
-
-
-
-
-

When Using DDP on a Multi-node Cluster, Set NCCL Parameters

-

NCCL is the NVIDIA Collective Communications Library that is used by PyTorch to handle communication across nodes and GPUs. There are reported benefits in terms of speedups when adjusting NCCL parameters as seen in this issue. In the issue, we see a 30% speed improvement when training the Transformer XLM-RoBERTa and a 15% improvement in training with Detectron2.

-

NCCL parameters can be adjusted via environment variables.

-
-

Note

-

AWS and GCP already set default values for these on their clusters. This is typically useful for custom cluster setups.

-
- -
export NCCL_NSOCKS_PERTHREAD=4
-export NCCL_SOCKET_NTHREADS=2
-
-
-
-
-

Gradients as Bucket View

-

Enabling gradient_as_bucket_view=True in the DDPStrategy will make gradients views point to different offsets of the allreduce communication buckets. See DistributedDataParallel for more information.

-

This can reduce peak memory usage and throughput as saved memory will be equal to the total gradient memory + removes the need to copy gradients to the allreduce communication buckets.

-
-

Note

-

When gradient_as_bucket_view=True you cannot call detach_() on gradients. If hitting such errors, please fix it by referring to the zero_grad() function in torch/optim/optimizer.py as a solution (source).

-
-
from pytorch_lightning import Trainer
-from pytorch_lightning.strategies import DDPStrategy
-
-model = MyModel()
-trainer = Trainer(accelerator="gpu", devices=4, strategy=DDPStrategy(gradient_as_bucket_view=True))
-trainer.fit(model)
-
-
-
-
-

DDP Communication Hooks

-

DDP Communication hooks is an interface to control how gradients are communicated across workers, overriding the standard allreduce in DistributedDataParallel. This allows you to enable performance improving communication hooks when using multiple nodes.

-

Enable FP16 Compress Hook for multi-node throughput improvement:

-
from pytorch_lightning import Trainer
-from pytorch_lightning.strategies import DDPStrategy
-from torch.distributed.algorithms.ddp_comm_hooks import default_hooks as default
-
-model = MyModel()
-trainer = Trainer(accelerator="gpu", devices=4, strategy=DDPStrategy(ddp_comm_hook=default.fp16_compress_hook))
-trainer.fit(model)
-
-
-

Enable PowerSGD for multi-node throughput improvement:

-
-

Note

-

PowerSGD typically requires extra memory of the same size as the model’s gradients to enable error feedback, which can compensate for biased compressed communication and improve accuracy (source).

-
-
from pytorch_lightning import Trainer
-from pytorch_lightning.strategies import DDPStrategy
-from torch.distributed.algorithms.ddp_comm_hooks import powerSGD_hook as powerSGD
-
-model = MyModel()
-trainer = Trainer(
-    accelerator="gpu",
-    devices=4,
-    strategy=DDPStrategy(
-        ddp_comm_state=powerSGD.PowerSGDState(
-            process_group=None,
-            matrix_approximation_rank=1,
-            start_powerSGD_iter=5000,
-        ),
-        ddp_comm_hook=powerSGD.powerSGD_hook,
-    ),
-)
-trainer.fit(model)
-
-
-

Combine hooks for accumulated benefit:

-
-

Note

-

DDP communication wrappers support requires PyTorch>=1.9.0

-
-
from pytorch_lightning import Trainer
-from pytorch_lightning.strategies import DDPStrategy
-from torch.distributed.algorithms.ddp_comm_hooks import (
-    default_hooks as default,
-    powerSGD_hook as powerSGD,
-)
-
-model = MyModel()
-trainer = Trainer(
-    accelerator="gpu",
-    devices=4,
-    strategy=DDPStrategy(
-        ddp_comm_state=powerSGD.PowerSGDState(
-            process_group=None,
-            matrix_approximation_rank=1,
-            start_powerSGD_iter=5000,
-        ),
-        ddp_comm_hook=powerSGD.powerSGD_hook,
-        ddp_comm_wrapper=default.fp16_compress_wrapper,
-    ),
-)
-trainer.fit(model)
-
-
-

When using Post-localSGD, you must also pass model_averaging_period to allow for model parameter averaging:

-
-

Note

-

Post-localSGD support requires PyTorch>=1.10.0

-
-
from pytorch_lightning import Trainer
-from pytorch_lightning.strategies import DDPStrategy
-from torch.distributed.algorithms.ddp_comm_hooks import post_localSGD_hook as post_localSGD
-
-model = MyModel()
-trainer = Trainer(
-    accelerator="gpu",
-    devices=4,
-    strategy=DDPStrategy(
-        ddp_comm_state=post_localSGD.PostLocalSGDState(
-            process_group=None,
-            subgroup=None,
-            start_localSGD_iter=8,
-        ),
-        ddp_comm_hook=post_localSGD.post_localSGD_hook,
-        model_averaging_period=4,
-    ),
-)
-trainer.fit(model)
-
-
-
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/advanced/pruning_quantization.html b/docs/advanced/pruning_quantization.html deleted file mode 100644 index 98e8cf4..0000000 --- a/docs/advanced/pruning_quantization.html +++ /dev/null @@ -1,795 +0,0 @@ - - - - - - - - - - - - - - Pruning and Quantization — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Pruning and Quantization
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Pruning and Quantization

-

Pruning and Quantization are techniques to compress model size for deployment, allowing inference speed up and energy saving without significant accuracy losses.

-
-

Pruning

-
-

Warning

-

Pruning is in beta and subject to change.

-
-

Pruning is a technique which focuses on eliminating some of the model weights to reduce the model size and decrease inference requirements.

-

Pruning has been shown to achieve significant efficiency improvements while minimizing the drop in model performance (prediction quality). Model pruning is recommended for cloud endpoints, deploying models on edge devices, or mobile inference (among others).

-

To enable pruning during training in Lightning, simply pass in the ModelPruning callback to the Lightning Trainer. PyTorch’s native pruning implementation is used under the hood.

-

This callback supports multiple pruning functions: pass any torch.nn.utils.prune function as a string to select which weights to prune (random_unstructured, RandomStructured, etc) or implement your own by subclassing BasePruningMethod.

-
from pytorch_lightning.callbacks import ModelPruning
-
-# set the amount to be the fraction of parameters to prune
-trainer = Trainer(callbacks=[ModelPruning("l1_unstructured", amount=0.5)])
-
-
-

You can also perform iterative pruning, apply the lottery ticket hypothesis, and more!

-
def compute_amount(epoch):
-    # the sum of all returned values need to be smaller than 1
-    if epoch == 10:
-        return 0.5
-
-    elif epoch == 50:
-        return 0.25
-
-    elif 75 < epoch < 99:
-        return 0.01
-
-
-# the amount can be also be a callable
-trainer = Trainer(callbacks=[ModelPruning("l1_unstructured", amount=compute_amount)])
-
-
-
-
-

Quantization

-
-

Warning

-

Quantization is in beta and subject to change.

-
-

Model quantization is another performance optimization technique that allows speeding up inference and decreasing memory requirements by performing computations and storing tensors at lower bitwidths (such as INT8 or FLOAT16) than floating-point precision. This is particularly beneficial during model deployment.

-

Quantization Aware Training (QAT) mimics the effects of quantization during training: The computations are carried-out in floating-point precision but the subsequent quantization effect is taken into account. The weights and activations are quantized into lower precision only for inference, when training is completed.

-

Quantization is useful when it is required to serve large models on machines with limited memory, or when there’s a need to switch between models and reducing the I/O time is important. For example, switching between monolingual speech recognition models across multiple languages.

-

Lightning includes QuantizationAwareTraining callback (using PyTorch’s native quantization, read more here), which allows creating fully quantized models (compatible with torchscript).

-
from pytorch_lightning.callbacks import QuantizationAwareTraining
-
-
-class RegressionModel(LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.layer_0 = nn.Linear(16, 64)
-        self.layer_0a = torch.nn.ReLU()
-        self.layer_1 = nn.Linear(64, 64)
-        self.layer_1a = torch.nn.ReLU()
-        self.layer_end = nn.Linear(64, 1)
-
-    def forward(self, x):
-        x = self.layer_0(x)
-        x = self.layer_0a(x)
-        x = self.layer_1(x)
-        x = self.layer_1a(x)
-        x = self.layer_end(x)
-        return x
-
-
-trainer = Trainer(callbacks=[QuantizationAwareTraining()])
-qmodel = RegressionModel()
-trainer.fit(qmodel, ...)
-
-batch = iter(my_dataloader()).next()
-qmodel(qmodel.quant(batch[0]))
-
-tsmodel = qmodel.to_torchscript()
-tsmodel(tsmodel.quant(batch[0]))
-
-
-

You can further customize the callback:

-
qcb = QuantizationAwareTraining(
-    # specification of quant estimation quality
-    observer_type="histogram",
-    # specify which layers shall be merged together to increase efficiency
-    modules_to_fuse=[(f"layer_{i}", f"layer_{i}a") for i in range(2)],
-    # make your model compatible with all original input/outputs, in such case the model is wrapped in a shell with entry/exit layers.
-    input_compatible=True,
-)
-
-batch = iter(my_dataloader()).next()
-qmodel(batch[0])
-
-
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/advanced/strategy_registry.html b/docs/advanced/strategy_registry.html deleted file mode 100644 index 408b974..0000000 --- a/docs/advanced/strategy_registry.html +++ /dev/null @@ -1,741 +0,0 @@ - - - - - - - - - - - - - - Strategy Registry — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Strategy Registry
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Strategy Registry

-
-

Warning

-

The Strategy Registry is experimental and subject to change.

-
-

Lightning includes a registry that holds information about Training strategies and allows for the registration of new custom strategies.

-

The Strategies are assigned strings that identify them, such as “ddp”, “deepspeed_stage_2_offload”, and so on. -It also returns the optional description and parameters for initialising the Strategy that were defined during registration.

-
# Training with the DDP Strategy with `find_unused_parameters` as False
-trainer = Trainer(strategy="ddp_find_unused_parameters_false", accelerator="gpu", devices=4)
-
-# Training with DeepSpeed ZeRO Stage 3 and CPU Offload
-trainer = Trainer(strategy="deepspeed_stage_3_offload", accelerator="gpu", devices=3)
-
-# Training with the TPU Spawn Strategy with `debug` as True
-trainer = Trainer(strategy="tpu_spawn_debug", accelerator="tpu", devices=8)
-
-
-

Additionally, you can pass your custom registered training strategies to the strategy argument.

-
from pytorch_lightning.strategies import DDPStrategy, StrategyRegistry, CheckpointIO
-
-
-class CustomCheckpointIO(CheckpointIO):
-    def save_checkpoint(self, checkpoint: Dict[str, Any], path: Union[str, Path]) -> None:
-        ...
-
-    def load_checkpoint(self, path: Union[str, Path]) -> Dict[str, Any]:
-        ...
-
-
-custom_checkpoint_io = CustomCheckpointIO()
-
-# Register the DDP Strategy with your custom CheckpointIO plugin
-StrategyRegistry.register(
-    "ddp_custom_checkpoint_io",
-    DDPStrategy,
-    description="DDP Strategy with custom checkpoint io plugin",
-    checkpoint_io=custom_checkpoint_io,
-)
-
-trainer = Trainer(strategy="ddp_custom_checkpoint_io", accelerator="gpu", devices=2)
-
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
- -
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/advanced/training_tricks.html b/docs/advanced/training_tricks.html deleted file mode 100644 index cfd9cdf..0000000 --- a/docs/advanced/training_tricks.html +++ /dev/null @@ -1,1063 +0,0 @@ - - - - - - - - - - - - - - Effective Training Techniques — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Effective Training Techniques
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Effective Training Techniques

-

Lightning implements various techniques to help during training that can help make the training smoother.

-
-
-

Accumulate Gradients

-

Accumulated gradients run K small batches of size N before doing a backward pass. The effect is a large effective batch size of size KxN, where N is the batch size. -Internally it doesn’t stack up the batches and do a forward pass rather it accumulates the gradients for K batches and then do an optimizer.step to make sure the -effective batch size is increased but there is no memory overhead.

-
-

Warning

-

When using distributed training for eg. DDP, with let’s say with P devices, each device accumulates independently i.e. it stores the gradients -after each loss.backward() and doesn’t sync the gradients across the devices until we call optimizer.step(). So for each accumulation -step, the effective batch size on each device will remain N*K but right before the optimizer.step(), the gradient sync will make the effective -batch size as P*N*K. For DP, since the batch is split across devices, the final effective batch size will be N*K.

-
-
-

See also

-

Trainer

-
-
# DEFAULT (ie: no accumulated grads)
-trainer = Trainer(accumulate_grad_batches=1)
-
-# Accumulate gradients for 7 batches
-trainer = Trainer(accumulate_grad_batches=7)
-
-
-

You can set different values for it at different epochs by passing a dictionary, where the key represents the epoch at which the value for gradient accumulation -should be updated.

-
# till 5th epoch, it will accumulate every 8 batches. From 5th epoch
-# till 9th epoch it will accumulate every 4 batches and after that no accumulation
-# will happen. Note that you need to use zero-indexed epoch keys here
-trainer = Trainer(accumulate_grad_batches={0: 8, 4: 4, 8: 1})
-
-
-

Or, you can create custom GradientAccumulationScheduler

-
from pytorch_lightning.callbacks import GradientAccumulationScheduler
-
-
-# till 5th epoch, it will accumulate every 8 batches. From 5th epoch
-# till 9th epoch it will accumulate every 4 batches and after that no accumulation
-# will happen. Note that you need to use zero-indexed epoch keys here
-accumulator = GradientAccumulationScheduler(scheduling={0: 8, 4: 4, 8: 1})
-trainer = Trainer(callbacks=accumulator)
-
-
-
-
-
-

Gradient Clipping

-

Gradient clipping can be enabled to avoid exploding gradients. By default, this will clip the gradient norm by calling -torch.nn.utils.clip_grad_norm_() computed over all model parameters together. -If the Trainer’s gradient_clip_algorithm is set to 'value' ('norm' by default), this will use instead -torch.nn.utils.clip_grad_value_() for each parameter instead.

-
-

Note

-

If using mixed precision, the gradient_clip_val does not need to be changed as the gradients are unscaled -before applying the clipping function.

-
-
-

See also

-

Trainer

-
-
# DEFAULT (ie: don't clip)
-trainer = Trainer(gradient_clip_val=0)
-
-# clip gradients' global norm to <=0.5 using gradient_clip_algorithm='norm' by default
-trainer = Trainer(gradient_clip_val=0.5)
-
-# clip gradients' maximum magnitude to <=0.5
-trainer = Trainer(gradient_clip_val=0.5, gradient_clip_algorithm="value")
-
-
-

Read more about Configuring Gradient Clipping for advanced use-cases.

-
-
-
-

Stochastic Weight Averaging

-

Stochastic Weight Averaging (SWA) can make your models generalize better at virtually no additional cost. -This can be used with both non-trained and trained models. The SWA procedure smooths the loss landscape thus making -it harder to end up in a local minimum during optimization.

-

For a more detailed explanation of SWA and how it works, -read this post by the PyTorch team.

-
-

See also

-

The StochasticWeightAveraging callback

-
-
# Enable Stochastic Weight Averaging using the callback
-trainer = Trainer(callbacks=[StochasticWeightAveraging(swa_lrs=1e-2)])
-
-
-
-
-
-

Batch Size Finder

-

Auto-scaling of batch size can be enabled to find the largest batch size that fits into -memory. Large batch size often yields a better estimation of the gradients, but may also result in -longer training time. Inspired by https://github.com/BlackHC/toma.

-
-

See also

-

Trainer

-
-
# DEFAULT (ie: don't scale batch size automatically)
-trainer = Trainer(auto_scale_batch_size=None)
-
-# Autoscale batch size
-trainer = Trainer(auto_scale_batch_size=None | "power" | "binsearch")
-
-# Find the batch size
-trainer.tune(model)
-
-
-

Currently, this feature supports two modes 'power' scaling and 'binsearch' -scaling. In 'power' scaling, starting from a batch size of 1 keeps doubling -the batch size until an out-of-memory (OOM) error is encountered. Setting the -argument to 'binsearch' will initially also try doubling the batch size until -it encounters an OOM, after which it will do a binary search that will finetune the -batch size. Additionally, it should be noted that the batch size scaler cannot -search for batch sizes larger than the size of the training dataset.

-
-

Note

-

This feature expects that a batch_size field is either located as a model attribute -i.e. model.batch_size or as a field in your hparams i.e. model.hparams.batch_size. -Similarly it can work with datamodules too. The field should exist and will be updated by -the results of this algorithm. Additionally, your train_dataloader() method should depend -on this field for this feature to work i.e.

-
# using LightningModule
-class LitModel(LightningModule):
-    def __init__(self, batch_size):
-        super().__init__()
-        self.save_hyperparameters()
-        # or
-        self.batch_size = batch_size
-
-    def train_dataloader(self):
-        return DataLoader(train_dataset, batch_size=self.batch_size | self.hparams.batch_size)
-
-
-trainer = Trainer(...)
-model = LitModel(batch_size=32)
-trainer.tune(model)
-
-# using LightningDataModule
-class LitDataModule(LightningDataModule):
-    def __init__(self, batch_size):
-        super().__init__()
-        self.save_hyperparameters()
-        # or
-        self.batch_size = batch_size
-
-    def train_dataloader(self):
-        return DataLoader(train_dataset, batch_size=self.batch_size | self.hparams.batch_size)
-
-
-trainer = Trainer(...)
-model = MyModel()
-datamodule = LitDataModule(batch_size=32)
-trainer.tune(model, datamodule=datamodule)
-
-
-
-
-

Warning

-

Due to the constraints listed above, this features does NOT work when passing dataloaders directly -to .fit().

-
-

The scaling algorithm has a number of parameters that the user can control by -invoking the scale_batch_size() method:

-
# Use default in trainer construction
-trainer = Trainer()
-tuner = Tuner(trainer)
-
-# Invoke method
-new_batch_size = tuner.scale_batch_size(model, *extra_parameters_here)
-
-# Override old batch size (this is done automatically)
-model.hparams.batch_size = new_batch_size
-
-# Fit as normal
-trainer.fit(model)
-
-
-
-
The algorithm in short works by:
    -
  1. Dumping the current state of the model and trainer

  2. -
  3. -
    Iteratively until convergence or maximum number of tries max_trials (default 25) has been reached:
      -
    • Call fit() method of trainer. This evaluates steps_per_trial (default 3) number of -optimization steps. Each training step can trigger an OOM error if the tensors -(training batch, weights, gradients, etc.) allocated during the steps have a -too large memory footprint.

    • -
    • If an OOM error is encountered, decrease batch size else increase it. -How much the batch size is increased/decreased is determined by the chosen -strategy.

    • -
    -
    -
    -
  4. -
  5. The found batch size is saved to either model.batch_size or model.hparams.batch_size

  6. -
  7. Restore the initial state of model and trainer

  8. -
-
-
-
-

Warning

-

Batch size finder is not yet supported for DDP or any of its variations, it is coming soon.

-
-
-
-
-

Learning Rate Finder

-
-

-
-

For training deep neural networks, selecting a good learning rate is essential -for both better performance and faster convergence. Even optimizers such as -Adam that are self-adjusting the learning rate can benefit from more optimal -choices.

-

To reduce the amount of guesswork concerning choosing a good initial learning -rate, a learning rate finder can be used. As described in this paper -a learning rate finder does a small run where the learning rate is increased -after each processed batch and the corresponding loss is logged. The result of -this is a lr vs. loss plot that can be used as guidance for choosing an optimal -initial learning rate.

-
-

Warning

-

For the moment, this feature only works with models having a single optimizer. -LR Finder support for DDP and any of its variations is not implemented yet. It is coming soon.

-
-
-

Using Lightning’s built-in LR finder

-

To enable the learning rate finder, your lightning module needs to -have a learning_rate or lr attribute (or as a field in your hparams i.e. -hparams.learning_rate or hparams.lr). Then, set Trainer(auto_lr_find=True) -during trainer construction, and then call trainer.tune(model) to run the LR finder. -The suggested learning_rate will be written to the console and will be automatically -set to your lightning module, which can be accessed -via self.learning_rate or self.lr.

-
-

See also

-

trainer.tune.

-
-
class LitModel(LightningModule):
-    def __init__(self, learning_rate):
-        super().__init__()
-        self.learning_rate = learning_rate
-        self.model = Model(...)
-
-    def configure_optimizers(self):
-        return Adam(self.parameters(), lr=(self.lr or self.learning_rate))
-
-
-model = LitModel()
-
-# finds learning rate automatically
-# sets hparams.lr or hparams.learning_rate to that learning rate
-trainer = Trainer(auto_lr_find=True)
-
-trainer.tune(model)
-
-
-

If your model is using an arbitrary value instead of self.lr or self.learning_rate, set that value as auto_lr_find:

-
model = LitModel()
-
-# to set to your own hparams.my_value
-trainer = Trainer(auto_lr_find="my_value")
-
-trainer.tune(model)
-
-
-

You can also inspect the results of the learning rate finder or just play around -with the parameters of the algorithm. This can be done by invoking the -lr_find() method. A typical example of this would look like:

-
model = MyModelClass(hparams)
-trainer = Trainer()
-
-# Run learning rate finder
-lr_finder = trainer.tuner.lr_find(model)
-
-# Results can be found in
-print(lr_finder.results)
-
-# Plot with
-fig = lr_finder.plot(suggest=True)
-fig.show()
-
-# Pick point based on plot, or get suggestion
-new_lr = lr_finder.suggestion()
-
-# update hparams of the model
-model.hparams.lr = new_lr
-
-# Fit model
-trainer.fit(model)
-
-
-

The figure produced by lr_finder.plot() should look something like the figure -below. It is recommended to not pick the learning rate that achieves the lowest -loss, but instead something in the middle of the sharpest downward slope (red point). -This is the point returned py lr_finder.suggestion().

-
-../_images/lr_finder.png -
-
-
-
-
-

Advanced GPU Optimizations

-

When training on single or multiple GPU machines, Lightning offers a host of advanced optimizations to improve throughput, memory efficiency, and model scaling. -Refer to Advanced GPU Optimized Training for more details.

-
-
-
-

Sharing Datasets Across Process Boundaries

-

The LightningDataModule class provides an organized way to decouple data loading from training logic, with prepare_data() being used for downloading and pre-processing the dataset on a single process, and setup() loading the pre-processed data for each process individually:

-
class MNISTDataModule(pl.LightningDataModule):
-    def prepare_data(self):
-        MNIST(self.data_dir, download=True)
-
-    def setup(self, stage: Optional[str] = None):
-        self.mnist = MNIST(self.data_dir)
-
-    def train_loader(self):
-        return DataLoader(self.mnist, batch_size=128)
-
-
-

However, for in-memory datasets, that means that each process will hold a (redundant) replica of the dataset in memory, which may be impractical when using many processes while utilizing datasets that nearly fit into CPU memory, as the memory consumption will scale up linearly with the number of processes. -For example, when training Graph Neural Networks, a common strategy is to load the entire graph into CPU memory for fast access to the entire graph structure and its features, and to then perform neighbor sampling to obtain mini-batches that fit onto the GPU.

-

A simple way to prevent redundant dataset replicas is to rely on torch.multiprocessing to share the data automatically between spawned processes via shared memory. -For this, all data pre-loading should be done on the main process inside DataModule.__init__(). As a result, all tensor-data will get automatically shared when using the DDPSpawnStrategy strategy.

-
-

Warning

-

torch.multiprocessing will send a handle of each individual tensor to other processes. -In order to prevent any errors due to too many open file handles, try to reduce the number of tensors to share, e.g., by stacking your data into a single tensor.

-
-
class MNISTDataModule(pl.LightningDataModule):
-    def __init__(self, data_dir: str):
-        self.mnist = MNIST(data_dir, download=True, transform=T.ToTensor())
-
-    def train_loader(self):
-        return DataLoader(self.mnist, batch_size=128)
-
-
-model = Model(...)
-datamodule = MNISTDataModule("data/MNIST")
-
-trainer = Trainer(accelerator="gpu", devices=2, strategy="ddp_spawn")
-trainer.fit(model, datamodule)
-
-
-

See the graph-level and node-level prediction examples in PyTorch Geometric for practical use-cases.

-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/advanced/transfer_learning.html b/docs/advanced/transfer_learning.html deleted file mode 100644 index 1ae0896..0000000 --- a/docs/advanced/transfer_learning.html +++ /dev/null @@ -1,811 +0,0 @@ - - - - - - - - - - - - - - Transfer Learning — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Transfer Learning
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Transfer Learning

-

Audience: Users looking to use pretrained models with Lightning.

-
-
-

Use any PyTorch nn.Module

-

Any model that is a PyTorch nn.Module can be used with Lightning (because LightningModules are nn.Modules also).

-
-
-
-

Use a pretrained LightningModule

-

Let’s use the AutoEncoder as a feature extractor in a separate model.

-
class Encoder(torch.nn.Module):
-    ...
-
-
-class AutoEncoder(LightningModule):
-    def __init__(self):
-        self.encoder = Encoder()
-        self.decoder = Decoder()
-
-
-class CIFAR10Classifier(LightningModule):
-    def __init__(self):
-        # init the pretrained LightningModule
-        self.feature_extractor = AutoEncoder.load_from_checkpoint(PATH)
-        self.feature_extractor.freeze()
-
-        # the autoencoder outputs a 100-dim representation and CIFAR-10 has 10 classes
-        self.classifier = nn.Linear(100, 10)
-
-    def forward(self, x):
-        representations = self.feature_extractor(x)
-        x = self.classifier(representations)
-        ...
-
-
-

We used our pretrained Autoencoder (a LightningModule) for transfer learning!

-
-
-
-

Example: Imagenet (Computer Vision)

-
import torchvision.models as models
-
-
-class ImagenetTransferLearning(LightningModule):
-    def __init__(self):
-        super().__init__()
-
-        # init a pretrained resnet
-        backbone = models.resnet50(pretrained=True)
-        num_filters = backbone.fc.in_features
-        layers = list(backbone.children())[:-1]
-        self.feature_extractor = nn.Sequential(*layers)
-
-        # use the pretrained model to classify cifar-10 (10 image classes)
-        num_target_classes = 10
-        self.classifier = nn.Linear(num_filters, num_target_classes)
-
-    def forward(self, x):
-        self.feature_extractor.eval()
-        with torch.no_grad():
-            representations = self.feature_extractor(x).flatten(1)
-        x = self.classifier(representations)
-        ...
-
-
-

Finetune

-
model = ImagenetTransferLearning()
-trainer = Trainer()
-trainer.fit(model)
-
-
-

And use it to predict your data of interest

-
model = ImagenetTransferLearning.load_from_checkpoint(PATH)
-model.freeze()
-
-x = some_images_from_cifar10()
-predictions = model(x)
-
-
-

We used a pretrained model on imagenet, finetuned on CIFAR-10 to predict on CIFAR-10. -In the non-academic world we would finetune on a tiny dataset you have and predict on your dataset.

-
-
-
-

Example: BERT (NLP)

-

Lightning is completely agnostic to what’s used for transfer learning so long -as it is a torch.nn.Module subclass.

-

Here’s a model that uses Huggingface transformers.

-
class BertMNLIFinetuner(LightningModule):
-    def __init__(self):
-        super().__init__()
-
-        self.bert = BertModel.from_pretrained("bert-base-cased", output_attentions=True)
-        self.W = nn.Linear(bert.config.hidden_size, 3)
-        self.num_classes = 3
-
-    def forward(self, input_ids, attention_mask, token_type_ids):
-
-        h, _, attn = self.bert(input_ids=input_ids, attention_mask=attention_mask, token_type_ids=token_type_ids)
-
-        h_cls = h[:, 0]
-        logits = self.W(h_cls)
-        return logits, attn
-
-
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/benchmarking/benchmarks.html b/docs/benchmarking/benchmarks.html deleted file mode 100644 index 9e91cbd..0000000 --- a/docs/benchmarking/benchmarks.html +++ /dev/null @@ -1,701 +0,0 @@ - - - - - - - - - - - - - - Benchmark with vanilla PyTorch — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Benchmark with vanilla PyTorch
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Benchmark with vanilla PyTorch

-

In this section we set grounds for comparison between vanilla PyTorch and PT Lightning for most common scenarios.

-
-

Time comparison

-

We have set regular benchmarking against PyTorch vanilla training loop on with RNN and simple MNIST classifier as per of out CI. -In average for simple MNIST CNN classifier we are only about 0.06s slower per epoch, see detail chart bellow.

-
-Speed parity to vanilla PT, created on 2020-12-16 -
-

Learn more about reproducible benchmarking from the PyTorch Reproducibility Guide.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/cli/lightning_cli.html b/docs/cli/lightning_cli.html deleted file mode 100644 index 9a471e8..0000000 --- a/docs/cli/lightning_cli.html +++ /dev/null @@ -1,784 +0,0 @@ - - - - - - - - - - - - - - Eliminate config boilerplate — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Eliminate config boilerplate
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
- - - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/cli/lightning_cli_advanced.html b/docs/cli/lightning_cli_advanced.html deleted file mode 100644 index 04d3fb4..0000000 --- a/docs/cli/lightning_cli_advanced.html +++ /dev/null @@ -1,778 +0,0 @@ - - - - - - - - - - - - - - Eliminate config boilerplate (Advanced) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Eliminate config boilerplate (Advanced)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Eliminate config boilerplate (Advanced)

-

Audience: Users looking to modularize their code for a professional project.

-

Pre-reqs: You must have read (Control it all from the CLI).

-
-
-

What is a yaml config file?

-

A yaml is a standard configuration file that describes parameters for sections of a program. It is a common tool in engineering, and it has recently started to gain popularity in machine learning.

-
# file.yaml
-car:
-    max_speed:100
-    max_passengers:2
-plane:
-    fuel_capacity: 50
-class_3:
-    option_1: 'x'
-    option_2: 'y'
-
-
-
-
- -
-
-

Write a config yaml from the CLI

-

To have a copy of the configuration that produced this model, save a yaml file from the –print_config outputs:

-
python main.py fit --model.learning_rate 0.001 --print_config > config.yaml
-
-
-
-
-
-

Run from a single yaml

-

To run from a yaml, pass a yaml produced with --print_config to the --config argument:

-
python main.py fit --config config.yaml
-
-
-

when using a yaml to run, you can still pass in inline arguments

-
python main.py fit --config config.yaml --trainer.max_epochs 100
-
-
-
-
-
-

Compose yaml files

-

For production or complex research projects it’s advisable to have each object in its own config file. To compose all the configs, pass them all inline:

-
$ python trainer.py fit --config trainer.yaml --config datamodules.yaml --config models.yaml ...
-
-
-

The configs will be parsed sequentially. Let’s say we have two configs with the same args:

-
# trainer.yaml
-trainer:
-    num_epochs: 10
-
-
-# trainer_2.yaml
-trainer:
-    num_epochs: 20
-
-
-

the ones from the last config will be used (num_epochs = 20) in this case:

-
$ python trainer.py fit --config trainer.yaml --config trainer_2.yaml
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/cli/lightning_cli_advanced_2.html b/docs/cli/lightning_cli_advanced_2.html deleted file mode 100644 index fb799af..0000000 --- a/docs/cli/lightning_cli_advanced_2.html +++ /dev/null @@ -1,815 +0,0 @@ - - - - - - - - - - - - - - Eliminate config boilerplate (Advanced) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Eliminate config boilerplate (Advanced)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Eliminate config boilerplate (Advanced)

-
-

Customize arguments by command

-

To customize arguments by subcommand, pass the config before the subcommand:

-
$ python main.py [before] [subcommand] [after]
-$ python main.py  ...         fit       ...
-
-
-

For example, here we set the Trainer argument [max_steps = 100] for the full training routine and [max_steps = 10] for testing:

-
# config1.yaml
-fit:
-    trainer:
-        max_steps: 100
-test:
-    trainer:
-        max_epochs: 10
-
-
-

now you can toggle this behavior by subcommand:

-
# full routine with max_steps = 100
-$ python main.py --config config1.yaml fit
-
-# test only with max_epochs = 10
-$ python main.py --config config1.yaml test
-
-
-
-
-
-

Use groups of options

-

Groups of options can also be given as independent config files:

-
$ python trainer.py fit --trainer trainer.yaml --model model.yaml --data data.yaml [...]
-
-
-
-
-
-

Run from cloud yaml configs

-

For certain enterprise workloads, Lightning CLI supports running from hosted configs:

-
$ python trainer.py [subcommand] --config s3://bucket/config.yaml
-
-
-

For more options, refer to Remote filesystems.

-
-
-
-

Use a config via environment variables

-

For certain CI/CD systems, it’s useful to pass in config files as environment variables:

-
$ python trainer.py fit --trainer "$TRAINER_CONFIG" --model "$MODEL_CONFIG" [...]
-
-
-
-
-
-

Run from environment variables directly

-

The Lightning CLI can convert every possible CLI flag into an environment variable. To enable this, set the env_parse argument:

-
LightningCLI(env_parse=True)
-
-
-

now use the --help CLI flag with any subcommand:

-
$ python main.py fit --help
-
-
-

which will show you ALL possible environment variables you can now set:

-
usage: main.py [options] fit [-h] [-c CONFIG]
-                            [--trainer.max_epochs MAX_EPOCHS] [--trainer.min_epochs MIN_EPOCHS]
-                            [--trainer.max_steps MAX_STEPS] [--trainer.min_steps MIN_STEPS]
-                            ...
-                            [--ckpt_path CKPT_PATH]
-
-optional arguments:
-...
---model CONFIG        Path to a configuration file.
---model.out_dim OUT_DIM
-                        (type: int, default: 10)
---model.learning_rate LEARNING_RATE
-                        (type: float, default: 0.02)
-
-
-

now you can customize the behavior via environment variables:

-
# set the options via env vars
-$ export LEARNING_RATE=0.01
-$ export OUT_DIM=5
-
-$ python main.py fit
-
-
-
-
-
-

Set default config files

-

To set a path to a config file of defaults, use the default_config_files argument:

-
cli = LightningCLI(MyModel, MyDataModule, parser_kwargs={"default_config_files": ["my_cli_defaults.yaml"]})
-
-
-

or if you want defaults per subcommand:

-
cli = LightningCLI(MyModel, MyDataModule, parser_kwargs={"fit": {"default_config_files": ["my_fit_defaults.yaml"]}})
-
-
-

For more configuration options, refer to the ArgumentParser API documentation.

-
-
-
-

Enable variable interpolation

-

In certain cases where multiple configs need to share variables, consider using variable interpolation. Variable interpolation -allows you to add variables to your yaml configs like so:

-
model:
-  encoder_layers: 12
-  decoder_layers:
-  - ${model.encoder_layers}
-  - 4
-
-
-

To enable variable interpolation, first install omegaconf:

-
pip install omegaconf
-
-
-

Once this is installed, the Lightning CLI will automatically handle variables in yaml files:

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/cli/lightning_cli_advanced_3.html b/docs/cli/lightning_cli_advanced_3.html deleted file mode 100644 index cd317c9..0000000 --- a/docs/cli/lightning_cli_advanced_3.html +++ /dev/null @@ -1,1004 +0,0 @@ - - - - - - - - - - - - - - Instantiation only mode — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Instantiation only mode
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Instantiation only mode

-

The CLI is designed to start fitting with minimal code changes. On class instantiation, the CLI will automatically -call the trainer function associated to the subcommand provided so you don’t have to do it. -To avoid this, you can set the following argument:

-
cli = LightningCLI(MyModel, run=False)  # True by default
-# you'll have to call fit yourself:
-cli.trainer.fit(cli.model)
-
-
-

In this mode, there are subcommands added to the parser. -This can be useful to implement custom logic without having to subclass the CLI, but still using the CLI’s instantiation -and argument parsing capabilities.

-
-
-

Subclass registration

-

To use shorthand notation, the options need to be registered beforehand. This can be easily done with:

-
LightningCLI(auto_registry=True)  # False by default
-
-
-

which will register all subclasses of torch.optim.Optimizer, torch.optim.lr_scheduler._LRScheduler, -LightningModule, -LightningDataModule, Callback, and -LightningLoggerBase across all imported modules. This includes those in your own -code.

-

Alternatively, if this is left unset, only the subclasses defined in PyTorch’s torch.optim.Optimizer, -torch.optim.lr_scheduler._LRScheduler and Lightning’s Callback and -LightningLoggerBase subclassess will be registered.

-

In subsequent sections, we will go over adding specific classes to specific registries as well as how to use -shorthand notation.

-
-
-

Trainer Callbacks and arguments with class type

-

A very important argument of the Trainer class is the callbacks. In -contrast to other more simple arguments which just require numbers or strings, callbacks expects a list of -instances of subclasses of Callback. To specify this kind of argument in a config -file, each callback must be given as a dictionary including a class_path entry with an import path of the class, -and optionally an init_args entry with arguments required to instantiate it. Therefore, a simple configuration -file example that defines a couple of callbacks is the following:

-
trainer:
-  callbacks:
-    - class_path: pytorch_lightning.callbacks.EarlyStopping
-      init_args:
-        patience: 5
-    - class_path: pytorch_lightning.callbacks.LearningRateMonitor
-      init_args:
-        ...
-
-
-

Similar to the callbacks, any arguments in Trainer and user extended -LightningModule and -LightningDataModule classes that have as type hint a class can be configured -the same way using class_path and init_args.

-

For callbacks in particular, Lightning simplifies the command line so that only -the Callback name is required. -The argument’s order matters and the user needs to pass the arguments in the following way.

-
$ python ... \
-    --trainer.callbacks={CALLBACK_1_NAME} \
-    --trainer.callbacks.{CALLBACK_1_ARGS_1}=... \
-    --trainer.callbacks.{CALLBACK_1_ARGS_2}=... \
-    ...
-    --trainer.callbacks={CALLBACK_N_NAME} \
-    --trainer.callbacks.{CALLBACK_N_ARGS_1}=... \
-    ...
-
-
-

Here is an example:

-
$ python ... \
-    --trainer.callbacks=EarlyStopping \
-    --trainer.callbacks.patience=5 \
-    --trainer.callbacks=LearningRateMonitor \
-    --trainer.callbacks.logging_interval=epoch
-
-
-

Lightning provides a mechanism for you to add your own callbacks and benefit from the command line simplification -as described above:

-
from pytorch_lightning.utilities.cli import CALLBACK_REGISTRY
-
-
-@CALLBACK_REGISTRY
-class CustomCallback(Callback):
-    ...
-
-
-cli = LightningCLI(...)
-
-
-
$  python ... --trainer.callbacks=CustomCallback ...
-
-
-
-

Note

-

This shorthand notation is only supported in the shell and not inside a configuration file. The configuration file -generated by calling the previous command with --print_config will have the class_path notation.

-
trainer:
-  callbacks:
-    - class_path: your_class_path.CustomCallback
-      init_args:
-        ...
-
-
-
-
-

Tip

-

--trainer.logger also supports shorthand notation and a LOGGER_REGISTRY is available to register custom -Loggers.

-
-
-
-

Multiple models and/or datasets

-

Additionally, the tool can be configured such that a model and/or a datamodule is -specified by an import path and init arguments. For example, with a tool implemented as:

-
cli = LightningCLI(MyModelBaseClass, MyDataModuleBaseClass, subclass_mode_model=True, subclass_mode_data=True)
-
-
-

A possible config file could be as follows:

-
model:
-  class_path: mycode.mymodels.MyModel
-  init_args:
-    decoder_layers:
-    - 2
-    - 4
-    encoder_layers: 12
-data:
-  class_path: mycode.mydatamodules.MyDataModule
-  init_args:
-    ...
-trainer:
-  callbacks:
-    - class_path: pytorch_lightning.callbacks.EarlyStopping
-      init_args:
-        patience: 5
-    ...
-
-
-

Only model classes that are a subclass of MyModelBaseClass would be allowed, and similarly only subclasses of -MyDataModuleBaseClass. If as base classes LightningModule and -LightningDataModule are given, then the tool would allow any lightning -module and data module.

-
-

Tip

-

Note that with the subclass modes the --help option does not show information for a specific subclass. To -get help for a subclass the options --model.help and --data.help can be used, followed by the -desired class path. Similarly --print_config does not include the settings for a particular subclass. To -include them the class path should be given before the --print_config option. Examples for both help and -print config are:

-
$ python trainer.py fit --model.help mycode.mymodels.MyModel
-$ python trainer.py fit --model mycode.mymodels.MyModel --print_config
-
-
-
-
-
-

Models with multiple submodules

-

Many use cases require to have several modules each with its own configurable options. One possible way to handle this -with LightningCLI is to implement a single module having as init parameters each of the submodules. Since the init -parameters have as type a class, then in the configuration these would be specified with class_path and -init_args entries. For instance a model could be implemented as:

-
class MyMainModel(LightningModule):
-    def __init__(self, encoder: nn.Module, decoder: nn.Module):
-        """Example encoder-decoder submodules model
-
-        Args:
-            encoder: Instance of a module for encoding
-            decoder: Instance of a module for decoding
-        """
-        super().__init__()
-        self.encoder = encoder
-        self.decoder = decoder
-
-
-

If the CLI is implemented as LightningCLI(MyMainModel) the configuration would be as follows:

-
model:
-  encoder:
-    class_path: mycode.myencoders.MyEncoder
-    init_args:
-      ...
-  decoder:
-    class_path: mycode.mydecoders.MyDecoder
-    init_args:
-      ...
-
-
-

It is also possible to combine subclass_mode_model=True and submodules, thereby having two levels of -class_path.

-
-
-

Class type defaults

-

The support for classes as type hints allows to try many possibilities with the same CLI. This is a useful feature, but -it can make it tempting to use an instance of a class as a default. For example:

-
class MyMainModel(LightningModule):
-    def __init__(
-        self,
-        backbone: torch.nn.Module = MyModel(encoder_layers=24),  # BAD PRACTICE!
-    ):
-        super().__init__()
-        self.backbone = backbone
-
-
-

Normally classes are mutable as it is in this case. The instance of MyModel would be created the moment that the -module that defines MyMainModel is first imported. This means that the default of backbone will be -initialized before the CLI class runs seed_everything making it non-reproducible. Furthermore, if -MyMainModel is used more than once in the same Python process and the backbone parameter is not -overridden, the same instance would be used in multiple places which very likely is not what the developer intended. -Having an instance as default also makes it impossible to generate the complete config file since for arbitrary classes -it is not known which arguments were used to instantiate it.

-

A good solution to these problems is to not have a default or set the default to a special value (e.g. a -string) which would be checked in the init and instantiated accordingly. If a class parameter has no default and the CLI -is subclassed then a default can be set as follows:

-
default_backbone = {
-    "class_path": "import.path.of.MyModel",
-    "init_args": {
-        "encoder_layers": 24,
-    },
-}
-
-
-class MyLightningCLI(LightningCLI):
-    def add_arguments_to_parser(self, parser):
-        parser.set_defaults({"model.backbone": default_backbone})
-
-
-

A more compact version that avoids writing a dictionary would be:

-
from jsonargparse import lazy_instance
-
-
-class MyLightningCLI(LightningCLI):
-    def add_arguments_to_parser(self, parser):
-        parser.set_defaults({"model.backbone": lazy_instance(MyModel, encoder_layers=24)})
-
-
-
-
-

Optimizers

-

If you will not be changing the class, you can manually add the arguments for specific optimizers and/or -learning rate schedulers by subclassing the CLI. This has the advantage of providing the proper help message for those -classes. The following code snippet shows how to implement it:

-
class MyLightningCLI(LightningCLI):
-    def add_arguments_to_parser(self, parser):
-        parser.add_optimizer_args(torch.optim.Adam)
-        parser.add_lr_scheduler_args(torch.optim.lr_scheduler.ExponentialLR)
-
-
-

With this, in the config the optimizer and lr_scheduler groups would accept all of the options for the -given classes, in this example Adam and ExponentialLR. -Therefore, the config file would be structured like:

-
optimizer:
-  lr: 0.01
-lr_scheduler:
-  gamma: 0.2
-model:
-  ...
-trainer:
-  ...
-
-
-

Where the arguments can be passed directly through command line without specifying the class. For example:

-
$ python trainer.py fit --optimizer.lr=0.01 --lr_scheduler.gamma=0.2
-
-
-

The automatic implementation of configure_optimizers can be disabled by linking the configuration group. An -example can be when one wants to add support for multiple optimizers:

-
from pytorch_lightning.utilities.cli import instantiate_class
-
-
-class MyModel(LightningModule):
-    def __init__(self, optimizer1_init: dict, optimizer2_init: dict):
-        super().__init__()
-        self.optimizer1_init = optimizer1_init
-        self.optimizer2_init = optimizer2_init
-
-    def configure_optimizers(self):
-        optimizer1 = instantiate_class(self.parameters(), self.optimizer1_init)
-        optimizer2 = instantiate_class(self.parameters(), self.optimizer2_init)
-        return [optimizer1, optimizer2]
-
-
-class MyLightningCLI(LightningCLI):
-    def add_arguments_to_parser(self, parser):
-        parser.add_optimizer_args(
-            OPTIMIZER_REGISTRY.classes, nested_key="gen_optimizer", link_to="model.optimizer1_init"
-        )
-        parser.add_optimizer_args(
-            OPTIMIZER_REGISTRY.classes, nested_key="gen_discriminator", link_to="model.optimizer2_init"
-        )
-
-
-cli = MyLightningCLI(MyModel)
-
-
-

The value given to optimizer*_init will always be a dictionary including class_path and -init_args entries. The function instantiate_class() -takes care of importing the class defined in class_path and instantiating it using some positional arguments, -in this case self.parameters(), and the init_args. -Any number of optimizers and learning rate schedulers can be added when using link_to.

-

With shorthand notation:

-
$ python trainer.py fit \
-    --gen_optimizer=Adam \
-    --gen_optimizer.lr=0.01 \
-    --gen_discriminator=AdamW \
-    --gen_discriminator.lr=0.0001
-
-
-

You can also pass the class path directly, for example, if the optimizer hasn’t been registered to the -OPTIMIZER_REGISTRY:

-
$ python trainer.py fit \
-    --gen_optimizer.class_path=torch.optim.Adam \
-    --gen_optimizer.init_args.lr=0.01 \
-    --gen_discriminator.class_path=torch.optim.AdamW \
-    --gen_discriminator.init_args.lr=0.0001
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/cli/lightning_cli_expert.html b/docs/cli/lightning_cli_expert.html deleted file mode 100644 index 1d4599e..0000000 --- a/docs/cli/lightning_cli_expert.html +++ /dev/null @@ -1,870 +0,0 @@ - - - - - - - - - - - - - - Eliminate config boilerplate (Advanced) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Eliminate config boilerplate (Advanced)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Eliminate config boilerplate (Advanced)

-

Audience: Users who already understand the LightningCLI and want to customize it.

-
-
-

Customize the LightningCLI

-

The init parameters of the LightningCLI class can be used to customize some -things, namely: the description of the tool, enabling parsing of environment variables and additional arguments to -instantiate the trainer and configuration parser.

-

Nevertheless the init arguments are not enough for many use cases. For this reason the class is designed so that can be -extended to customize different parts of the command line tool. The argument parser class used by -LightningCLI is -LightningArgumentParser which is an extension of python’s argparse, thus -adding arguments can be done using the add_argument() method. In contrast to argparse it has additional methods to -add arguments, for example add_class_arguments() adds all arguments from the init of a class, though requiring -parameters to have type hints. For more details about this please refer to the respective documentation.

-

The LightningCLI class has the -add_arguments_to_parser() method which can be implemented to include -more arguments. After parsing, the configuration is stored in the config attribute of the class instance. The -LightningCLI class also has two methods that can be used to run code before -and after the trainer runs: before_<subcommand> and after_<subcommand>. -A realistic example for these would be to send an email before and after the execution. -The code for the fit subcommand would be something like:

-
class MyLightningCLI(LightningCLI):
-    def add_arguments_to_parser(self, parser):
-        parser.add_argument("--notification_email", default="will@email.com")
-
-    def before_fit(self):
-        send_email(address=self.config["notification_email"], message="trainer.fit starting")
-
-    def after_fit(self):
-        send_email(address=self.config["notification_email"], message="trainer.fit finished")
-
-
-cli = MyLightningCLI(MyModel)
-
-
-

Note that the config object self.config is a dictionary whose keys are global options or groups of options. It -has the same structure as the yaml format described previously. This means for instance that the parameters used for -instantiating the trainer class can be found in self.config['fit']['trainer'].

-
-

Tip

-

Have a look at the LightningCLI class API reference to learn about other -methods that can be extended to customize a CLI.

-
-
-
-
-

Configure forced callbacks

-

As explained previously, any Lightning callback can be added by passing it through command line or -including it in the config via class_path and init_args entries.

-

However, certain callbacks MUST be coupled with a model so they are always present and configurable. -This can be implemented as follows:

-
from pytorch_lightning.callbacks import EarlyStopping
-
-
-class MyLightningCLI(LightningCLI):
-    def add_arguments_to_parser(self, parser):
-        parser.add_lightning_class_args(EarlyStopping, "my_early_stopping")
-        parser.set_defaults({"my_early_stopping.monitor": "val_loss", "my_early_stopping.patience": 5})
-
-
-cli = MyLightningCLI(MyModel)
-
-
-

To change the configuration of the EarlyStopping in the config it would be:

-
model:
-  ...
-trainer:
-  ...
-my_early_stopping:
-  patience: 5
-
-
-
-

Note

-

The example above overrides a default in add_arguments_to_parser. This is included to show that defaults can -be changed if needed. However, note that overriding of defaults in the source code is not intended to be used to -store the best hyperparameters for a task after experimentation. To ease reproducibility the source code should be -stable. It is better practice to store the best hyperparameters for a task in a configuration file independent from -the source code.

-
-
-
-
-

Class type defaults

-

The support for classes as type hints allows to try many possibilities with the same CLI. This is a useful feature, but -it can make it tempting to use an instance of a class as a default. For example:

-
class MyMainModel(LightningModule):
-    def __init__(
-        self,
-        backbone: torch.nn.Module = MyModel(encoder_layers=24),  # BAD PRACTICE!
-    ):
-        super().__init__()
-        self.backbone = backbone
-
-
-

Normally classes are mutable as it is in this case. The instance of MyModel would be created the moment that the -module that defines MyMainModel is first imported. This means that the default of backbone will be -initialized before the CLI class runs seed_everything making it non-reproducible. Furthermore, if -MyMainModel is used more than once in the same Python process and the backbone parameter is not -overridden, the same instance would be used in multiple places which very likely is not what the developer intended. -Having an instance as default also makes it impossible to generate the complete config file since for arbitrary classes -it is not known which arguments were used to instantiate it.

-

A good solution to these problems is to not have a default or set the default to a special value (e.g. a -string) which would be checked in the init and instantiated accordingly. If a class parameter has no default and the CLI -is subclassed then a default can be set as follows:

-
default_backbone = {
-    "class_path": "import.path.of.MyModel",
-    "init_args": {
-        "encoder_layers": 24,
-    },
-}
-
-
-class MyLightningCLI(LightningCLI):
-    def add_arguments_to_parser(self, parser):
-        parser.set_defaults({"model.backbone": default_backbone})
-
-
-

A more compact version that avoids writing a dictionary would be:

-
from jsonargparse import lazy_instance
-
-
-class MyLightningCLI(LightningCLI):
-    def add_arguments_to_parser(self, parser):
-        parser.set_defaults({"model.backbone": lazy_instance(MyModel, encoder_layers=24)})
-
-
-
-
-
-

Connect two config files

-

Another case in which it might be desired to extend LightningCLI is that the -model and data module depend on a common parameter. For example in some cases both classes require to know the -batch_size. It is a burden and error prone giving the same value twice in a config file. To avoid this the -parser can be configured so that a value is only given once and then propagated accordingly. With a tool implemented -like shown below, the batch_size only has to be provided in the data section of the config.

-
class MyLightningCLI(LightningCLI):
-    def add_arguments_to_parser(self, parser):
-        parser.link_arguments("data.batch_size", "model.batch_size")
-
-
-cli = MyLightningCLI(MyModel, MyDataModule)
-
-
-

The linking of arguments is observed in the help of the tool, which for this example would look like:

-
$ python trainer.py fit --help
-  ...
-    --data.batch_size BATCH_SIZE
-                          Number of samples in a batch (type: int, default: 8)
-
-  Linked arguments:
-    model.batch_size <-- data.batch_size
-                          Number of samples in a batch (type: int)
-
-
-

Sometimes a parameter value is only available after class instantiation. An example could be that your model requires -the number of classes to instantiate its fully connected layer (for a classification task) but the value is not -available until the data module has been instantiated. The code below illustrates how to address this.

-
class MyLightningCLI(LightningCLI):
-    def add_arguments_to_parser(self, parser):
-        parser.link_arguments("data.num_classes", "model.num_classes", apply_on="instantiate")
-
-
-cli = MyLightningCLI(MyClassModel, MyDataModule)
-
-
-

Instantiation links are used to automatically determine the order of instantiation, in this case data first.

-
-

Tip

-

The linking of arguments can be used for more complex cases. For example to derive a value via a function that takes -multiple settings as input. For more details have a look at the API of link_arguments.

-
-

The linking of arguments is intended for things that are meant to be non-configurable. This improves the CLI user -experience since it avoids the need for providing more parameters. A related concept is -variable interpolation which in contrast keeps things being configurable.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/cli/lightning_cli_faq.html b/docs/cli/lightning_cli_faq.html deleted file mode 100644 index 2f48f3a..0000000 --- a/docs/cli/lightning_cli_faq.html +++ /dev/null @@ -1,768 +0,0 @@ - - - - - - - - - - - - - - Eliminate config boilerplate (expert) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Eliminate config boilerplate (expert)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Eliminate config boilerplate (expert)

-
-

Troubleshooting

-

The standard behavior for CLIs, when they fail, is to terminate the process with a non-zero exit code and a short message -to hint the user about the cause. This is problematic while developing the CLI since there is no information to track -down the root of the problem. A simple change in the instantiation of the LightningCLI can be used such that when -there is a failure an exception is raised and the full stack trace printed.

-
cli = LightningCLI(MyModel, parser_kwargs={"error_handler": None})
-
-
-
-

Note

-

When asking about problems and reporting issues please set the error_handler to None and include the stack -trace in your description. With this, it is more likely for people to help out identifying the cause without needing -to create a reproducible script.

-
-
-
-
-

Reproducibility with the LightningCLI

-

The topic of reproducibility is complex and it is impossible to guarantee reproducibility by just providing a class that -people can use in unexpected ways. Nevertheless, the LightningCLI tries to -give a framework and recommendations to make reproducibility simpler.

-

When an experiment is run, it is good practice to use a stable version of the source code, either being a released -package or at least a commit of some version controlled repository. For each run of a CLI the config file is -automatically saved including all settings. This is useful to figure out what was done for a particular run without -requiring to look at the source code. If by mistake the exact version of the source code is lost or some defaults -changed, having the full config means that most of the information is preserved.

-

The class is targeted at implementing CLIs because running a command from a shell provides a separation with the Python -source code. Ideally the CLI would be placed in your path as part of the installation of a stable package, instead of -running from a clone of a repository that could have uncommitted local modifications. Creating installable packages that -include CLIs is out of the scope of this document. This is mentioned only as a teaser for people who would strive for -the best practices possible.

-

For every CLI implemented, users are encouraged to learn how to run it by reading the documentation printed with the ---help option and use the --print_config option to guide the writing of config files. A few more details -that might not be clear by only reading the help are the following.

-

LightningCLI is based on argparse and as such follows the same arguments style -as many POSIX command line tools. Long options are prefixed with two dashes and its corresponding values should be -provided with an empty space or an equal sign, as --option value or --option=value. Command line options -are parsed from left to right, therefore if a setting appears multiple times the value most to the right will override -the previous ones. If a class has an init parameter that is required (i.e. no default value), it is given as ---option which makes it explicit and more readable instead of relying on positional arguments.

-
-
-
-

What is a subcommand?

-

A subcommand is what is the action the LightningCLI applies to the script:

-
python main.py [subcommand]
-
-
-

See the Potential subcommands with:

-
python main.py --help
-
-
-

which prints:

-
...
-
-fit                 Runs the full optimization routine.
-validate            Perform one evaluation epoch over the validation set.
-test                Perform one evaluation epoch over the test set.
-predict             Run inference on your data.
-tune                Runs routines to tune hyperparameters before training.
-
-
-

use a subcommand as follows:

-
python main.py fit
-python main.py test
-
-
-
-
-
-

What is the CLI?

-

CLI is short for commandline interface. Use your terminal to enter these commands.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/cli/lightning_cli_intermediate.html b/docs/cli/lightning_cli_intermediate.html deleted file mode 100644 index b81f240..0000000 --- a/docs/cli/lightning_cli_intermediate.html +++ /dev/null @@ -1,862 +0,0 @@ - - - - - - - - - - - - - - Eliminate config boilerplate (Intermediate) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Eliminate config boilerplate (Intermediate)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Eliminate config boilerplate (Intermediate)

-

Audience: Users who want advanced modularity via the commandline interface (CLI).

-

Pre-reqs: You must already understand how to use a commandline and LightningDataModule.

-
-
-

What is config boilerplate?

-

As Lightning projects grow in complexity it becomes desirable to enable full customizability from the commandline (CLI) so you can -change any hyperparameters without changing your code:

-
# Mix and match anything
-$ python main.py --command fit --model.learning_rate 0.02
-$ python main.py --command fit --model.learning_rate 0.01 --trainer.fast_dev_run True
-
-
-

This is what the Lightning CLI enables. Without the Lightning CLI, you usually end up with a TON of boilerplate that looks like this:

-
from argparse import ArgumentParser
-
-if __name__ == "__main__":
-    parser = ArgumentParser()
-    parser.add_argument("--learning_rate_1", default=0.02)
-    parser.add_argument("--learning_rate_2", default=0.03)
-    parser.add_argument("--model", default="cnn")
-    parser.add_argument("--command", default="fit")
-    parser.add_argument("--run_fast", default=True)
-    ...
-    # add 100 more of these
-    ...
-
-    args = parser.parse_args()
-
-    if args.model == "cnn":
-        model = ConvNet(learning_rate=args.learning_rate_1)
-    elif args.model == "transformer":
-        model = Transformer(learning_rate=args.learning_rate_2)
-    trainer = Trainer(fast_dev_run=args.run_fast)
-    ...
-
-    if args.command == "fit":
-        trainer.fit()
-    elif args.command == "test":
-        ...
-
-
-

This kind of boilerplate is unsustainable as projects grow in complexity.

-
-
-
-

Enable the Lightning CLI

-

To enable the Lightning CLI install the extras:

-
pip install pytorch-lightning[extra]
-
-
-

if the above fails, only install jsonargparse:

-
pip install -U jsonargparse[signatures]
-
-
-
-
-
-

Connect a model to the CLI

-

The simplest way to control a model with the CLI is to wrap it in the LightningCLI object:

-
# main.py
-
-import torch
-from pytorch_lightning.utilities.cli import LightningCLI
-from pytorch_lightning import LightningModule, demos
-
-
-class DemoModel(LightningModule):
-    def __init__(self, out_dim: int = 10, learning_rate: float = 0.02):
-        super().__init__()
-        self.l1 = torch.nn.Linear(32, out_dim)
-        self.learning_rate = learning_rate
-
-    def forward(self, x):
-        return torch.relu(self.l1(x.view(x.size(0), -1)))
-
-    def training_step(self, batch, batch_nb):
-        x = batch
-        x = self(x)
-        loss = x.sum()
-        return loss
-
-    def configure_optimizers(self):
-        return torch.optim.Adam(self.parameters(), lr=self.learning_rate)
-
-
-cli = LightningCLI(DemoModel, demos.BoringDataModule)
-# don't call fit!!
-
-
-

Now your model can be managed via the CLI. To see the available commands type:

-
$ python main.py --help
-
-
-

Which prints out:

-
usage: a.py [-h] [-c CONFIG] [--print_config [={comments,skip_null,skip_default}+]]
-        {fit,validate,test,predict,tune} ...
-
-pytorch-lightning trainer command line tool
-
-optional arguments:
--h, --help            Show this help message and exit.
--c CONFIG, --config CONFIG
-                        Path to a configuration file in json or yaml format.
---print_config [={comments,skip_null,skip_default}+]
-                        Print configuration and exit.
-
-subcommands:
-For more details of each subcommand add it as argument followed by --help.
-
-{fit,validate,test,predict,tune}
-    fit                 Runs the full optimization routine.
-    validate            Perform one evaluation epoch over the validation set.
-    test                Perform one evaluation epoch over the test set.
-    predict             Run inference on your data.
-    tune                Runs routines to tune hyperparameters before training.
-
-
-

the message tells us that we have a few available subcommands:

-
python main.py [subcommand]
-
-
-

which you can use depending on your use case:

-
$ python main.py fit
-$ python main.py validate
-$ python main.py test
-$ python main.py predict
-$ python main.py tune
-
-
-
-
-
-

Train a model with the CLI

-

To run the full training routine (train, val, test), use the subcommand fit:

-
python main.py fit
-
-
-

View all available options with the --help command:

-
usage: main.py [options] fit [-h] [-c CONFIG]
-                            [--seed_everything SEED_EVERYTHING] [--trainer CONFIG]
-                            ...
-                            [--ckpt_path CKPT_PATH]
-    --trainer.logger LOGGER
-
-optional arguments:
-<class '__main__.DemoModel'>:
-    --model.out_dim OUT_DIM
-                            (type: int, default: 10)
-    --model.learning_rate LEARNING_RATE
-                            (type: float, default: 0.02)
-<class 'pytorch_lightning.demos.boring_classes.BoringDataModule'>:
---data CONFIG         Path to a configuration file.
---data.data_dir DATA_DIR
-                        (type: str, default: ./)
-
-
-

With the Lightning CLI enabled, you can now change the parameters without touching your code:

-
# change the learning_rate
-python main.py fit --model.out_dim 30
-
-# change the out dimensions also
-python main.py fit --model.out_dim 10 --model.learning_rate 0.1
-
-# change trainer and data arguments too
-python main.py fit --model.out_dim 2 --model.learning_rate 0.1 --data.data_dir '~/' --trainer.logger False
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/cli/lightning_cli_intermediate_2.html b/docs/cli/lightning_cli_intermediate_2.html deleted file mode 100644 index 3c176d9..0000000 --- a/docs/cli/lightning_cli_intermediate_2.html +++ /dev/null @@ -1,900 +0,0 @@ - - - - - - - - - - - - - - Eliminate config boilerplate (intermediate) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Eliminate config boilerplate (intermediate)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Eliminate config boilerplate (intermediate)

-

Audience: Users who have multiple models and datasets per project.

-

Pre-reqs: You must have read (Control it all from the CLI).

-
-
-

Why do I want to mix models and datasets

-

Lightning projects usually begin with one model and one dataset. As the project grows in complexity and you introduce more models and more datasets, it becomes desirable -to mix any model with any dataset directly from the commandline without changing your code.

-
# Mix and match anything
-$ python main.py fit --model=GAN --data=MNIST
-$ python main.py fit --model=Transformer --data=MNIST
-
-
-

This is what the Lightning CLI enables. Otherwise, this kind of configuration requires a significant amount of boilerplate that often looks like this:

-
# choose model
-if args.model == "gan":
-    model = GAN(args.feat_dim)
-elif args.model == "transformer":
-    model = Transformer(args.feat_dim)
-...
-
-# choose datamodule
-if args.data == "MNIST":
-    datamodule = MNIST()
-elif args.data == "imagenet":
-    datamodule = Imagenet()
-...
-
-# mix them!
-trainer.fit(model, datamodule)
-
-
-
-
-
-

Register LightningModules

-

Connect models across different files with the MODEL_REGISTRY to make them available from the CLI:

-
# main.py
-
-from pytorch_lightning import demos
-from pytorch_lightning.utilities import cli as pl_cli
-
-
-@pl_cli.MODEL_REGISTRY
-class Model1(demos.DemoModel):
-    def configure_optimizers(self):
-        print("⚡", "using Model1", "⚡")
-        return super().configure_optimizers()
-
-
-@pl_cli.MODEL_REGISTRY
-class Model2(demos.DemoModel):
-    def configure_optimizers(self):
-        print("⚡", "using Model2", "⚡")
-        return super().configure_optimizers()
-
-
-cli = pl_cli.LightningCLI(datamodule_class=demos.BoringDataModule)
-
-
-

Now you can choose between any model from the CLI:

-
# use Model1
-python main.py fit --model Model1
-
-# use Model2
-python main.py fit --model Model2
-
-
-
-
-
-

Register DataModules

-

Connect DataModules across different files with the DATAMODULE_REGISTRY to make them available from the CLI:

-
# main.py
-import torch
-from pytorch_lightning.utilities import cli as pl_cli
-from pytorch_lightning import demos
-
-
-@pl_cli.DATAMODULE_REGISTRY
-class FakeDataset1(demos.BoringDataModule):
-    def train_dataloader(self):
-        print("⚡", "using FakeDataset1", "⚡")
-        return torch.utils.data.DataLoader(self.random_train)
-
-
-@pl_cli.DATAMODULE_REGISTRY
-class FakeDataset2(demos.BoringDataModule):
-    def train_dataloader(self):
-        print("⚡", "using FakeDataset2", "⚡")
-        return torch.utils.data.DataLoader(self.random_train)
-
-
-cli = pl_cli.LightningCLI(demos.DemoModel)
-
-
-

Now you can choose between any dataset at runtime:

-
# use Model1
-python main.py fit --data FakeDataset1
-
-# use Model2
-python main.py fit --data FakeDataset2
-
-
-
-
-
-

Register optimizers

-

Connect optimizers with the OPTIMIZER_REGISTRY to make them available from the CLI:

-
# main.py
-import torch
-from pytorch_lightning.utilities import cli as pl_cli
-from pytorch_lightning import demos
-
-
-@pl_cli.OPTIMIZER_REGISTRY
-class LitAdam(torch.optim.Adam):
-    def step(self, closure):
-        print("⚡", "using LitAdam", "⚡")
-        super().step(closure)
-
-
-@pl_cli.OPTIMIZER_REGISTRY
-class FancyAdam(torch.optim.Adam):
-    def step(self, closure):
-        print("⚡", "using FancyAdam", "⚡")
-        super().step(closure)
-
-
-cli = pl_cli.LightningCLI(demos.DemoModel, demos.BoringDataModule)
-
-
-

Now you can choose between any optimizer at runtime:

-
# use LitAdam
-python main.py fit --optimizer LitAdam
-
-# use FancyAdam
-python main.py fit --optimizer FancyAdam
-
-
-

Bonus: If you need only 1 optimizer, the Lightning CLI already works out of the box with any Optimizer from torch.optim.optim:

-
python main.py fit --optimizer AdamW
-
-
-

If the optimizer you want needs other arguments, add them via the CLI (no need to change your code)!

-
python main.py fit --optimizer SGD --optimizer.lr=0.01
-
-
-
-
-
-

Register LR schedulers

-

Connect learning rate schedulers with the LR_SCHEDULER_REGISTRY to make them available from the CLI:

-
# main.py
-import torch
-from pytorch_lightning.utilities import cli as pl_cli
-from pytorch_lightning import demos
-
-
-@pl_cli.LR_SCHEDULER_REGISTRY
-class LitLRScheduler(torch.optim.lr_scheduler.CosineAnnealingLR):
-    def step(self):
-        print("⚡", "using LitLRScheduler", "⚡")
-        super().step()
-
-
-cli = pl_cli.LightningCLI(demos.DemoModel, demos.BoringDataModule)
-
-
-

Now you can choose between any learning rate scheduler at runtime:

-
# LitLRScheduler
-python main.py fit --lr_scheduler LitLRScheduler
-
-
-

Bonus: If you need only 1 LRScheduler, the Lightning CLI already works out of the box with any LRScheduler from torch.optim:

-
python main.py fit --lr_scheduler CosineAnnealingLR
-python main.py fit --lr_scheduler LinearLR
-...
-
-
-

If the scheduler you want needs other arguments, add them via the CLI (no need to change your code)!

-
python main.py fit --lr_scheduler=ReduceLROnPlateau --lr_scheduler.monitor=epoch
-
-
-
-
-
-

Register from any package

-

A shortcut to register many classes from a package is to use the register_classes method. Here we register all optimizers from the torch.optim library:

-
import torch
-from pytorch_lightning.utilities import cli as pl_cli
-from pytorch_lightning import demos
-
-# add all PyTorch optimizers!
-pl_cli.OPTIMIZER_REGISTRY.register_classes(module=torch.optim, base_cls=torch.optim.Optimizer)
-
-cli = pl_cli.LightningCLI(demos.DemoModel, demos.BoringDataModule)
-
-
-

Now use any of the optimizers in the torch.optim library:

-
python main.py fit --optimizer AdamW
-
-
-

This method is supported by all the registry classes.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/clouds/cloud_training.html b/docs/clouds/cloud_training.html deleted file mode 100644 index 9084678..0000000 --- a/docs/clouds/cloud_training.html +++ /dev/null @@ -1,760 +0,0 @@ - - - - - - - - - - - - - - Train on the cloud — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Train on the cloud
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Train on the cloud

-

Audience: Users who want to develop and train models on the cloud (public cloud, private cloud or onprem clusters).

-
-
-
-
-

Grid.ai is the official cloud training solution for PyTorch Lightning. Grid is designed to support researcher workloads at both academic labs and major companies.

-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
- -
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/clouds/cloud_training_intermediate.html b/docs/clouds/cloud_training_intermediate.html deleted file mode 100644 index f968b8b..0000000 --- a/docs/clouds/cloud_training_intermediate.html +++ /dev/null @@ -1,688 +0,0 @@ - - - - - - - - - - - - - - Train on the cloud (intermediate) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Train on the cloud (intermediate)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Train on the cloud (intermediate)

-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/clouds/cluster.html b/docs/clouds/cluster.html deleted file mode 100644 index 5c6673e..0000000 --- a/docs/clouds/cluster.html +++ /dev/null @@ -1,741 +0,0 @@ - - - - - - - - - - - - - - Run on an on-prem cluster — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Run on an on-prem cluster
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
- -
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/clouds/cluster_advanced.html b/docs/clouds/cluster_advanced.html deleted file mode 100644 index b6d898f..0000000 --- a/docs/clouds/cluster_advanced.html +++ /dev/null @@ -1,882 +0,0 @@ - - - - - - - - - - - - - - Run on an on-prem cluster (advanced) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Run on an on-prem cluster (advanced)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Run on an on-prem cluster (advanced)

-
-
-

Run on a SLRUM managed cluster

-

Lightning automates the details behind training on a SLURM-powered cluster. In contrast to the general purpose -cluster above, the user does not start the jobs manually on each node and instead submits it to SLURM which -schedules the resources and time for which the job is allowed to run.

-
-
-
-

Design your training script

-

To train a model using multiple nodes, do the following:

-
    -
  1. Design your LightningModule (no need to add anything specific here).

  2. -
  3. Enable DDP in the trainer

    -
    # train on 32 GPUs across 4 nodes
    -trainer = Trainer(accelerator="gpu", devices=8, num_nodes=4, strategy="ddp")
    -
    -
    -
  4. -
  5. It’s a good idea to structure your training script like this:

    -
    # train.py
    -def main(hparams):
    -    model = LightningTemplateModel(hparams)
    -
    -    trainer = Trainer(accelerator="gpu", devices=8, num_nodes=4, strategy="ddp")
    -
    -    trainer.fit(model)
    -
    -
    -if __name__ == "__main__":
    -    root_dir = os.path.dirname(os.path.realpath(__file__))
    -    parent_parser = ArgumentParser(add_help=False)
    -    hyperparams = parser.parse_args()
    -
    -    # TRAIN
    -    main(hyperparams)
    -
    -
    -
  6. -
  7. Create the appropriate SLURM job:

    -
    # (submit.sh)
    -#!/bin/bash -l
    -
    -# SLURM SUBMIT SCRIPT
    -#SBATCH --nodes=4
    -#SBATCH --gres=gpu:8
    -#SBATCH --ntasks-per-node=8
    -#SBATCH --mem=0
    -#SBATCH --time=0-02:00:00
    -
    -# activate conda env
    -source activate $1
    -
    -# debugging flags (optional)
    -export NCCL_DEBUG=INFO
    -export PYTHONFAULTHANDLER=1
    -
    -# on your cluster you might need these:
    -# set the network interface
    -# export NCCL_SOCKET_IFNAME=^docker0,lo
    -
    -# might need the latest CUDA
    -# module load NCCL/2.4.7-1-cuda.10.0
    -
    -# run script from above
    -srun python3 train.py
    -
    -
    -
  8. -
  9. If you want auto-resubmit (read below), add this line to the submit.sh script

    -
    #SBATCH --signal=SIGUSR1@90
    -
    -
    -
  10. -
  11. Submit the SLURM job

    -
    sbatch submit.sh
    -
    -
    -
  12. -
-
-
-
-

Enable auto wall-time resubmitions

-

When you use Lightning in a SLURM cluster, it automatically detects when it is about -to run into the wall time and does the following:

-
    -
  1. Saves a temporary checkpoint.

  2. -
  3. Requeues the job.

  4. -
  5. When the job starts, it loads the temporary checkpoint.

  6. -
-

To get this behavior make sure to add the correct signal to your SLURM script

-
# 90 seconds before training ends
-SBATCH --signal=SIGUSR1@90
-
-
-

If auto-resubmit is not desired, it can be turned off in the SLURMEnvironment plugin:

-
from pytorch_lightning.plugins.environments import SLURMEnvironment
-
-trainer = Trainer(plugins=[SLURMEnvironment(auto_requeue=False)])
-
-
-
-
-
-

Build your SLURM script

-

Instead of manually building SLURM scripts, you can use the -SlurmCluster object -to do this for you. The SlurmCluster can also run a grid search if you pass -in a HyperOptArgumentParser.

-

Here is an example where you run a grid search of 9 combinations of hyperparameters. -See also the multi-node examples -here.

-
# grid search 3 values of learning rate and 3 values of number of layers for your net
-# this generates 9 experiments (lr=1e-3, layers=16), (lr=1e-3, layers=32),
-# (lr=1e-3, layers=64), ... (lr=1e-1, layers=64)
-parser = HyperOptArgumentParser(strategy="grid_search", add_help=False)
-parser.opt_list("--learning_rate", default=0.001, type=float, options=[1e-3, 1e-2, 1e-1], tunable=True)
-parser.opt_list("--layers", default=1, type=float, options=[16, 32, 64], tunable=True)
-hyperparams = parser.parse_args()
-
-# Slurm cluster submits 9 jobs, each with a set of hyperparams
-cluster = SlurmCluster(
-    hyperparam_optimizer=hyperparams,
-    log_path="/some/path/to/save",
-)
-
-# OPTIONAL FLAGS WHICH MAY BE CLUSTER DEPENDENT
-# which interface your nodes use for communication
-cluster.add_command("export NCCL_SOCKET_IFNAME=^docker0,lo")
-
-# see the output of the NCCL connection process
-# NCCL is how the nodes talk to each other
-cluster.add_command("export NCCL_DEBUG=INFO")
-
-# setting a main port here is a good idea.
-cluster.add_command("export MASTER_PORT=%r" % PORT)
-
-# ************** DON'T FORGET THIS ***************
-# MUST load the latest NCCL version
-cluster.load_modules(["NCCL/2.4.7-1-cuda.10.0"])
-
-# configure cluster
-cluster.per_experiment_nb_nodes = 12
-cluster.per_experiment_nb_gpus = 8
-
-cluster.add_slurm_cmd(cmd="ntasks-per-node", value=8, comment="1 task per gpu")
-
-# submit a script with 9 combinations of hyper params
-# (lr=1e-3, layers=16), (lr=1e-3, layers=32), (lr=1e-3, layers=64), ... (lr=1e-1, layers=64)
-cluster.optimize_parallel_cluster_gpu(
-    main, nb_trials=9, job_name="name_for_squeue"  # how many permutations of the grid search to run
-)
-
-
-

The other option is that you generate scripts on your own via a bash command or use our -native solution.

-
-
-
-

Get help

-

Setting up a cluster for distributed training is not trivial. Lightning offers lightning-grid which allows you to configure a cluster easily and run experiments via the CLI and web UI.

-

Try it out for free today:

-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/clouds/cluster_expert.html b/docs/clouds/cluster_expert.html deleted file mode 100644 index c0f6f39..0000000 --- a/docs/clouds/cluster_expert.html +++ /dev/null @@ -1,750 +0,0 @@ - - - - - - - - - - - - - - Run on an on-prem cluster (expert) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Run on an on-prem cluster (expert)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Run on an on-prem cluster (expert)

-
-
-

Integrate your own cluster

-

Lightning provides an interface for providing your own definition of a cluster environment. It mainly consists of -parsing the right environment variables to access information such as world size, global and local rank (process id), -and node rank (node id). Here is an example of a custom -ClusterEnvironment:

-
import os
-from pytorch_lightning.plugins.environments import ClusterEnvironment
-
-
-class MyClusterEnvironment(ClusterEnvironment):
-    @property
-    def creates_processes_externally(self) -> bool:
-        """Return True if the cluster is managed (you don't launch processes yourself)"""
-        return True
-
-    def world_size(self) -> int:
-        return int(os.environ["WORLD_SIZE"])
-
-    def global_rank(self) -> int:
-        return int(os.environ["RANK"])
-
-    def local_rank(self) -> int:
-        return int(os.environ["LOCAL_RANK"])
-
-    def node_rank(self) -> int:
-        return int(os.environ["NODE_RANK"])
-
-    def main_address(self) -> str:
-        return os.environ["MASTER_ADDRESS"]
-
-    def main_port(self) -> int:
-        return int(os.environ["MASTER_PORT"])
-
-
-trainer = Trainer(plugins=[MyClusterEnvironment()])
-
-
-
-
-
-

Get help

-

Setting up a cluster for distributed training is not trivial. Lightning offers lightning-grid which allows you to configure a cluster easily and run experiments via the CLI and web UI.

-

Try it out for free today:

-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/clouds/cluster_intermediate_1.html b/docs/clouds/cluster_intermediate_1.html deleted file mode 100644 index 4de1950..0000000 --- a/docs/clouds/cluster_intermediate_1.html +++ /dev/null @@ -1,767 +0,0 @@ - - - - - - - - - - - - - - Run on an on-prem cluster (intermediate) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Run on an on-prem cluster (intermediate)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Run on an on-prem cluster (intermediate)

-

Audience: Users who need to run on an academic or enterprise private cluster.

-
-
-

Setup the cluster

-

This guide shows how to run a training job on a general purpose cluster. We recommend beginners to try this method -first because it requires the least amount of configuration and changes to the code. -To setup a multi-node computing cluster you need:

-
    -
  1. Multiple computers with PyTorch Lightning installed

  2. -
  3. A network connectivity between them with firewall rules that allow traffic flow on a specified MASTER_PORT.

  4. -
  5. Defined environment variables on each node required for the PyTorch Lightning multi-node distributed training

  6. -
-

PyTorch Lightning follows the design of PyTorch distributed communication package. and requires the following environment variables to be defined on each node:

-
    -
  • MASTER_PORT - required; has to be a free port on machine with NODE_RANK 0

  • -
  • MASTER_ADDR - required (except for NODE_RANK 0); address of NODE_RANK 0 node

  • -
  • WORLD_SIZE - required; how many nodes are in the cluster

  • -
  • NODE_RANK - required; id of the node in the cluster

  • -
-
-
-
-

Setup the training script

-

To train a model using multiple nodes, do the following:

-
    -
  1. Design your LightningModule (no need to add anything specific here).

  2. -
  3. Enable DDP in the trainer

    -
    # train on 32 GPUs across 4 nodes
    -trainer = Trainer(accelerator="gpu", devices=8, num_nodes=4, strategy="ddp")
    -
    -
    -
  4. -
-
-
-
-

Submit a job to the cluster

-

To submit a training job to the cluster you need to run the same training script on each node of the cluster. -This means that you need to:

-
    -
  1. Copy all third-party libraries to each node (usually means - distribute requirements.txt file and install it).

  2. -
  3. Copy all your import dependencies and the script itself to each node.

  4. -
  5. Run the script on each node.

  6. -
-
-
-
-

Debug on a cluster

-

When running in DDP mode, some errors in your code can show up as an NCCL issue. -Set the NCCL_DEBUG=INFO environment variable to see the ACTUAL error.

-
NCCL_DEBUG=INFO python train.py ...
-
-
-
-
-
-

Get help

-

Setting up a cluster for distributed training is not trivial. Lightning offers lightning-grid which allows you to configure a cluster easily and run experiments via the CLI and web UI.

-

Try it out for free today:

-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/clouds/cluster_intermediate_2.html b/docs/clouds/cluster_intermediate_2.html deleted file mode 100644 index 0e99257..0000000 --- a/docs/clouds/cluster_intermediate_2.html +++ /dev/null @@ -1,744 +0,0 @@ - - - - - - - - - - - - - - Run on an on-prem cluster (intermediate) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Run on an on-prem cluster (intermediate)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Run on an on-prem cluster (intermediate)

-
-

Run with TorchDistributed

-

Torch Distributed Run provides helper functions to setup distributed environment variables from the PyTorch distributed communication package that need to be defined on each node.

-

Once the script is setup like described in :ref:` Training Script Setup<training_script_setup>`, you can run the below command across your nodes to start multi-node training.

-

Like a custom cluster, you have to ensure that there is network connectivity between the nodes with firewall rules that allow traffic flow on a specified MASTER_PORT.

-

Finally, you’ll need to decide which node you’d like to be the main node (MASTER_ADDR), and the ranks of each node (NODE_RANK).

-

For example:

-
    -
  • MASTER_ADDR 10.10.10.16

  • -
  • MASTER_PORT 29500

  • -
  • NODE_RANK 0 for the first node, 1 for the second node

  • -
-

Run the below command with the appropriate variables set on each node.

-
python -m torch.distributed.run
-    --nnodes=2 # number of nodes you'd like to run with
-    --master_addr <MASTER_ADDR>
-    --master_port <MASTER_PORT>
-    --node_rank <NODE_RANK>
-    train.py (--arg1 ... train script args...)
-
-
-
-

Note

-

torch.distributed.run assumes that you’d like to spawn a process per GPU if GPU devices are found on the node. This can be adjusted with -nproc_per_node.

-
-
-
-
-

Get help

-

Setting up a cluster for distributed training is not trivial. Lightning offers lightning-grid which allows you to configure a cluster easily and run experiments via the CLI and web UI.

-

Try it out for free today:

-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/clouds/fault_tolerant_training.html b/docs/clouds/fault_tolerant_training.html deleted file mode 100644 index 93e7376..0000000 --- a/docs/clouds/fault_tolerant_training.html +++ /dev/null @@ -1,732 +0,0 @@ - - - - - - - - - - - - - - Fault-tolerant Training — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Fault-tolerant Training
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
- -
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/clouds/fault_tolerant_training_basic.html b/docs/clouds/fault_tolerant_training_basic.html deleted file mode 100644 index 2c0dc20..0000000 --- a/docs/clouds/fault_tolerant_training_basic.html +++ /dev/null @@ -1,725 +0,0 @@ - - - - - - - - - - - - - - Fault-tolerant Training (basic) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Fault-tolerant Training (basic)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Fault-tolerant Training (basic)

-

Audience: User who want to run on the cloud or a cluster environment.

-

Pre-requisites: Users must have first read Run on the cloud (basic)

-
-
-

What is fault-tolerant training?

-

When developing models on the cloud or cluster environments, you may be forced to restart from scratch in the event of a software or hardware failure (ie: a fault). Lightning models can run fault-proof.

-

With Fault Tolerant Training, when Trainer.fit() fails in the middle of an epoch during training or validation, -Lightning will restart exactly where it failed, and everything will be restored (down to the batch it was on even if the dataset was shuffled).

-
-

Warning

-

Fault-tolerant Training is currently an experimental feature within Lightning.

-
-
-
-
-

Use fault-tolerance to save money on cloud training

-

Cloud providers offer pre-emptible machines which can be priced as low as 1/10th the cost but can be shut-down automatically at any time. -Because fault-tolerant training can automatically recover from an interruption, you can train models for many weeks/months at a time for the pre-emptible prices.

-

To easily run on the cloud with fault-tolerance with lightning-grid, use the following arguments:

-
grid run --use_spot --auto_resume lightning_script.py
-
-
-

The --use_spot argument enables cheap preemptible pricing (but the machines that can be interrupted). -If the machine is interrupted, the --auto_resume argument automatically restarts the machine.

-

As long as you are running a script that runs a lightning model, the model will restore itself and handle all the details of fault tolerance.

-
-
-
-

Cost

-

Lightning (via lightning-grid) provides access to cloud machines to the community for free. However, you must buy credits on lightning-grid which are used to pay the cloud providers on your behalf.

-

If you want to run on your own AWS account and pay the cloud provider directly, please contact our onprem team: mailto:onprem@pytorchlightning.ai

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/clouds/fault_tolerant_training_expert.html b/docs/clouds/fault_tolerant_training_expert.html deleted file mode 100644 index 92149d6..0000000 --- a/docs/clouds/fault_tolerant_training_expert.html +++ /dev/null @@ -1,714 +0,0 @@ - - - - - - - - - - - - - - Fault-tolerant Training (expert) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Fault-tolerant Training (expert)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Fault-tolerant Training (expert)

-

Audience: Experts looking to enable and handle their own fault-tolerance.

-

Pre-requisites: Users must have first read Fault-tolrance Training (basic)

-
-
-

Enable fault-tolerant behavior anywhere

-

To enable fault tolerance on your own cloud or cluster environment enable the PL_FAULT_TOLERANT_TRAINING environment variable:

-
PL_FAULT_TOLERANT_TRAINING=1 python script.py
-
-
-

Although Lighting will now be fault-tolerant, you’ll have to handle all the nuances of making sure the models are automatically restarted.

-
-

Note

-

This complexity is already handled for you if you use lightning-grid.

-
-
-
-
-

Enable fault-tolerant behavior on your own cluster

-

The simplest way to enable fault-tolerant behavior is to enable lightning-grid to work on your on-prem cluster or cloud environment which will handle all the nuances of fault-tolerant training at scale.

-

Email us to connect with your own cloud account:

-

mailto:onprem@pytorchlightning.ai

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/clouds/fault_tolerant_training_faq.html b/docs/clouds/fault_tolerant_training_faq.html deleted file mode 100644 index d4d8190..0000000 --- a/docs/clouds/fault_tolerant_training_faq.html +++ /dev/null @@ -1,816 +0,0 @@ - - - - - - - - - - - - - - Fault-tolerant Training (FAQ) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Fault-tolerant Training (FAQ)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Fault-tolerant Training (FAQ)

-
-

How do I use iterable datasets?

-

To support fault-tolerance, you will need to use and expose a sampler within your dataset.

-

For example, the following implementation for an iterable dataset sub-classing IterableDataset won’t be supported.

-
from torch.utils.data import IterableDataset, DataLoader
-
-
-# does not support fault tolerance training!
-class RandomIterableDataset(IterableDataset):
-    def __init__(self, size: int, count: int):
-        self.count = count
-        self.size = size
-
-    def __iter__(self):
-        for _ in range(self.count):
-            yield torch.randn(self.size)
-
-
-

There are two primary reasons why Lightning can’t support the previous implementation.

-
    -
  • Lightning cannot infer what you are iterating over, making it difficult to restart training. Lightning Fault Tolerant Training requires a Sampler to be used to encapsulate the fetching logic, requiring both the sampler and an iterator to be made available as attributes within the dataset, so Lightning can access them to track progress.

  • -
  • Implementing the __next__ method is required as it separates iterator creation from its consumption, which is essential for Lightning to wrap the iterator before their consumption.

  • -
-

If your iterable dataset are implemented in the following way, everything should works as expected.

-
import torch
-from torch.utils.data import IterableDataset, DataLoader
-
-
-class RandomIterableDataset(IterableDataset):
-    def __init__(self, size: int, length: int):
-        self.data = torch.randn(length, size)
-
-        # expose the sampler as an attribute
-        self.sampler = RandomSampler(range(length))
-
-    def __iter__(self) -> "RandomIterableDataset":
-        # expose the generator from the sampler as an attribute
-        # the ``sampler_iter`` will be wrapped by Lightning to ensure
-        # we can capture random seeds and iteration count for fast-forward samplers
-        # while restarting.
-        self.sampler_iter = iter(self.sampler)
-        return self
-
-    def __next__(self) -> torch.Tensor:
-        # call next on the iterator and get the associated data.
-        # the logic here can become more complex but the sampler
-        # should be the central piece for fetching the next sample
-        index = next(self.sampler_iter)
-        return self.data[index]
-
-
-
-
-
-

How do I use multiple dataloaders?

-

If you are using multiple training dataloaders, Lightning won’t be able to restore the random state properly.

-
class LitModel(LightningModule):
-    def train_dataloader(self):
-        loader_a = torch.utils.data.DataLoader(range(8), batch_size=4)
-        loader_b = torch.utils.data.DataLoader(range(16), batch_size=4)
-        return {"loader_a": loader_a, "loader_b": loader_b}
-
-    def training_step(self, batch, batch_idx):
-        # access the data in the same format as the collection of dataloaders.
-        # dict, list are supported.
-        loader_a = batch["loader_a"]
-        loader_b = batch["loader_b"]
-
-
-

If you believe this to be useful, please open a feature request.

-
-
-
-

What are the performance impacts?

-

Fault-tolerant Training was tested on common and worst-case scenarios in order to measure the impact of the internal state tracking on the total training time. -On tiny models like the BoringModel and RandomDataset -which has virtually no data loading and processing overhead, we noticed up to 50% longer training time with fault tolerance enabled. -In this worst-case scenario, fault-tolerant adds an overhead that is noticeable in comparison to the compute time for dataloading itself. -However, for more realistic training workloads where data loading and preprocessing is more expensive, the constant overhead that fault tolerance adds becomes less noticeable or not noticeable at all. -For example, when training with ResNet50 on CIFAR 10 we have observed a 0.5% to 1% increase in training time depending on batch size or number of workers.

-

More detailed benchmarks will be shared in the future.

-
-

Note

-

The extra time is coming from several parts:

-
    -
  • Capturing the iteration count + random states for each sample within each DataLoader workers and pass it through the data_queue

  • -
  • Extra logic to handle / store the dataloader’s states from each batch.

  • -
-
-
-
-
-

What happens to my shuffled dataset?

-

If you are using a single map-based dataset by sub-classing Dataset, everything should work as expected.

-
from torch.utils.data import Dataset, DataLoader
-
-
-class RandomDataset(Dataset):
-    def __init__(self, size: int, length: int):
-        self.len = length
-        self.data = torch.randn(length, size)
-
-    def __getitem__(self, index):
-        return self.data[index]
-
-    def __len__(self):
-        return self.len
-
-
-
-
-
-

What parts are fault-tolerant?

-

Lightning keeps track of the following state updates during training:

-
    -
  • Samplers indices and random states across multiple processes and workers: This enables restoring random transforms and batch fetching to the exact state as it was right before the failure.

  • -
  • Optimizers, learning rate schedulers, callbacks, etc..

  • -
  • Loop progression

  • -
  • Logging internal states such that metric reductions on epoch end are not getting affected by the failure and model selection can continue as expected.

  • -
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/clouds/grid_costs.html b/docs/clouds/grid_costs.html deleted file mode 100644 index cdacaae..0000000 --- a/docs/clouds/grid_costs.html +++ /dev/null @@ -1,690 +0,0 @@ - - - - - - - - - - - - - - Cost — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Cost

-

Lightning (via lightning-grid) provides access to cloud machines to the community for free. However, you must buy credits on lightning-grid which are used to pay the cloud providers on your behalf.

-

If you want to run on your own AWS account and pay the cloud provider directly, please contact our onprem team: mailto:onprem@pytorchlightning.ai

-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- - -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/clouds/run_advanced.html b/docs/clouds/run_advanced.html deleted file mode 100644 index da84b2f..0000000 --- a/docs/clouds/run_advanced.html +++ /dev/null @@ -1,784 +0,0 @@ - - - - - - - - - - - - - - Train on the cloud (advanced) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Train on the cloud (advanced)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Train on the cloud (advanced)

-

Audience: Anyone looking to train a model on the cloud in the background

-
-
-

What is background training?

-

Background training lets you train models in the background without you needing to interact with the machine. As the model trains you can monitor its progress via Tensorboard or an experiment manager of your choice.

-
-
-
-

0: Install lightning-grid

-

First Navigate to https://platform.grid.ai to create a free account.

-

Next, install lightning-grid and login

-
pip install lightning-grid
-grid login
-
-
-
-
-
-

1: Create a dataset

-

Create a datastore which optimizes your datasets for training at scale on the cloud.

-

First, let’s download a dummy dataset we created.

-
# download
-curl https://pl-flash-data.s3.amazonaws.com/cifar5.zip -o cifar5.zip
-
-# unzip
-unzip cifar5.zip
-
-
-

Now create the datastore

-
grid datastore create cifar5/ --name cifar5
-
-
-

Now your dataset is ready to be used for training on the cloud!

-
-

Note

-

In some research workflows, your model script ALSO downloads the dataset. If the dataset is only a few GBs this is fine. Otherwise we recommend you create a Datastore.

-
-
-
-
-

2: Choose the model to run

-

You can run any python script in the background. For this example, we’ll use a simple classifier:

-

Clone the code to your machine:

-
-

Note

-

Code repositories can be as complicated as needed. This is just a simple demo.

-
-
-
-
-

3: Run on the cloud

-

To run this model on the cloud, use the grid run command which has two parts:

-
grid run [run args] file.py [file args]
-
-
-

To attach the datastore cifar5 to the cifar5.py file use the following command:

-
# command | the datastore to use   |  the model  | argument to the model
-grid run --datastore_name cifar5 cifar5.py.py --data_dir /datastores/cifar5
-
-
-
-
-
-

4: Monitor and manage

-

Now that your model is running in the background you can monitor and manage it here.

-

You can also monitor its progress on the commandline:

-
grid status
-
-
-
-
-
-

Next Steps

-

Here are the recommended next steps depending on your workflow.

-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/clouds/run_basic.html b/docs/clouds/run_basic.html deleted file mode 100644 index cf898e9..0000000 --- a/docs/clouds/run_basic.html +++ /dev/null @@ -1,788 +0,0 @@ - - - - - - - - - - - - - - Train on the cloud (intermediate) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Train on the cloud (intermediate)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Train on the cloud (intermediate)

-

Audience: Anyone looking to train a model on the cloud in the background

-
-
-

What is background training?

-

Background training lets you train models in the background without you needing to interact with the machine. As the model trains you can monitor its progress via Tensorboard or an experiment manager of your choice.

-
-
-
-

0: Install lightning-grid

-

First Navigate to https://platform.grid.ai to create a free account.

-

Next, install lightning-grid and login

-
pip install lightning-grid
-grid login
-
-# Login successful. Welcome to Grid.
-
-
-
-
-
-

1: Create a dataset

-

Create a datastore which optimizes your datasets for training at scale on the cloud. Datastores can be created from all sorts of sources such as .zip and .tar links, local files/folders and even s3 buckets.

-

Let’s create a datastore from this .zip file

-
grid datastore create https://pl-flash-data.s3.amazonaws.com/tinycifar5.zip --name cifar5
-
-
-

Now your dataset is ready to be used for training on the cloud!

-
-

Note

-

In some research workflows, your model script ALSO downloads the dataset. If the dataset is only a few GBs this is fine. Otherwise we recommend you create a Datastore.

-
-
-
-
-

2: Choose the model to run

-

You can run any python script in the background. For this example, we’ll use a simple classifier:

-

Clone the code to your machine:

-
git clone https://github.com/williamFalcon/cifar5-simple.git
-cd cifar5-simple
-
-
-
-

Note

-

Code repositories can be as complicated as needed. This is just a simple demo.

-
-
-
-
-

3: Run on the cloud

-

To run this model on the cloud with the attached datastore, use the grid run command:

-
grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5
-
-
-

The grid command has two parts the [run args] and the [file args]

-
grid run [run args] file.py [file args]
-
-
-
-
-
-

4: Monitor and manage

-

Now that your model is running in the background, monitor and manage it here.

-

You can also monitor its progress on the commandline:

-
grid status
-
-
-
-
-
-

Cost

-

Lightning (via lightning-grid) provides access to cloud machines to the community for free. However, you must buy credits on lightning-grid which are used to pay the cloud providers on your behalf.

-

If you want to run on your own AWS account and pay the cloud provider directly, please contact our onprem team: mailto:onprem@pytorchlightning.ai

-
-
-
-

Next Steps

-

Here are the recommended next steps depending on your workflow.

-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/clouds/run_expert.html b/docs/clouds/run_expert.html deleted file mode 100644 index c8b4a71..0000000 --- a/docs/clouds/run_expert.html +++ /dev/null @@ -1,717 +0,0 @@ - - - - - - - - - - - - - - Train on the cloud (expert) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Train on the cloud (expert)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Train on the cloud (expert)

-

Audience: Corporate or academic users who want to run on their Company or University private cloud account.

-
-
-

Run on your own cloud or cluster

-

If you have access to a corporate or academic cluster, you can simply submit jobs that run Lightning models and lightning will automatically work. -Please refer to Clusters guide for more information.

-
-
-
-

Run on your own cloud (hassle free)

-

Cluster training can get complicated once you start doing multi-node training, fault-tolerant training or sweeps. -If you’d prefer to not deal with any of the hassles of running on your own cloud environments, lightning-grid enables University and Enterprise customers to run on the cloud with their own credentials or even onprem.

-

These are some of the benefits of running via lightning-grid:

-
    -
  • create datasets optimized for scale

  • -
  • fully configurable on-prem deployment

  • -
  • SOC-2 compliance (in-progress) (ETA Q3 2022)

  • -
  • micro cost optimizations everywhere (which add up)

  • -
  • built-in fault tolerance

  • -
  • enabled collaboration for teams and enterprises

  • -
-

Contact our sales support engineering team so we can help you set up Grid with your own cloud credentials.

-

Email us to connect with your own cloud account:

-

mailto:onprem@pytorchlightning.ai.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/clouds/run_intermediate.html b/docs/clouds/run_intermediate.html deleted file mode 100644 index 92c88bd..0000000 --- a/docs/clouds/run_intermediate.html +++ /dev/null @@ -1,900 +0,0 @@ - - - - - - - - - - - - - - Train on the cloud (intermediate) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Train on the cloud (intermediate)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Train on the cloud (intermediate)

-

Audience: User looking to run many models at once

-
-
-

What is a sweep?

-

A sweep is the term giving to running the same model multiple times with different hyperparameters to find the one that performs the best (according to your definition of performance).

-

Let’s say I have a python script that trains a Lighting model to classify images. We run this file like so:

-
grid run file.py --batch_size 8
-
-
-

with such a model, I would be interested in knowing how it performs with different batch size. In this case, I’m going to train many versions of this model.

-
# run 4 models in parallel
-grid run file.py --batch_size 8
-grid run file.py --batch_size 16
-grid run file.py --batch_size 32
-grid run file.py --batch_size 64
-
-
-

Now I can see how my model performs according to the layers and based on time and cost I can pick my “best” model:

- - ------ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
Training speed vs cost

Batch size

classification accuracy (%)

training time

cost

8

0.80

5 minutes

$0.15

16

0.85

10 minutes

$0.30

32

0.90

30 minutes

$0.50

64

0.95

60 minutes

$1.01

-
-
-
-

Start a Sweep

-

First, recall that in the previous tutorial we ran a single model using this command:

-
grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5
-
-
-

Now we’re going to run that same model 4 different times each with a different number of layers:

-
grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5 --batch_size 8
-grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5 --batch_size 16
-grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5 --batch_size 32
-grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5 --batch_size 64
-
-
-

Grid has a special syntax based on python that gives you shortcuts for sweeps. The shortcut for the above commands is:

-
grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5 --batch_size "[8, 16, 32, 64]"
-
-
-
-
-
-

Syntax Shortcuts

-
-

List

-
grid run file.py --batch_size "[8, 16, 32, 64]"
-
-
-

equivalent to:

-
grid run file.py --batch_size 8
-grid run file.py --batch_size 16
-grid run file.py --batch_size 32
-grid run file.py --batch_size 64
-
-
-
-
-
-

Range

-
grid run file.py --batch_size "range(1, 10, 2)"
-
-
-

equivalent to:

-
grid run main.py --batch_size 1
-grid run main.py --batch_size 3
-grid run main.py --batch_size 5
-grid run main.py --batch_size 7
-grid run main.py --batch_size 9
-
-
-

-
-
-

String list

-
grid run file.py --model_backbone "['resnet18' 'transformer', 'resnet50']"
-
-
-

equivalent to:

-
grid run file.py --model_backbone 'resnet18'
-grid run file.py --model_backbone 'transformer'
-grid run file.py --model_backbone 'resnet50'
-
-
-
-
-
-

Sampling

-
grid run file.py --learning_rate "uniform(1e-5, 1e-1, 3)"
-
-
-

equivalent to:

-
grid run file.py --learning_rate 0.03977392
-grid run file.py --learning_rate 0.04835479
-grid run file.py --learning_rate 0.05200016
-
-
-
-
-
-
-

Sweep strategies

-

Models often have dozens of hyperparameters. We usually don’t run all combinations because it would be too prohibitive. Grid supports two strategies:

-
- -
- -
-
-
-

Next Steps

-

Here are the recommended next steps depending on your workflow.

-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/clouds/session_basic.html b/docs/clouds/session_basic.html deleted file mode 100644 index 5ce689c..0000000 --- a/docs/clouds/session_basic.html +++ /dev/null @@ -1,788 +0,0 @@ - - - - - - - - - - - - - - Train on the cloud (basic) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Train on the cloud (basic)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Train on the cloud (basic)

-

Audience: Anyone looking to train across many machines at once on the cloud.

-
-
-

Why do I need cloud training?

-

Training on the cloud is a cost effective way to train your models faster by allowing you to access powerful GPU machines.

-

For example, if your model takes 10 days to train on a CPU machine, here’s how cloud training can speed up your training time:

- - ----- - - - - - - - - - - - - - - - - - - - - - - - - -
Training speed vs cost

Machine type

Training time

Cost (AWS 1 M60 GPU)

CPU

10 days

$12.00

1 GPU

2 days

$11.52

2 GPU

1 day

$20.64

4 GPU

12 hours

$19.08

-
-
-
-

Start a cloud machine in < 1 minute

-

Lightning has a native cloud solution with various products (lightning-grid) designed for researchers and ML practicioners in industry. -To start an interactive machine simply go to Lightning Grid to create a free account, then start a new Grid Session.

-

A Grid Session is an interactive machine with 1-16 GPUs per machine.

-Start a Grid Session in a few seconds -
-
-
-

Open the Jupyter Notebook

-

Once the Session starts, open a Jupyter notebook.

-
-
-
-

Clone and run your model

-

On the Jupyter page you can use a Notebook, or to clone your code and run via the CLI.

-
-
-
-

Cost

-

Lightning (via lightning-grid) provides access to cloud machines to the community for free. However, you must buy credits on lightning-grid which are used to pay the cloud providers on your behalf.

-

If you want to run on your own AWS account and pay the cloud provider directly, please contact our onprem team: mailto:onprem@pytorchlightning.ai

-
-
-
-

Next Steps

-

Here are the recommended next steps depending on your workflow.

-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/clouds/session_intermediate.html b/docs/clouds/session_intermediate.html deleted file mode 100644 index b9eb1dd..0000000 --- a/docs/clouds/session_intermediate.html +++ /dev/null @@ -1,689 +0,0 @@ - - - - - - - - - - - - - - Train on the cloud (basic) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Train on the cloud (basic)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Train on the cloud (basic)

-

Audience: Anyone looking to train across many machines at once on the cloud.

-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
- -
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/checkpointing.html b/docs/common/checkpointing.html deleted file mode 100644 index 1a0cdb8..0000000 --- a/docs/common/checkpointing.html +++ /dev/null @@ -1,754 +0,0 @@ - - - - - - - - - - - - - - Checkpointing — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- - -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/checkpointing_advanced.html b/docs/common/checkpointing_advanced.html deleted file mode 100644 index aee1421..0000000 --- a/docs/common/checkpointing_advanced.html +++ /dev/null @@ -1,762 +0,0 @@ - - - - - - - - - - - - - - Checkpointing (advanced) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Checkpointing (advanced)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Checkpointing (advanced)

-
-

Cloud checkpoints

-

Lightning is integrated with the major remote file systems including local filesystems and several cloud storage providers such as -S3 on AWS, GCS on Google Cloud, -or ADL on Azure.

-

PyTorch Lightning uses fsspec internally to handle all filesystem operations.

-
-
-

Save a cloud checkpoint

-

To save to a remote filesystem, prepend a protocol like “s3:/” to the root_dir used for writing and reading model data.

-
# `default_root_dir` is the default path used for logs and checkpoints
-trainer = Trainer(default_root_dir="s3://my_bucket/data/")
-trainer.fit(model)
-
-
-
-
-
-

Resume training from a cloud checkpoint

-

To resume training from a cloud checkpoint use a cloud url.

-
trainer = Trainer(default_root_dir=tmpdir, max_steps=3)
-trainer.fit(model, ckpt_path="s3://my_bucket/ckpts/classifier.ckpt")
-
-
-

PyTorch Lightning uses fsspec internally to handle all filesystem operations.

-
-
-
-
-

Modularize your checkpoints

-

Checkpoints can also save the state of datamodules and callbacks.

-
-
-
-

Modify a checkpoint anywhere

-

When you need to change the components of a checkpoint before saving or loading, use the on_save_checkpoint() and on_load_checkpoint() of your LightningModule.

-
class LitModel(pl.LightningModule):
-    def on_save_checkpoint(self, checkpoint):
-        checkpoint["something_cool_i_want_to_save"] = my_cool_pickable_object
-
-    def on_load_checkpoint(self, checkpoint):
-        my_cool_pickable_object = checkpoint["something_cool_i_want_to_save"]
-
-
-

Use the above approach when you need to couple this behavior to your LightningModule for reproducibility reasons. Otherwise, Callbacks also have the on_save_checkpoint() and on_load_checkpoint() which you should use instead:

-
class LitCallback(pl.Callback):
-    def on_save_checkpoint(self, checkpoint):
-        checkpoint["something_cool_i_want_to_save"] = my_cool_pickable_object
-
-    def on_load_checkpoint(self, checkpoint):
-        my_cool_pickable_object = checkpoint["something_cool_i_want_to_save"]
-
-
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/checkpointing_basic.html b/docs/common/checkpointing_basic.html deleted file mode 100644 index 85e04b0..0000000 --- a/docs/common/checkpointing_basic.html +++ /dev/null @@ -1,845 +0,0 @@ - - - - - - - - - - - - - - Checkpointing (basic) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Checkpointing (basic)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Checkpointing (basic)

-

Audience: All users

-
-
-

What is a checkpoint?

-

When a model is training, the performance changes as it continues to see more data. It is a best practice to save the state of a model throughout the training process. This gives you a version of the model, a checkpoint, at each key point during the development of the model. Once training has completed, use the checkpoint that corresponds to the best performance you found during the training process.

-

Checkpoints also enable your training to resume from where it was in case the training process is interrupted.

-

PyTorch Lightning checkpoints are fully usable in plain PyTorch.

-
-
-
-

Contents of a checkpoint

-

A Lightning checkpoint contains a dump of the model’s entire internal state. Unlike plain PyTorch, Lightning saves everything you need to restore a model even in the most complex distributed training environments.

-

Inside a Lightning checkpoint you’ll find:

-
    -
  • 16-bit scaling factor (if using 16-bit precision training)

  • -
  • Current epoch

  • -
  • Global step

  • -
  • LightningModule’s state_dict

  • -
  • State of all optimizers

  • -
  • State of all learning rate schedulers

  • -
  • State of all callbacks (for stateful callbacks)

  • -
  • State of datamodule (for stateful datamodules)

  • -
  • The hyperparameters used for that model if passed in as hparams (Argparse.Namespace)

  • -
  • State of Loops (if using Fault-Tolerant training)

  • -
-
-
-
-

Save a checkpoint

-

Lightning automatically saves a checkpoint for you in your current working directory, with the state of your last training epoch. This makes sure you can resume training in case it was interrupted.

-
# simply by using the Trainer you get automatic checkpointing
-trainer = Trainer()
-
-
-

To change the checkpoint path use the default_root_dir argument:

-
# saves checkpoints to 'some/path/' at every epoch end
-trainer = Trainer(default_root_dir="some/path/")
-
-
-
-
-
-

LightningModule from checkpoint

-

To load a LightningModule along with its weights and hyperparameters use the following method:

-
model = MyLightningModule.load_from_checkpoint("/path/to/checkpoint.ckpt")
-
-# disable randomness, dropout, etc...
-model.eval()
-
-# predict with the model
-y_hat = model(x)
-
-
-
-
-

Save hyperparameters

-

The LightningModule allows you to automatically save all the hyperparameters passed to init simply by calling self.save_hyperparameters().

-
class MyLightningModule(LightningModule):
-    def __init__(self, learning_rate, another_parameter, *args, **kwargs):
-        super().__init__()
-        self.save_hyperparameters()
-
-
-

The hyperparameters are saved to the “hyper_parameters” key in the checkpoint

-
checkpoint = torch.load(checkpoint, map_location=lambda storage, loc: storage)
-print(checkpoint["hyper_parameters"])
-# {"learning_rate": the_value, "another_parameter": the_other_value}
-
-
-

The LightningModule also has access to the Hyperparameters

-
model = MyLightningModule.load_from_checkpoint("/path/to/checkpoint.ckpt")
-print(model.learning_rate)
-
-
-
-
-
-

Initalize with other parameters

-

If you used the self.save_hyperparameters() method in the init of the LightningModule, you can initialize the model with different hyperparameters.

-
# if you train and save the model like this it will use these values when loading
-# the weights. But you can overwrite this
-LitModel(in_dim=32, out_dim=10)
-
-# uses in_dim=32, out_dim=10
-model = LitModel.load_from_checkpoint(PATH)
-
-# uses in_dim=128, out_dim=10
-model = LitModel.load_from_checkpoint(PATH, in_dim=128, out_dim=10)
-
-
-
-
-
-
-

nn.Module from checkpoint

-

Lightning checkpoints are fully compatible with plain torch nn.Modules.

-
checkpoint = torch.load(CKPT_PATH)
-print(checkpoint.keys())
-
-
-

For example, let’s pretend we created a LightningModule like so:

-
class Encoder(nn.Module):
-    ...
-
-
-class Decoder(nn.Module):
-    ...
-
-
-class Autoencoder(pl.LightningModule):
-    def __init__(self, encoder, decoder, *args, **kwargs):
-        ...
-
-
-autoencoder = Autoencoder(Encoder(), Decoder())
-
-
-

Once the autoencoder has trained, pull out the relevant weights for your torch nn.Module:

-
checkpoint = torch.load(CKPT_PATH)
-encoder_weights = checkpoint["encoder"]
-decoder_weights = checkpoint["decoder"]
-
-
-
-
-
-

Disable checkpointing

-

You can disable checkpointing by passing:

-
trainer = Trainer(enable_checkpointing=False)
-
-
-
-
-
-

Resume training state

-

If you don’t just want to load weights, but instead restore the full training, do the following:

-
model = LitModel()
-trainer = Trainer()
-
-# automatically restores model, epoch, step, LR schedulers, apex, etc...
-trainer.fit(model, ckpt_path="some/path/to/my_checkpoint.ckpt")
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/checkpointing_expert.html b/docs/common/checkpointing_expert.html deleted file mode 100644 index e046d52..0000000 --- a/docs/common/checkpointing_expert.html +++ /dev/null @@ -1,774 +0,0 @@ - - - - - - - - - - - - - - Checkpointing (expert) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Checkpointing (expert)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Checkpointing (expert)

-

TODO: I don’t understand this…

-
-

Customize Checkpointing

-
-

Warning

-

The Checkpoint IO API is experimental and subject to change.

-
-

Lightning supports modifying the checkpointing save/load functionality through the CheckpointIO. This encapsulates the save/load logic -that is managed by the Strategy. CheckpointIO is different from on_save_checkpoint() -and on_load_checkpoint() methods as it determines how the checkpoint is saved/loaded to storage rather than -what’s saved in the checkpoint.

-
-
-

Built-in Checkpoint IO Plugins

- - ---- - - - - - - - - - - - - - -
Built-in Checkpoint IO Plugins

Plugin

Description

TorchCheckpointIO

CheckpointIO that utilizes torch.save() and torch.load() to save and load checkpoints -respectively, common for most use cases.

XLACheckpointIO

CheckpointIO that utilizes xm.save() to save checkpoints for TPU training strategies.

-
-
-

Custom Checkpoint IO Plugin

-

CheckpointIO can be extended to include your custom save/load functionality to and from a path. The CheckpointIO object can be passed to either a Trainer directly or a Strategy as shown below:

-
from pytorch_lightning import Trainer
-from pytorch_lightning.callbacks import ModelCheckpoint
-from pytorch_lightning.plugins import CheckpointIO
-from pytorch_lightning.strategies import SingleDeviceStrategy
-
-
-class CustomCheckpointIO(CheckpointIO):
-    def save_checkpoint(self, checkpoint, path, storage_options=None):
-        ...
-
-    def load_checkpoint(self, path, storage_options=None):
-        ...
-
-    def remove_checkpoint(self, path):
-        ...
-
-
-custom_checkpoint_io = CustomCheckpointIO()
-
-# Either pass into the Trainer object
-model = MyModel()
-trainer = Trainer(
-    plugins=[custom_checkpoint_io],
-    callbacks=ModelCheckpoint(save_last=True),
-)
-trainer.fit(model)
-
-# or pass into Strategy
-model = MyModel()
-device = torch.device("cpu")
-trainer = Trainer(
-    strategy=SingleDeviceStrategy(device, checkpoint_io=custom_checkpoint_io),
-    callbacks=ModelCheckpoint(save_last=True),
-)
-trainer.fit(model)
-
-
-
-

Note

-

Some TrainingTypePlugins like DeepSpeedStrategy do not support custom CheckpointIO as checkpointing logic is not modifiable.

-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/checkpointing_intermediate.html b/docs/common/checkpointing_intermediate.html deleted file mode 100644 index 16b8ce7..0000000 --- a/docs/common/checkpointing_intermediate.html +++ /dev/null @@ -1,865 +0,0 @@ - - - - - - - - - - - - - - Checkpointing (intermediate) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Checkpointing (intermediate)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Checkpointing (intermediate)

-

Audience: Users looking to customize the checkpointing behavior

-
-
-

Modify checkpointing behavior

-

For fine-grain control over checkpointing behavior, use the ModelCheckpoint object

-
from pytorch_lightning.callbacks import ModelCheckpoint
-
-checkpoint_callback = ModelCheckpoint(dirpath="my/path/", save_top_k=2, monitor="val_loss")
-trainer = Trainer(callbacks=[checkpoint_callback])
-trainer.fit(model)
-checkpoint_callback.best_model_path
-
-
-

Any value that has been logged via self.log in the LightningModule can be monitored.

-
class LitModel(pl.LightningModule):
-    def training_step(self, batch, batch_idx):
-        self.log("my_metric", x)
-
-
-# 'my_metric' is now able to be monitored
-checkpoint_callback = ModelCheckpoint(monitor="my_metric")
-
-
-
-
-
-

Save checkpoints by condition

-

To save checkpoints based on a (when/which/what/where) condition (for example when the validation_loss is lower) modify the ModelCheckpoint properties.

-
-

When

-
    -
  • When using iterative training which doesn’t have an epoch, you can checkpoint at every N training steps by specifying every_n_training_steps=N.

  • -
  • You can also control the interval of epochs between checkpoints using every_n_epochs between checkpoints, to avoid slowdowns.

  • -
  • You can checkpoint at a regular time interval using train_time_interval argument independent of the steps or epochs.

  • -
  • In case you are monitoring a training metrics, we’d suggest using save_on_train_epoch_end=True to ensure the required metric is being accumulated correctly for creating a checkpoint.

  • -
-
-
-

Which

-
    -
  • You can save the last checkpoint when training ends using save_last argument.

  • -
  • You can save top-K and last-K checkpoints by configuring the monitor and save_top_k argument.

  • -
-
-

-
-
-
from pytorch_lightning.callbacks import ModelCheckpoint
-
-
-# saves top-K checkpoints based on "val_loss" metric
-checkpoint_callback = ModelCheckpoint(
-    save_top_k=10,
-    monitor="val_loss",
-    mode="min",
-    dirpath="my/path/",
-    filename="sample-mnist-{epoch:02d}-{val_loss:.2f}",
-)
-
-# saves last-K checkpoints based on "global_step" metric
-# make sure you log it inside your LightningModule
-checkpoint_callback = ModelCheckpoint(
-    save_top_k=10,
-    monitor="global_step",
-    mode="max",
-    dirpath="my/path/",
-    filename="sample-mnist-{epoch:02d}-{global_step}",
-)
-
-
-
-
    -
  • You can customize the checkpointing behavior to monitor any quantity of your training or validation steps. For example, if you want to update your checkpoints based on your validation loss:

  • -
-
-

-
-
-
from pytorch_lightning.callbacks import ModelCheckpoint
-
-
-class LitAutoEncoder(LightningModule):
-    def validation_step(self, batch, batch_idx):
-        x, y = batch
-        y_hat = self.backbone(x)
-
-        # 1. calculate loss
-        loss = F.cross_entropy(y_hat, y)
-
-        # 2. log val_loss
-        self.log("val_loss", loss)
-
-
-# 3. Init ModelCheckpoint callback, monitoring "val_loss"
-checkpoint_callback = ModelCheckpoint(monitor="val_loss")
-
-# 4. Add your callback to the callbacks list
-trainer = Trainer(callbacks=[checkpoint_callback])
-
-
-
-
-
-

What

-
    -
  • By default, the ModelCheckpoint callback saves model weights, optimizer states, etc., but in case you have limited disk space or just need the model weights to be saved you can specify save_weights_only=True.

  • -
-
-
-

Where

-
    -
  • It gives you the ability to specify the dirpath and filename for your checkpoints. Filename can also be dynamic so you can inject the metrics that are being logged using log().

  • -
-
-

-
-
-
from pytorch_lightning.callbacks import ModelCheckpoint
-
-
-# saves a file like: my/path/sample-mnist-epoch=02-val_loss=0.32.ckpt
-checkpoint_callback = ModelCheckpoint(
-    dirpath="my/path/",
-    filename="sample-mnist-{epoch:02d}-{val_loss:.2f}",
-)
-
-
-
-
-

-
-

The ModelCheckpoint callback is very robust and should cover 99% of the use-cases. If you find a use-case that is not configured yet, feel free to open an issue with a feature request on GitHub -and the Lightning Team will be happy to integrate/help integrate it.

-
-
-
-
-

Save checkpoints manually

-

You can manually save checkpoints and restore your model from the checkpointed state using save_checkpoint() -and load_from_checkpoint().

-
model = MyLightningModule(hparams)
-trainer.fit(model)
-trainer.save_checkpoint("example.ckpt")
-
-# load the checkpoint later as normal
-new_model = MyLightningModule.load_from_checkpoint(checkpoint_path="example.ckpt")
-
-
-
-

Manual saving with distributed training

-

In distributed training cases where a model is running across many machines, Lightning ensures that only one checkpoint is saved instead of a model per machine. This requires no code changes as seen below:

-
trainer = Trainer(strategy="ddp")
-model = MyLightningModule(hparams)
-trainer.fit(model)
-# Saves only on the main process
-trainer.save_checkpoint("example.ckpt")
-
-
-

Not using save_checkpoint() can lead to unexpected behavior and potential deadlock. Using other saving functions will result in all devices attempting to save the checkpoint. As a result, we highly recommend using the Trainer’s save functionality. -If using custom saving functions cannot be avoided, we recommend using the rank_zero_only() decorator to ensure saving occurs only on the main process. Note that this will only work if all ranks hold the exact same state and won’t work when using -model parallel distributed strategies such as deepspeed or sharded training.

-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/child_modules.html b/docs/common/child_modules.html deleted file mode 100644 index 130f1e0..0000000 --- a/docs/common/child_modules.html +++ /dev/null @@ -1,747 +0,0 @@ - - - - - - - - - - - - - - <no title> — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -

Research projects tend to test different approaches to the same dataset. -This is very easy to do in Lightning with inheritance.

-

For example, imagine we now want to train an AutoEncoder to use as a feature extractor for images. -The only things that change in the LitAutoEncoder model are the init, forward, training, validation and test step.

-
class Encoder(torch.nn.Module):
-    ...
-
-
-class Decoder(torch.nn.Module):
-    ...
-
-
-class AutoEncoder(torch.nn.Module):
-    def __init__(self):
-        super().__init__()
-        self.encoder = Encoder()
-        self.decoder = Decoder()
-
-    def forward(self, x):
-        return self.decoder(self.encoder(x))
-
-
-class LitAutoEncoder(LightningModule):
-    def __init__(self, auto_encoder):
-        super().__init__()
-        self.auto_encoder = auto_encoder
-        self.metric = torch.nn.MSELoss()
-
-    def forward(self, x):
-        return self.auto_encoder.encoder(x)
-
-    def training_step(self, batch, batch_idx):
-        x, _ = batch
-        x_hat = self.auto_encoder(x)
-        loss = self.metric(x, x_hat)
-        return loss
-
-    def validation_step(self, batch, batch_idx):
-        self._shared_eval(batch, batch_idx, "val")
-
-    def test_step(self, batch, batch_idx):
-        self._shared_eval(batch, batch_idx, "test")
-
-    def _shared_eval(self, batch, batch_idx, prefix):
-        x, _ = batch
-        x_hat = self.auto_encoder(x)
-        loss = self.metric(x, x_hat)
-        self.log(f"{prefix}_loss", loss)
-
-
-

and we can train this using the Trainer:

-
auto_encoder = AutoEncoder()
-lightning_module = LitAutoEncoder(auto_encoder)
-trainer = Trainer()
-trainer.fit(lightning_module, train_dataloader, val_dataloader)
-
-
-

And remember that the forward method should define the practical use of a LightningModule. -In this case, we want to use the LitAutoEncoder to extract image representations:

-
some_images = torch.Tensor(32, 1, 28, 28)
-representations = lightning_module(some_images)
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
-
    -
- -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/console_logs.html b/docs/common/console_logs.html deleted file mode 100644 index ba90330..0000000 --- a/docs/common/console_logs.html +++ /dev/null @@ -1,721 +0,0 @@ - - - - - - - - - - - - - - Console logging — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Console logging

-

Audience: Engineers looking to capture more visible logs.

-
-
-

Enable console logs

-

Lightning logs useful information about the training process and user warnings to the console. -You can retrieve the Lightning console logger and change it to your liking. For example, adjust the logging level -or redirect output for certain modules to log files:

-
import logging
-
-# configure logging at the root level of Lightning
-logging.getLogger("pytorch_lightning").setLevel(logging.ERROR)
-
-# configure logging on module level, redirect to file
-logger = logging.getLogger("pytorch_lightning.core")
-logger.addHandler(logging.FileHandler("core.log"))
-
-
-

Read more about custom Python logging here.

-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
- -
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/early_stopping.html b/docs/common/early_stopping.html deleted file mode 100644 index bf3584a..0000000 --- a/docs/common/early_stopping.html +++ /dev/null @@ -1,775 +0,0 @@ - - - - - - - - - - - - - - Early Stopping — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Early Stopping

-
-

Stopping an Epoch Early

-

You can stop and skip the rest of the current epoch early by overriding on_train_batch_start() to return -1 when some condition is met.

-

If you do this repeatedly, for every epoch you had originally requested, then this will stop your entire training.

-
-
-

EarlyStopping Callback

-

The EarlyStopping callback can be used to monitor a metric and stop the training when no improvement is observed.

-

To enable it:

-
    -
  • Import EarlyStopping callback.

  • -
  • Log the metric you want to monitor using log() method.

  • -
  • Init the callback, and set monitor to the logged metric of your choice.

  • -
  • Set the mode based on the metric needs to be monitored.

  • -
  • Pass the EarlyStopping callback to the Trainer callbacks flag.

  • -
-
from pytorch_lightning.callbacks.early_stopping import EarlyStopping
-
-
-class LitModel(LightningModule):
-    def validation_step(self, batch, batch_idx):
-        loss = ...
-        self.log("val_loss", loss)
-
-
-model = LitModel()
-trainer = Trainer(callbacks=[EarlyStopping(monitor="val_loss", mode="min")])
-trainer.fit(model)
-
-
-

You can customize the callbacks behaviour by changing its parameters.

-
early_stop_callback = EarlyStopping(monitor="val_accuracy", min_delta=0.00, patience=3, verbose=False, mode="max")
-trainer = Trainer(callbacks=[early_stop_callback])
-
-
-

Additional parameters that stop training at extreme points:

-
    -
  • stopping_threshold: Stops training immediately once the monitored quantity reaches this threshold. -It is useful when we know that going beyond a certain optimal value does not further benefit us.

  • -
  • divergence_threshold: Stops training as soon as the monitored quantity becomes worse than this threshold. -When reaching a value this bad, we believes the model cannot recover anymore and it is better to stop early and run with different initial conditions.

  • -
  • check_finite: When turned on, it stops training if the monitored metric becomes NaN or infinite.

  • -
  • check_on_train_epoch_end: When turned on, it checks the metric at the end of a training epoch. Use this only when you are monitoring any metric logged within -training-specific hooks on epoch-level.

  • -
-

In case you need early stopping in a different part of training, subclass EarlyStopping -and change where it is called:

-
class MyEarlyStopping(EarlyStopping):
-    def on_validation_end(self, trainer, pl_module):
-        # override this to disable early stopping at the end of val loop
-        pass
-
-    def on_train_end(self, trainer, pl_module):
-        # instead, do it at the end of training loop
-        self._run_early_stopping_check(trainer)
-
-
-
-

Note

-

The EarlyStopping callback runs -at the end of every validation epoch by default. However, the frequency of validation -can be modified by setting various parameters in the Trainer, -for example check_val_every_n_epoch -and val_check_interval. -It must be noted that the patience parameter counts the number of -validation checks with no improvement, and not the number of training epochs. -Therefore, with parameters check_val_every_n_epoch=10 and patience=3, the trainer -will perform at least 40 training epochs before being stopped.

-
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/evaluation.html b/docs/common/evaluation.html deleted file mode 100644 index c4ee553..0000000 --- a/docs/common/evaluation.html +++ /dev/null @@ -1,721 +0,0 @@ - - - - - - - - - - - - - - Add validation and test datasets — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Add validation and test datasets
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/evaluation_basic.html b/docs/common/evaluation_basic.html deleted file mode 100644 index f9e097e..0000000 --- a/docs/common/evaluation_basic.html +++ /dev/null @@ -1,808 +0,0 @@ - - - - - - - - - - - - - - Validate and test a model (basic) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Validate and test a model (basic)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Validate and test a model (basic)

-

Audience: Users who want to add a validation loop to avoid overfitting

-
-
-

Add a test loop

-

To make sure a model can generalize to an unseen dataset (ie: to publish a paper or in a production environment) a dataset is normally split into two parts, the train split and the test split.

-

The test set is NOT used during training, it is ONLY used once the model has been trained to see how the model will do in the real-world.

-
-
-

Find the train and test splits

-

Datasets come with two splits. Refer to the dataset documentation to find the train and test splits.

-
import torch.utils.data as data
-from torchvision import datasets
-
-# Load data sets
-train_set = datasets.MNIST(root="MNIST", download=True, train=True)
-test_set = datasets.MNIST(root="MNIST", download=True, train=False)
-
-
-
-
-
-

Define the test loop

-

To add a test loop, implement the test_step method of the LightningModule

-
class LitAutoEncoder(pl.LightningModule):
-    def training_step(self, batch, batch_idx):
-        ...
-
-    def test_step(self, batch, batch_idx):
-        # this is the test loop
-        x, y = batch
-        x = x.view(x.size(0), -1)
-        z = self.encoder(x)
-        x_hat = self.decoder(z)
-        test_loss = F.mse_loss(x_hat, x)
-        self.log("test_loss", test_loss)
-
-
-
-
-
-

Train with the test loop

-

Once the model has finished training, call .test

-
from torch.utils.data import DataLoader
-
-# initialize the Trainer
-trainer = Trainer()
-
-# test the model
-trainer.test(model, dataloaders=DataLoader(test_set))
-
-
-
-
-
-
-

Add a validation loop

-

During training, it’s common practice to use a small portion of the train split to determine when the model has finished training.

-
-
-

Split the training data

-

As a rule of thumb, we use 20% of the training set as the validation set. This number varies from dataset to dataset.

-
# use 20% of training data for validation
-train_set_size = int(len(train_set) * 0.8)
-valid_set_size = len(train_set) - train_set_size
-
-# split the train set into two
-seed = torch.Generator().manual_seed(42)
-train_set, valid_set = data.random_split(train_set, [train_set_size, valid_set_size], generator=seed)
-
-
-
-
-
-

Define the validation loop

-

To add a validation loop, implement the validation_step method of the LightningModule

-
class LitAutoEncoder(pl.LightningModule):
-    def training_step(self, batch, batch_idx):
-        ...
-
-    def validation_step(self, batch, batch_idx):
-        # this is the validation loop
-        x, y = batch
-        x = x.view(x.size(0), -1)
-        z = self.encoder(x)
-        x_hat = self.decoder(z)
-        test_loss = F.mse_loss(x_hat, x)
-        self.log("val_loss", test_loss)
-
-
-
-
-
-

Train with the validation loop

-

To run the validation loop, pass in the validation set to .fit

-
from torch.utils.data import DataLoader
-
-train_set = DataLoader(train_set)
-val_set = DataLoader(val_set)
-
-# train with both splits
-trainer = Trainer()
-trainer.fit(model, train_set, val_set)
-
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/evaluation_intermediate.html b/docs/common/evaluation_intermediate.html deleted file mode 100644 index eb3640d..0000000 --- a/docs/common/evaluation_intermediate.html +++ /dev/null @@ -1,878 +0,0 @@ - - - - - - - - - - - - - - Validate and test a model (intermediate) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Validate and test a model (intermediate)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Validate and test a model (intermediate)

-

During and after training we need a way to evaluate our models to make sure they are not overfitting while training and -generalize well on unseen or real-world data. There are generally 2 stages of evaluation: validation and testing. To some -degree they serve the same purpose, to make sure models works on real data but they have some practical differences.

-

Validation is usually done during training, traditionally after each training epoch. It can be used for hyperparameter optimization or tracking model performance during training. -It’s a part of the training process.

-

Testing is usually done once we are satisfied with the training and only with the best model selected from the validation metrics.

-

Let’s see how these can be performed with Lightning.

-
-

Testing

-

Lightning allows the user to test their models with any compatible test dataloaders. This can be done before/after training -and is completely agnostic to fit() call. The logic used here is defined under -test_step().

-

Testing is performed using the Trainer object’s .test() method.

-
-
-Trainer.test(model=None, dataloaders=None, ckpt_path=None, verbose=True, datamodule=None)[source]
-

Perform one evaluation epoch over the test set. -It’s separated from fit to make sure you never run on your test set until you want to.

-
-
Parameters
-
    -
  • model (Optional[LightningModule]) – The model to test.

  • -
  • dataloaders (Union[DataLoader, Sequence[DataLoader], LightningDataModule, None]) – A torch.utils.data.DataLoader or a sequence of them, -or a LightningDataModule specifying test samples.

  • -
  • ckpt_path (Optional[str]) – Either best or path to the checkpoint you wish to test. -If None and the model instance was passed, use the current weights. -Otherwise, the best model checkpoint from the previous trainer.fit call will be loaded -if a checkpoint callback is configured.

  • -
  • verbose (bool) – If True, prints the test results.

  • -
  • datamodule (Optional[LightningDataModule]) – An instance of LightningDataModule.

  • -
-
-
Return type
-

List[Dict[str, float]]

-
-
Returns
-

List of dictionaries with metrics logged during the test phase, e.g., in model- or callback hooks -like test_step(), -test_epoch_end(), etc. -The length of the list corresponds to the number of test dataloaders used.

-
-
-
- -
-

Test after Fit

-

To run the test set after training completes, use this method.

-
# run full training
-trainer.fit(model)
-
-# (1) load the best checkpoint automatically (lightning tracks this for you)
-trainer.test(ckpt_path="best")
-
-# (2) test using a specific checkpoint
-trainer.test(ckpt_path="/path/to/my_checkpoint.ckpt")
-
-# (3) test with an explicit model (will use this model and not load a checkpoint)
-trainer.test(model)
-
-
-
-

Warning

-

It is recommended to test with Trainer(devices=1) since distributed strategies such as DDP -use DistributedSampler internally, which replicates some samples to -make sure all devices have same batch size in case of uneven inputs. This is helpful to make sure -benchmarking for research papers is done the right way.

-
-
-
-

Test Multiple Models

-

You can run the test set on multiple models using the same trainer instance.

-
model1 = LitModel()
-model2 = GANModel()
-
-trainer = Trainer()
-trainer.test(model1)
-trainer.test(model2)
-
-
-
-
-

Test Pre-Trained Model

-

To run the test set on a pre-trained model, use this method.

-
model = MyLightningModule.load_from_checkpoint(
-    checkpoint_path="/path/to/pytorch_checkpoint.ckpt",
-    hparams_file="/path/to/test_tube/experiment/version/hparams.yaml",
-    map_location=None,
-)
-
-# init trainer with whatever options
-trainer = Trainer(...)
-
-# test (pass in the model)
-trainer.test(model)
-
-
-

In this case, the options you pass to trainer will be used when -running the test set (ie: 16-bit, dp, ddp, etc…)

-
-
-

Test with Additional DataLoaders

-

You can still run inference on a test dataset even if the test_dataloader() method hasn’t been -defined within your lightning module instance. This would be the case when your test data -is not available at the time your model was declared.

-
# setup your data loader
-test_dataloader = DataLoader(...)
-
-# test (pass in the loader)
-trainer.test(dataloaders=test_dataloader)
-
-
-

You can either pass in a single dataloader or a list of them. This optional named -parameter can be used in conjunction with any of the above use cases. Additionally, -you can also pass in an datamodules that have overridden the -test_dataloader method.

-
class MyDataModule(pl.LightningDataModule):
-    ...
-
-    def test_dataloader(self):
-        return DataLoader(...)
-
-
-# setup your datamodule
-dm = MyDataModule(...)
-
-# test (pass in datamodule)
-trainer.test(datamodule=dm)
-
-
-
-
-
-
-

Validation

-

Lightning allows the user to validate their models with any compatible val dataloaders. This can be done before/after training. -The logic associated to the validation is defined within the validation_step().

-

Apart from this .validate has same API as .test, but would rely respectively on validation_step() and test_step().

-
-

Note

-

.validate method uses the same validation logic being used under validation happening within -fit() call.

-
-
-

Warning

-

When using trainer.validate(), it is recommended to use Trainer(devices=1) since distributed strategies such as DDP -uses DistributedSampler internally, which replicates some samples to -make sure all devices have same batch size in case of uneven inputs. This is helpful to make sure -benchmarking for research papers is done the right way.

-
-
-
-Trainer.validate(model=None, dataloaders=None, ckpt_path=None, verbose=True, datamodule=None)[source]
-

Perform one evaluation epoch over the validation set.

-
-
Parameters
-
    -
  • model (Optional[LightningModule]) – The model to validate.

  • -
  • dataloaders (Union[DataLoader, Sequence[DataLoader], LightningDataModule, None]) – A torch.utils.data.DataLoader or a sequence of them, -or a LightningDataModule specifying validation samples.

  • -
  • ckpt_path (Optional[str]) – Either best or path to the checkpoint you wish to validate. -If None and the model instance was passed, use the current weights. -Otherwise, the best model checkpoint from the previous trainer.fit call will be loaded -if a checkpoint callback is configured.

  • -
  • verbose (bool) – If True, prints the validation results.

  • -
  • datamodule (Optional[LightningDataModule]) – An instance of LightningDataModule.

  • -
-
-
Return type
-

List[Dict[str, float]]

-
-
Returns
-

List of dictionaries with metrics logged during the validation phase, e.g., in model- or callback hooks -like validation_step(), -validation_epoch_end(), etc. -The length of the list corresponds to the number of validation dataloaders used.

-
-
-
- -
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/gradient_accumulation.html b/docs/common/gradient_accumulation.html deleted file mode 100644 index f8d6505..0000000 --- a/docs/common/gradient_accumulation.html +++ /dev/null @@ -1,724 +0,0 @@ - - - - - - - - - - - - - - <no title> — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -

Accumulated gradients run K small batches of size N before doing a backward pass. The effect is a large effective batch size of size KxN, where N is the batch size. -Internally it doesn’t stack up the batches and do a forward pass rather it accumulates the gradients for K batches and then do an optimizer.step to make sure the -effective batch size is increased but there is no memory overhead.

-
-

Warning

-

When using distributed training for eg. DDP, with let’s say with P devices, each device accumulates independently i.e. it stores the gradients -after each loss.backward() and doesn’t sync the gradients across the devices until we call optimizer.step(). So for each accumulation -step, the effective batch size on each device will remain N*K but right before the optimizer.step(), the gradient sync will make the effective -batch size as P*N*K. For DP, since the batch is split across devices, the final effective batch size will be N*K.

-
-
-

See also

-

Trainer

-
-
# DEFAULT (ie: no accumulated grads)
-trainer = Trainer(accumulate_grad_batches=1)
-
-# Accumulate gradients for 7 batches
-trainer = Trainer(accumulate_grad_batches=7)
-
-
-

You can set different values for it at different epochs by passing a dictionary, where the key represents the epoch at which the value for gradient accumulation -should be updated.

-
# till 5th epoch, it will accumulate every 8 batches. From 5th epoch
-# till 9th epoch it will accumulate every 4 batches and after that no accumulation
-# will happen. Note that you need to use zero-indexed epoch keys here
-trainer = Trainer(accumulate_grad_batches={0: 8, 4: 4, 8: 1})
-
-
-

Or, you can create custom GradientAccumulationScheduler

-
from pytorch_lightning.callbacks import GradientAccumulationScheduler
-
-
-# till 5th epoch, it will accumulate every 8 batches. From 5th epoch
-# till 9th epoch it will accumulate every 4 batches and after that no accumulation
-# will happen. Note that you need to use zero-indexed epoch keys here
-accumulator = GradientAccumulationScheduler(scheduling={0: 8, 4: 4, 8: 1})
-trainer = Trainer(callbacks=accumulator)
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
-
    -
- -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/hyperparameters.html b/docs/common/hyperparameters.html deleted file mode 100644 index 19b0173..0000000 --- a/docs/common/hyperparameters.html +++ /dev/null @@ -1,944 +0,0 @@ - - - - - - - - - - - - - - Configure hyperparameters from the CLI — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Configure hyperparameters from the CLI
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Configure hyperparameters from the CLI

-

Lightning has utilities to interact seamlessly with the command line ArgumentParser -and plays well with the hyperparameter optimization framework of your choice.

-
-
-

ArgumentParser

-

Lightning is designed to augment a lot of the functionality of the built-in Python ArgumentParser

-
from argparse import ArgumentParser
-
-parser = ArgumentParser()
-parser.add_argument("--layer_1_dim", type=int, default=128)
-args = parser.parse_args()
-
-
-

This allows you to call your program like so:

-
python trainer.py --layer_1_dim 64
-
-
-
-
-
-

Argparser Best Practices

-

It is best practice to layer your arguments in three sections.

-
    -
  1. Trainer args (accelerator, devices, num_nodes, etc…)

  2. -
  3. Model specific arguments (layer_dim, num_layers, learning_rate, etc…)

  4. -
  5. Program arguments (data_path, cluster_email, etc…)

  6. -
-
-

-
-

We can do this as follows. First, in your LightningModule, define the arguments -specific to that module. Remember that data splits or data paths may also be specific to -a module (i.e.: if your project has a model that trains on Imagenet and another on CIFAR-10).

-
class LitModel(LightningModule):
-    @staticmethod
-    def add_model_specific_args(parent_parser):
-        parser = parent_parser.add_argument_group("LitModel")
-        parser.add_argument("--encoder_layers", type=int, default=12)
-        parser.add_argument("--data_path", type=str, default="/some/path")
-        return parent_parser
-
-
-

Now in your main trainer file, add the Trainer args, the program args, and add the model args

-
# ----------------
-# trainer_main.py
-# ----------------
-from argparse import ArgumentParser
-
-parser = ArgumentParser()
-
-# add PROGRAM level args
-parser.add_argument("--conda_env", type=str, default="some_name")
-parser.add_argument("--notification_email", type=str, default="will@email.com")
-
-# add model specific args
-parser = LitModel.add_model_specific_args(parser)
-
-# add all the available trainer options to argparse
-# ie: now --accelerator --devices --num_nodes ... --fast_dev_run all work in the cli
-parser = Trainer.add_argparse_args(parser)
-
-args = parser.parse_args()
-
-
-

Now you can call run your program like so:

-
python trainer_main.py --accelerator 'gpu' --devices 2 --num_nodes 2 --conda_env 'my_env' --encoder_layers 12
-
-
-

Finally, make sure to start the training like so:

-
# init the trainer like this
-trainer = Trainer.from_argparse_args(args, early_stopping_callback=...)
-
-# NOT like this
-trainer = Trainer(accelerator=hparams.accelerator, devices=hparams.devices, ...)
-
-# init the model with Namespace directly
-model = LitModel(args)
-
-# or init the model with all the key-value pairs
-dict_args = vars(args)
-model = LitModel(**dict_args)
-
-
-
-
-
-

LightningModule hyperparameters

-

Often times we train many versions of a model. You might share that model or come back to it a few months later -at which point it is very useful to know how that model was trained (i.e.: what learning rate, neural network, etc…).

-

Lightning has a standardized way of saving the information for you in checkpoints and YAML files. The goal here is to -improve readability and reproducibility.

-
-

save_hyperparameters

-

Use save_hyperparameters() within your -LightningModule’s __init__ method. -It will enable Lightning to store all the provided arguments under the self.hparams attribute. -These hyperparameters will also be stored within the model checkpoint, which simplifies model re-instantiation after training.

-
class LitMNIST(LightningModule):
-    def __init__(self, layer_1_dim=128, learning_rate=1e-2):
-        super().__init__()
-        # call this to save (layer_1_dim=128, learning_rate=1e-4) to the checkpoint
-        self.save_hyperparameters()
-
-        # equivalent
-        self.save_hyperparameters("layer_1_dim", "learning_rate")
-
-        # Now possible to access layer_1_dim from hparams
-        self.hparams.layer_1_dim
-
-
-

In addition, loggers that support it will automatically log the contents of self.hparams.

-
-
-

Excluding hyperparameters

-

By default, every parameter of the __init__ method will be considered a hyperparameter to the LightningModule. -However, sometimes some parameters need to be excluded from saving, for example when they are not serializable. -Those parameters should be provided back when reloading the LightningModule. -In this case, exclude them explicitly:

-
class LitMNIST(LightningModule):
-    def __init__(self, loss_fx, generator_network, layer_1_dim=128):
-        super().__init__()
-        self.layer_1_dim = layer_1_dim
-        self.loss_fx = loss_fx
-
-        # call this to save only (layer_1_dim=128) to the checkpoint
-        self.save_hyperparameters("layer_1_dim")
-
-        # equivalent
-        self.save_hyperparameters(ignore=["loss_fx", "generator_network"])
-
-
-
-
-

load_from_checkpoint

-

LightningModules that have hyperparameters automatically saved with save_hyperparameters() -can conveniently be loaded and instantiated directly from a checkpoint with load_from_checkpoint():

-
# to load specify the other args
-model = LitMNIST.load_from_checkpoint(PATH, loss_fx=torch.nn.SomeOtherLoss, generator_network=MyGenerator())
-
-
-

If parameters were excluded, they need to be provided at the time of loading:

-
# the excluded parameters were `loss_fx` and `generator_network`
-model = LitMNIST.load_from_checkpoint(PATH, loss_fx=torch.nn.SomeOtherLoss, generator_network=MyGenerator())
-
-
-
-
-
-
-

Trainer args

-

To recap, add ALL possible trainer flags to the argparser and init the Trainer this way

-
parser = ArgumentParser()
-parser = Trainer.add_argparse_args(parser)
-hparams = parser.parse_args()
-
-trainer = Trainer.from_argparse_args(hparams)
-
-# or if you need to pass in callbacks
-trainer = Trainer.from_argparse_args(hparams, enable_checkpointing=..., callbacks=[...])
-
-
-
-
-
-

Multiple Lightning Modules

-

We often have multiple Lightning Modules where each one has different arguments. Instead of -polluting the main.py file, the LightningModule lets you define arguments for each one.

-
class LitMNIST(LightningModule):
-    def __init__(self, layer_1_dim, **kwargs):
-        super().__init__()
-        self.layer_1 = nn.Linear(28 * 28, layer_1_dim)
-
-    @staticmethod
-    def add_model_specific_args(parent_parser):
-        parser = parent_parser.add_argument_group("LitMNIST")
-        parser.add_argument("--layer_1_dim", type=int, default=128)
-        return parent_parser
-
-
-
class GoodGAN(LightningModule):
-    def __init__(self, encoder_layers, **kwargs):
-        super().__init__()
-        self.encoder = Encoder(layers=encoder_layers)
-
-    @staticmethod
-    def add_model_specific_args(parent_parser):
-        parser = parent_parser.add_argument_group("GoodGAN")
-        parser.add_argument("--encoder_layers", type=int, default=12)
-        return parent_parser
-
-
-

Now we can allow each model to inject the arguments it needs in the main.py

-
def main(args):
-    dict_args = vars(args)
-
-    # pick model
-    if args.model_name == "gan":
-        model = GoodGAN(**dict_args)
-    elif args.model_name == "mnist":
-        model = LitMNIST(**dict_args)
-
-    trainer = Trainer.from_argparse_args(args)
-    trainer.fit(model)
-
-
-if __name__ == "__main__":
-    parser = ArgumentParser()
-    parser = Trainer.add_argparse_args(parser)
-
-    # figure out which model to use
-    parser.add_argument("--model_name", type=str, default="gan", help="gan or mnist")
-
-    # THIS LINE IS KEY TO PULL THE MODEL NAME
-    temp_args, _ = parser.parse_known_args()
-
-    # let the model add what it wants
-    if temp_args.model_name == "gan":
-        parser = GoodGAN.add_model_specific_args(parser)
-    elif temp_args.model_name == "mnist":
-        parser = LitMNIST.add_model_specific_args(parser)
-
-    args = parser.parse_args()
-
-    # train
-    main(args)
-
-
-

and now we can train MNIST or the GAN using the command line interface!

-
$ python main.py --model_name gan --encoder_layers 24
-$ python main.py --model_name mnist --layer_1_dim 128
-
-
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/lightning_module.html b/docs/common/lightning_module.html deleted file mode 100644 index 1041cd4..0000000 --- a/docs/common/lightning_module.html +++ /dev/null @@ -1,4988 +0,0 @@ - - - - - - - - - - - - - - LightningModule — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

LightningModule

-

A LightningModule organizes your PyTorch code into 6 sections:

-
    -
  • Computations (init).

  • -
  • Train Loop (training_step)

  • -
  • Validation Loop (validation_step)

  • -
  • Test Loop (test_step)

  • -
  • Prediction Loop (predict_step)

  • -
  • Optimizers and LR Schedulers (configure_optimizers)

  • -
-
-

-
-
-

-
-

Notice a few things.

-
    -
  1. It is the SAME code.

  2. -
  3. The PyTorch code IS NOT abstracted - just organized.

  4. -
  5. All the other code that’s not in the LightningModule -has been automated for you by the Trainer.

  6. -
-
-

-
-
-
net = Net()
-trainer = Trainer()
-trainer.fit(net)
-
-
-
-
    -
  1. There are no .cuda() or .to(device) calls required. Lightning does these for you.

  2. -
-
-

-
-
-
# don't do in Lightning
-x = torch.Tensor(2, 3)
-x = x.cuda()
-x = x.to(device)
-
-# do this instead
-x = x  # leave it alone!
-
-# or to init a new tensor
-new_x = torch.Tensor(2, 3)
-new_x = new_x.type_as(x)
-
-
-
-
    -
  1. When running under a distributed strategy, Lightning handles the distributed sampler for you by default.

  2. -
-
-

-
-
-
# Don't do in Lightning...
-data = MNIST(...)
-sampler = DistributedSampler(data)
-DataLoader(data, sampler=sampler)
-
-# do this instead
-data = MNIST(...)
-DataLoader(data)
-
-
-
-
    -
  1. A LightningModule is a torch.nn.Module but with added functionality. Use it as such!

  2. -
-
-

-
-
-
net = Net.load_from_checkpoint(PATH)
-net.freeze()
-out = net(x)
-
-
-
-

Thus, to use Lightning, you just need to organize your code which takes about 30 minutes, -(and let’s be real, you probably should do anyway).

-
-
-

Starter Example

-

Here are the only required methods.

-
import pytorch_lightning as pl
-import torch.nn as nn
-import torch.nn.functional as F
-
-
-class LitModel(pl.LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.l1 = nn.Linear(28 * 28, 10)
-
-    def forward(self, x):
-        return torch.relu(self.l1(x.view(x.size(0), -1)))
-
-    def training_step(self, batch, batch_idx):
-        x, y = batch
-        y_hat = self(x)
-        loss = F.cross_entropy(y_hat, y)
-        return loss
-
-    def configure_optimizers(self):
-        return torch.optim.Adam(self.parameters(), lr=0.02)
-
-
-

Which you can train by doing:

-
train_loader = DataLoader(MNIST(os.getcwd(), download=True, transform=transforms.ToTensor()))
-trainer = pl.Trainer(max_epochs=1)
-model = LitModel()
-
-trainer.fit(model, train_dataloaders=train_loader)
-
-
-

The LightningModule has many convenience methods, but the core ones you need to know about are:

- ---- - - - - - - - - - - - - - - - - - - - - - - - - - - - - -

Name

Description

init

Define computations here

forward

Use for inference only (separate from training_step)

training_step

the complete training loop

validation_step

the complete validation loop

test_step

the complete test loop

predict_step

the complete prediction loop

configure_optimizers

define optimizers and LR schedulers

-
-
-
-

Training

-
-

Training Loop

-

To activate the training loop, override the training_step() method.

-
class LitClassifier(pl.LightningModule):
-    def __init__(self, model):
-        super().__init__()
-        self.model = model
-
-    def training_step(self, batch, batch_idx):
-        x, y = batch
-        y_hat = self.model(x)
-        loss = F.cross_entropy(y_hat, y)
-        return loss
-
-
-

Under the hood, Lightning does the following (pseudocode):

-
# put model in train mode and enable gradient calculation
-model.train()
-torch.set_grad_enabled(True)
-
-outs = []
-for batch_idx, batch in enumerate(train_dataloader):
-    loss = training_step(batch, batch_idx)
-    outs.append(loss.detach())
-
-    # clear gradients
-    optimizer.zero_grad()
-
-    # backward
-    loss.backward()
-
-    # update parameters
-    optimizer.step()
-
-
-
-
-

Train Epoch-level Metrics

-

If you want to calculate epoch-level metrics and log them, use log().

-
def training_step(self, batch, batch_idx):
-    x, y = batch
-    y_hat = self.model(x)
-    loss = F.cross_entropy(y_hat, y)
-
-    # logs metrics for each training_step,
-    # and the average across the epoch, to the progress bar and logger
-    self.log("train_loss", loss, on_step=True, on_epoch=True, prog_bar=True, logger=True)
-    return loss
-
-
-

The log() object automatically reduces the -requested metrics across a complete epoch and devices. Here’s the pseudocode of what it does under the hood:

-
outs = []
-for batch_idx, batch in enumerate(train_dataloader):
-    # forward
-    loss = training_step(batch, batch_idx)
-    outs.append(loss)
-
-    # clear gradients
-    optimizer.zero_grad()
-
-    # backward
-    loss.backward()
-
-    # update parameters
-    optimizer.step()
-
-epoch_metric = torch.mean(torch.stack([x for x in outs]))
-
-
-
-
-

Train Epoch-level Operations

-

If you need to do something with all the outputs of each training_step(), -override the training_epoch_end() method.

-
def training_step(self, batch, batch_idx):
-    x, y = batch
-    y_hat = self.model(x)
-    loss = F.cross_entropy(y_hat, y)
-    preds = ...
-    return {"loss": loss, "other_stuff": preds}
-
-
-def training_epoch_end(self, training_step_outputs):
-    all_preds = torch.stack(training_step_outputs)
-    ...
-
-
-

The matching pseudocode is:

-
outs = []
-for batch_idx, batch in enumerate(train_dataloader):
-    # forward
-    loss = training_step(batch, batch_idx)
-    outs.append(loss)
-
-    # clear gradients
-    optimizer.zero_grad()
-
-    # backward
-    loss.backward()
-
-    # update parameters
-    optimizer.step()
-
-training_epoch_end(outs)
-
-
-
-
-

Training with DataParallel

-

When training using a strategy that splits data from each batch across GPUs, sometimes you might -need to aggregate them on the main GPU for processing (DP, or DDP2).

-

In this case, implement the training_step_end() -method which will have outputs from all the devices and you can accumulate to get the effective results.

-
def training_step(self, batch, batch_idx):
-    x, y = batch
-    y_hat = self.model(x)
-    loss = F.cross_entropy(y_hat, y)
-    pred = ...
-    return {"loss": loss, "pred": pred}
-
-
-def training_step_end(self, batch_parts):
-    # predictions from each GPU
-    predictions = batch_parts["pred"]
-    # losses from each GPU
-    losses = batch_parts["loss"]
-
-    gpu_0_prediction = predictions[0]
-    gpu_1_prediction = predictions[1]
-
-    # do something with both outputs
-    return (losses[0] + losses[1]) / 2
-
-
-def training_epoch_end(self, training_step_outputs):
-    for out in training_step_outputs:
-        ...
-
-
-

Here is the Lightning training pseudo-code for DP:

-
outs = []
-for batch_idx, train_batch in enumerate(train_dataloader):
-    batches = split_batch(train_batch)
-    dp_outs = []
-    for sub_batch in batches:
-        # 1
-        dp_out = training_step(sub_batch, batch_idx)
-        dp_outs.append(dp_out)
-
-    # 2
-    out = training_step_end(dp_outs)
-    outs.append(out)
-
-# do something with the outputs for all batches
-# 3
-training_epoch_end(outs)
-
-
-
-
-
-
-

Validation

-
-

Validation Loop

-

To activate the validation loop while training, override the validation_step() method.

-
class LitModel(pl.LightningModule):
-    def validation_step(self, batch, batch_idx):
-        x, y = batch
-        y_hat = self.model(x)
-        loss = F.cross_entropy(y_hat, y)
-        self.log("val_loss", loss)
-
-
-

Under the hood, Lightning does the following (pseudocode):

-
# ...
-for batch_idx, batch in enumerate(train_dataloader):
-    loss = model.training_step(batch, batch_idx)
-    loss.backward()
-    # ...
-
-    if validate_at_some_point:
-        # disable grads + batchnorm + dropout
-        torch.set_grad_enabled(False)
-        model.eval()
-
-        # ----------------- VAL LOOP ---------------
-        for val_batch_idx, val_batch in enumerate(val_dataloader):
-            val_out = model.validation_step(val_batch, val_batch_idx)
-        # ----------------- VAL LOOP ---------------
-
-        # enable grads + batchnorm + dropout
-        torch.set_grad_enabled(True)
-        model.train()
-
-
-

You can also run just the validation loop on your validation dataloaders by overriding validation_step() -and calling validate().

-
model = Model()
-trainer = Trainer()
-trainer.validate(model)
-
-
-
-

Note

-

It is recommended to validate on single device to ensure each sample/batch gets evaluated exactly once. -This is helpful to make sure benchmarking for research papers is done the right way. Otherwise, in a -multi-device setting, samples could occur duplicated when DistributedSampler -is used, for eg. with strategy="ddp". It replicates some samples on some devices to make sure all devices have -same batch size in case of uneven inputs.

-
-
-
-

Validation Epoch-level Metrics

-

If you need to do something with all the outputs of each validation_step(), -override the validation_epoch_end() method. Note that this method is called before training_epoch_end().

-
def validation_step(self, batch, batch_idx):
-    x, y = batch
-    y_hat = self.model(x)
-    loss = F.cross_entropy(y_hat, y)
-    pred = ...
-    return pred
-
-
-def validation_epoch_end(self, validation_step_outputs):
-    all_preds = torch.stack(validation_step_outputs)
-    ...
-
-
-
-
-

Validating with DataParallel

-

When training using a strategy that splits data from each batch across GPUs, sometimes you might -need to aggregate them on the main GPU for processing (DP, or DDP2).

-

In this case, implement the validation_step_end() -method which will have outputs from all the devices and you can accumulate to get the effective results.

-
def validation_step(self, batch, batch_idx):
-    x, y = batch
-    y_hat = self.model(x)
-    loss = F.cross_entropy(y_hat, y)
-    pred = ...
-    return {"loss": loss, "pred": pred}
-
-
-def validation_step_end(self, batch_parts):
-    # predictions from each GPU
-    predictions = batch_parts["pred"]
-    # losses from each GPU
-    losses = batch_parts["loss"]
-
-    gpu_0_prediction = predictions[0]
-    gpu_1_prediction = predictions[1]
-
-    # do something with both outputs
-    return (losses[0] + losses[1]) / 2
-
-
-def validation_epoch_end(self, validation_step_outputs):
-    for out in validation_step_outputs:
-        ...
-
-
-

Here is the Lightning validation pseudo-code for DP:

-
outs = []
-for batch in dataloader:
-    batches = split_batch(batch)
-    dp_outs = []
-    for sub_batch in batches:
-        # 1
-        dp_out = validation_step(sub_batch)
-        dp_outs.append(dp_out)
-
-    # 2
-    out = validation_step_end(dp_outs)
-    outs.append(out)
-
-# do something with the outputs for all batches
-# 3
-validation_epoch_end(outs)
-
-
-
-
-
-
-

Testing

-
-

Test Loop

-

The process for enabling a test loop is the same as the process for enabling a validation loop. Please refer to -the section above for details. For this you need to override the test_step() method.

-

The only difference is that the test loop is only called when test() is used.

-
model = Model()
-trainer = Trainer()
-trainer.fit(model)
-
-# automatically loads the best weights for you
-trainer.test(model)
-
-
-

There are two ways to call test():

-
# call after training
-trainer = Trainer()
-trainer.fit(model)
-
-# automatically auto-loads the best weights from the previous run
-trainer.test(dataloaders=test_dataloader)
-
-# or call with pretrained model
-model = MyLightningModule.load_from_checkpoint(PATH)
-trainer = Trainer()
-trainer.test(model, dataloaders=test_dataloader)
-
-
-
-

Note

-

It is recommended to validate on single device to ensure each sample/batch gets evaluated exactly once. -This is helpful to make sure benchmarking for research papers is done the right way. Otherwise, in a -multi-device setting, samples could occur duplicated when DistributedSampler -is used, for eg. with strategy="ddp". It replicates some samples on some devices to make sure all devices have -same batch size in case of uneven inputs.

-
-
-
-
-
-

Inference

-
-

Prediction Loop

-

By default, the predict_step() method runs the -forward() method. In order to customize this behaviour, -simply override the predict_step() method.

-

For the example let’s override predict_step and try out Monte Carlo Dropout:

-
class LitMCdropoutModel(pl.LightningModule):
-    def __init__(self, model, mc_iteration):
-        super().__init__()
-        self.model = model
-        self.dropout = nn.Dropout()
-        self.mc_iteration = mc_iteration
-
-    def predict_step(self, batch, batch_idx):
-        # enable Monte Carlo Dropout
-        self.dropout.train()
-
-        # take average of `self.mc_iteration` iterations
-        pred = torch.vstack([self.dropout(self.model(x)).unsqueeze(0) for _ in range(self.mc_iteration)]).mean(dim=0)
-        return pred
-
-
-

Under the hood, Lightning does the following (pseudocode):

-
# disable grads + batchnorm + dropout
-torch.set_grad_enabled(False)
-model.eval()
-all_preds = []
-
-for batch_idx, batch in enumerate(predict_dataloader):
-    pred = model.predict_step(batch, batch_idx)
-    all_preds.append(pred)
-
-
-

There are two ways to call predict():

-
# call after training
-trainer = Trainer()
-trainer.fit(model)
-
-# automatically auto-loads the best weights from the previous run
-predictions = trainer.predict(dataloaders=predict_dataloader)
-
-# or call with pretrained model
-model = MyLightningModule.load_from_checkpoint(PATH)
-trainer = Trainer()
-predictions = trainer.predict(model, dataloaders=test_dataloader)
-
-
-
-
-

Inference in Research

-

If you want to perform inference with the system, you can add a forward method to the LightningModule.

-
-

Note

-

When using forward, you are responsible to call eval() and use the no_grad() context manager.

-
-
class Autoencoder(pl.LightningModule):
-    def forward(self, x):
-        return self.decoder(x)
-
-
-model = Autoencoder()
-model.eval()
-with torch.no_grad():
-    reconstruction = model(embedding)
-
-
-

The advantage of adding a forward is that in complex systems, you can do a much more involved inference procedure, -such as text generation:

-
class Seq2Seq(pl.LightningModule):
-    def forward(self, x):
-        embeddings = self(x)
-        hidden_states = self.encoder(embeddings)
-        for h in hidden_states:
-            # decode
-            ...
-        return decoded
-
-
-

In the case where you want to scale your inference, you should be using -predict_step().

-
class Autoencoder(pl.LightningModule):
-    def forward(self, x):
-        return self.decoder(x)
-
-    def predict_step(self, batch, batch_idx, dataloader_idx=0):
-        # this calls forward
-        return self(batch)
-
-
-data_module = ...
-model = Autoencoder()
-trainer = Trainer(accelerator="gpu", devices=2)
-trainer.predict(model, data_module)
-
-
-
-
-

Inference in Production

-

For cases like production, you might want to iterate different models inside a LightningModule.

-
from torchmetrics.functional import accuracy
-
-
-class ClassificationTask(pl.LightningModule):
-    def __init__(self, model):
-        super().__init__()
-        self.model = model
-
-    def training_step(self, batch, batch_idx):
-        x, y = batch
-        y_hat = self.model(x)
-        loss = F.cross_entropy(y_hat, y)
-        return loss
-
-    def validation_step(self, batch, batch_idx):
-        loss, acc = self._shared_eval_step(batch, batch_idx)
-        metrics = {"val_acc": acc, "val_loss": loss}
-        self.log_dict(metrics)
-        return metrics
-
-    def test_step(self, batch, batch_idx):
-        loss, acc = self._shared_eval_step(batch, batch_idx)
-        metrics = {"test_acc": acc, "test_loss": loss}
-        self.log_dict(metrics)
-        return metrics
-
-    def _shared_eval_step(self, batch, batch_idx):
-        x, y = batch
-        y_hat = self.model(x)
-        loss = F.cross_entropy(y_hat, y)
-        acc = accuracy(y_hat, y)
-        return loss, acc
-
-    def predict_step(self, batch, batch_idx, dataloader_idx=0):
-        x, y = batch
-        y_hat = self.model(x)
-        return y_hat
-
-    def configure_optimizers(self):
-        return torch.optim.Adam(self.model.parameters(), lr=0.02)
-
-
-

Then pass in any arbitrary model to be fit with this task

-
for model in [resnet50(), vgg16(), BidirectionalRNN()]:
-    task = ClassificationTask(model)
-
-    trainer = Trainer(accelerator="gpu", devices=2)
-    trainer.fit(task, train_dataloaders=train_dataloader, val_dataloaders=val_dataloader)
-
-
-

Tasks can be arbitrarily complex such as implementing GAN training, self-supervised or even RL.

-
class GANTask(pl.LightningModule):
-    def __init__(self, generator, discriminator):
-        super().__init__()
-        self.generator = generator
-        self.discriminator = discriminator
-
-    ...
-
-
-

When used like this, the model can be separated from the Task and thus used in production without needing to keep it in -a LightningModule.

-

The following example shows how you can run inference in the Python runtime:

-
task = ClassificationTask(model)
-trainer = Trainer(accelerator="gpu", devices=2)
-trainer.fit(task, train_dataloader, val_dataloader)
-trainer.save_checkpoint("best_model.ckpt")
-
-# use model after training or load weights and drop into the production system
-model = ClassificationTask.load_from_checkpoint("best_model.ckpt")
-x = ...
-model.eval()
-with torch.no_grad():
-    y_hat = model(x)
-
-
-

Check out Inference in Production guide to learn about the possible ways to perform inference in production.

-
-
-
-
-

Child Modules

-

Research projects tend to test different approaches to the same dataset. -This is very easy to do in Lightning with inheritance.

-

For example, imagine we now want to train an AutoEncoder to use as a feature extractor for images. -The only things that change in the LitAutoEncoder model are the init, forward, training, validation and test step.

-
class Encoder(torch.nn.Module):
-    ...
-
-
-class Decoder(torch.nn.Module):
-    ...
-
-
-class AutoEncoder(torch.nn.Module):
-    def __init__(self):
-        super().__init__()
-        self.encoder = Encoder()
-        self.decoder = Decoder()
-
-    def forward(self, x):
-        return self.decoder(self.encoder(x))
-
-
-class LitAutoEncoder(LightningModule):
-    def __init__(self, auto_encoder):
-        super().__init__()
-        self.auto_encoder = auto_encoder
-        self.metric = torch.nn.MSELoss()
-
-    def forward(self, x):
-        return self.auto_encoder.encoder(x)
-
-    def training_step(self, batch, batch_idx):
-        x, _ = batch
-        x_hat = self.auto_encoder(x)
-        loss = self.metric(x, x_hat)
-        return loss
-
-    def validation_step(self, batch, batch_idx):
-        self._shared_eval(batch, batch_idx, "val")
-
-    def test_step(self, batch, batch_idx):
-        self._shared_eval(batch, batch_idx, "test")
-
-    def _shared_eval(self, batch, batch_idx, prefix):
-        x, _ = batch
-        x_hat = self.auto_encoder(x)
-        loss = self.metric(x, x_hat)
-        self.log(f"{prefix}_loss", loss)
-
-
-

and we can train this using the Trainer:

-
auto_encoder = AutoEncoder()
-lightning_module = LitAutoEncoder(auto_encoder)
-trainer = Trainer()
-trainer.fit(lightning_module, train_dataloader, val_dataloader)
-
-
-

And remember that the forward method should define the practical use of a LightningModule. -In this case, we want to use the LitAutoEncoder to extract image representations:

-
some_images = torch.Tensor(32, 1, 28, 28)
-representations = lightning_module(some_images)
-
-
-
-
-
-

LightningModule API

-
-

Methods

-
-

all_gather

-
-
-LightningModule.all_gather(data, group=None, sync_grads=False)[source]
-

Allows users to call self.all_gather() from the LightningModule, thus making the all_gather operation -accelerator agnostic. all_gather is a function provided by accelerators to gather a tensor from several -distributed processes.

-
-
Parameters
-
    -
  • data (Union[Tensor, Dict, List, Tuple]) – int, float, tensor of shape (batch, …), or a (possibly nested) collection thereof.

  • -
  • group (Optional[Any]) – the process group to gather results from. Defaults to all processes (world)

  • -
  • sync_grads (bool) – flag that allows users to synchronize gradients for the all_gather operation

  • -
-
-
Returns
-

A tensor of shape (world_size, batch, …), or if the input was a collection -the output will also be a collection with tensors of this shape.

-
-
-
- -
-
-

configure_callbacks

-
-
-LightningModule.configure_callbacks()[source]
-

Configure model-specific callbacks. When the model gets attached, e.g., when .fit() or .test() -gets called, the list or a callback returned here will be merged with the list of callbacks passed to the -Trainer’s callbacks argument. If a callback returned here has the same type as one or several callbacks -already present in the Trainer’s callbacks list, it will take priority and replace them. In addition, -Lightning will make sure ModelCheckpoint callbacks -run last.

-
-
Return type
-

Union[Sequence[Callback], Callback]

-
-
Returns
-

A callback or a list of callbacks which will extend the list of callbacks in the Trainer.

-
-
-

Example:

-
def configure_callbacks(self):
-    early_stop = EarlyStopping(monitor="val_acc", mode="max")
-    checkpoint = ModelCheckpoint(monitor="val_loss")
-    return [early_stop, checkpoint]
-
-
-
-

Note

-

Certain callback methods like on_init_start() -will never be invoked on the new callbacks returned here.

-
-
- -
-
-

configure_optimizers

-
-
-LightningModule.configure_optimizers()[source]
-

Choose what optimizers and learning-rate schedulers to use in your optimization. -Normally you’d need one. But in the case of GANs or similar you might have multiple.

-
-
Returns
-

Any of these 6 options.

-
    -
  • Single optimizer.

  • -
  • List or Tuple of optimizers.

  • -
  • Two lists - The first list has multiple optimizers, and the second has multiple LR schedulers -(or multiple lr_scheduler_config).

  • -
  • Dictionary, with an "optimizer" key, and (optionally) a "lr_scheduler" -key whose value is a single LR scheduler or lr_scheduler_config.

  • -
  • Tuple of dictionaries as described above, with an optional "frequency" key.

  • -
  • None - Fit will run without any optimizer.

  • -
-

-
-
-

The lr_scheduler_config is a dictionary which contains the scheduler and its associated configuration. -The default configuration is shown below.

-
lr_scheduler_config = {
-    # REQUIRED: The scheduler instance
-    "scheduler": lr_scheduler,
-    # The unit of the scheduler's step size, could also be 'step'.
-    # 'epoch' updates the scheduler on epoch end whereas 'step'
-    # updates it after a optimizer update.
-    "interval": "epoch",
-    # How many epochs/steps should pass between calls to
-    # `scheduler.step()`. 1 corresponds to updating the learning
-    # rate after every epoch/step.
-    "frequency": 1,
-    # Metric to to monitor for schedulers like `ReduceLROnPlateau`
-    "monitor": "val_loss",
-    # If set to `True`, will enforce that the value specified 'monitor'
-    # is available when the scheduler is updated, thus stopping
-    # training if not found. If set to `False`, it will only produce a warning
-    "strict": True,
-    # If using the `LearningRateMonitor` callback to monitor the
-    # learning rate progress, this keyword can be used to specify
-    # a custom logged name
-    "name": None,
-}
-
-
-

When there are schedulers in which the .step() method is conditioned on a value, such as the -torch.optim.lr_scheduler.ReduceLROnPlateau scheduler, Lightning requires that the -lr_scheduler_config contains the keyword "monitor" set to the metric name that the scheduler -should be conditioned on.

-
# The ReduceLROnPlateau scheduler requires a monitor
-def configure_optimizers(self):
-    optimizer = Adam(...)
-    return {
-        "optimizer": optimizer,
-        "lr_scheduler": {
-            "scheduler": ReduceLROnPlateau(optimizer, ...),
-            "monitor": "metric_to_track",
-            "frequency": "indicates how often the metric is updated"
-            # If "monitor" references validation metrics, then "frequency" should be set to a
-            # multiple of "trainer.check_val_every_n_epoch".
-        },
-    }
-
-
-# In the case of two optimizers, only one using the ReduceLROnPlateau scheduler
-def configure_optimizers(self):
-    optimizer1 = Adam(...)
-    optimizer2 = SGD(...)
-    scheduler1 = ReduceLROnPlateau(optimizer1, ...)
-    scheduler2 = LambdaLR(optimizer2, ...)
-    return (
-        {
-            "optimizer": optimizer1,
-            "lr_scheduler": {
-                "scheduler": scheduler1,
-                "monitor": "metric_to_track",
-            },
-        },
-        {"optimizer": optimizer2, "lr_scheduler": scheduler2},
-    )
-
-
-

Metrics can be made available to monitor by simply logging it using -self.log('metric_to_track', metric_val) in your LightningModule.

-
-

Note

-

The frequency value specified in a dict along with the optimizer key is an int corresponding -to the number of sequential batches optimized with the specific optimizer. -It should be given to none or to all of the optimizers. -There is a difference between passing multiple optimizers in a list, -and passing multiple optimizers in dictionaries with a frequency of 1:

-
-
    -
  • In the former case, all optimizers will operate on the given batch in each optimization step.

  • -
  • In the latter, only one optimizer will operate on the given batch at every step.

  • -
-
-

This is different from the frequency value specified in the lr_scheduler_config mentioned above.

-
def configure_optimizers(self):
-    optimizer_one = torch.optim.SGD(self.model.parameters(), lr=0.01)
-    optimizer_two = torch.optim.SGD(self.model.parameters(), lr=0.01)
-    return [
-        {"optimizer": optimizer_one, "frequency": 5},
-        {"optimizer": optimizer_two, "frequency": 10},
-    ]
-
-
-

In this example, the first optimizer will be used for the first 5 steps, -the second optimizer for the next 10 steps and that cycle will continue. -If an LR scheduler is specified for an optimizer using the lr_scheduler key in the above dict, -the scheduler will only be updated when its optimizer is being used.

-
-

Examples:

-
# most cases. no learning rate scheduler
-def configure_optimizers(self):
-    return Adam(self.parameters(), lr=1e-3)
-
-# multiple optimizer case (e.g.: GAN)
-def configure_optimizers(self):
-    gen_opt = Adam(self.model_gen.parameters(), lr=0.01)
-    dis_opt = Adam(self.model_dis.parameters(), lr=0.02)
-    return gen_opt, dis_opt
-
-# example with learning rate schedulers
-def configure_optimizers(self):
-    gen_opt = Adam(self.model_gen.parameters(), lr=0.01)
-    dis_opt = Adam(self.model_dis.parameters(), lr=0.02)
-    dis_sch = CosineAnnealing(dis_opt, T_max=10)
-    return [gen_opt, dis_opt], [dis_sch]
-
-# example with step-based learning rate schedulers
-# each optimizer has its own scheduler
-def configure_optimizers(self):
-    gen_opt = Adam(self.model_gen.parameters(), lr=0.01)
-    dis_opt = Adam(self.model_dis.parameters(), lr=0.02)
-    gen_sch = {
-        'scheduler': ExponentialLR(gen_opt, 0.99),
-        'interval': 'step'  # called after each training step
-    }
-    dis_sch = CosineAnnealing(dis_opt, T_max=10) # called every epoch
-    return [gen_opt, dis_opt], [gen_sch, dis_sch]
-
-# example with optimizer frequencies
-# see training procedure in `Improved Training of Wasserstein GANs`, Algorithm 1
-# https://arxiv.org/abs/1704.00028
-def configure_optimizers(self):
-    gen_opt = Adam(self.model_gen.parameters(), lr=0.01)
-    dis_opt = Adam(self.model_dis.parameters(), lr=0.02)
-    n_critic = 5
-    return (
-        {'optimizer': dis_opt, 'frequency': n_critic},
-        {'optimizer': gen_opt, 'frequency': 1}
-    )
-
-
-
-

Note

-

Some things to know:

-
    -
  • Lightning calls .backward() and .step() on each optimizer and learning rate scheduler as needed.

  • -
  • If you use 16-bit precision (precision=16), Lightning will automatically handle the optimizers.

  • -
  • If you use multiple optimizers, training_step() will have an additional optimizer_idx parameter.

  • -
  • If you use torch.optim.LBFGS, Lightning handles the closure function automatically for you.

  • -
  • If you use multiple optimizers, gradients will be calculated only for the parameters of current optimizer -at each training step.

  • -
  • If you need to control how often those optimizers step or override the default .step() schedule, -override the optimizer_step() hook.

  • -
-
-
- -
-
-

forward

-
-
-LightningModule.forward(*args, **kwargs)[source]
-

Same as torch.nn.Module.forward().

-
-
Parameters
-
    -
  • *args – Whatever you decide to pass into the forward method.

  • -
  • **kwargs – Keyword arguments are also possible.

  • -
-
-
Return type
-

Any

-
-
Returns
-

Your model’s output

-
-
-
- -
-
-

freeze

-
-
-LightningModule.freeze()[source]
-

Freeze all params for inference.

-

Example:

-
model = MyLightningModule(...)
-model.freeze()
-
-
-
-
Return type
-

None

-
-
-
- -
-
-

log

-
-
-LightningModule.log(name, value, prog_bar=False, logger=True, on_step=None, on_epoch=None, reduce_fx='mean', enable_graph=False, sync_dist=False, sync_dist_group=None, add_dataloader_idx=True, batch_size=None, metric_attribute=None, rank_zero_only=False)[source]
-

Log a key, value pair.

-

Example:

-
self.log('train_loss', loss)
-
-
-

The default behavior per hook is documented here: Automatic Logging.

-
-
Parameters
-
    -
  • name (str) – key to log.

  • -
  • value (Union[Metric, Tensor, int, float, Mapping[str, Union[Metric, Tensor, int, float]]]) – value to log. Can be a float, Tensor, Metric, or a dictionary of the former.

  • -
  • prog_bar (bool) – if True logs to the progress bar.

  • -
  • logger (bool) – if True logs to the logger.

  • -
  • on_step (Optional[bool]) – if True logs at this step. The default value is determined by the hook. -See Automatic Logging for details.

  • -
  • on_epoch (Optional[bool]) – if True logs epoch accumulated metrics. The default value is determined by the hook. -See Automatic Logging for details.

  • -
  • reduce_fx (Union[str, Callable]) – reduction function over step values for end of epoch. torch.mean() by default.

  • -
  • enable_graph (bool) – if True, will not auto detach the graph.

  • -
  • sync_dist (bool) – if True, reduces the metric across devices. Use with care as this may lead to a significant -communication overhead.

  • -
  • sync_dist_group (Optional[Any]) – the DDP group to sync across.

  • -
  • add_dataloader_idx (bool) – if True, appends the index of the current dataloader to -the name (when using multiple dataloaders). If False, user needs to give unique names for -each dataloader to not mix the values.

  • -
  • batch_size (Optional[int]) – Current batch_size. This will be directly inferred from the loaded batch, -but for some data structures you might need to explicitly provide it.

  • -
  • metric_attribute (Optional[str]) – To restore the metric state, Lightning requires the reference of the -torchmetrics.Metric in your model. This is found automatically if it is a model attribute.

  • -
  • rank_zero_only (bool) – Whether the value will be logged only on rank 0. This will prevent synchronization which -would produce a deadlock as not all processes would perform this log call.

  • -
-
-
Return type
-

None

-
-
-
- -
-
-

log_dict

-
-
-LightningModule.log_dict(dictionary, prog_bar=False, logger=True, on_step=None, on_epoch=None, reduce_fx='mean', enable_graph=False, sync_dist=False, sync_dist_group=None, add_dataloader_idx=True, batch_size=None, rank_zero_only=False)[source]
-

Log a dictionary of values at once.

-

Example:

-
values = {'loss': loss, 'acc': acc, ..., 'metric_n': metric_n}
-self.log_dict(values)
-
-
-
-
Parameters
-
    -
  • dictionary (Mapping[str, Union[Metric, Tensor, int, float, Mapping[str, Union[Metric, Tensor, int, float]]]]) – key value pairs. -The values can be a float, Tensor, Metric, or a dictionary of the former.

  • -
  • prog_bar (bool) – if True logs to the progress base.

  • -
  • logger (bool) – if True logs to the logger.

  • -
  • on_step (Optional[bool]) – if True logs at this step. -None auto-logs for training_step but not validation/test_step. -The default value is determined by the hook. -See Automatic Logging for details.

  • -
  • on_epoch (Optional[bool]) – if True logs epoch accumulated metrics. -None auto-logs for val/test step but not training_step. -The default value is determined by the hook. -See Automatic Logging for details.

  • -
  • reduce_fx (Union[str, Callable]) – reduction function over step values for end of epoch. torch.mean() by default.

  • -
  • enable_graph (bool) – if True, will not auto-detach the graph

  • -
  • sync_dist (bool) – if True, reduces the metric across GPUs/TPUs. Use with care as this may lead to a significant -communication overhead.

  • -
  • sync_dist_group (Optional[Any]) – the ddp group to sync across.

  • -
  • add_dataloader_idx (bool) – if True, appends the index of the current dataloader to -the name (when using multiple). If False, user needs to give unique names for -each dataloader to not mix values.

  • -
  • batch_size (Optional[int]) – Current batch size. This will be directly inferred from the loaded batch, -but some data structures might need to explicitly provide it.

  • -
  • rank_zero_only (bool) – Whether the value will be logged only on rank 0. This will prevent synchronization which -would produce a deadlock as not all processes would perform this log call.

  • -
-
-
Return type
-

None

-
-
-
- -
-
-

lr_schedulers

-
-
-LightningModule.lr_schedulers()[source]
-

Returns the learning rate scheduler(s) that are being used during training. Useful for manual -optimization.

-
-
Return type
-

Union[_LRScheduler, ReduceLROnPlateau, List[Union[_LRScheduler, ReduceLROnPlateau]], None]

-
-
Returns
-

A single scheduler, or a list of schedulers in case multiple ones are present, or None if no -schedulers were returned in configure_optimizers().

-
-
-
- -
-
-

manual_backward

-
-
-LightningModule.manual_backward(loss, *args, **kwargs)[source]
-

Call this directly from your training_step() when doing optimizations manually. By using this, -Lightning can ensure that all the proper scaling gets applied when using mixed precision.

-

See manual optimization for more examples.

-

Example:

-
def training_step(...):
-    opt = self.optimizers()
-    loss = ...
-    opt.zero_grad()
-    # automatically applies scaling, etc...
-    self.manual_backward(loss)
-    opt.step()
-
-
-
-
Parameters
-
    -
  • loss (Tensor) – The tensor on which to compute gradients. Must have a graph attached.

  • -
  • *args – Additional positional arguments to be forwarded to backward()

  • -
  • **kwargs – Additional keyword arguments to be forwarded to backward()

  • -
-
-
Return type
-

None

-
-
-
- -
-
-

optimizers

-
-
-LightningModule.optimizers(use_pl_optimizer: Literal[True] = True) Union[pytorch_lightning.core.optimizer.LightningOptimizer, List[pytorch_lightning.core.optimizer.LightningOptimizer]][source]
-
-LightningModule.optimizers(use_pl_optimizer: Literal[False]) Union[torch.optim.optimizer.Optimizer, List[torch.optim.optimizer.Optimizer]]
-
-LightningModule.optimizers(use_pl_optimizer: bool) Union[torch.optim.optimizer.Optimizer, pytorch_lightning.core.optimizer.LightningOptimizer, List[torch.optim.optimizer.Optimizer], List[pytorch_lightning.core.optimizer.LightningOptimizer]]
-

Returns the optimizer(s) that are being used during training. Useful for manual optimization.

-
-
Parameters
-

use_pl_optimizer (bool) – If True, will wrap the optimizer(s) in a -LightningOptimizer for automatic handling of precision and -profiling.

-
-
Return type
-

Union[Optimizer, LightningOptimizer, List[Optimizer], List[LightningOptimizer]]

-
-
Returns
-

A single optimizer, or a list of optimizers in case multiple ones are present.

-
-
-
- -
-
-

print

-
-
-LightningModule.print(*args, **kwargs)[source]
-

Prints only from process 0. Use this in any distributed mode to log only once.

-
-
Parameters
-
    -
  • *args – The thing to print. The same as for Python’s built-in print function.

  • -
  • **kwargs – The same as for Python’s built-in print function.

  • -
-
-
-

Example:

-
def forward(self, x):
-    self.print(x, 'in forward')
-
-
-
-
Return type
-

None

-
-
-
- -
-
-

predict_step

-
-
-LightningModule.predict_step(batch, batch_idx, dataloader_idx=0)[source]
-

Step function called during predict(). By default, it -calls forward(). Override to add any processing -logic.

-

The predict_step() is used -to scale inference on multi-devices.

-

To prevent an OOM error, it is possible to use BasePredictionWriter -callback to write the predictions to disk or database after each batch or on epoch end.

-

The BasePredictionWriter should be used while using a spawn -based accelerator. This happens for Trainer(strategy="ddp_spawn") -or training on 8 TPU cores with Trainer(accelerator="tpu", devices=8) as predictions won’t be returned.

-

Example

-
class MyModel(LightningModule):
-
-    def predicts_step(self, batch, batch_idx, dataloader_idx=0):
-        return self(batch)
-
-dm = ...
-model = MyModel()
-trainer = Trainer(accelerator="gpu", devices=2)
-predictions = trainer.predict(model, dm)
-
-
-
-
Parameters
-
    -
  • batch (Any) – Current batch.

  • -
  • batch_idx (int) – Index of current batch.

  • -
  • dataloader_idx (int) – Index of the current dataloader.

  • -
-
-
Return type
-

Any

-
-
Returns
-

Predicted output

-
-
-
- -
-
-

save_hyperparameters

-
-
-LightningModule.save_hyperparameters(*args, ignore=None, frame=None, logger=True)
-

Save arguments to hparams attribute.

-
-
Parameters
-
    -
  • args (Any) – single object of dict, NameSpace or OmegaConf -or string names or arguments from class __init__

  • -
  • ignore (Union[Sequence[str], str, None]) – an argument name or a list of argument names from -class __init__ to be ignored

  • -
  • frame (Optional[frame]) – a frame object. Default is None

  • -
  • logger (bool) – Whether to send the hyperparameters to the logger. Default: True

  • -
-
-
-
-
Example::
>>> class ManuallyArgsModel(HyperparametersMixin):
-...     def __init__(self, arg1, arg2, arg3):
-...         super().__init__()
-...         # manually assign arguments
-...         self.save_hyperparameters('arg1', 'arg3')
-...     def forward(self, *args, **kwargs):
-...         ...
->>> model = ManuallyArgsModel(1, 'abc', 3.14)
->>> model.hparams
-"arg1": 1
-"arg3": 3.14
-
-
-
>>> class AutomaticArgsModel(HyperparametersMixin):
-...     def __init__(self, arg1, arg2, arg3):
-...         super().__init__()
-...         # equivalent automatic
-...         self.save_hyperparameters()
-...     def forward(self, *args, **kwargs):
-...         ...
->>> model = AutomaticArgsModel(1, 'abc', 3.14)
->>> model.hparams
-"arg1": 1
-"arg2": abc
-"arg3": 3.14
-
-
-
>>> class SingleArgModel(HyperparametersMixin):
-...     def __init__(self, params):
-...         super().__init__()
-...         # manually assign single argument
-...         self.save_hyperparameters(params)
-...     def forward(self, *args, **kwargs):
-...         ...
->>> model = SingleArgModel(Namespace(p1=1, p2='abc', p3=3.14))
->>> model.hparams
-"p1": 1
-"p2": abc
-"p3": 3.14
-
-
-
>>> class ManuallyArgsModel(HyperparametersMixin):
-...     def __init__(self, arg1, arg2, arg3):
-...         super().__init__()
-...         # pass argument(s) to ignore as a string or in a list
-...         self.save_hyperparameters(ignore='arg2')
-...     def forward(self, *args, **kwargs):
-...         ...
->>> model = ManuallyArgsModel(1, 'abc', 3.14)
->>> model.hparams
-"arg1": 1
-"arg3": 3.14
-
-
-
-
-
-
Return type
-

None

-
-
-
- -
-
-

toggle_optimizer

-
-
-LightningModule.toggle_optimizer(optimizer, optimizer_idx)[source]
-

Makes sure only the gradients of the current optimizer’s parameters are calculated in the training step -to prevent dangling gradients in multiple-optimizer setup.

-

This is only called automatically when automatic optimization is enabled and multiple optimizers are used. -It works with untoggle_optimizer() to make sure param_requires_grad_state is properly reset.

-
-
Parameters
-
    -
  • optimizer (Union[Optimizer, LightningOptimizer]) – The optimizer to toggle.

  • -
  • optimizer_idx (int) – The index of the optimizer to toggle.

  • -
-
-
Return type
-

None

-
-
-
- -
-
-

test_step

-
-
-LightningModule.test_step(*args, **kwargs)[source]
-

Operates on a single batch of data from the test set. -In this step you’d normally generate examples or calculate anything of interest -such as accuracy.

-
# the pseudocode for these calls
-test_outs = []
-for test_batch in test_data:
-    out = test_step(test_batch)
-    test_outs.append(out)
-test_epoch_end(test_outs)
-
-
-
-
Parameters
-
    -
  • batch – The output of your DataLoader.

  • -
  • batch_idx – The index of this batch.

  • -
  • dataloader_id – The index of the dataloader that produced this batch. -(only if multiple test dataloaders used).

  • -
-
-
Return type
-

Union[Tensor, Dict[str, Any], None]

-
-
Returns
-

Any of.

-
-
    -
  • Any object or value

  • -
  • None - Testing will skip to the next batch

  • -
-
-

-
-
-
# if you have one test dataloader:
-def test_step(self, batch, batch_idx):
-    ...
-
-
-# if you have multiple test dataloaders:
-def test_step(self, batch, batch_idx, dataloader_idx=0):
-    ...
-
-
-

Examples:

-
# CASE 1: A single test dataset
-def test_step(self, batch, batch_idx):
-    x, y = batch
-
-    # implement your own
-    out = self(x)
-    loss = self.loss(out, y)
-
-    # log 6 example images
-    # or generated text... or whatever
-    sample_imgs = x[:6]
-    grid = torchvision.utils.make_grid(sample_imgs)
-    self.logger.experiment.add_image('example_images', grid, 0)
-
-    # calculate acc
-    labels_hat = torch.argmax(out, dim=1)
-    test_acc = torch.sum(y == labels_hat).item() / (len(y) * 1.0)
-
-    # log the outputs!
-    self.log_dict({'test_loss': loss, 'test_acc': test_acc})
-
-
-

If you pass in multiple test dataloaders, test_step() will have an additional argument. We recommend -setting the default value of 0 so that you can quickly switch between single and multiple dataloaders.

-
# CASE 2: multiple test dataloaders
-def test_step(self, batch, batch_idx, dataloader_idx=0):
-    # dataloader_idx tells you which dataset this is.
-    ...
-
-
-
-

Note

-

If you don’t need to test you don’t need to implement this method.

-
-
-

Note

-

When the test_step() is called, the model has been put in eval mode and -PyTorch gradients have been disabled. At the end of the test epoch, the model goes back -to training mode and gradients are enabled.

-
-
- -
-
-

test_step_end

-
-
-LightningModule.test_step_end(*args, **kwargs)[source]
-

Use this when testing with dp or ddp2 because test_step() will operate on only part of the batch. -However, this is still optional and only needed for things like softmax or NCE loss.

-
-

Note

-

If you later switch to ddp or some other mode, this will still be called -so that you don’t have to change your code.

-
-
# pseudocode
-sub_batches = split_batches_for_dp(batch)
-step_output = [test_step(sub_batch) for sub_batch in sub_batches]
-test_step_end(step_output)
-
-
-
-
Parameters
-

step_output – What you return in test_step() for each batch part.

-
-
Return type
-

Union[Tensor, Dict[str, Any], None]

-
-
Returns
-

None or anything

-
-
-
# WITHOUT test_step_end
-# if used in DP or DDP2, this batch is 1/num_gpus large
-def test_step(self, batch, batch_idx):
-    # batch is 1/num_gpus big
-    x, y = batch
-
-    out = self(x)
-    loss = self.softmax(out)
-    self.log("test_loss", loss)
-
-
-# --------------
-# with test_step_end to do softmax over the full batch
-def test_step(self, batch, batch_idx):
-    # batch is 1/num_gpus big
-    x, y = batch
-
-    out = self.encoder(x)
-    return out
-
-
-def test_step_end(self, output_results):
-    # this out is now the full size of the batch
-    all_test_step_outs = output_results.out
-    loss = nce_loss(all_test_step_outs)
-    self.log("test_loss", loss)
-
-
-
-

See also

-

See the accelerators/gpu:Multi GPU Training guide for more details.

-
-
- -
-
-

test_epoch_end

-
-
-LightningModule.test_epoch_end(outputs)[source]
-

Called at the end of a test epoch with the output of all test steps.

-
# the pseudocode for these calls
-test_outs = []
-for test_batch in test_data:
-    out = test_step(test_batch)
-    test_outs.append(out)
-test_epoch_end(test_outs)
-
-
-
-
Parameters
-

outputs (Union[List[Union[Tensor, Dict[str, Any]]], List[List[Union[Tensor, Dict[str, Any]]]]]) – List of outputs you defined in test_step_end(), or if there -are multiple dataloaders, a list containing a list of outputs for each dataloader

-
-
Return type
-

None

-
-
Returns
-

None

-
-
-
-

Note

-

If you didn’t define a test_step(), this won’t be called.

-
-

Examples

-

With a single dataloader:

-
def test_epoch_end(self, outputs):
-    # do something with the outputs of all test batches
-    all_test_preds = test_step_outputs.predictions
-
-    some_result = calc_all_results(all_test_preds)
-    self.log(some_result)
-
-
-

With multiple dataloaders, outputs will be a list of lists. The outer list contains -one entry per dataloader, while the inner list contains the individual outputs of -each test step for that dataloader.

-
def test_epoch_end(self, outputs):
-    final_value = 0
-    for dataloader_outputs in outputs:
-        for test_step_out in dataloader_outputs:
-            # do something
-            final_value += test_step_out
-
-    self.log("final_metric", final_value)
-
-
-
- -
-
-

to_onnx

-
-
-LightningModule.to_onnx(file_path, input_sample=None, **kwargs)[source]
-

Saves the model in ONNX format.

-
-
Parameters
-
    -
  • file_path (Union[str, Path]) – The path of the file the onnx model should be saved to.

  • -
  • input_sample (Optional[Any]) – An input for tracing. Default: None (Use self.example_input_array)

  • -
  • **kwargs – Will be passed to torch.onnx.export function.

  • -
-
-
-

Example

-
>>> class SimpleModel(LightningModule):
-...     def __init__(self):
-...         super().__init__()
-...         self.l1 = torch.nn.Linear(in_features=64, out_features=4)
-...
-...     def forward(self, x):
-...         return torch.relu(self.l1(x.view(x.size(0), -1)))
-
-
-
>>> with tempfile.NamedTemporaryFile(suffix='.onnx', delete=False) as tmpfile:
-...     model = SimpleModel()
-...     input_sample = torch.randn((1, 64))
-...     model.to_onnx(tmpfile.name, input_sample, export_params=True)
-...     os.path.isfile(tmpfile.name)
-True
-
-
-
- -
-
-

to_torchscript

-
-
-LightningModule.to_torchscript(file_path=None, method='script', example_inputs=None, **kwargs)[source]
-

By default compiles the whole model to a ScriptModule. If you want to use tracing, -please provided the argument method='trace' and make sure that either the example_inputs argument is -provided, or the model has example_input_array set. If you would like to customize the modules that -are scripted you should override this method. In case you want to return multiple modules, we recommend -using a dictionary.

-
-
Parameters
-
    -
  • file_path (Union[str, Path, None]) – Path where to save the torchscript. Default: None (no file saved).

  • -
  • method (Optional[str]) – Whether to use TorchScript’s script or trace method. Default: ‘script’

  • -
  • example_inputs (Optional[Any]) – An input to be used to do tracing when method is set to ‘trace’. -Default: None (uses example_input_array)

  • -
  • **kwargs – Additional arguments that will be passed to the torch.jit.script() or -torch.jit.trace() function.

  • -
-
-
-
-

Note

-
    -
  • Requires the implementation of the -forward() method.

  • -
  • The exported script will be set to evaluation mode.

  • -
  • It is recommended that you install the latest supported version of PyTorch -to use this feature without limitations. See also the torch.jit -documentation for supported features.

  • -
-
-

Example

-
>>> class SimpleModel(LightningModule):
-...     def __init__(self):
-...         super().__init__()
-...         self.l1 = torch.nn.Linear(in_features=64, out_features=4)
-...
-...     def forward(self, x):
-...         return torch.relu(self.l1(x.view(x.size(0), -1)))
-...
->>> model = SimpleModel()
->>> model.to_torchscript(file_path="model.pt")  
->>> os.path.isfile("model.pt")  
->>> torch.jit.save(model.to_torchscript(file_path="model_trace.pt", method='trace', 
-...                                     example_inputs=torch.randn(1, 64)))  
->>> os.path.isfile("model_trace.pt")  
-True
-
-
-
-
Return type
-

Union[ScriptModule, Dict[str, ScriptModule]]

-
-
Returns
-

This LightningModule as a torchscript, regardless of whether file_path is -defined or not.

-
-
-
- -
-
-

training_step

-
-
-LightningModule.training_step(*args, **kwargs)[source]
-

Here you compute and return the training loss and some additional metrics for e.g. -the progress bar or logger.

-
-
Parameters
-
    -
  • batch (Tensor | (Tensor, …) | [Tensor, …]) – The output of your DataLoader. A tensor, tuple or list.

  • -
  • batch_idx (int) – Integer displaying index of this batch

  • -
  • optimizer_idx (int) – When using multiple optimizers, this argument will also be present.

  • -
  • hiddens (Any) – Passed in if -truncated_bptt_steps > 0.

  • -
-
-
Return type
-

Union[Tensor, Dict[str, Any]]

-
-
Returns
-

Any of.

-
    -
  • Tensor - The loss tensor

  • -
  • dict - A dictionary. Can include any keys, but must include the key 'loss'

  • -
  • -
    None - Training will skip to the next batch. This is only for automatic optimization.

    This is not supported for multi-GPU, TPU, IPU, or DeepSpeed.

    -
    -
    -
  • -
-

-
-
-

In this step you’d normally do the forward pass and calculate the loss for a batch. -You can also do fancier things like multiple forward passes or something model specific.

-

Example:

-
def training_step(self, batch, batch_idx):
-    x, y, z = batch
-    out = self.encoder(x)
-    loss = self.loss(out, x)
-    return loss
-
-
-

If you define multiple optimizers, this step will be called with an additional -optimizer_idx parameter.

-
# Multiple optimizers (e.g.: GANs)
-def training_step(self, batch, batch_idx, optimizer_idx):
-    if optimizer_idx == 0:
-        # do training_step with encoder
-        ...
-    if optimizer_idx == 1:
-        # do training_step with decoder
-        ...
-
-
-

If you add truncated back propagation through time you will also get an additional -argument with the hidden states of the previous step.

-
# Truncated back-propagation through time
-def training_step(self, batch, batch_idx, hiddens):
-    # hiddens are the hidden states from the previous truncated backprop step
-    out, hiddens = self.lstm(data, hiddens)
-    loss = ...
-    return {"loss": loss, "hiddens": hiddens}
-
-
-
-

Note

-

The loss value shown in the progress bar is smoothed (averaged) over the last values, -so it differs from the actual loss returned in train/validation step.

-
-
- -
-
-

training_step_end

-
-
-LightningModule.training_step_end(step_output)[source]
-

Use this when training with dp or ddp2 because training_step() will operate on only part of the -batch. However, this is still optional and only needed for things like softmax or NCE loss.

-
-

Note

-

If you later switch to ddp or some other mode, this will still be called -so that you don’t have to change your code

-
-
# pseudocode
-sub_batches = split_batches_for_dp(batch)
-step_output = [training_step(sub_batch) for sub_batch in sub_batches]
-training_step_end(step_output)
-
-
-
-
Parameters
-

step_output (Union[Tensor, Dict[str, Any]]) – What you return in training_step for each batch part.

-
-
Return type
-

Union[Tensor, Dict[str, Any]]

-
-
Returns
-

Anything

-
-
-

When using dp/ddp2 distributed backends, only a portion of the batch is inside the training_step:

-
def training_step(self, batch, batch_idx):
-    # batch is 1/num_gpus big
-    x, y = batch
-
-    out = self(x)
-
-    # softmax uses only a portion of the batch in the denominator
-    loss = self.softmax(out)
-    loss = nce_loss(loss)
-    return loss
-
-
-

If you wish to do something with all the parts of the batch, then use this method to do it:

-
def training_step(self, batch, batch_idx):
-    # batch is 1/num_gpus big
-    x, y = batch
-
-    out = self.encoder(x)
-    return {"pred": out}
-
-
-def training_step_end(self, training_step_outputs):
-    gpu_0_pred = training_step_outputs[0]["pred"]
-    gpu_1_pred = training_step_outputs[1]["pred"]
-    gpu_n_pred = training_step_outputs[n]["pred"]
-
-    # this softmax now uses the full batch
-    loss = nce_loss([gpu_0_pred, gpu_1_pred, gpu_n_pred])
-    return loss
-
-
-
-

See also

-

See the accelerators/gpu:Multi GPU Training guide for more details.

-
-
- -
-
-

training_epoch_end

-
-
-LightningModule.training_epoch_end(outputs)[source]
-

Called at the end of the training epoch with the outputs of all training steps. Use this in case you -need to do something with all the outputs returned by training_step().

-
# the pseudocode for these calls
-train_outs = []
-for train_batch in train_data:
-    out = training_step(train_batch)
-    train_outs.append(out)
-training_epoch_end(train_outs)
-
-
-
-
Parameters
-

outputs (List[Union[Tensor, Dict[str, Any]]]) – List of outputs you defined in training_step(). If there are multiple optimizers or when -using truncated_bptt_steps > 0, the lists have the dimensions -(n_batches, tbptt_steps, n_optimizers). Dimensions of length 1 are squeezed.

-
-
Return type
-

None

-
-
Returns
-

None

-
-
-
-

Note

-

If this method is not overridden, this won’t be called.

-
-
def training_epoch_end(self, training_step_outputs):
-    # do something with all training_step outputs
-    for out in training_step_outputs:
-        ...
-
-
-
- -
-
-

unfreeze

-
-
-LightningModule.unfreeze()[source]
-

Unfreeze all parameters for training.

-
model = MyLightningModule(...)
-model.unfreeze()
-
-
-
-
Return type
-

None

-
-
-
- -
-
-

untoggle_optimizer

-
-
-LightningModule.untoggle_optimizer(optimizer_idx)[source]
-

Resets the state of required gradients that were toggled with toggle_optimizer().

-

This is only called automatically when automatic optimization is enabled and multiple optimizers are used.

-
-
Parameters
-

optimizer_idx (int) – The index of the optimizer to untoggle.

-
-
Return type
-

None

-
-
-
- -
-
-

validation_step

-
-
-LightningModule.validation_step(*args, **kwargs)[source]
-

Operates on a single batch of data from the validation set. -In this step you’d might generate examples or calculate anything of interest like accuracy.

-
# the pseudocode for these calls
-val_outs = []
-for val_batch in val_data:
-    out = validation_step(val_batch)
-    val_outs.append(out)
-validation_epoch_end(val_outs)
-
-
-
-
Parameters
-
    -
  • batch – The output of your DataLoader.

  • -
  • batch_idx – The index of this batch.

  • -
  • dataloader_idx – The index of the dataloader that produced this batch. -(only if multiple val dataloaders used)

  • -
-
-
Return type
-

Union[Tensor, Dict[str, Any], None]

-
-
Returns
-

    -
  • Any object or value

  • -
  • None - Validation will skip to the next batch

  • -
-

-
-
-
# pseudocode of order
-val_outs = []
-for val_batch in val_data:
-    out = validation_step(val_batch)
-    if defined("validation_step_end"):
-        out = validation_step_end(out)
-    val_outs.append(out)
-val_outs = validation_epoch_end(val_outs)
-
-
-
# if you have one val dataloader:
-def validation_step(self, batch, batch_idx):
-    ...
-
-
-# if you have multiple val dataloaders:
-def validation_step(self, batch, batch_idx, dataloader_idx=0):
-    ...
-
-
-

Examples:

-
# CASE 1: A single validation dataset
-def validation_step(self, batch, batch_idx):
-    x, y = batch
-
-    # implement your own
-    out = self(x)
-    loss = self.loss(out, y)
-
-    # log 6 example images
-    # or generated text... or whatever
-    sample_imgs = x[:6]
-    grid = torchvision.utils.make_grid(sample_imgs)
-    self.logger.experiment.add_image('example_images', grid, 0)
-
-    # calculate acc
-    labels_hat = torch.argmax(out, dim=1)
-    val_acc = torch.sum(y == labels_hat).item() / (len(y) * 1.0)
-
-    # log the outputs!
-    self.log_dict({'val_loss': loss, 'val_acc': val_acc})
-
-
-

If you pass in multiple val dataloaders, validation_step() will have an additional argument. We recommend -setting the default value of 0 so that you can quickly switch between single and multiple dataloaders.

-
# CASE 2: multiple validation dataloaders
-def validation_step(self, batch, batch_idx, dataloader_idx=0):
-    # dataloader_idx tells you which dataset this is.
-    ...
-
-
-
-

Note

-

If you don’t need to validate you don’t need to implement this method.

-
-
-

Note

-

When the validation_step() is called, the model has been put in eval mode -and PyTorch gradients have been disabled. At the end of validation, -the model goes back to training mode and gradients are enabled.

-
-
- -
-
-

validation_step_end

-
-
-LightningModule.validation_step_end(*args, **kwargs)[source]
-

Use this when validating with dp or ddp2 because validation_step() will operate on only part of -the batch. However, this is still optional and only needed for things like softmax or NCE loss.

-
-

Note

-

If you later switch to ddp or some other mode, this will still be called -so that you don’t have to change your code.

-
-
# pseudocode
-sub_batches = split_batches_for_dp(batch)
-step_output = [validation_step(sub_batch) for sub_batch in sub_batches]
-validation_step_end(step_output)
-
-
-
-
Parameters
-

step_output – What you return in validation_step() for each batch part.

-
-
Return type
-

Union[Tensor, Dict[str, Any], None]

-
-
Returns
-

None or anything

-
-
-
# WITHOUT validation_step_end
-# if used in DP or DDP2, this batch is 1/num_gpus large
-def validation_step(self, batch, batch_idx):
-    # batch is 1/num_gpus big
-    x, y = batch
-
-    out = self.encoder(x)
-    loss = self.softmax(out)
-    loss = nce_loss(loss)
-    self.log("val_loss", loss)
-
-
-# --------------
-# with validation_step_end to do softmax over the full batch
-def validation_step(self, batch, batch_idx):
-    # batch is 1/num_gpus big
-    x, y = batch
-
-    out = self(x)
-    return out
-
-
-def validation_step_end(self, val_step_outputs):
-    for out in val_step_outputs:
-        ...
-
-
-
-

See also

-

See the accelerators/gpu:Multi GPU Training guide for more details.

-
-
- -
-
-

validation_epoch_end

-
-
-LightningModule.validation_epoch_end(outputs)[source]
-

Called at the end of the validation epoch with the outputs of all validation steps.

-
# the pseudocode for these calls
-val_outs = []
-for val_batch in val_data:
-    out = validation_step(val_batch)
-    val_outs.append(out)
-validation_epoch_end(val_outs)
-
-
-
-
Parameters
-

outputs (Union[List[Union[Tensor, Dict[str, Any]]], List[List[Union[Tensor, Dict[str, Any]]]]]) – List of outputs you defined in validation_step(), or if there -are multiple dataloaders, a list containing a list of outputs for each dataloader.

-
-
Return type
-

None

-
-
Returns
-

None

-
-
-
-

Note

-

If you didn’t define a validation_step(), this won’t be called.

-
-

Examples

-

With a single dataloader:

-
def validation_epoch_end(self, val_step_outputs):
-    for out in val_step_outputs:
-        ...
-
-
-

With multiple dataloaders, outputs will be a list of lists. The outer list contains -one entry per dataloader, while the inner list contains the individual outputs of -each validation step for that dataloader.

-
def validation_epoch_end(self, outputs):
-    for dataloader_output_result in outputs:
-        dataloader_outs = dataloader_output_result.dataloader_i_outputs
-
-    self.log("final_metric", final_value)
-
-
-
- -
-
-
-
-

Properties

-

These are properties available in a LightningModule.

-
-

current_epoch

-

The number of epochs run.

-
def training_step(self, batch, batch_idx):
-    if self.current_epoch == 0:
-        ...
-
-
-
-
-

device

-

The device the module is on. Use it to keep your code device agnostic.

-
def training_step(self, batch, batch_idx):
-    z = torch.rand(2, 3, device=self.device)
-
-
-
-
-

global_rank

-

The global_rank is the index of the current process across all nodes and devices. -Lightning will perform some operations such as logging, weight checkpointing only when global_rank=0. You -usually do not need to use this property, but it is useful to know how to access it if needed.

-
def training_step(self, batch, batch_idx):
-    if self.global_rank == 0:
-        # do something only once across all the nodes
-        ...
-
-
-
-
-

global_step

-

The number of optimizer steps taken (does not reset each epoch). -This includes multiple optimizers and TBPTT steps (if enabled).

-
def training_step(self, batch, batch_idx):
-    self.logger.experiment.log_image(..., step=self.global_step)
-
-
-
-
-

hparams

-

The arguments passed through LightningModule.__init__() and saved by calling -save_hyperparameters() could be accessed by the hparams attribute.

-
def __init__(self, learning_rate):
-    self.save_hyperparameters()
-
-
-def configure_optimizers(self):
-    return Adam(self.parameters(), lr=self.hparams.learning_rate)
-
-
-
-
-

logger

-

The current logger being used (tensorboard or other supported logger)

-
def training_step(self, batch, batch_idx):
-    # the generic logger (same no matter if tensorboard or other supported logger)
-    self.logger
-
-    # the particular logger
-    tensorboard_logger = self.logger.experiment
-
-
-
-
-

loggers

-

The list of loggers currently being used by the Trainer.

-
def training_step(self, batch, batch_idx):
-    # List of Logger objects
-    loggers = self.loggers
-    for logger in loggers:
-        logger.log_metrics({"foo": 1.0})
-
-
-
-
-

local_rank

-

The local_rank is the index of the current process across all the devices for the current node. -You usually do not need to use this property, but it is useful to know how to access it if needed. -For example, if using 10 machines (or nodes), the GPU at index 0 on each machine has local_rank = 0.

-
def training_step(self, batch, batch_idx):
-    if self.local_rank == 0:
-        # do something only once across each node
-        ...
-
-
-
-
-

precision

-

The type of precision used:

-
def training_step(self, batch, batch_idx):
-    if self.precision == 16:
-        ...
-
-
-
-
-

trainer

-

Pointer to the trainer

-
def training_step(self, batch, batch_idx):
-    max_steps = self.trainer.max_steps
-    any_flag = self.trainer.any_flag
-
-
-
-
-

prepare_data_per_node

-

If set to True will call prepare_data() on LOCAL_RANK=0 for every node. -If set to False will only call from NODE_RANK=0, LOCAL_RANK=0.

-
class LitModel(LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.prepare_data_per_node = True
-
-
-
-
-

automatic_optimization

-

When set to False, Lightning does not automate the optimization process. This means you are responsible for handling -your optimizers. However, we do take care of precision and any accelerators used.

-

See manual optimization for details.

-
def __init__(self):
-    self.automatic_optimization = False
-
-
-def training_step(self, batch, batch_idx):
-    opt = self.optimizers(use_pl_optimizer=True)
-
-    loss = ...
-    opt.zero_grad()
-    self.manual_backward(loss)
-    opt.step()
-
-
-

This is recommended only if using 2+ optimizers AND if you know how to perform the optimization procedure properly. Note -that automatic optimization can still be used with multiple optimizers by relying on the optimizer_idx parameter. -Manual optimization is most useful for research topics like reinforcement learning, sparse coding, and GAN research.

-
def __init__(self):
-    self.automatic_optimization = False
-
-
-def training_step(self, batch, batch_idx):
-    # access your optimizers with use_pl_optimizer=False. Default is True
-    opt_a, opt_b = self.optimizers(use_pl_optimizer=True)
-
-    gen_loss = ...
-    opt_a.zero_grad()
-    self.manual_backward(gen_loss)
-    opt_a.step()
-
-    disc_loss = ...
-    opt_b.zero_grad()
-    self.manual_backward(disc_loss)
-    opt_b.step()
-
-
-
-
-

example_input_array

-

Set and access example_input_array, which basically represents a single batch.

-
def __init__(self):
-    self.example_input_array = ...
-    self.generator = ...
-
-
-def on_train_epoch_end(self):
-    # generate some images using the example_input_array
-    gen_images = self.generator(self.example_input_array)
-
-
-
-
-

truncated_bptt_steps

-

Truncated Backpropagation Through Time (TBPTT) performs perform backpropogation every k steps of -a much longer sequence. This is made possible by passing training batches -split along the time-dimensions into splits of size k to the -training_step. In order to keep the same forward propagation behavior, all -hidden states should be kept in-between each time-dimension split.

-

If this is enabled, your batches will automatically get truncated -and the Trainer will apply Truncated Backprop to it.

-

(Williams et al. “An efficient gradient-based algorithm for on-line training of -recurrent network trajectories.”)

-

Tutorial

-
from pytorch_lightning import LightningModule
-
-
-class MyModel(LightningModule):
-    def __init__(self, input_size, hidden_size, num_layers):
-        super().__init__()
-        # batch_first has to be set to True
-        self.lstm = nn.LSTM(
-            input_size=input_size,
-            hidden_size=hidden_size,
-            num_layers=num_layers,
-            batch_first=True,
-        )
-
-        ...
-
-        # Important: This property activates truncated backpropagation through time
-        # Setting this value to 2 splits the batch into sequences of size 2
-        self.truncated_bptt_steps = 2
-
-    # Truncated back-propagation through time
-    def training_step(self, batch, batch_idx, hiddens):
-        x, y = batch
-
-        # the training step must be updated to accept a ``hiddens`` argument
-        # hiddens are the hiddens from the previous truncated backprop step
-        out, hiddens = self.lstm(x, hiddens)
-
-        ...
-
-        return {"loss": ..., "hiddens": hiddens}
-
-
-

Lightning takes care of splitting your batch along the time-dimension. It is -assumed to be the second dimension of your batches. Therefore, in the -example above, we have set batch_first=True.

-
# we use the second as the time dimension
-# (batch, time, ...)
-sub_batch = batch[0, 0:t, ...]
-
-
-

To modify how the batch is split, -override the pytorch_lightning.core.lightning.LightningModule.tbptt_split_batch() method:

-
class LitMNIST(LightningModule):
-    def tbptt_split_batch(self, batch, split_size):
-        # do your own splitting on the batch
-        return splits
-
-
-
-
-
-
-

Hooks

-

This is the pseudocode to describe the structure of fit(). -The inputs and outputs of each function are not represented for simplicity. Please check each function’s API reference -for more information.

-
def fit(self):
-    if global_rank == 0:
-        # prepare data is called on GLOBAL_ZERO only
-        prepare_data()
-
-    configure_callbacks()
-
-    with parallel(devices):
-        # devices can be GPUs, TPUs, ...
-        train_on_device(model)
-
-
-def train_on_device(model):
-    # called PER DEVICE
-    on_fit_start()
-    setup("fit")
-    configure_optimizers()
-
-    # the sanity check runs here
-
-    on_train_start()
-    for epoch in epochs:
-        fit_loop()
-    on_train_end()
-
-    on_fit_end()
-    teardown("fit")
-
-
-def fit_loop():
-    on_train_epoch_start()
-
-    for batch in train_dataloader():
-        on_train_batch_start()
-
-        on_before_batch_transfer()
-        transfer_batch_to_device()
-        on_after_batch_transfer()
-
-        training_step()
-
-        on_before_zero_grad()
-        optimizer_zero_grad()
-
-        on_before_backward()
-        backward()
-        on_after_backward()
-
-        on_before_optimizer_step()
-        configure_gradient_clipping()
-        optimizer_step()
-
-        on_train_batch_end()
-
-        if should_check_val:
-            val_loop()
-    # end training epoch
-    training_epoch_end()
-
-    on_train_epoch_end()
-
-
-def val_loop():
-    on_validation_model_eval()  # calls `model.eval()`
-    torch.set_grad_enabled(False)
-
-    on_validation_start()
-    on_validation_epoch_start()
-
-    val_outs = []
-    for batch_idx, batch in enumerate(val_dataloader()):
-        on_validation_batch_start(batch, batch_idx)
-
-        batch = on_before_batch_transfer(batch)
-        batch = transfer_batch_to_device(batch)
-        batch = on_after_batch_transfer(batch)
-
-        out = validation_step(batch, batch_idx)
-
-        on_validation_batch_end(batch, batch_idx)
-        val_outs.append(out)
-
-    validation_epoch_end(val_outs)
-
-    on_validation_epoch_end()
-    on_validation_end()
-
-    # set up for train
-    on_validation_model_train()  # calls `model.train()`
-    torch.set_grad_enabled(True)
-
-
-
-

backward

-
-
-LightningModule.backward(loss, optimizer, optimizer_idx, *args, **kwargs)[source]
-

Called to perform backward on the loss returned in training_step(). Override this hook with your -own implementation if you need to.

-
-
Parameters
-
    -
  • loss (Tensor) – The loss tensor returned by training_step(). If gradient accumulation is used, the loss here -holds the normalized value (scaled by 1 / accumulation steps).

  • -
  • optimizer (Optional[Optimizer]) – Current optimizer being used. None if using manual optimization.

  • -
  • optimizer_idx (Optional[int]) – Index of the current optimizer being used. None if using manual optimization.

  • -
-
-
-

Example:

-
def backward(self, loss, optimizer, optimizer_idx):
-    loss.backward()
-
-
-
-
Return type
-

None

-
-
-
- -
-
-

on_before_backward

-
-
-LightningModule.on_before_backward(loss)
-

Called before loss.backward().

-
-
Parameters
-

loss (Tensor) – Loss divided by number of batches for gradient accumulation and scaled if using native AMP.

-
-
Return type
-

None

-
-
-
- -
-
-

on_after_backward

-
-
-LightningModule.on_after_backward()
-

Called after loss.backward() and before optimizers are stepped.

-
-

Note

-

If using native AMP, the gradients will not be unscaled at this point. -Use the on_before_optimizer_step if you need the unscaled gradients.

-
-
-
Return type
-

None

-
-
-
- -
-
-

on_before_zero_grad

-
-
-LightningModule.on_before_zero_grad(optimizer)
-

Called after training_step() and before optimizer.zero_grad().

-

Called in the training loop after taking an optimizer step and before zeroing grads. -Good place to inspect weight information with weights updated.

-

This is where it is called:

-
for optimizer in optimizers:
-    out = training_step(...)
-
-    model.on_before_zero_grad(optimizer) # < ---- called here
-    optimizer.zero_grad()
-
-    backward()
-
-
-
-
Parameters
-

optimizer (Optimizer) – The optimizer for which grads should be zeroed.

-
-
Return type
-

None

-
-
-
- -
-
-

on_fit_start

-
-
-LightningModule.on_fit_start()
-

Called at the very beginning of fit.

-

If on DDP it is called on every process

-
-
Return type
-

None

-
-
-
- -
-
-

on_fit_end

-
-
-LightningModule.on_fit_end()
-

Called at the very end of fit.

-

If on DDP it is called on every process

-
-
Return type
-

None

-
-
-
- -
-
-

on_load_checkpoint

-
-
-LightningModule.on_load_checkpoint(checkpoint)
-

Called by Lightning to restore your model. -If you saved something with on_save_checkpoint() this is your chance to restore this.

-
-
Parameters
-

checkpoint (Dict[str, Any]) – Loaded checkpoint

-
-
-

Example:

-
def on_load_checkpoint(self, checkpoint):
-    # 99% of the time you don't need to implement this method
-    self.something_cool_i_want_to_save = checkpoint['something_cool_i_want_to_save']
-
-
-
-

Note

-

Lightning auto-restores global step, epoch, and train state including amp scaling. -There is no need for you to restore anything regarding training.

-
-
-
Return type
-

None

-
-
-
- -
-
-

on_save_checkpoint

-
-
-LightningModule.on_save_checkpoint(checkpoint)
-

Called by Lightning when saving a checkpoint to give you a chance to store anything -else you might want to save.

-
-
Parameters
-

checkpoint (Dict[str, Any]) – The full checkpoint dictionary before it gets dumped to a file. -Implementations of this hook can insert additional data into this dictionary.

-
-
-

Example:

-
def on_save_checkpoint(self, checkpoint):
-    # 99% of use cases you don't need to implement this method
-    checkpoint['something_cool_i_want_to_save'] = my_cool_pickable_object
-
-
-
-

Note

-

Lightning saves all aspects of training (epoch, global step, etc…) -including amp scaling. -There is no need for you to store anything about training.

-
-
-
Return type
-

None

-
-
-
- -
-
-

load_from_checkpoint

-
-
-classmethod LightningModule.load_from_checkpoint(checkpoint_path, map_location=None, hparams_file=None, strict=True, **kwargs)
-

Primary way of loading a model from a checkpoint. When Lightning saves a checkpoint -it stores the arguments passed to __init__ in the checkpoint under "hyper_parameters".

-

Any arguments specified through **kwargs will override args stored in "hyper_parameters".

-
-
Parameters
-
    -
  • checkpoint_path (Union[str, IO]) – Path to checkpoint. This can also be a URL, or file-like object

  • -
  • map_location (Union[Dict[str, str], str, device, int, Callable, None]) – If your checkpoint saved a GPU model and you now load on CPUs -or a different number of GPUs, use this to map to the new setup. -The behaviour is the same as in torch.load().

  • -
  • hparams_file (Optional[str]) –

    Optional path to a .yaml file with hierarchical structure -as in this example:

    -
    drop_prob: 0.2
    -dataloader:
    -    batch_size: 32
    -
    -
    -

    You most likely won’t need this since Lightning will always save the hyperparameters -to the checkpoint. -However, if your checkpoint weights don’t have the hyperparameters saved, -use this method to pass in a .yaml file with the hparams you’d like to use. -These will be converted into a dict and passed into your -LightningModule for use.

    -

    If your model’s hparams argument is Namespace -and .yaml file has hierarchical structure, you need to refactor your model to treat -hparams as dict.

    -

  • -
  • strict (bool) – Whether to strictly enforce that the keys in checkpoint_path match the keys -returned by this module’s state dict.

  • -
  • kwargs – Any extra keyword args needed to init the model. Can also be used to override saved -hyperparameter values.

  • -
-
-
Returns
-

LightningModule instance with loaded weights and hyperparameters (if available).

-
-
-
-

Note

-

load_from_checkpoint is a class method. You should use your LightningModule -class to call it instead of the LightningModule instance.

-
-

Example:

-
# load weights without mapping ...
-model = MyLightningModule.load_from_checkpoint('path/to/checkpoint.ckpt')
-
-# or load weights mapping all weights from GPU 1 to GPU 0 ...
-map_location = {'cuda:1':'cuda:0'}
-model = MyLightningModule.load_from_checkpoint(
-    'path/to/checkpoint.ckpt',
-    map_location=map_location
-)
-
-# or load weights and hyperparameters from separate files.
-model = MyLightningModule.load_from_checkpoint(
-    'path/to/checkpoint.ckpt',
-    hparams_file='/path/to/hparams_file.yaml'
-)
-
-# override some of the params with new values
-model = MyLightningModule.load_from_checkpoint(
-    PATH,
-    num_layers=128,
-    pretrained_ckpt_path=NEW_PATH,
-)
-
-# predict
-pretrained_model.eval()
-pretrained_model.freeze()
-y_hat = pretrained_model(x)
-
-
-
- -
-
-

on_hpc_save

-
-
-LightningModule.on_hpc_save(checkpoint)
-

Hook to do whatever you need right before Slurm manager saves the model.

-
-
Parameters
-

checkpoint (Dict[str, Any]) – A dictionary in which you can save variables to save in a checkpoint. -Contents need to be pickleable.

-
-
-
-

Deprecated since version v1.6: This method is deprecated in v1.6 and will be removed in v1.8. -Please use LightningModule.on_save_checkpoint instead.

-
-
-
Return type
-

None

-
-
-
- -
-
-

on_hpc_load

-
-
-LightningModule.on_hpc_load(checkpoint)
-

Hook to do whatever you need right before Slurm manager loads the model.

-
-
Parameters
-

checkpoint (Dict[str, Any]) – A dictionary with variables from the checkpoint.

-
-
-
-

Deprecated since version v1.6: This method is deprecated in v1.6 and will be removed in v1.8. -Please use LightningModule.on_load_checkpoint instead.

-
-
-
Return type
-

None

-
-
-
- -
-
-

on_train_start

-
-
-LightningModule.on_train_start()
-

Called at the beginning of training after sanity check.

-
-
Return type
-

None

-
-
-
- -
-
-

on_train_end

-
-
-LightningModule.on_train_end()
-

Called at the end of training before logger experiment is closed.

-
-
Return type
-

None

-
-
-
- -
-
-

on_validation_start

-
-
-LightningModule.on_validation_start()
-

Called at the beginning of validation.

-
-
Return type
-

None

-
-
-
- -
-
-

on_validation_end

-
-
-LightningModule.on_validation_end()
-

Called at the end of validation.

-
-
Return type
-

None

-
-
-
- -
-
-

on_test_batch_start

-
-
-LightningModule.on_test_batch_start(batch, batch_idx, dataloader_idx)
-

Called in the test loop before anything happens for that batch.

-
-
Parameters
-
    -
  • batch (Any) – The batched data as it is returned by the test DataLoader.

  • -
  • batch_idx (int) – the index of the batch

  • -
  • dataloader_idx (int) – the index of the dataloader

  • -
-
-
Return type
-

None

-
-
-
- -
-
-

on_test_batch_end

-
-
-LightningModule.on_test_batch_end(outputs, batch, batch_idx, dataloader_idx)
-

Called in the test loop after the batch.

-
-
Parameters
-
    -
  • outputs (Union[Tensor, Dict[str, Any], None]) – The outputs of test_step_end(test_step(x))

  • -
  • batch (Any) – The batched data as it is returned by the test DataLoader.

  • -
  • batch_idx (int) – the index of the batch

  • -
  • dataloader_idx (int) – the index of the dataloader

  • -
-
-
Return type
-

None

-
-
-
- -
-
-

on_test_epoch_start

-
-
-LightningModule.on_test_epoch_start()
-

Called in the test loop at the very beginning of the epoch.

-
-
Return type
-

None

-
-
-
- -
-
-

on_test_epoch_end

-
-
-LightningModule.on_test_epoch_end()
-

Called in the test loop at the very end of the epoch.

-
-
Return type
-

None

-
-
-
- -
-
-

on_test_start

-
-
-LightningModule.on_test_start()
-

Called at the beginning of testing.

-
-
Return type
-

None

-
-
-
- -
-
-

on_test_end

-
-
-LightningModule.on_test_end()
-

Called at the end of testing.

-
-
Return type
-

None

-
-
-
- -
-
-

on_predict_batch_start

-
-
-LightningModule.on_predict_batch_start(batch, batch_idx, dataloader_idx)
-

Called in the predict loop before anything happens for that batch.

-
-
Parameters
-
    -
  • batch (Any) – The batched data as it is returned by the test DataLoader.

  • -
  • batch_idx (int) – the index of the batch

  • -
  • dataloader_idx (int) – the index of the dataloader

  • -
-
-
Return type
-

None

-
-
-
- -
-
-

on_predict_batch_end

-
-
-LightningModule.on_predict_batch_end(outputs, batch, batch_idx, dataloader_idx)
-

Called in the predict loop after the batch.

-
-
Parameters
-
    -
  • outputs (Optional[Any]) – The outputs of predict_step_end(test_step(x))

  • -
  • batch (Any) – The batched data as it is returned by the test DataLoader.

  • -
  • batch_idx (int) – the index of the batch

  • -
  • dataloader_idx (int) – the index of the dataloader

  • -
-
-
Return type
-

None

-
-
-
- -
-
-

on_predict_epoch_start

-
-
-LightningModule.on_predict_epoch_start()
-

Called at the beginning of predicting.

-
-
Return type
-

None

-
-
-
- -
-
-

on_predict_epoch_end

-
-
-LightningModule.on_predict_epoch_end(results)
-

Called at the end of predicting.

-
-
Return type
-

None

-
-
-
- -
-
-

on_predict_start

-
-
-LightningModule.on_predict_start()
-

Called at the beginning of predicting.

-
-
Return type
-

None

-
-
-
- -
-
-

on_predict_end

-
-
-LightningModule.on_predict_end()
-

Called at the end of predicting.

-
-
Return type
-

None

-
-
-
- -
-
-

on_train_batch_start

-
-
-LightningModule.on_train_batch_start(batch, batch_idx, unused=0)
-

Called in the training loop before anything happens for that batch.

-

If you return -1 here, you will skip training for the rest of the current epoch.

-
-
Parameters
-
    -
  • batch (Any) – The batched data as it is returned by the training DataLoader.

  • -
  • batch_idx (int) – the index of the batch

  • -
  • unused (int) – Deprecated argument. Will be removed in v1.7.

  • -
-
-
Return type
-

Optional[int]

-
-
-
- -
-
-

on_train_batch_end

-
-
-LightningModule.on_train_batch_end(outputs, batch, batch_idx, unused=0)
-

Called in the training loop after the batch.

-
-
Parameters
-
    -
  • outputs (Union[Tensor, Dict[str, Any]]) – The outputs of training_step_end(training_step(x))

  • -
  • batch (Any) – The batched data as it is returned by the training DataLoader.

  • -
  • batch_idx (int) – the index of the batch

  • -
  • unused (int) – Deprecated argument. Will be removed in v1.7.

  • -
-
-
Return type
-

None

-
-
-
- -
-
-

on_train_epoch_start

-
-
-LightningModule.on_train_epoch_start()
-

Called in the training loop at the very beginning of the epoch.

-
-
Return type
-

None

-
-
-
- -
-
-

on_train_epoch_end

-
-
-LightningModule.on_train_epoch_end()
-

Called in the training loop at the very end of the epoch.

-

To access all batch outputs at the end of the epoch, either:

-
    -
  1. Implement training_epoch_end in the LightningModule OR

  2. -
  3. Cache data across steps on the attribute(s) of the LightningModule and access them in this hook

  4. -
-
-
Return type
-

None

-
-
-
- -
-
-

on_validation_batch_start

-
-
-LightningModule.on_validation_batch_start(batch, batch_idx, dataloader_idx)
-

Called in the validation loop before anything happens for that batch.

-
-
Parameters
-
    -
  • batch (Any) – The batched data as it is returned by the validation DataLoader.

  • -
  • batch_idx (int) – the index of the batch

  • -
  • dataloader_idx (int) – the index of the dataloader

  • -
-
-
Return type
-

None

-
-
-
- -
-
-

on_validation_batch_end

-
-
-LightningModule.on_validation_batch_end(outputs, batch, batch_idx, dataloader_idx)
-

Called in the validation loop after the batch.

-
-
Parameters
-
    -
  • outputs (Union[Tensor, Dict[str, Any], None]) – The outputs of validation_step_end(validation_step(x))

  • -
  • batch (Any) – The batched data as it is returned by the validation DataLoader.

  • -
  • batch_idx (int) – the index of the batch

  • -
  • dataloader_idx (int) – the index of the dataloader

  • -
-
-
Return type
-

None

-
-
-
- -
-
-

on_validation_epoch_start

-
-
-LightningModule.on_validation_epoch_start()
-

Called in the validation loop at the very beginning of the epoch.

-
-
Return type
-

None

-
-
-
- -
-
-

on_validation_epoch_end

-
-
-LightningModule.on_validation_epoch_end()
-

Called in the validation loop at the very end of the epoch.

-
-
Return type
-

None

-
-
-
- -
-
-

on_post_move_to_device

-
-
-LightningModule.on_post_move_to_device()
-

Called in the parameter_validation decorator after -to() is called. This is a good place to tie weights between -modules after moving them to a device. Can be used when training models with weight sharing properties on -TPU.

-

Addresses the handling of shared weights on TPU: -https://github.com/pytorch/xla/blob/master/TROUBLESHOOTING.md#xla-tensor-quirks

-

Example:

-
def on_post_move_to_device(self):
-    self.decoder.weight = self.encoder.weight
-
-
-
-
Return type
-

None

-
-
-
- -
-
-

configure_sharded_model

-
-
-LightningModule.configure_sharded_model()
-

Hook to create modules in a distributed aware context. This is useful for when using sharded plugins, -where we’d like to shard the model instantly, which is useful for extremely large models which can save -memory and initialization time.

-

This hook is called during each of fit/val/test/predict stages in the same process, so ensure that -implementation of this hook is idempotent.

-
-
Return type
-

None

-
-
-
- -
-
-

on_validation_model_eval

-
-
-LightningModule.on_validation_model_eval()
-

Sets the model to eval during the val loop.

-
-
Return type
-

None

-
-
-
- -
-
-

on_validation_model_train

-
-
-LightningModule.on_validation_model_train()
-

Sets the model to train during the val loop.

-
-
Return type
-

None

-
-
-
- -
-
-

on_test_model_eval

-
-
-LightningModule.on_test_model_eval()
-

Sets the model to eval during the test loop.

-
-
Return type
-

None

-
-
-
- -
-
-

on_test_model_train

-
-
-LightningModule.on_test_model_train()
-

Sets the model to train during the test loop.

-
-
Return type
-

None

-
-
-
- -
-
-

on_before_optimizer_step

-
-
-LightningModule.on_before_optimizer_step(optimizer, optimizer_idx)
-

Called before optimizer.step().

-

If using gradient accumulation, the hook is called once the gradients have been accumulated. -See: accumulate_grad_batches.

-

If using native AMP, the loss will be unscaled before calling this hook. -See these docs -for more information on the scaling of gradients.

-

If clipping gradients, the gradients will not have been clipped yet.

-
-
Parameters
-
    -
  • optimizer (Optimizer) – Current optimizer being used.

  • -
  • optimizer_idx (int) – Index of the current optimizer being used.

  • -
-
-
-

Example:

-
def on_before_optimizer_step(self, optimizer, optimizer_idx):
-    # example to inspect gradient information in tensorboard
-    if self.trainer.global_step % 25 == 0:  # don't make the tf file huge
-        for k, v in self.named_parameters():
-            self.logger.experiment.add_histogram(
-                tag=k, values=v.grad, global_step=self.trainer.global_step
-            )
-
-
-
-
Return type
-

None

-
-
-
- -
-
-

configure_gradient_clipping

-
-
-LightningModule.configure_gradient_clipping(optimizer, optimizer_idx, gradient_clip_val=None, gradient_clip_algorithm=None)[source]
-

Perform gradient clipping for the optimizer parameters. Called before optimizer_step().

-
-
Parameters
-
    -
  • optimizer (Optimizer) – Current optimizer being used.

  • -
  • optimizer_idx (int) – Index of the current optimizer being used.

  • -
  • gradient_clip_val (Union[int, float, None]) – The value at which to clip gradients. By default value passed in Trainer -will be available here.

  • -
  • gradient_clip_algorithm (Optional[str]) – The gradient clipping algorithm to use. By default value -passed in Trainer will be available here.

  • -
-
-
-

Example:

-
# Perform gradient clipping on gradients associated with discriminator (optimizer_idx=1) in GAN
-def configure_gradient_clipping(self, optimizer, optimizer_idx, gradient_clip_val, gradient_clip_algorithm):
-    if optimizer_idx == 1:
-        # Lightning will handle the gradient clipping
-        self.clip_gradients(
-            optimizer,
-            gradient_clip_val=gradient_clip_val,
-            gradient_clip_algorithm=gradient_clip_algorithm
-        )
-    else:
-        # implement your own custom logic to clip gradients for generator (optimizer_idx=0)
-
-
-
- -
-
-

optimizer_step

-
-
-LightningModule.optimizer_step(epoch, batch_idx, optimizer, optimizer_idx=0, optimizer_closure=None, on_tpu=False, using_native_amp=False, using_lbfgs=False)[source]
-

Override this method to adjust the default way the Trainer calls -each optimizer.

-

By default, Lightning calls step() and zero_grad() as shown in the example once per optimizer. -This method (and zero_grad()) won’t be called during the accumulation phase when -Trainer(accumulate_grad_batches != 1). Overriding this hook has no benefit with manual optimization.

-
-
Parameters
-
    -
  • epoch (int) – Current epoch

  • -
  • batch_idx (int) – Index of current batch

  • -
  • optimizer (Union[Optimizer, LightningOptimizer]) – A PyTorch optimizer

  • -
  • optimizer_idx (int) – If you used multiple optimizers, this indexes into that list.

  • -
  • optimizer_closure (Optional[Callable[[], Any]]) – The optimizer closure. This closure must be executed as it includes the -calls to training_step(), optimizer.zero_grad(), and backward().

  • -
  • on_tpu (bool) – True if TPU backward is required

  • -
  • using_native_amp (bool) – True if using native amp

  • -
  • using_lbfgs (bool) – True if the matching optimizer is torch.optim.LBFGS

  • -
-
-
-

Examples:

-
# DEFAULT
-def optimizer_step(self, epoch, batch_idx, optimizer, optimizer_idx,
-                   optimizer_closure, on_tpu, using_native_amp, using_lbfgs):
-    optimizer.step(closure=optimizer_closure)
-
-# Alternating schedule for optimizer steps (i.e.: GANs)
-def optimizer_step(self, epoch, batch_idx, optimizer, optimizer_idx,
-                   optimizer_closure, on_tpu, using_native_amp, using_lbfgs):
-    # update generator opt every step
-    if optimizer_idx == 0:
-        optimizer.step(closure=optimizer_closure)
-
-    # update discriminator opt every 2 steps
-    if optimizer_idx == 1:
-        if (batch_idx + 1) % 2 == 0 :
-            optimizer.step(closure=optimizer_closure)
-        else:
-            # call the closure by itself to run `training_step` + `backward` without an optimizer step
-            optimizer_closure()
-
-    # ...
-    # add as many optimizers as you want
-
-
-

Here’s another example showing how to use this for more advanced things such as -learning rate warm-up:

-
# learning rate warm-up
-def optimizer_step(
-    self,
-    epoch,
-    batch_idx,
-    optimizer,
-    optimizer_idx,
-    optimizer_closure,
-    on_tpu,
-    using_native_amp,
-    using_lbfgs,
-):
-    # update params
-    optimizer.step(closure=optimizer_closure)
-
-    # manually warm up lr without a scheduler
-    if self.trainer.global_step < 500:
-        lr_scale = min(1.0, float(self.trainer.global_step + 1) / 500.0)
-        for pg in optimizer.param_groups:
-            pg["lr"] = lr_scale * self.learning_rate
-
-
-
-
Return type
-

None

-
-
-
- -
-
-

optimizer_zero_grad

-
-
-LightningModule.optimizer_zero_grad(epoch, batch_idx, optimizer, optimizer_idx)[source]
-

Override this method to change the default behaviour of optimizer.zero_grad().

-
-
Parameters
-
    -
  • epoch (int) – Current epoch

  • -
  • batch_idx (int) – Index of current batch

  • -
  • optimizer (Optimizer) – A PyTorch optimizer

  • -
  • optimizer_idx (int) – If you used multiple optimizers this indexes into that list.

  • -
-
-
-

Examples:

-
# DEFAULT
-def optimizer_zero_grad(self, epoch, batch_idx, optimizer, optimizer_idx):
-    optimizer.zero_grad()
-
-# Set gradients to `None` instead of zero to improve performance.
-def optimizer_zero_grad(self, epoch, batch_idx, optimizer, optimizer_idx):
-    optimizer.zero_grad(set_to_none=True)
-
-
-

See torch.optim.Optimizer.zero_grad() for the explanation of the above example.

-
- -
-
-

prepare_data

-
-
-LightningModule.prepare_data()
-

Use this to download and prepare data. Downloading and saving data with multiple processes (distributed -settings) will result in corrupted data. Lightning ensures this method is called only within a single -process, so you can safely add your downloading logic within.

-
-

Warning

-

DO NOT set state to the model (use setup instead) -since this is NOT called on every device

-
-

Example:

-
def prepare_data(self):
-    # good
-    download_data()
-    tokenize()
-    etc()
-
-    # bad
-    self.split = data_split
-    self.some_state = some_other_state()
-
-
-

In DDP prepare_data can be called in two ways (using Trainer(prepare_data_per_node)):

-
    -
  1. Once per node. This is the default and is only called on LOCAL_RANK=0.

  2. -
  3. Once in total. Only called on GLOBAL_RANK=0.

  4. -
-

See prepare_data_per_node.

-

Example:

-
# DEFAULT
-# called once per node on LOCAL_RANK=0 of that node
-Trainer(prepare_data_per_node=True)
-
-# call on GLOBAL_RANK=0 (great for shared file systems)
-Trainer(prepare_data_per_node=False)
-
-
-

This is called before requesting the dataloaders:

-
model.prepare_data()
-initialize_distributed()
-model.setup(stage)
-model.train_dataloader()
-model.val_dataloader()
-model.test_dataloader()
-
-
-
-
Return type
-

None

-
-
-
- -
-
-

setup

-
-
-LightningModule.setup(stage=None)
-

Called at the beginning of fit (train + validate), validate, test, or predict. This is a good hook when -you need to build models dynamically or adjust something about them. This hook is called on every process -when using DDP.

-
-
Parameters
-

stage (Optional[str]) – either 'fit', 'validate', 'test', or 'predict'

-
-
-

Example:

-
class LitModel(...):
-    def __init__(self):
-        self.l1 = None
-
-    def prepare_data(self):
-        download_data()
-        tokenize()
-
-        # don't do this
-        self.something = else
-
-    def setup(self, stage):
-        data = load_data(...)
-        self.l1 = nn.Linear(28, data.num_classes)
-
-
-
-
Return type
-

None

-
-
-
- -
-
-

tbptt_split_batch

-
-
-LightningModule.tbptt_split_batch(batch, split_size)[source]
-

When using truncated backpropagation through time, each batch must be split along the -time dimension. Lightning handles this by default, but for custom behavior override -this function.

-
-
Parameters
-
    -
  • batch (Any) – Current batch

  • -
  • split_size (int) – The size of the split

  • -
-
-
Return type
-

List[Any]

-
-
Returns
-

List of batch splits. Each split will be passed to training_step() to enable truncated -back propagation through time. The default implementation splits root level Tensors and -Sequences at dim=1 (i.e. time dim). It assumes that each time dim is the same length.

-
-
-

Examples:

-
def tbptt_split_batch(self, batch, split_size):
-    splits = []
-    for t in range(0, time_dims[0], split_size):
-        batch_split = []
-        for i, x in enumerate(batch):
-            if isinstance(x, torch.Tensor):
-                split_x = x[:, t:t + split_size]
-            elif isinstance(x, collections.Sequence):
-                split_x = [None] * len(x)
-                for batch_idx in range(len(x)):
-                  split_x[batch_idx] = x[batch_idx][t:t + split_size]
-            batch_split.append(split_x)
-        splits.append(batch_split)
-    return splits
-
-
-
-

Note

-

Called in the training loop after -on_train_batch_start() -if truncated_bptt_steps > 0. -Each returned batch split is passed separately to training_step().

-
-
- -
-
-

teardown

-
-
-LightningModule.teardown(stage=None)
-

Called at the end of fit (train + validate), validate, test, or predict.

-
-
Parameters
-

stage (Optional[str]) – either 'fit', 'validate', 'test', or 'predict'

-
-
Return type
-

None

-
-
-
- -
-
-

train_dataloader

-
-
-LightningModule.train_dataloader()
-

Implement one or more PyTorch DataLoaders for training.

-
-
Return type
-

Union[DataLoader, Sequence[DataLoader], Sequence[Sequence[DataLoader]], Sequence[Dict[str, DataLoader]], Dict[str, DataLoader], Dict[str, Dict[str, DataLoader]], Dict[str, Sequence[DataLoader]]]

-
-
Returns
-

A collection of torch.utils.data.DataLoader specifying training samples. -In the case of multiple dataloaders, please see this section.

-
-
-

The dataloader you return will not be reloaded unless you set -reload_dataloaders_every_n_epochs to -a positive integer.

-

For data processing use the following pattern:

-
-
    -
  • download in prepare_data()

  • -
  • process and split in setup()

  • -
-
-

However, the above are only necessary for distributed processing.

-
-

Warning

-

do not assign state in prepare_data

-
-
    -
  • fit()

  • -
  • prepare_data()

  • -
  • setup()

  • -
-
-

Note

-

Lightning adds the correct sampler for distributed and arbitrary hardware. -There is no need to set it yourself.

-
-

Example:

-
# single dataloader
-def train_dataloader(self):
-    transform = transforms.Compose([transforms.ToTensor(),
-                                    transforms.Normalize((0.5,), (1.0,))])
-    dataset = MNIST(root='/path/to/mnist/', train=True, transform=transform,
-                    download=True)
-    loader = torch.utils.data.DataLoader(
-        dataset=dataset,
-        batch_size=self.batch_size,
-        shuffle=True
-    )
-    return loader
-
-# multiple dataloaders, return as list
-def train_dataloader(self):
-    mnist = MNIST(...)
-    cifar = CIFAR(...)
-    mnist_loader = torch.utils.data.DataLoader(
-        dataset=mnist, batch_size=self.batch_size, shuffle=True
-    )
-    cifar_loader = torch.utils.data.DataLoader(
-        dataset=cifar, batch_size=self.batch_size, shuffle=True
-    )
-    # each batch will be a list of tensors: [batch_mnist, batch_cifar]
-    return [mnist_loader, cifar_loader]
-
-# multiple dataloader, return as dict
-def train_dataloader(self):
-    mnist = MNIST(...)
-    cifar = CIFAR(...)
-    mnist_loader = torch.utils.data.DataLoader(
-        dataset=mnist, batch_size=self.batch_size, shuffle=True
-    )
-    cifar_loader = torch.utils.data.DataLoader(
-        dataset=cifar, batch_size=self.batch_size, shuffle=True
-    )
-    # each batch will be a dict of tensors: {'mnist': batch_mnist, 'cifar': batch_cifar}
-    return {'mnist': mnist_loader, 'cifar': cifar_loader}
-
-
-
- -
-
-

val_dataloader

-
-
-LightningModule.val_dataloader()
-

Implement one or multiple PyTorch DataLoaders for validation.

-

The dataloader you return will not be reloaded unless you set -reload_dataloaders_every_n_epochs to -a positive integer.

-

It’s recommended that all data downloads and preparation happen in prepare_data().

-
    -
  • fit()

  • -
  • validate()

  • -
  • prepare_data()

  • -
  • setup()

  • -
-
-

Note

-

Lightning adds the correct sampler for distributed and arbitrary hardware -There is no need to set it yourself.

-
-
-
Return type
-

Union[DataLoader, Sequence[DataLoader]]

-
-
Returns
-

A torch.utils.data.DataLoader or a sequence of them specifying validation samples.

-
-
-

Examples:

-
def val_dataloader(self):
-    transform = transforms.Compose([transforms.ToTensor(),
-                                    transforms.Normalize((0.5,), (1.0,))])
-    dataset = MNIST(root='/path/to/mnist/', train=False,
-                    transform=transform, download=True)
-    loader = torch.utils.data.DataLoader(
-        dataset=dataset,
-        batch_size=self.batch_size,
-        shuffle=False
-    )
-
-    return loader
-
-# can also return multiple dataloaders
-def val_dataloader(self):
-    return [loader_a, loader_b, ..., loader_n]
-
-
-
-

Note

-

If you don’t need a validation dataset and a validation_step(), you don’t need to -implement this method.

-
-
-

Note

-

In the case where you return multiple validation dataloaders, the validation_step() -will have an argument dataloader_idx which matches the order here.

-
-
- -
-
-

test_dataloader

-
-
-LightningModule.test_dataloader()
-

Implement one or multiple PyTorch DataLoaders for testing.

-

For data processing use the following pattern:

-
-
    -
  • download in prepare_data()

  • -
  • process and split in setup()

  • -
-
-

However, the above are only necessary for distributed processing.

-
-

Warning

-

do not assign state in prepare_data

-
-
    -
  • test()

  • -
  • prepare_data()

  • -
  • setup()

  • -
-
-

Note

-

Lightning adds the correct sampler for distributed and arbitrary hardware. -There is no need to set it yourself.

-
-
-
Return type
-

Union[DataLoader, Sequence[DataLoader]]

-
-
Returns
-

A torch.utils.data.DataLoader or a sequence of them specifying testing samples.

-
-
-

Example:

-
def test_dataloader(self):
-    transform = transforms.Compose([transforms.ToTensor(),
-                                    transforms.Normalize((0.5,), (1.0,))])
-    dataset = MNIST(root='/path/to/mnist/', train=False, transform=transform,
-                    download=True)
-    loader = torch.utils.data.DataLoader(
-        dataset=dataset,
-        batch_size=self.batch_size,
-        shuffle=False
-    )
-
-    return loader
-
-# can also return multiple dataloaders
-def test_dataloader(self):
-    return [loader_a, loader_b, ..., loader_n]
-
-
-
-

Note

-

If you don’t need a test dataset and a test_step(), you don’t need to implement -this method.

-
-
-

Note

-

In the case where you return multiple test dataloaders, the test_step() -will have an argument dataloader_idx which matches the order here.

-
-
- -
-
-

predict_dataloader

-
-
-LightningModule.predict_dataloader()
-

Implement one or multiple PyTorch DataLoaders for prediction.

-

It’s recommended that all data downloads and preparation happen in prepare_data().

-
    -
  • predict()

  • -
  • prepare_data()

  • -
  • setup()

  • -
-
-

Note

-

Lightning adds the correct sampler for distributed and arbitrary hardware -There is no need to set it yourself.

-
-
-
Return type
-

Union[DataLoader, Sequence[DataLoader]]

-
-
Returns
-

A torch.utils.data.DataLoader or a sequence of them specifying prediction samples.

-
-
-
-

Note

-

In the case where you return multiple prediction dataloaders, the predict_step() -will have an argument dataloader_idx which matches the order here.

-
-
- -
-
-

on_train_dataloader

-
-
-LightningModule.on_train_dataloader()
-

Called before requesting the train dataloader.

-
-

Deprecated since version v1.5: on_train_dataloader() is deprecated and will be removed in v1.7.0. -Please use train_dataloader() directly.

-
-
-
Return type
-

None

-
-
-
- -
-
-

on_val_dataloader

-
-
-LightningModule.on_val_dataloader()
-

Called before requesting the val dataloader.

-
-

Deprecated since version v1.5: on_val_dataloader() is deprecated and will be removed in v1.7.0. -Please use val_dataloader() directly.

-
-
-
Return type
-

None

-
-
-
- -
-
-

on_test_dataloader

-
-
-LightningModule.on_test_dataloader()
-

Called before requesting the test dataloader.

-
-

Deprecated since version v1.5: on_test_dataloader() is deprecated and will be removed in v1.7.0. -Please use test_dataloader() directly.

-
-
-
Return type
-

None

-
-
-
- -
-
-

on_predict_dataloader

-
-
-LightningModule.on_predict_dataloader()
-

Called before requesting the predict dataloader.

-
-

Deprecated since version v1.5: on_predict_dataloader() is deprecated and will be removed in v1.7.0. -Please use predict_dataloader() directly.

-
-
-
Return type
-

None

-
-
-
- -
-
-

transfer_batch_to_device

-
-
-LightningModule.transfer_batch_to_device(batch, device, dataloader_idx)
-

Override this hook if your DataLoader returns tensors wrapped in a custom -data structure.

-

The data types listed below (and any arbitrary nesting of them) are supported out of the box:

-
    -
  • torch.Tensor or anything that implements .to(…)

  • -
  • list

  • -
  • dict

  • -
  • tuple

  • -
  • torchtext.data.batch.Batch

  • -
-

For anything else, you need to define how the data is moved to the target device (CPU, GPU, TPU, …).

-
-

Note

-

This hook should only transfer the data and not modify it, nor should it move the data to -any other device than the one passed in as argument (unless you know what you are doing). -To check the current state of execution of this hook you can use -self.trainer.training/testing/validating/predicting so that you can -add different logic as per your requirement.

-
-
-

Note

-

This hook only runs on single GPU training and DDP (no data-parallel). -Data-Parallel support will come in near future.

-
-
-
Parameters
-
    -
  • batch (Any) – A batch of data that needs to be transferred to a new device.

  • -
  • device (device) – The target device as defined in PyTorch.

  • -
  • dataloader_idx (int) – The index of the dataloader to which the batch belongs.

  • -
-
-
Return type
-

Any

-
-
Returns
-

A reference to the data on the new device.

-
-
-

Example:

-
def transfer_batch_to_device(self, batch, device, dataloader_idx):
-    if isinstance(batch, CustomBatch):
-        # move all tensors in your custom data structure to the device
-        batch.samples = batch.samples.to(device)
-        batch.targets = batch.targets.to(device)
-    elif dataloader_idx == 0:
-        # skip device transfer for the first dataloader or anything you wish
-        pass
-    else:
-        batch = super().transfer_batch_to_device(data, device, dataloader_idx)
-    return batch
-
-
-
-
Raises
-

MisconfigurationException – If using data-parallel, Trainer(strategy='dp').

-
-
-
-

See also

-
    -
  • move_data_to_device()

  • -
  • apply_to_collection()

  • -
-
-
- -
-
-

on_before_batch_transfer

-
-
-LightningModule.on_before_batch_transfer(batch, dataloader_idx)
-

Override to alter or apply batch augmentations to your batch before it is transferred to the device.

-
-

Note

-

To check the current state of execution of this hook you can use -self.trainer.training/testing/validating/predicting so that you can -add different logic as per your requirement.

-
-
-

Note

-

This hook only runs on single GPU training and DDP (no data-parallel). -Data-Parallel support will come in near future.

-
-
-
Parameters
-
    -
  • batch (Any) – A batch of data that needs to be altered or augmented.

  • -
  • dataloader_idx (int) – The index of the dataloader to which the batch belongs.

  • -
-
-
Return type
-

Any

-
-
Returns
-

A batch of data

-
-
-

Example:

-
def on_before_batch_transfer(self, batch, dataloader_idx):
-    batch['x'] = transforms(batch['x'])
-    return batch
-
-
-
-
Raises
-

MisconfigurationException – If using data-parallel, Trainer(strategy='dp').

-
-
-
-

See also

-
    -
  • on_after_batch_transfer()

  • -
  • transfer_batch_to_device()

  • -
-
-
- -
-
-

on_after_batch_transfer

-
-
-LightningModule.on_after_batch_transfer(batch, dataloader_idx)
-

Override to alter or apply batch augmentations to your batch after it is transferred to the device.

-
-

Note

-

To check the current state of execution of this hook you can use -self.trainer.training/testing/validating/predicting so that you can -add different logic as per your requirement.

-
-
-

Note

-

This hook only runs on single GPU training and DDP (no data-parallel). -Data-Parallel support will come in near future.

-
-
-
Parameters
-
    -
  • batch (Any) – A batch of data that needs to be altered or augmented.

  • -
  • dataloader_idx (int) – The index of the dataloader to which the batch belongs.

  • -
-
-
Return type
-

Any

-
-
Returns
-

A batch of data

-
-
-

Example:

-
def on_after_batch_transfer(self, batch, dataloader_idx):
-    batch['x'] = gpu_transforms(batch['x'])
-    return batch
-
-
-
-
Raises
-

MisconfigurationException – If using data-parallel, Trainer(strategy='dp').

-
-
-
-

See also

-
    -
  • on_before_batch_transfer()

  • -
  • transfer_batch_to_device()

  • -
-
-
- -
-
-

add_to_queue

-
-
-LightningModule.add_to_queue(queue)[source]
-

Appends the trainer.callback_metrics dictionary to the given queue. To avoid issues with memory -sharing, we cast the data to numpy.

-
-
Parameters
-

queue (_FakeQueue) – the instance of the queue to append the data.

-
-
-
-

Deprecated since version v1.5: This method was deprecated in v1.5 and will be removed in v1.7.

-
-
-
Return type
-

None

-
-
-
- -
-
-

get_from_queue

-
-
-LightningModule.get_from_queue(queue)[source]
-

Retrieve the trainer.callback_metrics dictionary from the given queue. To preserve consistency, -we cast back the data to torch.Tensor.

-
-
Parameters
-

queue (_FakeQueue) – the instance of the queue from where to get the data.

-
-
-
-

Deprecated since version v1.5: This method was deprecated in v1.5 and will be removed in v1.7.

-
-
-
Return type
-

None

-
-
-
- -
-
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- - -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/optimization.html b/docs/common/optimization.html deleted file mode 100644 index 428d7b8..0000000 --- a/docs/common/optimization.html +++ /dev/null @@ -1,1296 +0,0 @@ - - - - - - - - - - - - - - Optimization — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Optimization

-

Lightning offers two modes for managing the optimization process:

-
    -
  • Manual Optimization

  • -
  • Automatic Optimization

  • -
-

For the majority of research cases, automatic optimization will do the right thing for you and it is what most -users should use.

-

For advanced/expert users who want to do esoteric optimization schedules or techniques, use manual optimization.

-
-
-

Manual Optimization

-

For advanced research topics like reinforcement learning, sparse coding, or GAN research, it may be desirable to -manually manage the optimization process.

-

This is only recommended for experts who need ultimate flexibility. -Lightning will handle only accelerator, precision and strategy logic. -The users are left with optimizer.zero_grad(), gradient accumulation, model toggling, etc..

-

To manually optimize, do the following:

-
    -
  • Set self.automatic_optimization=False in your LightningModule’s __init__.

  • -
  • Use the following functions and call them manually:

    -
      -
    • self.optimizers() to access your optimizers (one or multiple)

    • -
    • optimizer.zero_grad() to clear the gradients from the previous training step

    • -
    • self.manual_backward(loss) instead of loss.backward()

    • -
    • optimizer.step() to update your model parameters

    • -
    -
  • -
-

Here is a minimal example of manual optimization.

-
from pytorch_lightning import LightningModule
-
-
-class MyModel(LightningModule):
-    def __init__(self):
-        super().__init__()
-        # Important: This property activates manual optimization.
-        self.automatic_optimization = False
-
-    def training_step(self, batch, batch_idx):
-        opt = self.optimizers()
-        opt.zero_grad()
-        loss = self.compute_loss(batch)
-        self.manual_backward(loss)
-        opt.step()
-
-
-
-

Warning

-

Before 1.2, optimizer.step() was calling optimizer.zero_grad() internally. -From 1.2, it is left to the user’s expertise.

-
-
-

Tip

-

Be careful where you call optimizer.zero_grad(), or your model won’t converge. -It is good practice to call optimizer.zero_grad() before self.manual_backward(loss).

-
-
-

Access your Own Optimizer

-

The provided optimizer is a LightningOptimizer object wrapping your own optimizer -configured in your configure_optimizers(). You can access your own optimizer -with optimizer.optimizer. However, if you use your own optimizer to perform a step, Lightning won’t be able to -support accelerators, precision and profiling for you.

-
class Model(LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.automatic_optimization = False
-        ...
-
-    def training_step(self, batch, batch_idx):
-        optimizer = self.optimizers()
-
-        # `optimizer` is a `LightningOptimizer` wrapping the optimizer.
-        # To access it, do the following.
-        # However, it won't work on TPU, AMP, etc...
-        optimizer = optimizer.optimizer
-        ...
-
-
-
-
-

Gradient Accumulation

-

You can accumulate gradients over batches similarly to accumulate_grad_batches argument in -Trainer for automatic optimization. To perform gradient accumulation with one optimizer -after every N steps, you can do as such.

-
def __init__(self):
-    super().__init__()
-    self.automatic_optimization = False
-
-
-def training_step(self, batch, batch_idx):
-    opt = self.optimizers()
-
-    loss = self.compute_loss(batch)
-    self.manual_backward(loss)
-
-    # accumulate gradients of N batches
-    if (batch_idx + 1) % N == 0:
-        opt.step()
-        opt.zero_grad()
-
-
-
-
-

Use Multiple Optimizers (like GANs)

-

Here is an example training a simple GAN with multiple optimizers using manual optimization.

-
import torch
-from torch import Tensor
-from pytorch_lightning import LightningModule
-
-
-class SimpleGAN(LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.G = Generator()
-        self.D = Discriminator()
-
-        # Important: This property activates manual optimization.
-        self.automatic_optimization = False
-
-    def sample_z(self, n) -> Tensor:
-        sample = self._Z.sample((n,))
-        return sample
-
-    def sample_G(self, n) -> Tensor:
-        z = self.sample_z(n)
-        return self.G(z)
-
-    def training_step(self, batch, batch_idx):
-        # Implementation follows the PyTorch tutorial:
-        # https://pytorch.org/tutorials/beginner/dcgan_faces_tutorial.html
-        g_opt, d_opt = self.optimizers()
-
-        X, _ = batch
-        batch_size = X.shape[0]
-
-        real_label = torch.ones((batch_size, 1), device=self.device)
-        fake_label = torch.zeros((batch_size, 1), device=self.device)
-
-        g_X = self.sample_G(batch_size)
-
-        ##########################
-        # Optimize Discriminator #
-        ##########################
-        d_x = self.D(X)
-        errD_real = self.criterion(d_x, real_label)
-
-        d_z = self.D(g_X.detach())
-        errD_fake = self.criterion(d_z, fake_label)
-
-        errD = errD_real + errD_fake
-
-        d_opt.zero_grad()
-        self.manual_backward(errD)
-        d_opt.step()
-
-        ######################
-        # Optimize Generator #
-        ######################
-        d_z = self.D(g_X)
-        errG = self.criterion(d_z, real_label)
-
-        g_opt.zero_grad()
-        self.manual_backward(errG)
-        g_opt.step()
-
-        self.log_dict({"g_loss": errG, "d_loss": errD}, prog_bar=True)
-
-    def configure_optimizers(self):
-        g_opt = torch.optim.Adam(self.G.parameters(), lr=1e-5)
-        d_opt = torch.optim.Adam(self.D.parameters(), lr=1e-5)
-        return g_opt, d_opt
-
-
-
-
-

Learning Rate Scheduling

-

Every optimizer you use can be paired with any -Learning Rate Scheduler. Please see the -documentation of configure_optimizers() for all the available options

-

You can call lr_scheduler.step() at arbitrary intervals. -Use self.lr_schedulers() in your LightningModule to access any learning rate schedulers -defined in your configure_optimizers().

-
-

Warning

-
    -
  • Before v1.3, Lightning automatically called lr_scheduler.step() in both automatic and manual optimization. From -1.3, lr_scheduler.step() is now for the user to call at arbitrary intervals.

  • -
  • Note that the lr_scheduler_config keys, such as "frequency" and "interval", will be ignored even if they are provided in -your configure_optimizers() during manual optimization.

  • -
-
-

Here is an example calling lr_scheduler.step() every step.

-
# step every batch
-def __init__(self):
-    super().__init__()
-    self.automatic_optimization = False
-
-
-def training_step(self, batch, batch_idx):
-    # do forward, backward, and optimization
-    ...
-
-    # single scheduler
-    sch = self.lr_schedulers()
-    sch.step()
-
-    # multiple schedulers
-    sch1, sch2 = self.lr_schedulers()
-    sch1.step()
-    sch2.step()
-
-
-

If you want to call lr_scheduler.step() every N steps/epochs, do the following.

-
def __init__(self):
-    super().__init__()
-    self.automatic_optimization = False
-
-
-def training_step(self, batch, batch_idx):
-    # do forward, backward, and optimization
-    ...
-
-    sch = self.lr_schedulers()
-
-    # step every N batches
-    if (batch_idx + 1) % N == 0:
-        sch.step()
-
-    # step every N epochs
-    if self.trainer.is_last_batch and (self.trainer.current_epoch + 1) % N == 0:
-        sch.step()
-
-
-

If you want to call schedulers that require a metric value after each epoch, consider doing the following:

-
def __init__(self):
-    super().__init__()
-    self.automatic_optimization = False
-
-
-def training_epoch_end(self, outputs):
-    sch = self.lr_schedulers()
-
-    # If the selected scheduler is a ReduceLROnPlateau scheduler.
-    if isinstance(sch, torch.optim.lr_scheduler.ReduceLROnPlateau):
-        sch.step(self.trainer.callback_metrics["loss"])
-
-
-
-
-

Use Closure for LBFGS-like Optimizers

-

It is a good practice to provide the optimizer with a closure function that performs a forward, zero_grad and -backward of your model. It is optional for most optimizers, but makes your code compatible if you switch to an -optimizer which requires a closure, such as LBFGS.

-

See the PyTorch docs for more about the closure.

-

Here is an example using a closure function.

-
def __init__(self):
-    super().__init__()
-    self.automatic_optimization = False
-
-
-def configure_optimizers(self):
-    return torch.optim.LBFGS(...)
-
-
-def training_step(self, batch, batch_idx):
-    opt = self.optimizers()
-
-    def closure():
-        loss = self.compute_loss(batch)
-        opt.zero_grad()
-        self.manual_backward(loss)
-        return loss
-
-    opt.step(closure=closure)
-
-
-
-

Warning

-

The LBFGS optimizer is not supported for apex AMP, native AMP, IPUs, or DeepSpeed.

-
-
-
-
-
-

Automatic Optimization

-

With Lightning, most users don’t have to think about when to call .zero_grad(), .backward() and .step() -since Lightning automates that for you.

-

Under the hood, Lightning does the following:

-
for epoch in epochs:
-    for batch in data:
-
-        def closure():
-            loss = model.training_step(batch, batch_idx, ...)
-            optimizer.zero_grad()
-            loss.backward()
-            return loss
-
-        optimizer.step(closure)
-
-    lr_scheduler.step()
-
-
-

In the case of multiple optimizers, Lightning does the following:

-
for epoch in epochs:
-    for batch in data:
-        for opt in optimizers:
-
-            def closure():
-                loss = model.training_step(batch, batch_idx, optimizer_idx)
-                opt.zero_grad()
-                loss.backward()
-                return loss
-
-            opt.step(closure)
-
-    for lr_scheduler in lr_schedulers:
-        lr_scheduler.step()
-
-
-

As can be seen in the code snippet above, Lightning defines a closure with training_step(), optimizer.zero_grad() -and loss.backward() for the optimization. This mechanism is in place to support optimizers which operate on the -output of the closure (e.g. the loss) or need to call the closure several times (e.g. LBFGS).

-
-

Warning

-

Before v1.2.2, Lightning internally calls backward, step and zero_grad in the order. -From v1.2.2, the order is changed to zero_grad, backward and step.

-
-
-

Gradient Accumulation

-

Accumulated gradients run K small batches of size N before doing a backward pass. The effect is a large effective batch size of size KxN, where N is the batch size. -Internally it doesn’t stack up the batches and do a forward pass rather it accumulates the gradients for K batches and then do an optimizer.step to make sure the -effective batch size is increased but there is no memory overhead.

-
-

Warning

-

When using distributed training for eg. DDP, with let’s say with P devices, each device accumulates independently i.e. it stores the gradients -after each loss.backward() and doesn’t sync the gradients across the devices until we call optimizer.step(). So for each accumulation -step, the effective batch size on each device will remain N*K but right before the optimizer.step(), the gradient sync will make the effective -batch size as P*N*K. For DP, since the batch is split across devices, the final effective batch size will be N*K.

-
-
-

See also

-

Trainer

-
-
# DEFAULT (ie: no accumulated grads)
-trainer = Trainer(accumulate_grad_batches=1)
-
-# Accumulate gradients for 7 batches
-trainer = Trainer(accumulate_grad_batches=7)
-
-
-

You can set different values for it at different epochs by passing a dictionary, where the key represents the epoch at which the value for gradient accumulation -should be updated.

-
# till 5th epoch, it will accumulate every 8 batches. From 5th epoch
-# till 9th epoch it will accumulate every 4 batches and after that no accumulation
-# will happen. Note that you need to use zero-indexed epoch keys here
-trainer = Trainer(accumulate_grad_batches={0: 8, 4: 4, 8: 1})
-
-
-

Or, you can create custom GradientAccumulationScheduler

-
from pytorch_lightning.callbacks import GradientAccumulationScheduler
-
-
-# till 5th epoch, it will accumulate every 8 batches. From 5th epoch
-# till 9th epoch it will accumulate every 4 batches and after that no accumulation
-# will happen. Note that you need to use zero-indexed epoch keys here
-accumulator = GradientAccumulationScheduler(scheduling={0: 8, 4: 4, 8: 1})
-trainer = Trainer(callbacks=accumulator)
-
-
-
-
-

Use Multiple Optimizers (like GANs)

-

To use multiple optimizers (optionally with learning rate schedulers), return two or more optimizers from -configure_optimizers().

-
# two optimizers, no schedulers
-def configure_optimizers(self):
-    return Adam(...), SGD(...)
-
-
-# two optimizers, one scheduler for adam only
-def configure_optimizers(self):
-    opt1 = Adam(...)
-    opt2 = SGD(...)
-    optimizers = [opt1, opt2]
-    lr_schedulers = {"scheduler": ReduceLROnPlateau(opt1, ...), "monitor": "metric_to_track"}
-    return optimizers, lr_schedulers
-
-
-# two optimizers, two schedulers
-def configure_optimizers(self):
-    opt1 = Adam(...)
-    opt2 = SGD(...)
-    return [opt1, opt2], [StepLR(opt1, ...), OneCycleLR(opt2, ...)]
-
-
-

Under the hood, Lightning will call each optimizer sequentially:

-
for epoch in epochs:
-    for batch in data:
-        for opt in optimizers:
-            loss = train_step(batch, batch_idx, optimizer_idx)
-            opt.zero_grad()
-            loss.backward()
-            opt.step()
-
-    for lr_scheduler in lr_schedulers:
-        lr_scheduler.step()
-
-
-
-
-

Step Optimizeres at Arbitrary Intervals

-

To do more interesting things with your optimizers such as learning rate warm-up or odd scheduling, -override the optimizer_step() function.

-
-

Warning

-

If you are overriding this method, make sure that you pass the optimizer_closure parameter to -optimizer.step() function as shown in the examples because training_step(), optimizer.zero_grad(), -loss.backward() are called in the closure function.

-
-

For example, here step optimizer A every batch and optimizer B every 2 batches.

-
# Alternating schedule for optimizer steps (e.g. GANs)
-def optimizer_step(
-    self,
-    epoch,
-    batch_idx,
-    optimizer,
-    optimizer_idx,
-    optimizer_closure,
-    on_tpu=False,
-    using_native_amp=False,
-    using_lbfgs=False,
-):
-    # update generator every step
-    if optimizer_idx == 0:
-        optimizer.step(closure=optimizer_closure)
-
-    # update discriminator every 2 steps
-    if optimizer_idx == 1:
-        if (batch_idx + 1) % 2 == 0:
-            # the closure (which includes the `training_step`) will be executed by `optimizer.step`
-            optimizer.step(closure=optimizer_closure)
-        else:
-            # call the closure by itself to run `training_step` + `backward` without an optimizer step
-            optimizer_closure()
-
-    # ...
-    # add as many optimizers as you want
-
-
-

Here we add a manual learning rate warm-up without an lr scheduler.

-
# learning rate warm-up
-def optimizer_step(
-    self,
-    epoch,
-    batch_idx,
-    optimizer,
-    optimizer_idx,
-    optimizer_closure,
-    on_tpu=False,
-    using_native_amp=False,
-    using_lbfgs=False,
-):
-    # update params
-    optimizer.step(closure=optimizer_closure)
-
-    # skip the first 500 steps
-    if self.trainer.global_step < 500:
-        lr_scale = min(1.0, float(self.trainer.global_step + 1) / 500.0)
-        for pg in optimizer.param_groups:
-            pg["lr"] = lr_scale * self.hparams.learning_rate
-
-
-
-
-

Access your Own Optimizer

-

The provided optimizer is a LightningOptimizer object wrapping your own optimizer -configured in your configure_optimizers(). -You can access your own optimizer with optimizer.optimizer. However, if you use your own optimizer -to perform a step, Lightning won’t be able to support accelerators, precision and profiling for you.

-
# function hook in LightningModule
-def optimizer_step(
-    self,
-    epoch,
-    batch_idx,
-    optimizer,
-    optimizer_idx,
-    optimizer_closure,
-    on_tpu=False,
-    using_native_amp=False,
-    using_lbfgs=False,
-):
-    optimizer.step(closure=optimizer_closure)
-
-
-# `optimizer` is a `LightningOptimizer` wrapping the optimizer.
-# To access it, do the following.
-# However, it won't work on TPU, AMP, etc...
-def optimizer_step(
-    self,
-    epoch,
-    batch_idx,
-    optimizer,
-    optimizer_idx,
-    optimizer_closure,
-    on_tpu=False,
-    using_native_amp=False,
-    using_lbfgs=False,
-):
-    optimizer = optimizer.optimizer
-    optimizer.step(closure=optimizer_closure)
-
-
-
-
-
-

Bring your own Custom Learning Rate Schedulers

-

Lightning allows using custom learning rate schedulers that aren’t available in PyTorch natively. -One good example is Timm Schedulers. When using custom learning rate schedulers -relying on a different API from Native PyTorch ones, you should override the lr_scheduler_step() with your desired logic. -If you are using native PyTorch schedulers, there is no need to override this hook since Lightning will handle it automatically by default.

-
from timm.scheduler import TanhLRScheduler
-
-
-def configure_optimizers(self):
-    optimizer = ...
-    scheduler = TanhLRScheduler(optimizer, ...)
-    return [optimizer], [{"scheduler": scheduler, "interval": "epoch"}]
-
-
-def lr_scheduler_step(self, scheduler, optimizer_idx, metric):
-    scheduler.step(epoch=self.current_epoch)  # timm's scheduler need the epoch value
-
-
-
-
-

Configure Gradient Clipping

-

To configure custom gradient clipping, consider overriding -the configure_gradient_clipping() method. -Attributes gradient_clip_val and gradient_clip_algorithm from Trainer will be passed in the -respective arguments here and Lightning will handle gradient clipping for you. In case you want to set -different values for your arguments of your choice and let Lightning handle the gradient clipping, you can -use the inbuilt clip_gradients() method and pass -the arguments along with your optimizer.

-
-

Warning

-

Make sure to not override clip_gradients() -method. If you want to customize gradient clipping, consider using -configure_gradient_clipping() method.

-
-

For example, here we will apply gradient clipping only to the gradients associated with optimizer A.

-
def configure_gradient_clipping(self, optimizer, optimizer_idx, gradient_clip_val, gradient_clip_algorithm):
-    if optimizer_idx == 0:
-        # Lightning will handle the gradient clipping
-        self.clip_gradients(
-            optimizer, gradient_clip_val=gradient_clip_val, gradient_clip_algorithm=gradient_clip_algorithm
-        )
-
-
-

Here we configure gradient clipping differently for optimizer B.

-
def configure_gradient_clipping(self, optimizer, optimizer_idx, gradient_clip_val, gradient_clip_algorithm):
-    if optimizer_idx == 0:
-        # Lightning will handle the gradient clipping
-        self.clip_gradients(
-            optimizer, gradient_clip_val=gradient_clip_val, gradient_clip_algorithm=gradient_clip_algorithm
-        )
-    elif optimizer_idx == 1:
-        self.clip_gradients(
-            optimizer, gradient_clip_val=gradient_clip_val * 2, gradient_clip_algorithm=gradient_clip_algorithm
-        )
-
-
-
-
-

Total Stepping Batches

-

You can use built-in trainer property estimated_stepping_batches to compute -total number of stepping batches for the complete training. The property is computed considering gradient accumulation factor and -distributed setting into consideration so you don’t have to derive it manually. One good example where this can be helpful is while using -OneCycleLR scheduler, which requires pre-computed total_steps during initialization.

-
def configure_optimizers(self):
-    optimizer = ...
-    scheduler = torch.optim.lr_scheduler.OneCycleLR(
-        optimizer, max_lr=1e-3, total_steps=self.trainer.estimated_stepping_batches
-    )
-    return [optimizer], [scheduler]
-
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/precision.html b/docs/common/precision.html deleted file mode 100644 index 0b8d6b3..0000000 --- a/docs/common/precision.html +++ /dev/null @@ -1,731 +0,0 @@ - - - - - - - - - - - - - - N-Bit Precision — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- - -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/precision_basic.html b/docs/common/precision_basic.html deleted file mode 100644 index 209922e..0000000 --- a/docs/common/precision_basic.html +++ /dev/null @@ -1,776 +0,0 @@ - - - - - - - - - - - - - - N-Bit Precision (Basic) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • N-Bit Precision (Basic)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

N-Bit Precision (Basic)

-

Audience: Users looking to train models faster and consume less memory.

-
-

If you’re looking to run models faster or consume less memory, consider tweaking the precision settings of your models.

-

Lower precision, such as 16-bit floating-point, requires less memory and enables training and deploying larger models. -Higher precision, such as the 64-bit floating-point, can be used for highly sensitive use-cases.

-
-
-

16-bit Precision

-

Use 16-bit precision to cut your memory consumption in half so that you can train and deploy larger models. If your GPUs are [Tensor Core] GPUs, you can also get a ~3x speed improvement. Half precision can sometimes lead to unstable training.

-
Trainer(precision=16)
-
-
-
-
-
-

32-bit Precision

-

32-bit precision is the default used across all models and research. This precision is known to be stable in contrast to lower precision settings.

-
Trainer(precision=32)
-
-
-
-
-
-

64-bit Precision

-

For certain scientific computations, 64-bit precision enables more accurate models. However, doubling the precision from 32 to 64 bit also doubles the memory requirements.

-
Trainer(precision=64)
-
-
-
-

Note

-

Since in deep learning, memory is always a bottleneck, especially when dealing with a large volume of data and with limited resources. -It is recommended using single precision for better speed. Although you can still use it if you want for your particular use-case.

-
-
-
-
-

Precision support by accelerator

- - ------- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
Precision with Accelerators

Precision

CPU

GPU

TPU

IPU

16

No

Yes

No

Yes

BFloat16

Yes

Yes

Yes

No

32

Yes

Yes

Yes

Yes

64

Yes

Yes

No

No

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/precision_expert.html b/docs/common/precision_expert.html deleted file mode 100644 index fd1322b..0000000 --- a/docs/common/precision_expert.html +++ /dev/null @@ -1,709 +0,0 @@ - - - - - - - - - - - - - - N-Bit Precision (Expert) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • N-Bit Precision (Expert)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

N-Bit Precision (Expert)

-

Audience: Researchers looking to integrate their new precision techniques into Lightning.

-
-

Precision Plugins

-

You can also customize and pass your own Precision Plugin by subclassing the PrecisionPlugin class.

-
    -
  • Perform pre and post backward/optimizer step operations such as scaling gradients.

  • -
  • Provide context managers for forward, training_step, etc.

  • -
-
class CustomPrecisionPlugin(PrecisionPlugin):
-    precision = 16
-
-    ...
-
-
-trainer = Trainer(plugins=[CustomPrecisionPlugin()])
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/precision_intermediate.html b/docs/common/precision_intermediate.html deleted file mode 100644 index 0fc0e78..0000000 --- a/docs/common/precision_intermediate.html +++ /dev/null @@ -1,800 +0,0 @@ - - - - - - - - - - - - - - N-Bit Precision (Intermediate) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • N-Bit Precision (Intermediate)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

N-Bit Precision (Intermediate)

-

Audience: Users looking to scale larger models or take advantage of optimized accelerators.

-
-
-

What is Mixed Precision?

-

PyTorch, like most deep learning frameworks, trains on 32-bit floating-point (FP32) arithmetic by default. However, many deep learning models do not require this to reach complete accuracy. By conducting -operations in half-precision format while keeping minimum information in single-precision to maintain as much information as possible in crucial areas of the network, mixed precision training delivers -significant computational speedup. Switching to mixed precision has resulted in considerable training speedups since the introduction of Tensor Cores in the Volta and Turing architectures. It combines -FP32 and lower-bit floating-points (such as FP16) to reduce memory footprint and increase performance during model training and evaluation. It accomplishes this by recognizing the steps that require -complete accuracy and employing a 32-bit floating-point for those steps only, while using a 16-bit floating-point for the rest. When compared to complete precision training, mixed precision training -delivers all of these benefits while ensuring that no task-specific accuracy is lost. [2].

-
-

Note

-

In some cases, it is essential to remain in FP32 for numerical stability, so keep this in mind when using mixed precision. -For example, when running scatter operations during the forward (such as torchpoint3d), computation must remain in FP32.

-
-
-

Warning

-

Do not cast anything to other dtypes manually using torch.autocast or tensor.half() when using native precision because -this can bring instability.

-
class LitModel(LightningModule):
-    def training_step(self, batch, batch_idx):
-        outs = self(batch)
-
-        a_float32 = torch.rand((8, 8), device=self.device, dtype=self.dtype)
-        b_float32 = torch.rand((8, 4), device=self.device, dtype=self.dtype)
-
-        # casting to float16 manually
-        with torch.autocast(device_type=self.device.type):
-            c_float16 = torch.mm(a_float32, b_float32)
-            target = self.layer(c_float16.flatten()[None])
-
-        # here outs is of type float32 and target is of type float16
-        loss = torch.mm(target @ outs).float()
-        return loss
-
-
-trainer = Trainer(accelerator="gpu", devices=1, precision=32)
-
-
-
-
-
-
-

FP16 Mixed Precision

-

In most cases, mixed precision uses FP16. Supported PyTorch operations automatically run in FP16, saving memory and improving throughput on the supported accelerators.

-
-

Note

-

When using TPUs, setting precision=16 will enable bfloat16, the only supported half precision type on TPUs.

-
-
Trainer(accelerator="gpu", devices=1, precision=16)
-
-
-
-

PyTorch Native

-

PyTorch 1.6 release introduced mixed precision functionality into their core as the AMP package, torch.cuda.amp. It is more flexible and intuitive compared to NVIDIA APEX. -Since computation happens in FP16, there is a chance of numerical instability during training. This is handled internally by a dynamic grad scaler which skips invalid steps and adjusts the scaler to ensure subsequent steps fall within a finite range. For more information see the autocast docs. -Lightning uses native amp by default with precision=16|"bf16". You can also set it using:

-
Trainer(precision=16, amp_backend="native")
-
-
-
-
-

NVIDIA APEX

-
-

Warning

-

We strongly recommend using the above native mixed precision rather than NVIDIA APEX unless you require more refined control.

-
-

NVIDIA APEX offers additional flexibility in setting mixed precision. This can be useful when trying out different precision configurations, such as keeping most of your weights in FP16 and running computation in FP16.

-
Trainer(accelerator="gpu", devices=1, amp_backend="apex", precision=16)
-
-
-

Set the NVIDIA optimization level via the trainer.

-
Trainer(accelerator="gpu", devices=1, amp_backend="apex", amp_level="O2", precision=16)
-
-
-
-
-
-
-

BFloat16 Mixed Precision

-
-

Warning

-

BFloat16 requires PyTorch 1.10 or later and is only supported with PyTorch Native AMP.

-

BFloat16 is also experimental and may not provide significant speedups or memory improvements, offering better numerical stability.

-

Do note for GPUs, the most significant benefits require Ampere based GPUs, such as A100s or 3090s.

-
-

BFloat16 Mixed precision is similar to FP16 mixed precision, however, it maintains more of the “dynamic range” that FP32 offers. This means it is able to improve numerical stability than FP16 mixed precision. For more information, see this TPU performance blogpost.

-

Under the hood, we use torch.autocast with the dtype set to bfloat16, with no gradient scaling.

-
Trainer(accelerator="gpu", devices=1, precision="bf16")
-
-
-

It is also possible to use BFloat16 mixed precision on the CPU, relying on MKLDNN under the hood.

-
Trainer(precision="bf16")
-
-
-
-
-
-

8-bit Optimizer

-

It is possible to further reduce the precision using third-party libraries like bitsandbytes. Although, -Lightning doesn’t support it out of the box yet but you can still use it by configuring it in your LightningModule and setting Trainer(precision=32).

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/progress_bar.html b/docs/common/progress_bar.html deleted file mode 100644 index 07b626d..0000000 --- a/docs/common/progress_bar.html +++ /dev/null @@ -1,817 +0,0 @@ - - - - - - - - - - - - - - Customize the progress bar — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Customize the progress bar
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Customize the progress bar

-

Lightning supports two different types of progress bars (tqdm and rich). TQDMProgressBar is used by default, -but you can override it by passing a custom TQDMProgressBar or RichProgressBar to the callbacks argument of the Trainer.

-

You could also use the ProgressBarBase class to implement your own progress bar.

-
-
-

TQDMProgressBar

-

The TQDMProgressBar uses the tqdm library internally and is the default progress bar used by Lightning. -It prints to stdout and shows up to four different bars:

-
    -
  • sanity check progress: the progress during the sanity check run

  • -
  • main progress: shows training + validation progress combined. It also accounts for multiple validation runs during training when val_check_interval is used.

  • -
  • validation progress: only visible during validation; shows total progress over all validation datasets.

  • -
  • test progress: only active when testing; shows total progress over all test datasets.

  • -
-

For infinite datasets, the progress bar never ends.

-

You can update refresh_rate (rate (number of batches) at which the progress bar get updated) for TQDMProgressBar by:

-
from pytorch_lightning.callbacks import TQDMProgressBar
-
-trainer = Trainer(callbacks=[TQDMProgressBar(refresh_rate=10)])
-
-
-

If you want to customize the default TQDMProgressBar used by Lightning, you can override -specific methods of the callback class and pass your custom implementation to the Trainer.

-
class LitProgressBar(TQDMProgressBar):
-    def init_validation_tqdm(self):
-        bar = super().init_validation_tqdm()
-        bar.set_description("running validation...")
-        return bar
-
-
-trainer = Trainer(callbacks=[LitProgressBar()])
-
-
-
-

See also

- -
-
-
-
-

RichProgressBar

-

Rich is a Python library for rich text and beautiful formatting in the terminal. -To use the RichProgressBar as your progress bar, first install the package:

-
pip install rich
-
-
-

Then configure the callback and pass it to the Trainer:

-
from pytorch_lightning.callbacks import RichProgressBar
-
-trainer = Trainer(callbacks=[RichProgressBar()])
-
-
-

Customize the theme for your RichProgressBar like this:

-
from pytorch_lightning.callbacks import RichProgressBar
-from pytorch_lightning.callbacks.progress.rich_progress import RichProgressBarTheme
-
-# create your own theme!
-progress_bar = RichProgressBar(
-    theme=RichProgressBarTheme(
-        description="green_yellow",
-        progress_bar="green1",
-        progress_bar_finished="green1",
-        progress_bar_pulse="#6206E0",
-        batch_progress="green_yellow",
-        time="grey82",
-        processing_speed="grey82",
-        metrics="grey82",
-    )
-)
-
-trainer = Trainer(callbacks=progress_bar)
-
-
-

You can customize the components used within RichProgressBar with ease by overriding the -configure_columns() method.

-
from rich.progress import TextColumn
-
-custom_column = TextColumn("[progress.description]Custom Rich Progress Bar!")
-
-
-class CustomRichProgressBar(RichProgressBar):
-    def configure_columns(self, trainer):
-        return [custom_column]
-
-
-progress_bar = CustomRichProgressBar()
-
-
-

If you wish for a new progress bar to be displayed at the end of every epoch, you should enable -RichProgressBar.leave by passing True

-
from pytorch_lightning.callbacks import RichProgressBar
-
-trainer = Trainer(callbacks=[RichProgressBar(leave=True)])
-
-
-
-

See also

-
    -
  • RichProgressBar docs.

  • -
  • RichModelSummary docs to customize the model summary table.

  • -
  • Rich library.

  • -
-
-
-

Note

-

Progress bar is automatically enabled with the Trainer, and to disable it, one should do this:

-
trainer = Trainer(enable_progress_bar=False)
-
-
-
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/remote_fs.html b/docs/common/remote_fs.html deleted file mode 100644 index a4ab5c6..0000000 --- a/docs/common/remote_fs.html +++ /dev/null @@ -1,739 +0,0 @@ - - - - - - - - - - - - - - Remote Filesystems — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Remote Filesystems
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Remote Filesystems

-

PyTorch Lightning enables working with data from a variety of filesystems, including local filesystems and several cloud storage providers such as -S3 on AWS, GCS on Google Cloud, -or ADL on Azure.

-

This applies to saving and writing checkpoints, as well as for logging. -Working with different filesystems can be accomplished by appending a protocol like “s3:/” to file paths for writing and reading data.

-
# `default_root_dir` is the default path used for logs and checkpoints
-trainer = Trainer(default_root_dir="s3://my_bucket/data/")
-trainer.fit(model)
-
-
-

You could pass custom paths to loggers for logging data.

-
from pytorch_lightning.loggers import TensorBoardLogger
-
-logger = TensorBoardLogger(save_dir="s3://my_bucket/logs/")
-
-trainer = Trainer(logger=logger)
-trainer.fit(model)
-
-
-

Additionally, you could also resume training with a checkpoint stored at a remote filesystem.

-
trainer = Trainer(default_root_dir=tmpdir, max_steps=3)
-trainer.fit(model, ckpt_path="s3://my_bucket/ckpts/classifier.ckpt")
-
-
-

PyTorch Lightning uses fsspec internally to handle all filesystem operations.

-

The most common filesystems supported by Lightning are:

-
    -
  • Local filesystem: file:// - It’s the default and doesn’t need any protocol to be used. It’s installed by default in Lightning.

  • -
  • Amazon S3: s3:// - Amazon S3 remote binary store, using the library s3fs. Run pip install fsspec[s3] to install it.

  • -
  • Google Cloud Storage: gcs:// or gs:// - Google Cloud Storage, using gcsfs. Run pip install fsspec[gcs] to install it.

  • -
  • Microsoft Azure Storage: adl://, abfs:// or az:// - Microsoft Azure Storage, using adlfs. Run pip install fsspec[adl] to install it.

  • -
  • Hadoop File System: hdfs:// - Hadoop Distributed File System. This uses PyArrow as the backend. Run pip install fsspec[hdfs] to install it.

  • -
-

You could learn more about the available filesystems with:

-
from fsspec.registry import known_implementations
-
-print(known_implementations)
-
-
-

You could also look into CheckpointIO Plugin for more details on how to customize saving and loading checkpoints.

-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
- -
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common/trainer.html b/docs/common/trainer.html deleted file mode 100644 index 105919f..0000000 --- a/docs/common/trainer.html +++ /dev/null @@ -1,2689 +0,0 @@ - - - - - - - - - - - - - - Trainer — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Trainer

-

Once you’ve organized your PyTorch code into a LightningModule, -the Trainer automates everything else.

-
-

-
-

This abstraction achieves the following:

-
    -
  1. You maintain control over all aspects via PyTorch code without an added abstraction.

  2. -
  3. The trainer uses best practices embedded by contributors and users -from top AI labs such as Facebook AI Research, NYU, MIT, Stanford, etc…

  4. -
  5. The trainer allows overriding any key part that you don’t want automated.

  6. -
-
-

-
-
-
-

Basic use

-

This is the basic use of the trainer:

-
model = MyLightningModule()
-
-trainer = Trainer()
-trainer.fit(model, train_dataloader, val_dataloader)
-
-
-
-
-
-

Under the hood

-

Under the hood, the Lightning Trainer handles the training loop details for you, some examples include:

-
    -
  • Automatically enabling/disabling grads

  • -
  • Running the training, validation and test dataloaders

  • -
  • Calling the Callbacks at the appropriate times

  • -
  • Putting batches and computations on the correct devices

  • -
-

Here’s the pseudocode for what the trainer does under the hood (showing the train loop only)

-
# put model in train mode
-model.train()
-torch.set_grad_enabled(True)
-
-losses = []
-for batch in train_dataloader:
-    # calls hooks like this one
-    on_train_batch_start()
-
-    # train step
-    loss = training_step(batch)
-
-    # clear gradients
-    optimizer.zero_grad()
-
-    # backward
-    loss.backward()
-
-    # update parameters
-    optimizer.step()
-
-    losses.append(loss)
-
-
-
-
-
-

Trainer in Python scripts

-

In Python scripts, it’s recommended you use a main function to call the Trainer.

-
from argparse import ArgumentParser
-
-
-def main(hparams):
-    model = LightningModule()
-    trainer = Trainer(accelerator=hparams.accelerator, devices=hparams.devices)
-    trainer.fit(model)
-
-
-if __name__ == "__main__":
-    parser = ArgumentParser()
-    parser.add_argument("--accelerator", default=None)
-    parser.add_argument("--devices", default=None)
-    args = parser.parse_args()
-
-    main(args)
-
-
-

So you can run it like so:

-
python main.py --accelerator 'gpu' --devices 2
-
-
-
-

Note

-

Pro-tip: You don’t need to define all flags manually. Lightning can add them automatically

-
-
from argparse import ArgumentParser
-
-
-def main(args):
-    model = LightningModule()
-    trainer = Trainer.from_argparse_args(args)
-    trainer.fit(model)
-
-
-if __name__ == "__main__":
-    parser = ArgumentParser()
-    parser = Trainer.add_argparse_args(parser)
-    args = parser.parse_args()
-
-    main(args)
-
-
-

So you can run it like so:

-
python main.py --accelerator 'gpu' --devices 2 --max_steps 10 --limit_train_batches 10 --any_trainer_arg x
-
-
-
-

Note

-

If you want to stop a training run early, you can press “Ctrl + C” on your keyboard. -The trainer will catch the KeyboardInterrupt and attempt a graceful shutdown, including -running accelerator callback on_train_end to clean up memory. The trainer object will also set -an attribute interrupted to True in such cases. If you have a callback which shuts down compute -resources, for example, you can conditionally run the shutdown logic for only uninterrupted runs.

-
-
-
-
-

Validation

-

You can perform an evaluation epoch over the validation set, outside of the training loop, -using validate(). This might be -useful if you want to collect new metrics from a model right at its initialization -or after it has already been trained.

-
trainer.validate(dataloaders=val_dataloaders)
-
-
-
-
-
-

Testing

-

Once you’re done training, feel free to run the test set! -(Only right before publishing your paper or pushing to production)

-
trainer.test(dataloaders=test_dataloaders)
-
-
-
-
-
-

Reproducibility

-

To ensure full reproducibility from run to run you need to set seeds for pseudo-random generators, -and set deterministic flag in Trainer.

-

Example:

-
from pytorch_lightning import Trainer, seed_everything
-
-seed_everything(42, workers=True)
-# sets seeds for numpy, torch and python.random.
-model = Model()
-trainer = Trainer(deterministic=True)
-
-
-

By setting workers=True in seed_everything(), Lightning derives -unique seeds across all dataloader workers and processes for torch, numpy and stdlib -random number generators. When turned on, it ensures that e.g. data augmentations are not repeated across workers.

-
-
-
-

Trainer flags

-
-

accelerator

-

Supports passing different accelerator types ("cpu", "gpu", "tpu", "ipu", "auto") -as well as custom accelerator instances.

-
# CPU accelerator
-trainer = Trainer(accelerator="cpu")
-
-# Training with GPU Accelerator using 2 GPUs
-trainer = Trainer(devices=2, accelerator="gpu")
-
-# Training with TPU Accelerator using 8 tpu cores
-trainer = Trainer(devices=8, accelerator="tpu")
-
-# Training with GPU Accelerator using the DistributedDataParallel strategy
-trainer = Trainer(devices=4, accelerator="gpu", strategy="ddp")
-
-
-
-

Note

-

The "auto" option recognizes the machine you are on, and selects the respective Accelerator.

-
-
# If your machine has GPUs, it will use the GPU Accelerator for training
-trainer = Trainer(devices=2, accelerator="auto")
-
-
-

You can also modify hardware behavior by subclassing an existing accelerator to adjust for your needs.

-

Example:

-
class MyOwnAcc(CPUAccelerator):
-    ...
-
-Trainer(accelerator=MyOwnAcc())
-
-
-
-

Note

-

If the devices flag is not defined, it will assume devices to be "auto" and fetch the auto_device_count -from the accelerator.

-
# This is part of the built-in `GPUAccelerator`
-class GPUAccelerator(Accelerator):
-    """Accelerator for GPU devices."""
-
-    @staticmethod
-    def auto_device_count() -> int:
-        """Get the devices when set to auto."""
-        return torch.cuda.device_count()
-
-
-# Training with GPU Accelerator using total number of gpus available on the system
-Trainer(accelerator="gpu")
-
-
-
-
-

Warning

-

Passing training strategies (e.g., "ddp") to accelerator has been deprecated in v1.5.0 -and will be removed in v1.7.0. Please use the strategy argument instead.

-
-
-
-

accumulate_grad_batches

-
-

-
-

Accumulates grads every k batches or as set up in the dict. -Trainer also calls optimizer.step() for the last indivisible step number.

-
# default used by the Trainer (no accumulation)
-trainer = Trainer(accumulate_grad_batches=1)
-
-
-

Example:

-
# accumulate every 4 batches (effective batch size is batch*4)
-trainer = Trainer(accumulate_grad_batches=4)
-
-# no accumulation for epochs 1-4. accumulate 3 for epochs 5-10. accumulate 20 after that
-trainer = Trainer(accumulate_grad_batches={5: 3, 10: 20})
-
-
-
-
-

amp_backend

-
-

-
-

Use PyTorch AMP (‘native’), or NVIDIA apex (‘apex’).

-
# using PyTorch built-in AMP, default used by the Trainer
-trainer = Trainer(amp_backend="native")
-
-# using NVIDIA Apex
-trainer = Trainer(amp_backend="apex")
-
-
-
-
-

amp_level

-
-

-
-

The optimization level to use (O1, O2, etc…) -for 16-bit GPU precision (using NVIDIA apex under the hood).

-

Check NVIDIA apex docs for level

-

Example:

-
# default used by the Trainer
-trainer = Trainer(amp_level='O2')
-
-
-
-
-

auto_scale_batch_size

-
-

-
-

Automatically tries to find the largest batch size that fits into memory, -before any training.

-
# default used by the Trainer (no scaling of batch size)
-trainer = Trainer(auto_scale_batch_size=None)
-
-# run batch size scaling, result overrides hparams.batch_size
-trainer = Trainer(auto_scale_batch_size="binsearch")
-
-# call tune to find the batch size
-trainer.tune(model)
-
-
-
-
-

auto_select_gpus

-
-

-
-

If enabled and devices is an integer, pick available GPUs automatically. -This is especially useful when GPUs are configured to be in “exclusive mode”, -such that only one process at a time can access them.

-

Example:

-
# no auto selection (picks first 2 GPUs on system, may fail if other process is occupying)
-trainer = Trainer(accelerator="gpu", devices=2, auto_select_gpus=False)
-
-# enable auto selection (will find two available GPUs on system)
-trainer = Trainer(accelerator="gpu", devices=2, auto_select_gpus=True)
-
-# specifies all GPUs regardless of its availability
-Trainer(accelerator="gpu", devices=-1, auto_select_gpus=False)
-
-# specifies all available GPUs (if only one GPU is not occupied, uses one gpu)
-Trainer(accelerator="gpu", devices=-1, auto_select_gpus=True)
-
-
-
-
-

auto_lr_find

-
-

-
-

Runs a learning rate finder algorithm (see this paper) -when calling trainer.tune(), to find optimal initial learning rate.

-
# default used by the Trainer (no learning rate finder)
-trainer = Trainer(auto_lr_find=False)
-
-
-

Example:

-
# run learning rate finder, results override hparams.learning_rate
-trainer = Trainer(auto_lr_find=True)
-
-# call tune to find the lr
-trainer.tune(model)
-
-
-

Example:

-
# run learning rate finder, results override hparams.my_lr_arg
-trainer = Trainer(auto_lr_find='my_lr_arg')
-
-# call tune to find the lr
-trainer.tune(model)
-
-
-
-

Note

-

See the learning rate finder guide.

-
-
-
-

benchmark

-
-

-
-

Defaults to True if deterministic is not set. -This flag sets the torch.backends.cudnn.benchmark flag. You can read more about its impact -here

-

This is likely to increase the speed of your system if your input sizes don’t change. However, if they do, then it -might make your system slower. The CUDNN auto-tuner will try to find the best algorithm for the hardware when a new -input size is encountered. Read more about it here.

-

Example:

-
# defaults to True if not deterministic (which is False by default)
-trainer = Trainer()
-
-# you can overwrite the value
-trainer = Trainer(benchmark=False)
-
-
-
-
-

deterministic

-
-

-
-

This flag sets the torch.backends.cudnn.deterministic flag. -Might make your system slower, but ensures reproducibility. -Also sets $HOROVOD_FUSION_THRESHOLD=0.

-

For more info check PyTorch docs.

-

Example:

-
# default used by the Trainer
-trainer = Trainer(deterministic=False)
-
-
-
-
-

callbacks

-
-

-
-

Add a list of Callback. Callbacks run sequentially in the order defined here -with the exception of ModelCheckpoint callbacks which run -after all others to ensure all states are saved to the checkpoints.

-
# a list of callbacks
-callbacks = [PrintCallback()]
-trainer = Trainer(callbacks=callbacks)
-
-
-

Example:

-
from pytorch_lightning.callbacks import Callback
-
-class PrintCallback(Callback):
-    def on_train_start(self, trainer, pl_module):
-        print("Training is started!")
-    def on_train_end(self, trainer, pl_module):
-        print("Training is done.")
-
-
-

Model-specific callbacks can also be added inside the LightningModule through -configure_callbacks(). -Callbacks returned in this hook will extend the list initially given to the Trainer argument, and replace -the trainer callbacks should there be two or more of the same type. -ModelCheckpoint callbacks always run last.

-
-
-

check_val_every_n_epoch

-
-

-
-

Check val every n train epochs.

-

Example:

-
# default used by the Trainer
-trainer = Trainer(check_val_every_n_epoch=1)
-
-# run val loop every 10 training epochs
-trainer = Trainer(check_val_every_n_epoch=10)
-
-
-
-
-

checkpoint_callback

-
-

Warning

-

checkpoint_callback has been deprecated in v1.5 and will be removed in v1.7. -To disable checkpointing, pass enable_checkpointing = False to the Trainer instead.

-
-
-
-

default_root_dir

-
-

-
-

Default path for logs and weights when no logger or -pytorch_lightning.callbacks.ModelCheckpoint callback passed. On -certain clusters you might want to separate where logs and checkpoints are -stored. If you don’t then use this argument for convenience. Paths can be local -paths or remote paths such as s3://bucket/path or ‘hdfs://path/’. Credentials -will need to be set up to use remote filepaths.

-
# default used by the Trainer
-trainer = Trainer(default_root_dir=os.getcwd())
-
-
-
-
-

devices

-

Number of devices to train on (int), which devices to train on (list or str), or "auto". -It will be mapped to either gpus, tpu_cores, num_processes or ipus, -based on the accelerator type ("cpu", "gpu", "tpu", "ipu", "auto").

-
# Training with CPU Accelerator using 2 processes
-trainer = Trainer(devices=2, accelerator="cpu")
-
-# Training with GPU Accelerator using GPUs 1 and 3
-trainer = Trainer(devices=[1, 3], accelerator="gpu")
-
-# Training with TPU Accelerator using 8 tpu cores
-trainer = Trainer(devices=8, accelerator="tpu")
-
-
-
-

Tip

-

The "auto" option recognizes the devices to train on, depending on the Accelerator being used.

-
-
# If your machine has GPUs, it will use all the available GPUs for training
-trainer = Trainer(devices="auto", accelerator="auto")
-
-# Training with CPU Accelerator using 1 process
-trainer = Trainer(devices="auto", accelerator="cpu")
-
-# Training with TPU Accelerator using 8 tpu cores
-trainer = Trainer(devices="auto", accelerator="tpu")
-
-# Training with IPU Accelerator using 4 ipus
-trainer = Trainer(devices="auto", accelerator="ipu")
-
-
-
-

Note

-

If the devices flag is not defined, it will assume devices to be "auto" and fetch the auto_device_count -from the accelerator.

-
# This is part of the built-in `GPUAccelerator`
-class GPUAccelerator(Accelerator):
-    """Accelerator for GPU devices."""
-
-    @staticmethod
-    def auto_device_count() -> int:
-        """Get the devices when set to auto."""
-        return torch.cuda.device_count()
-
-
-# Training with GPU Accelerator using total number of gpus available on the system
-Trainer(accelerator="gpu")
-
-
-
-
-
-

enable_checkpointing

-
-

-
-

By default Lightning saves a checkpoint for you in your current working directory, with the state of your last training epoch, -Checkpoints capture the exact value of all parameters used by a model. -To disable automatic checkpointing, set this to False.

-
# default used by Trainer, saves the most recent model to a single checkpoint after each epoch
-trainer = Trainer(enable_checkpointing=True)
-
-# turn off automatic checkpointing
-trainer = Trainer(enable_checkpointing=False)
-
-
-

You can override the default behavior by initializing the ModelCheckpoint -callback, and adding it to the callbacks list. -See Saving and Loading Checkpoints for how to customize checkpointing.

-
from pytorch_lightning.callbacks import ModelCheckpoint
-
-# Init ModelCheckpoint callback, monitoring 'val_loss'
-checkpoint_callback = ModelCheckpoint(monitor="val_loss")
-
-# Add your callback to the callbacks list
-trainer = Trainer(callbacks=[checkpoint_callback])
-
-
-
-
-

fast_dev_run

-
-

-
-

Runs n if set to n (int) else 1 if set to True batch(es) of train, val and test -to find any bugs (ie: a sort of unit test).

-

Under the hood the pseudocode looks like this when running fast_dev_run with a single batch:

-
# loading
-__init__()
-prepare_data
-
-# test training step
-training_batch = next(train_dataloader)
-training_step(training_batch)
-
-# test val step
-val_batch = next(val_dataloader)
-out = validation_step(val_batch)
-validation_epoch_end([out])
-
-
-
# default used by the Trainer
-trainer = Trainer(fast_dev_run=False)
-
-# runs 1 train, val, test batch and program ends
-trainer = Trainer(fast_dev_run=True)
-
-# runs 7 train, val, test batches and program ends
-trainer = Trainer(fast_dev_run=7)
-
-
-
-

Note

-

This argument is a bit different from limit_train/val/test_batches. Setting this argument will -disable tuner, checkpoint callbacks, early stopping callbacks, loggers and logger callbacks like -LearningRateLogger and runs for only 1 epoch. This must be used only for debugging purposes. -limit_train/val/test_batches only limits the number of batches and won’t disable anything.

-
-
-
-

flush_logs_every_n_steps

-
-

Warning

-

flush_logs_every_n_steps has been deprecated in v1.5 and will be removed in v1.7. -Please configure flushing directly in the logger instead.

-
-
-

-
-

Writes logs to disk this often.

-
# default used by the Trainer
-trainer = Trainer(flush_logs_every_n_steps=100)
-
-
-
-
See Also:
-
-
-
-
-

gpus

-
-

Warning

-

gpus=x has been deprecated in v1.7 and will be removed in v2.0. -Please use accelerator='gpu' and devices=x instead.

-
-
-

-
-
    -
  • Number of GPUs to train on (int)

  • -
  • or which GPUs to train on (list)

  • -
  • can handle strings

  • -
-
# default used by the Trainer (ie: train on CPU)
-trainer = Trainer(gpus=None)
-
-# equivalent
-trainer = Trainer(gpus=0)
-
-
-

Example:

-
# int: train on 2 gpus
-trainer = Trainer(gpus=2)
-
-# list: train on GPUs 1, 4 (by bus ordering)
-trainer = Trainer(gpus=[1, 4])
-trainer = Trainer(gpus='1, 4') # equivalent
-
-# -1: train on all gpus
-trainer = Trainer(gpus=-1)
-trainer = Trainer(gpus='-1') # equivalent
-
-# combine with num_nodes to train on multiple GPUs across nodes
-# uses 8 gpus in total
-trainer = Trainer(gpus=2, num_nodes=4)
-
-# train only on GPUs 1 and 4 across nodes
-trainer = Trainer(gpus=[1, 4], num_nodes=4)
-
-
-
-
See Also:
-
-
-
-
-

gradient_clip_val

-
-

-
-

Gradient clipping value

-
    -
  • 0 means don’t clip.

  • -
-
# default used by the Trainer
-trainer = Trainer(gradient_clip_val=0.0)
-
-
-
-
-

limit_train_batches

-
-

-
-

How much of training dataset to check. -Useful when debugging or testing something that happens at the end of an epoch.

-
# default used by the Trainer
-trainer = Trainer(limit_train_batches=1.0)
-
-
-

Example:

-
# default used by the Trainer
-trainer = Trainer(limit_train_batches=1.0)
-
-# run through only 25% of the training set each epoch
-trainer = Trainer(limit_train_batches=0.25)
-
-# run through only 10 batches of the training set each epoch
-trainer = Trainer(limit_train_batches=10)
-
-
-
-
-

limit_test_batches

-
-

-
-

How much of test dataset to check.

-
# default used by the Trainer
-trainer = Trainer(limit_test_batches=1.0)
-
-# run through only 25% of the test set each epoch
-trainer = Trainer(limit_test_batches=0.25)
-
-# run for only 10 batches
-trainer = Trainer(limit_test_batches=10)
-
-
-

In the case of multiple test dataloaders, the limit applies to each dataloader individually.

-
-
-

limit_val_batches

-
-

-
-

How much of validation dataset to check. -Useful when debugging or testing something that happens at the end of an epoch.

-
# default used by the Trainer
-trainer = Trainer(limit_val_batches=1.0)
-
-# run through only 25% of the validation set each epoch
-trainer = Trainer(limit_val_batches=0.25)
-
-# run for only 10 batches
-trainer = Trainer(limit_val_batches=10)
-
-
-

In the case of multiple validation dataloaders, the limit applies to each dataloader individually.

-
-
-

log_every_n_steps

-
-

-
-

How often to add logging rows (does not write to disk)

-
# default used by the Trainer
-trainer = Trainer(log_every_n_steps=50)
-
-
-
-
See Also:
-
-
-
-
-

logger

-
-

-
-

Logger (or iterable collection of loggers) for experiment tracking. A True value uses the default TensorBoardLogger shown below. False will disable logging.

-
from pytorch_lightning.loggers import TensorBoardLogger
-
-# default logger used by trainer
-logger = TensorBoardLogger(save_dir=os.getcwd(), version=1, name="lightning_logs")
-Trainer(logger=logger)
-
-
-
-
-

max_epochs

-
-

-
-

Stop training once this number of epochs is reached

-
# default used by the Trainer
-trainer = Trainer(max_epochs=1000)
-
-
-

If both max_epochs and max_steps aren’t specified, max_epochs will default to 1000. -To enable infinite training, set max_epochs = -1.

-
-
-

min_epochs

-
-

-
-

Force training for at least these many epochs

-
# default used by the Trainer
-trainer = Trainer(min_epochs=1)
-
-
-
-
-

max_steps

-
-

-
-

Stop training after this number of global steps. -Training will stop if max_steps or max_epochs have reached (earliest).

-
# Default (disabled)
-trainer = Trainer(max_steps=None)
-
-# Stop after 100 steps
-trainer = Trainer(max_steps=100)
-
-
-

If max_steps is not specified, max_epochs will be used instead (and max_epochs defaults to -1000 if max_epochs is not specified). To disable this default, set max_steps = -1.

-
-
-

min_steps

-
-

-
-

Force training for at least this number of global steps. -Trainer will train model for at least min_steps or min_epochs (latest).

-
# Default (disabled)
-trainer = Trainer(min_steps=None)
-
-# Run at least for 100 steps (disable min_epochs)
-trainer = Trainer(min_steps=100, min_epochs=0)
-
-
-
-
-

max_time

-

Set the maximum amount of time for training. Training will get interrupted mid-epoch. -For customizable options use the Timer callback.

-
# Default (disabled)
-trainer = Trainer(max_time=None)
-
-# Stop after 12 hours of training or when reaching 10 epochs (string)
-trainer = Trainer(max_time="00:12:00:00", max_epochs=10)
-
-# Stop after 1 day and 5 hours (dict)
-trainer = Trainer(max_time={"days": 1, "hours": 5})
-
-
-

In case max_time is used together with min_steps or min_epochs, the min_* requirement -always has precedence.

-
-
-

num_nodes

-
-

-
-

Number of GPU nodes for distributed training.

-
# default used by the Trainer
-trainer = Trainer(num_nodes=1)
-
-# to train on 8 nodes
-trainer = Trainer(num_nodes=8)
-
-
-
-
-

num_processes

-
-

Warning

-

num_processes=x has been deprecated in v1.7 and will be removed in v2.0. -Please use accelerator='cpu' and devices=x instead.

-
-
-

-
-

Number of processes to train with. Automatically set to the number of GPUs -when using strategy="ddp". Set to a number greater than 1 when -using accelerator="cpu" and strategy="ddp" to mimic distributed training on a -machine without GPUs. This is useful for debugging, but will not provide -any speedup, since single-process Torch already makes efficient use of multiple -CPUs. While it would typically spawns subprocesses for training, setting -num_nodes > 1 and keeping num_processes = 1 runs training in the main -process.

-
# Simulate DDP for debugging on your GPU-less laptop
-trainer = Trainer(accelerator="cpu", strategy="ddp", num_processes=2)
-
-
-
-
-

num_sanity_val_steps

-
-

-
-

Sanity check runs n batches of val before starting the training routine. -This catches any bugs in your validation without having to wait for the first validation check. -The Trainer uses 2 steps by default. Turn it off or modify it here.

-
# default used by the Trainer
-trainer = Trainer(num_sanity_val_steps=2)
-
-# turn it off
-trainer = Trainer(num_sanity_val_steps=0)
-
-# check all validation data
-trainer = Trainer(num_sanity_val_steps=-1)
-
-
-

This option will reset the validation dataloader unless num_sanity_val_steps=0.

-
-
-

overfit_batches

-
-

-
-

Uses this much data of the training & validation set. -If the training & validation dataloaders have shuffle=True, Lightning will automatically disable it.

-

Useful for quickly debugging or trying to overfit on purpose.

-
# default used by the Trainer
-trainer = Trainer(overfit_batches=0.0)
-
-# use only 1% of the train & val set
-trainer = Trainer(overfit_batches=0.01)
-
-# overfit on 10 of the same batches
-trainer = Trainer(overfit_batches=10)
-
-
-
-
-

plugins

-
-

-
-

Plugins allow you to connect arbitrary backends, precision libraries, clusters etc. For example:

- -

To define your own behavior, subclass the relevant class and pass it in. Here’s an example linking up your own -ClusterEnvironment.

-
from pytorch_lightning.plugins.environments import ClusterEnvironment
-
-
-class MyCluster(ClusterEnvironment):
-    def main_address(self):
-        return your_main_address
-
-    def main_port(self):
-        return your_main_port
-
-    def world_size(self):
-        return the_world_size
-
-
-trainer = Trainer(plugins=[MyCluster()], ...)
-
-
-
-
-

precision

-
-

-
-

Lightning supports either double (64), float (32), bfloat16 (bf16), or half (16) precision training.

-

Half precision, or mixed precision, is the combined use of 32 and 16 bit floating points to reduce memory footprint during model training. This can result in improved performance, achieving +3X speedups on modern GPUs.

-
# default used by the Trainer
-trainer = Trainer(precision=32)
-
-# 16-bit precision
-trainer = Trainer(precision=16, accelerator="gpu", devices=1)  # works only on CUDA
-
-# bfloat16 precision
-trainer = Trainer(precision="bf16")
-
-# 64-bit precision
-trainer = Trainer(precision=64)
-
-
-
-

Note

-

When running on TPUs, torch.bfloat16 will be used but tensor printing will still show torch.float32.

-
- -
-
-

process_position

-
-

Warning

-

process_position has been deprecated in v1.5 and will be removed in v1.7. -Please pass TQDMProgressBar with process_position -directly to the Trainer’s callbacks argument instead.

-
-
-

-
-

Orders the progress bar. Useful when running multiple trainers on the same node.

-
# default used by the Trainer
-trainer = Trainer(process_position=0)
-
-
-
-

Note

-

This argument is ignored if a custom callback is passed to callbacks.

-
-
-
-

profiler

-
-

-
-

To profile individual steps during training and assist in identifying bottlenecks.

-

See the profiler documentation. for more details.

-
from pytorch_lightning.profiler import SimpleProfiler, AdvancedProfiler
-
-# default used by the Trainer
-trainer = Trainer(profiler=None)
-
-# to profile standard training events, equivalent to `profiler=SimpleProfiler()`
-trainer = Trainer(profiler="simple")
-
-# advanced profiler for function-level stats, equivalent to `profiler=AdvancedProfiler()`
-trainer = Trainer(profiler="advanced")
-
-
-
-
-

enable_progress_bar

-

Whether to enable or disable the progress bar. Defaults to True.

-
# default used by the Trainer
-trainer = Trainer(enable_progress_bar=True)
-
-# disable progress bar
-trainer = Trainer(enable_progress_bar=False)
-
-
-
-
-

reload_dataloaders_every_n_epochs

-
-

-
-

Set to a positive integer to reload dataloaders every n epochs.

-
# if 0 (default)
-train_loader = model.train_dataloader()
-for epoch in epochs:
-    for batch in train_loader:
-        ...
-
-# if a positive integer
-for epoch in epochs:
-    if not epoch % reload_dataloaders_every_n_epochs:
-        train_loader = model.train_dataloader()
-    for batch in train_loader:
-        ...
-
-
-
-
-

replace_sampler_ddp

-
-

-
-

Enables auto adding of DistributedSampler. In PyTorch, you must use it in -distributed settings such as TPUs or multi-node. The sampler makes sure each GPU sees the appropriate part of your data. -By default it will add shuffle=True for train sampler and shuffle=False for val/test sampler. -If you want to customize it, you can set replace_sampler_ddp=False and add your own distributed sampler. -If replace_sampler_ddp=True and a distributed sampler was already added, -Lightning will not replace the existing one.

-
# default used by the Trainer
-trainer = Trainer(replace_sampler_ddp=True)
-
-
-

By setting to False, you have to add your own distributed sampler:

-
# in your LightningModule or LightningDataModule
-def train_dataloader(self):
-    # default used by the Trainer
-    sampler = torch.utils.data.distributed.DistributedSampler(dataset, shuffle=True)
-    dataloader = DataLoader(dataset, batch_size=32, sampler=sampler)
-    return dataloader
-
-
-
-

Note

-

For iterable datasets, we don’t do this automatically.

-
-
-
-

resume_from_checkpoint

-
-

Warning

-

resume_from_checkpoint is deprecated in v1.5 and will be removed in v2.0. -Please pass trainer.fit(ckpt_path="some/path/to/my_checkpoint.ckpt") instead.

-
-
-

-
-

To resume training from a specific checkpoint pass in the path here. If resuming from a mid-epoch -checkpoint, training will start from the beginning of the next epoch.

-
# default used by the Trainer
-trainer = Trainer(resume_from_checkpoint=None)
-
-# resume from a specific checkpoint
-trainer = Trainer(resume_from_checkpoint="some/path/to/my_checkpoint.ckpt")
-
-
-
-
-

strategy

-

Supports passing different training strategies with aliases (ddp, ddp_spawn, etc) as well as custom strategies.

-
# Training with the DistributedDataParallel strategy on 4 GPUs
-trainer = Trainer(strategy="ddp", accelerator="gpu", devices=4)
-
-# Training with the DDP Spawn strategy using 4 cpu processes
-trainer = Trainer(strategy="ddp_spawn", accelerator="cpu", devices=4)
-
-
-
-

Note

-

Additionally, you can pass your custom strategy to the strategy argument.

-
-
from pytorch_lightning.strategies import DDPStrategy
-
-
-class CustomDDPStrategy(DDPStrategy):
-    def configure_ddp(self):
-        self._model = MyCustomDistributedDataParallel(
-            self.model,
-            device_ids=...,
-        )
-
-
-trainer = Trainer(strategy=CustomDDPStrategy(), accelerator="gpu", devices=2)
-
-
-
-
See Also:
-
-
-
-
-

sync_batchnorm

-
-

-
-

Enable synchronization between batchnorm layers across all GPUs.

-
trainer = Trainer(sync_batchnorm=True)
-
-
-
-
-

track_grad_norm

-
-

-
-
    -
  • no tracking (-1)

  • -
  • Otherwise tracks that norm (2 for 2-norm)

  • -
-
# default used by the Trainer
-trainer = Trainer(track_grad_norm=-1)
-
-# track the 2-norm
-trainer = Trainer(track_grad_norm=2)
-
-
-
-
-

tpu_cores

-
-

Warning

-

tpu_cores=x has been deprecated in v1.7 and will be removed in v2.0. -Please use accelerator='tpu' and devices=x instead.

-
-
-

-
-
    -
  • How many TPU cores to train on (1 or 8).

  • -
  • Which TPU core to train on [1-8]

  • -
-

A single TPU v2 or v3 has 8 cores. A TPU pod has -up to 2048 cores. A slice of a POD means you get as many cores -as you request.

-

Your effective batch size is batch_size * total tpu cores.

-

This parameter can be either 1 or 8.

-

Example:

-
# your_trainer_file.py
-
-# default used by the Trainer (ie: train on CPU)
-trainer = Trainer(tpu_cores=None)
-
-# int: train on a single core
-trainer = Trainer(tpu_cores=1)
-
-# list: train on a single selected core
-trainer = Trainer(tpu_cores=[2])
-
-# int: train on all cores few cores
-trainer = Trainer(tpu_cores=8)
-
-# for 8+ cores must submit via xla script with
-# a max of 8 cores specified. The XLA script
-# will duplicate script onto each TPU in the POD
-trainer = Trainer(tpu_cores=8)
-
-
-

To train on more than 8 cores (ie: a POD), -submit this script using the xla_dist script.

-

Example:

-
python -m torch_xla.distributed.xla_dist
---tpu=$TPU_POD_NAME
---conda-env=torch-xla-nightly
---env=XLA_USE_BF16=1
--- python your_trainer_file.py
-
-
-
-
-

val_check_interval

-
-

-
-

How often within one training epoch to check the validation set. -Can specify as float or int.

-
    -
  • pass a float in the range [0.0, 1.0] to check after a fraction of the training epoch.

  • -
  • pass an int to check after a fixed number of training batches.

  • -
-
# default used by the Trainer
-trainer = Trainer(val_check_interval=1.0)
-
-# check validation set 4 times during a training epoch
-trainer = Trainer(val_check_interval=0.25)
-
-# check validation set every 1000 training batches
-# use this when using iterableDataset and your dataset has no length
-# (ie: production cases with streaming data)
-trainer = Trainer(val_check_interval=1000)
-
-
-
# Here is the computation to estimate the total number of batches seen within an epoch.
-
-# Find the total number of train batches
-total_train_batches = total_train_samples // (train_batch_size * world_size)
-
-# Compute how many times we will call validation during the training loop
-val_check_batch = max(1, int(total_train_batches * val_check_interval))
-val_checks_per_epoch = total_train_batches / val_check_batch
-
-# Find the total number of validation batches
-total_val_batches = total_val_samples // (val_batch_size * world_size)
-
-# Total number of batches run
-total_fit_batches = total_train_batches + total_val_batches
-
-
-
-
-

weights_save_path

-
-

Warning

-

weights_save_path has been deprecated in v1.6 and will be removed in v1.8. Please pass -dirpath directly to the ModelCheckpoint -callback.

-
-
-

-
-

Directory of where to save weights if specified.

-
# default used by the Trainer
-trainer = Trainer(weights_save_path=os.getcwd())
-
-# save to your custom path
-trainer = Trainer(weights_save_path="my/path")
-
-
-

Example:

-
# if checkpoint callback used, then overrides the weights path
-# **NOTE: this saves weights to some/path NOT my/path
-checkpoint = ModelCheckpoint(dirpath='some/path')
-trainer = Trainer(
-    callbacks=[checkpoint],
-    weights_save_path='my/path'
-)
-
-
-
-
-

weights_summary

-
-

Warning

-

weights_summary is deprecated in v1.5 and will be removed in v1.7. Please pass ModelSummary -directly to the Trainer’s callbacks argument instead. To disable the model summary, -pass enable_model_summary = False to the Trainer.

-
-
-

-
-

Prints a summary of the weights when training begins. -Options: ‘full’, ‘top’, None.

-
# default used by the Trainer (ie: print summary of top level modules)
-trainer = Trainer(weights_summary="top")
-
-# print full summary of all modules and submodules
-trainer = Trainer(weights_summary="full")
-
-# don't print a summary
-trainer = Trainer(weights_summary=None)
-
-
-
-
-

enable_model_summary

-

Whether to enable or disable the model summarization. Defaults to True.

-
# default used by the Trainer
-trainer = Trainer(enable_model_summary=True)
-
-# disable summarization
-trainer = Trainer(enable_model_summary=False)
-
-# enable custom summarization
-from pytorch_lightning.callbacks import ModelSummary
-
-trainer = Trainer(enable_model_summary=True, callbacks=[ModelSummary(max_depth=-1)])
-
-
-
-
-
-
-

Trainer class API

-
-

Methods

-
-

init

-
-
-Trainer.__init__(logger=True, checkpoint_callback=None, enable_checkpointing=True, callbacks=None, default_root_dir=None, gradient_clip_val=None, gradient_clip_algorithm=None, process_position=0, num_nodes=1, num_processes=None, devices=None, gpus=None, auto_select_gpus=False, tpu_cores=None, ipus=None, log_gpu_memory=None, progress_bar_refresh_rate=None, enable_progress_bar=True, overfit_batches=0.0, track_grad_norm=- 1, check_val_every_n_epoch=1, fast_dev_run=False, accumulate_grad_batches=None, max_epochs=None, min_epochs=None, max_steps=- 1, min_steps=None, max_time=None, limit_train_batches=None, limit_val_batches=None, limit_test_batches=None, limit_predict_batches=None, val_check_interval=None, flush_logs_every_n_steps=None, log_every_n_steps=50, accelerator=None, strategy=None, sync_batchnorm=False, precision=32, enable_model_summary=True, weights_summary='top', weights_save_path=None, num_sanity_val_steps=2, resume_from_checkpoint=None, profiler=None, benchmark=None, deterministic=False, reload_dataloaders_every_n_epochs=0, auto_lr_find=False, replace_sampler_ddp=True, detect_anomaly=False, auto_scale_batch_size=False, prepare_data_per_node=None, plugins=None, amp_backend='native', amp_level=None, move_metrics_to_cpu=False, multiple_trainloader_mode='max_size_cycle', stochastic_weight_avg=False, terminate_on_nan=None)[source]
-

Customize every aspect of training via flags.

-
-
Parameters
-
    -
  • accelerator (Union[str, Accelerator, None]) –

    Supports passing different accelerator types (“cpu”, “gpu”, “tpu”, “ipu”, “hpu”, “auto”) -as well as custom accelerator instances.

    -
    -

    Deprecated since version v1.5: Passing training strategies (e.g., ‘ddp’) to accelerator has been deprecated in v1.5.0 -and will be removed in v1.7.0. Please use the strategy argument instead.

    -
    -

  • -
  • accumulate_grad_batches (Union[int, Dict[int, int], None]) – Accumulates grads every k batches or as set up in the dict. -Default: None.

  • -
  • amp_backend (str) – The mixed precision backend to use (“native” or “apex”). -Default: 'native''.

  • -
  • amp_level (Optional[str]) – The optimization level to use (O1, O2, etc…). By default it will be set to “O2” -if amp_backend is set to “apex”.

  • -
  • auto_lr_find (Union[bool, str]) – If set to True, will make trainer.tune() run a learning rate finder, -trying to optimize initial learning for faster convergence. trainer.tune() method will -set the suggested learning rate in self.lr or self.learning_rate in the LightningModule. -To use a different key set a string instead of True with the key name. -Default: False.

  • -
  • auto_scale_batch_size (Union[str, bool]) – If set to True, will initially run a batch size -finder trying to find the largest batch size that fits into memory. -The result will be stored in self.batch_size in the LightningModule. -Additionally, can be set to either power that estimates the batch size through -a power search or binsearch that estimates the batch size through a binary search. -Default: False.

  • -
  • auto_select_gpus (bool) – If enabled and gpus or devices is an integer, pick available -gpus automatically. This is especially useful when -GPUs are configured to be in “exclusive mode”, such -that only one process at a time can access them. -Default: False.

  • -
  • benchmark (Optional[bool]) – Sets torch.backends.cudnn.benchmark. -Defaults to True if deterministic -is False. Overwrite to manually set a different value. Default: None.

  • -
  • callbacks (Union[List[Callback], Callback, None]) – Add a callback or list of callbacks. -Default: None.

  • -
  • checkpoint_callback (Optional[bool]) –

    If True, enable checkpointing. -Default: None.

    -
    -

    Deprecated since version v1.5: checkpoint_callback has been deprecated in v1.5 and will be removed in v1.7. -Please consider using enable_checkpointing instead.

    -
    -

  • -
  • enable_checkpointing (bool) – If True, enable checkpointing. -It will configure a default ModelCheckpoint callback if there is no user-defined ModelCheckpoint in -callbacks. -Default: True.

  • -
  • check_val_every_n_epoch (int) – Check val every n train epochs. -Default: 1.

  • -
  • default_root_dir (Optional[str]) – Default path for logs and weights when no logger/ckpt_callback passed. -Default: os.getcwd(). -Can be remote file paths such as s3://mybucket/path or ‘hdfs://path/’

  • -
  • detect_anomaly (bool) – Enable anomaly detection for the autograd engine. -Default: False.

  • -
  • deterministic (bool) – If True, sets whether PyTorch operations must use deterministic algorithms. -Default: False.

  • -
  • devices (Union[List[int], str, int, None]) – Will be mapped to either gpus, tpu_cores, num_processes or ipus, -based on the accelerator type.

  • -
  • fast_dev_run (Union[int, bool]) – Runs n if set to n (int) else 1 if set to True batch(es) -of train, val and test to find any bugs (ie: a sort of unit test). -Default: False.

  • -
  • flush_logs_every_n_steps (Optional[int]) –

    How often to flush logs to disk (defaults to every 100 steps).

    -
    -

    Deprecated since version v1.5: flush_logs_every_n_steps has been deprecated in v1.5 and will be removed in v1.7. -Please configure flushing directly in the logger instead.

    -
    -

  • -
  • gpus (Union[List[int], str, int, None]) – Number of GPUs to train on (int) or which GPUs to train on (list or str) applied per node -Default: None.

  • -
  • gradient_clip_val (Union[int, float, None]) – The value at which to clip gradients. Passing gradient_clip_val=None disables -gradient clipping. If using Automatic Mixed Precision (AMP), the gradients will be unscaled before. -Default: None.

  • -
  • gradient_clip_algorithm (Optional[str]) – The gradient clipping algorithm to use. Pass gradient_clip_algorithm="value" -to clip by value, and gradient_clip_algorithm="norm" to clip by norm. By default it will -be set to "norm".

  • -
  • limit_train_batches (Union[int, float, None]) – How much of training dataset to check (float = fraction, int = num_batches). -Default: 1.0.

  • -
  • limit_val_batches (Union[int, float, None]) – How much of validation dataset to check (float = fraction, int = num_batches). -Default: 1.0.

  • -
  • limit_test_batches (Union[int, float, None]) – How much of test dataset to check (float = fraction, int = num_batches). -Default: 1.0.

  • -
  • limit_predict_batches (Union[int, float, None]) – How much of prediction dataset to check (float = fraction, int = num_batches). -Default: 1.0.

  • -
  • logger (Union[LightningLoggerBase, Iterable[LightningLoggerBase], bool]) – Logger (or iterable collection of loggers) for experiment tracking. A True value uses -the default TensorBoardLogger. False will disable logging. If multiple loggers are -provided and the save_dir property of that logger is not set, local files (checkpoints, -profiler traces, etc.) are saved in default_root_dir rather than in the log_dir of any -of the individual loggers. -Default: True.

  • -
  • log_gpu_memory (Optional[str]) –

    None, ‘min_max’, ‘all’. Might slow performance.

    -
    -

    Deprecated since version v1.5: Deprecated in v1.5.0 and will be removed in v1.7.0 -Please use the DeviceStatsMonitor callback directly instead.

    -
    -

  • -
  • log_every_n_steps (int) – How often to log within steps. -Default: 50.

  • -
  • prepare_data_per_node (Optional[bool]) –

    If True, each LOCAL_RANK=0 will call prepare data. -Otherwise only NODE_RANK=0, LOCAL_RANK=0 will prepare data

    -
    -

    Deprecated since version v1.5: Deprecated in v1.5.0 and will be removed in v1.7.0 -Please set prepare_data_per_node in LightningDataModule and/or -LightningModule directly instead.

    -
    -

  • -
  • process_position (int) –

    Orders the progress bar when running multiple models on same machine.

    -
    -

    Deprecated since version v1.5: process_position has been deprecated in v1.5 and will be removed in v1.7. -Please pass TQDMProgressBar with process_position -directly to the Trainer’s callbacks argument instead.

    -
    -

  • -
  • progress_bar_refresh_rate (Optional[int]) –

    How often to refresh progress bar (in steps). Value 0 disables progress bar. -Ignored when a custom progress bar is passed to callbacks. Default: None, means -a suitable value will be chosen based on the environment (terminal, Google COLAB, etc.).

    -
    -

    Deprecated since version v1.5: progress_bar_refresh_rate has been deprecated in v1.5 and will be removed in v1.7. -Please pass TQDMProgressBar with refresh_rate -directly to the Trainer’s callbacks argument instead. To disable the progress bar, -pass enable_progress_bar = False to the Trainer.

    -
    -

  • -
  • enable_progress_bar (bool) – Whether to enable to progress bar by default. -Default: False.

  • -
  • profiler (Union[BaseProfiler, str, None]) – To profile individual steps during training and assist in identifying bottlenecks. -Default: None.

  • -
  • overfit_batches (Union[int, float]) – Overfit a fraction of training data (float) or a set number of batches (int). -Default: 0.0.

  • -
  • plugins (Union[Strategy, PrecisionPlugin, ClusterEnvironment, CheckpointIO, LayerSync, str, List[Union[Strategy, PrecisionPlugin, ClusterEnvironment, CheckpointIO, LayerSync, str]], None]) – Plugins allow modification of core behavior like ddp and amp, and enable custom lightning plugins. -Default: None.

  • -
  • precision (Union[int, str]) – Double precision (64), full precision (32), half precision (16) or bfloat16 precision (bf16). -Can be used on CPU, GPU, TPUs, HPUs or IPUs. -Default: 32.

  • -
  • max_epochs (Optional[int]) – Stop training once this number of epochs is reached. Disabled by default (None). -If both max_epochs and max_steps are not specified, defaults to max_epochs = 1000. -To enable infinite training, set max_epochs = -1.

  • -
  • min_epochs (Optional[int]) – Force training for at least these many epochs. Disabled by default (None).

  • -
  • max_steps (int) – Stop training after this number of steps. Disabled by default (-1). If max_steps = -1 -and max_epochs = None, will default to max_epochs = 1000. To enable infinite training, set -max_epochs to -1.

  • -
  • min_steps (Optional[int]) – Force training for at least these number of steps. Disabled by default (None).

  • -
  • max_time (Union[str, timedelta, Dict[str, int], None]) – Stop training after this amount of time has passed. Disabled by default (None). -The time duration can be specified in the format DD:HH:MM:SS (days, hours, minutes seconds), as a -datetime.timedelta, or a dictionary with keys that will be passed to -datetime.timedelta.

  • -
  • num_nodes (int) – Number of GPU nodes for distributed training. -Default: 1.

  • -
  • num_processes (Optional[int]) – Number of processes for distributed training with accelerator="cpu". -Default: 1.

  • -
  • num_sanity_val_steps (int) – Sanity check runs n validation batches before starting the training routine. -Set it to -1 to run all batches in all validation dataloaders. -Default: 2.

  • -
  • reload_dataloaders_every_n_epochs (int) – Set to a non-negative integer to reload dataloaders every n epochs. -Default: 0.

  • -
  • replace_sampler_ddp (bool) – Explicitly enables or disables sampler replacement. If not specified this -will toggled automatically when DDP is used. By default it will add shuffle=True for -train sampler and shuffle=False for val/test sampler. If you want to customize it, -you can set replace_sampler_ddp=False and add your own distributed sampler.

  • -
  • resume_from_checkpoint (Union[str, Path, None]) –

    Path/URL of the checkpoint from which training is resumed. If there is -no checkpoint file at the path, an exception is raised. If resuming from mid-epoch checkpoint, -training will start from the beginning of the next epoch.

    -
    -

    Deprecated since version v1.5: resume_from_checkpoint is deprecated in v1.5 and will be removed in v2.0. -Please pass the path to Trainer.fit(..., ckpt_path=...) instead.

    -
    -

  • -
  • strategy (Union[str, Strategy, None]) – Supports different training strategies with aliases -as well custom strategies. -Default: None.

  • -
  • sync_batchnorm (bool) – Synchronize batch norm layers between process groups/whole world. -Default: False.

  • -
  • terminate_on_nan (Optional[bool]) –

    If set to True, will terminate training (by raising a ValueError) at the -end of each training batch, if any of the parameters or the loss are NaN or +/-inf.

    -
    -

    Deprecated since version v1.5: Trainer argument terminate_on_nan was deprecated in v1.5 and will be removed in 1.7. -Please use detect_anomaly instead.

    -
    -

  • -
  • detect_anomaly – Enable anomaly detection for the autograd engine. -Default: False.

  • -
  • tpu_cores (Union[List[int], str, int, None]) – How many TPU cores to train on (1 or 8) / Single TPU to train on (1) -Default: None.

  • -
  • ipus (Optional[int]) – How many IPUs to train on. -Default: None.

  • -
  • track_grad_norm (Union[int, float, str]) – -1 no tracking. Otherwise tracks that p-norm. May be set to ‘inf’ infinity-norm. If using -Automatic Mixed Precision (AMP), the gradients will be unscaled before logging them. -Default: -1.

  • -
  • val_check_interval (Union[int, float, None]) – How often to check the validation set. Pass a float in the range [0.0, 1.0] to check -after a fraction of the training epoch. Pass an int to check after a fixed number of training -batches. -Default: 1.0.

  • -
  • enable_model_summary (bool) – Whether to enable model summarization by default. -Default: True.

  • -
  • weights_summary (Optional[str]) –

    Prints a summary of the weights when training begins.

    -
    -

    Deprecated since version v1.5: weights_summary has been deprecated in v1.5 and will be removed in v1.7. -To disable the summary, pass enable_model_summary = False to the Trainer. -To customize the summary, pass ModelSummary -directly to the Trainer’s callbacks argument.

    -
    -

  • -
  • weights_save_path (Optional[str]) –

    Where to save weights if specified. Will override default_root_dir -for checkpoints only. Use this if for whatever reason you need the checkpoints -stored in a different place than the logs written in default_root_dir. -Can be remote file paths such as s3://mybucket/path or ‘hdfs://path/’ -Defaults to default_root_dir.

    -
    -

    Deprecated since version v1.6: weights_save_path has been deprecated in v1.6 and will be removed in v1.8. Please pass -dirpath directly to the ModelCheckpoint -callback.

    -
    -

  • -
  • move_metrics_to_cpu (bool) – Whether to force internal logged metrics to be moved to cpu. -This can save some gpu memory, but can make training slower. Use with attention. -Default: False.

  • -
  • multiple_trainloader_mode (str) – How to loop over the datasets when there are multiple train loaders. -In ‘max_size_cycle’ mode, the trainer ends one epoch when the largest dataset is traversed, -and smaller datasets reload when running out of their data. In ‘min_size’ mode, all the datasets -reload when reaching the minimum length of datasets. -Default: "max_size_cycle".

  • -
  • stochastic_weight_avg (bool) –

    Whether to use Stochastic Weight Averaging (SWA). -Default: False.

    -
    -

    Deprecated since version v1.5: stochastic_weight_avg has been deprecated in v1.5 and will be removed in v1.7. -Please pass StochasticWeightAveraging -directly to the Trainer’s callbacks argument instead.

    -
    -

  • -
-
-
-
- -
-
-

fit

-
-
-Trainer.fit(model, train_dataloaders=None, val_dataloaders=None, datamodule=None, ckpt_path=None)[source]
-

Runs the full optimization routine.

-
-
Parameters
-
    -
  • model (LightningModule) – Model to fit.

  • -
  • train_dataloaders (Union[DataLoader, Sequence[DataLoader], Sequence[Sequence[DataLoader]], Sequence[Dict[str, DataLoader]], Dict[str, DataLoader], Dict[str, Dict[str, DataLoader]], Dict[str, Sequence[DataLoader]], LightningDataModule, None]) – A collection of torch.utils.data.DataLoader or a -LightningDataModule specifying training samples. -In the case of multiple dataloaders, please see this section.

  • -
  • val_dataloaders (Union[DataLoader, Sequence[DataLoader], None]) – A torch.utils.data.DataLoader or a sequence of them specifying validation samples.

  • -
  • ckpt_path (Optional[str]) – Path/URL of the checkpoint from which training is resumed. If there is -no checkpoint file at the path, an exception is raised. If resuming from mid-epoch checkpoint, -training will start from the beginning of the next epoch.

  • -
  • datamodule (Optional[LightningDataModule]) – An instance of LightningDataModule.

  • -
-
-
Return type
-

None

-
-
-
- -
-
-

validate

-
-
-Trainer.validate(model=None, dataloaders=None, ckpt_path=None, verbose=True, datamodule=None)[source]
-

Perform one evaluation epoch over the validation set.

-
-
Parameters
-
    -
  • model (Optional[LightningModule]) – The model to validate.

  • -
  • dataloaders (Union[DataLoader, Sequence[DataLoader], LightningDataModule, None]) – A torch.utils.data.DataLoader or a sequence of them, -or a LightningDataModule specifying validation samples.

  • -
  • ckpt_path (Optional[str]) – Either best or path to the checkpoint you wish to validate. -If None and the model instance was passed, use the current weights. -Otherwise, the best model checkpoint from the previous trainer.fit call will be loaded -if a checkpoint callback is configured.

  • -
  • verbose (bool) – If True, prints the validation results.

  • -
  • datamodule (Optional[LightningDataModule]) – An instance of LightningDataModule.

  • -
-
-
Return type
-

List[Dict[str, float]]

-
-
Returns
-

List of dictionaries with metrics logged during the validation phase, e.g., in model- or callback hooks -like validation_step(), -validation_epoch_end(), etc. -The length of the list corresponds to the number of validation dataloaders used.

-
-
-
- -
-
-

test

-
-
-Trainer.test(model=None, dataloaders=None, ckpt_path=None, verbose=True, datamodule=None)[source]
-

Perform one evaluation epoch over the test set. -It’s separated from fit to make sure you never run on your test set until you want to.

-
-
Parameters
-
    -
  • model (Optional[LightningModule]) – The model to test.

  • -
  • dataloaders (Union[DataLoader, Sequence[DataLoader], LightningDataModule, None]) – A torch.utils.data.DataLoader or a sequence of them, -or a LightningDataModule specifying test samples.

  • -
  • ckpt_path (Optional[str]) – Either best or path to the checkpoint you wish to test. -If None and the model instance was passed, use the current weights. -Otherwise, the best model checkpoint from the previous trainer.fit call will be loaded -if a checkpoint callback is configured.

  • -
  • verbose (bool) – If True, prints the test results.

  • -
  • datamodule (Optional[LightningDataModule]) – An instance of LightningDataModule.

  • -
-
-
Return type
-

List[Dict[str, float]]

-
-
Returns
-

List of dictionaries with metrics logged during the test phase, e.g., in model- or callback hooks -like test_step(), -test_epoch_end(), etc. -The length of the list corresponds to the number of test dataloaders used.

-
-
-
- -
-
-

predict

-
-
-Trainer.predict(model=None, dataloaders=None, datamodule=None, return_predictions=None, ckpt_path=None)[source]
-

Run inference on your data. -This will call the model forward function to compute predictions. Useful to perform distributed -and batched predictions. Logging is disabled in the predict hooks.

-
-
Parameters
-
    -
  • model (Optional[LightningModule]) – The model to predict with.

  • -
  • dataloaders (Union[DataLoader, Sequence[DataLoader], LightningDataModule, None]) – A torch.utils.data.DataLoader or a sequence of them, -or a LightningDataModule specifying prediction samples.

  • -
  • datamodule (Optional[LightningDataModule]) – The datamodule with a predict_dataloader method that returns one or more dataloaders.

  • -
  • return_predictions (Optional[bool]) – Whether to return predictions. -True by default except when an accelerator that spawns processes is used (not supported).

  • -
  • ckpt_path (Optional[str]) – Either best or path to the checkpoint you wish to predict. -If None and the model instance was passed, use the current weights. -Otherwise, the best model checkpoint from the previous trainer.fit call will be loaded -if a checkpoint callback is configured.

  • -
-
-
Return type
-

Union[List[Any], List[List[Any]], None]

-
-
Returns
-

Returns a list of dictionaries, one for each provided dataloader containing their respective predictions.

-
-
-
- -
-
-

tune

-
-
-Trainer.tune(model, train_dataloaders=None, val_dataloaders=None, datamodule=None, scale_batch_size_kwargs=None, lr_find_kwargs=None)[source]
-

Runs routines to tune hyperparameters before training.

-
-
Parameters
-
    -
  • model (LightningModule) – Model to tune.

  • -
  • train_dataloaders (Union[DataLoader, Sequence[DataLoader], Sequence[Sequence[DataLoader]], Sequence[Dict[str, DataLoader]], Dict[str, DataLoader], Dict[str, Dict[str, DataLoader]], Dict[str, Sequence[DataLoader]], LightningDataModule, None]) – A collection of torch.utils.data.DataLoader or a -LightningDataModule specifying training samples. -In the case of multiple dataloaders, please see this section.

  • -
  • val_dataloaders (Union[DataLoader, Sequence[DataLoader], None]) – A torch.utils.data.DataLoader or a sequence of them specifying validation samples.

  • -
  • datamodule (Optional[LightningDataModule]) – An instance of LightningDataModule.

  • -
  • scale_batch_size_kwargs (Optional[Dict[str, Any]]) – Arguments for scale_batch_size()

  • -
  • lr_find_kwargs (Optional[Dict[str, Any]]) – Arguments for lr_find()

  • -
-
-
Return type
-

Dict[str, Union[int, _LRFinder, None]]

-
-
-
- -
-
-
-

Properties

-
-

callback_metrics

-

The metrics available to callbacks. These are automatically set when you log via self.log

-
def training_step(self, batch, batch_idx):
-    self.log("a_val", 2)
-
-
-callback_metrics = trainer.callback_metrics
-assert callback_metrics["a_val"] == 2
-
-
-
-
-

current_epoch

-

The number of epochs run.

-
if trainer.current_epoch >= 10:
-    ...
-
-
-
-
-

global_step

-

The number of optimizer steps taken (does not reset each epoch). -This includes multiple optimizers and TBPTT steps (if enabled).

-
if trainer.global_step >= 100:
-    ...
-
-
-
-
-

logger

-

The current logger being used. Here’s an example using tensorboard

-
logger = trainer.logger
-tensorboard = logger.experiment
-
-
-
-
-

loggers

-

The list of loggers currently being used by the Trainer.

-
# List of Logger objects
-loggers = trainer.loggers
-for logger in loggers:
-    logger.log_metrics({"foo": 1.0})
-
-
-
-
-

logged_metrics

-

The metrics sent to the logger (visualizer).

-
def training_step(self, batch, batch_idx):
-    self.log("a_val", 2, logger=True)
-
-
-logged_metrics = trainer.logged_metrics
-assert logged_metrics["a_val"] == 2
-
-
-
-
-

log_dir

-

The directory for the current experiment. Use this to save images to, etc…

-
def training_step(self, batch, batch_idx):
-    img = ...
-    save_img(img, self.trainer.log_dir)
-
-
-
-
-

is_global_zero

-

Whether this process is the global zero in multi-node training

-
def training_step(self, batch, batch_idx):
-    if self.trainer.is_global_zero:
-        print("in node 0, accelerator 0")
-
-
-
-
-

progress_bar_metrics

-

The metrics sent to the progress bar.

-
def training_step(self, batch, batch_idx):
-    self.log("a_val", 2, prog_bar=True)
-
-
-progress_bar_metrics = trainer.progress_bar_metrics
-assert progress_bar_metrics["a_val"] == 2
-
-
-
-
-

estimated_stepping_batches

-

Check out estimated_stepping_batches().

-
-
-

state

-

The current state of the Trainer, including the current function that is running, the stage of -execution within that function, and the status of the Trainer.

-
# fn in ("fit", "validate", "test", "predict", "tune")
-trainer.state.fn
-# status in ("initializing", "running", "finished", "interrupted")
-trainer.state.status
-# stage in ("train", "sanity_check", "validate", "test", "predict", "tune")
-trainer.state.stage
-
-
-
-
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/common_usecases.html b/docs/common_usecases.html deleted file mode 100644 index f7a91f3..0000000 --- a/docs/common_usecases.html +++ /dev/null @@ -1,915 +0,0 @@ - - - - - - - - - - - - - - Common Workflows — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Common Workflows

-

Customize and extend Lightning for things like custom hardware or distributed strategies.

-

-
-
-

-

-

-

-

-

-

-

-

-

-

-

-

-

-

-

-

-

-

-

-

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- - -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/data/datamodule.html b/docs/data/datamodule.html deleted file mode 100644 index 618ce5f..0000000 --- a/docs/data/datamodule.html +++ /dev/null @@ -1,1428 +0,0 @@ - - - - - - - - - - - - - - LightningDataModule — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • LightningDataModule
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

LightningDataModule

-

A datamodule is a shareable, reusable class that encapsulates all the steps needed to process data:

-
-

-
-

A datamodule encapsulates the five steps involved in data processing in PyTorch:

-
    -
  1. Download / tokenize / process.

  2. -
  3. Clean and (maybe) save to disk.

  4. -
  5. Load inside Dataset.

  6. -
  7. Apply transforms (rotate, tokenize, etc…).

  8. -
  9. Wrap inside a DataLoader.

  10. -
-
-

-
-

This class can then be shared and used anywhere:

-
from pl_bolts.datamodules import CIFAR10DataModule, ImagenetDataModule
-
-model = LitClassifier()
-trainer = Trainer()
-
-imagenet = ImagenetDataModule()
-trainer.fit(model, datamodule=imagenet)
-
-cifar10 = CIFAR10DataModule()
-trainer.fit(model, datamodule=cifar10)
-
-
-
-
-

Why do I need a DataModule?

-

In normal PyTorch code, the data cleaning/preparation is usually scattered across many files. This makes -sharing and reusing the exact splits and transforms across projects impossible.

-

Datamodules are for you if you ever asked the questions:

-
    -
  • what splits did you use?

  • -
  • what transforms did you use?

  • -
  • what normalization did you use?

  • -
  • how did you prepare/tokenize the data?

  • -
-
-
-
-

What is a DataModule?

-

A DataModule is simply a collection of a train_dataloader(s), val_dataloader(s), test_dataloader(s) and -predict_dataloader(s) along with the matching transforms and data processing/downloads steps required.

-

Here’s a simple PyTorch example:

-
# regular PyTorch
-test_data = MNIST(my_path, train=False, download=True)
-predict_data = MNIST(my_path, train=False, download=True)
-train_data = MNIST(my_path, train=True, download=True)
-train_data, val_data = random_split(train_data, [55000, 5000])
-
-train_loader = DataLoader(train_data, batch_size=32)
-val_loader = DataLoader(val_data, batch_size=32)
-test_loader = DataLoader(test_data, batch_size=32)
-predict_loader = DataLoader(predict_data, batch_size=32)
-
-
-

The equivalent DataModule just organizes the same exact code, but makes it reusable across projects.

-
class MNISTDataModule(pl.LightningDataModule):
-    def __init__(self, data_dir: str = "path/to/dir", batch_size: int = 32):
-        super().__init__()
-        self.data_dir = data_dir
-        self.batch_size = batch_size
-
-    def setup(self, stage: Optional[str] = None):
-        self.mnist_test = MNIST(self.data_dir, train=False)
-        self.mnist_predict = MNIST(self.data_dir, train=False)
-        mnist_full = MNIST(self.data_dir, train=True)
-        self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000])
-
-    def train_dataloader(self):
-        return DataLoader(self.mnist_train, batch_size=self.batch_size)
-
-    def val_dataloader(self):
-        return DataLoader(self.mnist_val, batch_size=self.batch_size)
-
-    def test_dataloader(self):
-        return DataLoader(self.mnist_test, batch_size=self.batch_size)
-
-    def predict_dataloader(self):
-        return DataLoader(self.mnist_predict, batch_size=self.batch_size)
-
-    def teardown(self, stage: Optional[str] = None):
-        # Used to clean-up when the run is finished
-        ...
-
-
-

But now, as the complexity of your processing grows (transforms, multiple-GPU training), you can -let Lightning handle those details for you while making this dataset reusable so you can share with -colleagues or use in different projects.

-
mnist = MNISTDataModule(my_path)
-model = LitClassifier()
-
-trainer = Trainer()
-trainer.fit(model, mnist)
-
-
-

Here’s a more realistic, complex DataModule that shows how much more reusable the datamodule is.

-
import pytorch_lightning as pl
-from torch.utils.data import random_split, DataLoader
-
-# Note - you must have torchvision installed for this example
-from torchvision.datasets import MNIST
-from torchvision import transforms
-
-
-class MNISTDataModule(pl.LightningDataModule):
-    def __init__(self, data_dir: str = "./"):
-        super().__init__()
-        self.data_dir = data_dir
-        self.transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.1307,), (0.3081,))])
-
-    def prepare_data(self):
-        # download
-        MNIST(self.data_dir, train=True, download=True)
-        MNIST(self.data_dir, train=False, download=True)
-
-    def setup(self, stage: Optional[str] = None):
-
-        # Assign train/val datasets for use in dataloaders
-        if stage == "fit" or stage is None:
-            mnist_full = MNIST(self.data_dir, train=True, transform=self.transform)
-            self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000])
-
-        # Assign test dataset for use in dataloader(s)
-        if stage == "test" or stage is None:
-            self.mnist_test = MNIST(self.data_dir, train=False, transform=self.transform)
-
-        if stage == "predict" or stage is None:
-            self.mnist_predict = MNIST(self.data_dir, train=False, transform=self.transform)
-
-    def train_dataloader(self):
-        return DataLoader(self.mnist_train, batch_size=32)
-
-    def val_dataloader(self):
-        return DataLoader(self.mnist_val, batch_size=32)
-
-    def test_dataloader(self):
-        return DataLoader(self.mnist_test, batch_size=32)
-
-    def predict_dataloader(self):
-        return DataLoader(self.mnist_predict, batch_size=32)
-
-
-
-
-
-

LightningDataModule API

-

To define a DataModule the following methods are used to create train/val/test/predict dataloaders:

- -
-

prepare_data

-

Downloading and saving data with multiple processes (distributed settings) will result in corrupted data. Lightning -ensures the prepare_data() is called only within a single process on CPU, -so you can safely add your downloading logic within. In case of multi-node training, the execution of this hook -depends upon prepare_data_per_node. setup() is called after -prepare_data and there is a barrier in between which ensures that all the processes proceed to setup once the data is prepared and available for use.

-
    -
  • download, i.e. download data only once on the disk from a single process

  • -
  • tokenize. Since it’s a one time process, it is not recommended to do it on all processes

  • -
  • etc…

  • -
-
class MNISTDataModule(pl.LightningDataModule):
-    def prepare_data(self):
-        # download
-        MNIST(os.getcwd(), train=True, download=True, transform=transforms.ToTensor())
-        MNIST(os.getcwd(), train=False, download=True, transform=transforms.ToTensor())
-
-
-
-

Warning

-

prepare_data is called from the main process. It is not recommended to assign state here (e.g. self.x = y) since it is called on a single process and if you assign -states here then they won’t be available for other processes.

-
-
-
-

setup

-

There are also data operations you might want to perform on every GPU. Use setup() to do things like:

-
    -
  • count number of classes

  • -
  • build vocabulary

  • -
  • perform train/val/test splits

  • -
  • create datasets

  • -
  • apply transforms (defined explicitly in your datamodule)

  • -
  • etc…

  • -
-
import pytorch_lightning as pl
-
-
-class MNISTDataModule(pl.LightningDataModule):
-    def setup(self, stage: Optional[str] = None):
-
-        # Assign Train/val split(s) for use in Dataloaders
-        if stage in (None, "fit"):
-            mnist_full = MNIST(self.data_dir, train=True, download=True, transform=self.transform)
-            self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000])
-
-        # Assign Test split(s) for use in Dataloaders
-        if stage in (None, "test"):
-            self.mnist_test = MNIST(self.data_dir, train=False, download=True, transform=self.transform)
-
-
-

For eg., if you are working with NLP task where you need to tokenize the text and use it, then you can do something like as follows:

-
class LitDataModule(LightningDataModule):
-    def prepare_data(self):
-        dataset = load_Dataset(...)
-        train_dataset = ...
-        val_dataset = ...
-        # tokenize
-        # save it to disk
-
-    def setup(self, stage):
-        # load it back here
-        dataset = load_dataset_from_disk(...)
-
-
-

This method expects a stage argument. -It is used to separate setup logic for trainer.{fit,validate,test,predict}. If setup is called with stage=None, -we assume all stages have been set-up.

-
-

Note

-

setup is called from every process across all the nodes. Setting state here is recommended.

-
-
-

Note

-

teardown can be used to clean up the state. It is also called from every process across all the nodes.

-
-
-
-

train_dataloader

-

Use the train_dataloader() method to generate the training dataloader(s). -Usually you just wrap the dataset you defined in setup. This is the dataloader that the Trainer -fit() method uses.

-
import pytorch_lightning as pl
-
-
-class MNISTDataModule(pl.LightningDataModule):
-    def train_dataloader(self):
-        return DataLoader(self.mnist_train, batch_size=64)
-
-
-
-
-

val_dataloader

-

Use the val_dataloader() method to generate the validation dataloader(s). -Usually you just wrap the dataset you defined in setup. This is the dataloader that the Trainer -fit() and validate() methods uses.

-
import pytorch_lightning as pl
-
-
-class MNISTDataModule(pl.LightningDataModule):
-    def val_dataloader(self):
-        return DataLoader(self.mnist_val, batch_size=64)
-
-
-
-
-

test_dataloader

-

Use the test_dataloader() method to generate the test dataloader(s). -Usually you just wrap the dataset you defined in setup. This is the dataloader that the Trainer -test() method uses.

-
import pytorch_lightning as pl
-
-
-class MNISTDataModule(pl.LightningDataModule):
-    def test_dataloader(self):
-        return DataLoader(self.mnist_test, batch_size=64)
-
-
-
-
-

predict_dataloader

-

Use the predict_dataloader() method to generate the prediction dataloader(s). -Usually you just wrap the dataset you defined in setup. This is the dataloader that the Trainer -predict() method uses.

-
import pytorch_lightning as pl
-
-
-class MNISTDataModule(pl.LightningDataModule):
-    def predict_dataloader(self):
-        return DataLoader(self.mnist_predict, batch_size=64)
-
-
-
-
-

transfer_batch_to_device

-
-
-LightningDataModule.transfer_batch_to_device(batch, device, dataloader_idx)
-

Override this hook if your DataLoader returns tensors wrapped in a custom -data structure.

-

The data types listed below (and any arbitrary nesting of them) are supported out of the box:

-
    -
  • torch.Tensor or anything that implements .to(…)

  • -
  • list

  • -
  • dict

  • -
  • tuple

  • -
  • torchtext.data.batch.Batch

  • -
-

For anything else, you need to define how the data is moved to the target device (CPU, GPU, TPU, …).

-
-

Note

-

This hook should only transfer the data and not modify it, nor should it move the data to -any other device than the one passed in as argument (unless you know what you are doing). -To check the current state of execution of this hook you can use -self.trainer.training/testing/validating/predicting so that you can -add different logic as per your requirement.

-
-
-

Note

-

This hook only runs on single GPU training and DDP (no data-parallel). -Data-Parallel support will come in near future.

-
-
-
Parameters
-
    -
  • batch (Any) – A batch of data that needs to be transferred to a new device.

  • -
  • device (device) – The target device as defined in PyTorch.

  • -
  • dataloader_idx (int) – The index of the dataloader to which the batch belongs.

  • -
-
-
Return type
-

Any

-
-
Returns
-

A reference to the data on the new device.

-
-
-

Example:

-
def transfer_batch_to_device(self, batch, device, dataloader_idx):
-    if isinstance(batch, CustomBatch):
-        # move all tensors in your custom data structure to the device
-        batch.samples = batch.samples.to(device)
-        batch.targets = batch.targets.to(device)
-    elif dataloader_idx == 0:
-        # skip device transfer for the first dataloader or anything you wish
-        pass
-    else:
-        batch = super().transfer_batch_to_device(data, device, dataloader_idx)
-    return batch
-
-
-
-
Raises
-

MisconfigurationException – If using data-parallel, Trainer(strategy='dp').

-
-
-
-

See also

-
    -
  • move_data_to_device()

  • -
  • apply_to_collection()

  • -
-
-
- -
-
-

on_before_batch_transfer

-
-
-LightningDataModule.on_before_batch_transfer(batch, dataloader_idx)
-

Override to alter or apply batch augmentations to your batch before it is transferred to the device.

-
-

Note

-

To check the current state of execution of this hook you can use -self.trainer.training/testing/validating/predicting so that you can -add different logic as per your requirement.

-
-
-

Note

-

This hook only runs on single GPU training and DDP (no data-parallel). -Data-Parallel support will come in near future.

-
-
-
Parameters
-
    -
  • batch (Any) – A batch of data that needs to be altered or augmented.

  • -
  • dataloader_idx (int) – The index of the dataloader to which the batch belongs.

  • -
-
-
Return type
-

Any

-
-
Returns
-

A batch of data

-
-
-

Example:

-
def on_before_batch_transfer(self, batch, dataloader_idx):
-    batch['x'] = transforms(batch['x'])
-    return batch
-
-
-
-
Raises
-

MisconfigurationException – If using data-parallel, Trainer(strategy='dp').

-
-
-
-

See also

-
    -
  • on_after_batch_transfer()

  • -
  • transfer_batch_to_device()

  • -
-
-
- -
-
-

on_after_batch_transfer

-
-
-LightningDataModule.on_after_batch_transfer(batch, dataloader_idx)
-

Override to alter or apply batch augmentations to your batch after it is transferred to the device.

-
-

Note

-

To check the current state of execution of this hook you can use -self.trainer.training/testing/validating/predicting so that you can -add different logic as per your requirement.

-
-
-

Note

-

This hook only runs on single GPU training and DDP (no data-parallel). -Data-Parallel support will come in near future.

-
-
-
Parameters
-
    -
  • batch (Any) – A batch of data that needs to be altered or augmented.

  • -
  • dataloader_idx (int) – The index of the dataloader to which the batch belongs.

  • -
-
-
Return type
-

Any

-
-
Returns
-

A batch of data

-
-
-

Example:

-
def on_after_batch_transfer(self, batch, dataloader_idx):
-    batch['x'] = gpu_transforms(batch['x'])
-    return batch
-
-
-
-
Raises
-

MisconfigurationException – If using data-parallel, Trainer(strategy='dp').

-
-
-
-

See also

-
    -
  • on_before_batch_transfer()

  • -
  • transfer_batch_to_device()

  • -
-
-
- -
-
-

load_state_dict

-
-
-LightningDataModule.load_state_dict(state_dict)[source]
-

Called when loading a checkpoint, implement to reload datamodule state given datamodule state_dict.

-
-
Parameters
-

state_dict (Dict[str, Any]) – the datamodule state returned by state_dict.

-
-
Return type
-

None

-
-
-
- -
-
-

state_dict

-
-
-LightningDataModule.state_dict()[source]
-

Called when saving a checkpoint, implement to generate and save datamodule state.

-
-
Return type
-

Dict[str, Any]

-
-
Returns
-

A dictionary containing datamodule state.

-
-
-
- -
-
-

on_train_dataloader

-
-
-LightningDataModule.on_train_dataloader()
-

Called before requesting the train dataloader.

-
-

Deprecated since version v1.5: on_train_dataloader() is deprecated and will be removed in v1.7.0. -Please use train_dataloader() directly.

-
-
-
Return type
-

None

-
-
-
- -
-
-

on_val_dataloader

-
-
-LightningDataModule.on_val_dataloader()
-

Called before requesting the val dataloader.

-
-

Deprecated since version v1.5: on_val_dataloader() is deprecated and will be removed in v1.7.0. -Please use val_dataloader() directly.

-
-
-
Return type
-

None

-
-
-
- -
-
-

on_test_dataloader

-
-
-LightningDataModule.on_test_dataloader()
-

Called before requesting the test dataloader.

-
-

Deprecated since version v1.5: on_test_dataloader() is deprecated and will be removed in v1.7.0. -Please use test_dataloader() directly.

-
-
-
Return type
-

None

-
-
-
- -
-
-

on_predict_dataloader

-
-
-LightningDataModule.on_predict_dataloader()
-

Called before requesting the predict dataloader.

-
-

Deprecated since version v1.5: on_predict_dataloader() is deprecated and will be removed in v1.7.0. -Please use predict_dataloader() directly.

-
-
-
Return type
-

None

-
-
-
- -
-
-

teardown

-
-
-LightningDataModule.teardown(stage=None)
-

Called at the end of fit (train + validate), validate, test, or predict.

-
-
Parameters
-

stage (Optional[str]) – either 'fit', 'validate', 'test', or 'predict'

-
-
Return type
-

None

-
-
-
- -
-
-

prepare_data_per_node

-

If set to True will call prepare_data() on LOCAL_RANK=0 for every node. -If set to False will only call from NODE_RANK=0, LOCAL_RANK=0.

-
class LitDataModule(LightningDataModule):
-    def __init__(self):
-        super().__init__()
-        self.prepare_data_per_node = True
-
-
-
-
-
-
-

Using a DataModule

-

The recommended way to use a DataModule is simply:

-
dm = MNISTDataModule()
-model = Model()
-trainer.fit(model, datamodule=dm)
-trainer.test(datamodule=dm)
-trainer.validate(datamodule=dm)
-trainer.predict(datamodule=dm)
-
-
-

If you need information from the dataset to build your model, then run -prepare_data and -setup manually (Lightning ensures -the method runs on the correct devices).

-
dm = MNISTDataModule()
-dm.prepare_data()
-dm.setup(stage="fit")
-
-model = Model(num_classes=dm.num_classes, width=dm.width, vocab=dm.vocab)
-trainer.fit(model, dm)
-
-dm.setup(stage="test")
-trainer.test(datamodule=dm)
-
-
-
-
-
-

DataModules without Lightning

-

You can of course use DataModules in plain PyTorch code as well.

-
# download, etc...
-dm = MNISTDataModule()
-dm.prepare_data()
-
-# splits/transforms
-dm.setup(stage="fit")
-
-# use data
-for batch in dm.train_dataloader():
-    ...
-
-for batch in dm.val_dataloader():
-    ...
-
-dm.teardown(stage="fit")
-
-# lazy load test data
-dm.setup(stage="test")
-for batch in dm.test_dataloader():
-    ...
-
-dm.teardown(stage="test")
-
-
-

But overall, DataModules encourage reproducibility by allowing all details of a dataset to be specified in a unified -structure.

-
-
-
-

Hyperparameters in DataModules

-

Like LightningModules, DataModules support hyperparameters with the same API.

-
import pytorch_lightning as pl
-
-
-class CustomDataModule(pl.LightningDataModule):
-    def __init__(self, *args, **kwargs):
-        super().__init__()
-        self.save_hyperparameters()
-
-    def configure_optimizers(self):
-        # access the saved hyperparameters
-        opt = optim.Adam(self.parameters(), lr=self.hparams.lr)
-
-
-

Refer to save_hyperparameters in lightning module for more details.

-
-
-

Save DataModule state

-

When a checkpoint is created, it asks every DataModule for their state. If your DataModule defines the state_dict and load_state_dict methods, the checkpoint will automatically track and restore your DataModules.

-
class LitDataModule(pl.DataModuler):
-    def state_dict(self):
-        # track whatever you want here
-        state = {"current_train_batch_index": self.current_train_batch_index}
-        return state
-
-    def load_state_dict(self, state_dict):
-        # restore the state based on what you tracked in (def state_dict)
-        self.current_train_batch_index = state_dict["current_train_batch_index"]
-
-
-
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/debug/debugging.html b/docs/debug/debugging.html deleted file mode 100644 index 9d4a891..0000000 --- a/docs/debug/debugging.html +++ /dev/null @@ -1,731 +0,0 @@ - - - - - - - - - - - - - - Debug your model — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- - -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/debug/debugging_advanced.html b/docs/debug/debugging_advanced.html deleted file mode 100644 index 962a227..0000000 --- a/docs/debug/debugging_advanced.html +++ /dev/null @@ -1,721 +0,0 @@ - - - - - - - - - - - - - - Debug your model (advanced) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Debug your model (advanced)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Debug your model (advanced)

-

Audience: Users who want to debug distributed models.

-
-
-

Debug distributed models

-

To debug a distributed model, we recommend you debug it locally by running the distributed version on CPUs:

-
trainer = Trainer(accelerator="cpu", strategy="ddp", devices=2)
-
-
-

On the CPU, you can use pdb or breakpoint() -or use regular print statements.

-
class LitModel(LightningModule):
-    def training_step(self, batch, batch_idx):
-
-        debugging_message = ...
-        print(f"RANK - {self.trainer.global_rank}: {debugging_message}")
-
-        if self.trainer.global_rank == 0:
-            import pdb
-
-            pdb.set_trace()
-
-        # to prevent other processes from moving forward until all processes are in sync
-        self.trainer.strategy.barrier()
-
-
-

When everything works, switch back to GPU by changing only the accelerator.

-
trainer = Trainer(accelerator="gpu", strategy="ddp", devices=2)
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/debug/debugging_basic.html b/docs/debug/debugging_basic.html deleted file mode 100644 index 3fad6ed..0000000 --- a/docs/debug/debugging_basic.html +++ /dev/null @@ -1,811 +0,0 @@ - - - - - - - - - - - - - - Debug your model (basic) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Debug your model (basic)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Debug your model (basic)

-

Audience: Users who want to learn the basics of debugging models.

-
-
-

How does Lightning help me debug ?

-

The Lightning Trainer has a lot of arguments devoted to maximizing your debugging productivity.

-
-
-
-

Set a breakpoint

-

A breakpoint stops your code execution so you can inspect variables, etc… and allow your code to execute one line at a time.

-
def function_to_debug():
-    x = 2
-
-    # set breakpoint
-    import pdb
-
-    pdb.set_trace()
-    y = x ** 2
-
-
-

In this example, the code will stop before executing the y = x**2 line.

-
-
-
-

Run all your model code once quickly

-

If you’ve ever trained a model for days only to crash during validation or testing then this trainer argument is about to become your best friend.

-

The fast_dev_run argument in the trainer runs 5 batch of training, validation, test and prediction data through your trainer to see if there are any bugs:

-
Trainer(fast_dev_run=True)
-
-
-

To change how many batches to use, change the argument to an integer. Here we run 7 batches of each:

-
Trainer(fast_dev_run=7)
-
-
-
-

Note

-

This argument will disable tuner, checkpoint callbacks, early stopping callbacks, -loggers and logger callbacks like LearningRateMonitor and -DeviceStatsMonitor.

-
-
-
-
-

Shorten the epoch length

-

Sometimes it’s helpful to only use a fraction of your training, val, test, or predict data (or a set number of batches). -For example, you can use 20% of the training set and 1% of the validation set.

-

On larger datasets like Imagenet, this can help you debug or test a few things faster than waiting for a full epoch.

-
# use only 10% of training data and 1% of val data
-trainer = Trainer(limit_train_batches=0.1, limit_val_batches=0.01)
-
-# use 10 batches of train and 5 batches of val
-trainer = Trainer(limit_train_batches=10, limit_val_batches=5)
-
-
-
-
-
-

Run a Sanity Check

-

Lightning runs 2 steps of validation in the beginning of training. -This avoids crashing in the validation loop sometime deep into a lengthy training loop.

-

(See: num_sanity_val_steps -argument of Trainer)

-
trainer = Trainer(num_sanity_val_steps=2)
-
-
-
-
- -
- -
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/debug/debugging_intermediate.html b/docs/debug/debugging_intermediate.html deleted file mode 100644 index c3fcf7d..0000000 --- a/docs/debug/debugging_intermediate.html +++ /dev/null @@ -1,748 +0,0 @@ - - - - - - - - - - - - - - Debug your model (intermediate) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Debug your model (intermediate)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Debug your model (intermediate)

-

Audience: Users who want to debug their ML code

-
-
-

Why should I debug ML code?

-

Machine learning code requires debugging mathematical correctness, which is not something non-ML code has to deal with. Lightning implements a few best-practice techniques to give all users, expert level ML debugging abilities.

-
-
-
-

Overfit your model on a Subset of Data

-

A good debugging technique is to take a tiny portion of your data (say 2 samples per class), -and try to get your model to overfit. If it can’t, it’s a sign it won’t work with large datasets.

-

(See: overfit_batches -argument of Trainer)

-
# use only 1% of training data (and turn off validation)
-trainer = Trainer(overfit_batches=0.01)
-
-# similar, but with a fixed 10 batches
-trainer = Trainer(overfit_batches=10)
-
-
-

When using this argument, the validation loop will be disabled. We will also replace the sampler -in the training set to turn off shuffle for you.

-
-
-
-

Look-out for exploding gradients

-

One major problem that plagues models is exploding gradients. Gradient norm is one technique that can help keep gradients from exploding.

-
# the 2-norm
-trainer = Trainer(track_grad_norm=2)
-
-
-

This will plot the 2-norm to your experiment manager. If you notice the norm is going up, there’s a good chance your gradients are/will explode.

-

One technique to stop exploding gradients is to clip the gradient

-
# DEFAULT (ie: don't clip)
-trainer = Trainer(gradient_clip_val=0)
-
-# clip gradients' global norm to <=0.5 using gradient_clip_algorithm='norm' by default
-trainer = Trainer(gradient_clip_val=0.5)
-
-# clip gradients' maximum magnitude to <=0.5
-trainer = Trainer(gradient_clip_val=0.5, gradient_clip_algorithm="value")
-
-
-
-
-
-

Detect autograd anomalies

-

Lightning helps you detect anomalies in the PyTorh autograd engine via PyTorch’s built-in -Anomaly Detection Context-manager.

-

Enable it via the detect_anomaly trainer argument:

-
trainer = Trainer(detect_anomaly=True)
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/deploy/production.html b/docs/deploy/production.html deleted file mode 100644 index f489dbc..0000000 --- a/docs/deploy/production.html +++ /dev/null @@ -1,764 +0,0 @@ - - - - - - - - - - - - - - Deploy models into production — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Deploy models into production
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
- - - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/deploy/production_advanced.html b/docs/deploy/production_advanced.html deleted file mode 100644 index 281673a..0000000 --- a/docs/deploy/production_advanced.html +++ /dev/null @@ -1,751 +0,0 @@ - - - - - - - - - - - - - - Deploy models into production (advanced) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Deploy models into production (advanced)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Deploy models into production (advanced)

-

Audience: Machine learning engineers optimizing models for enterprise-scale production environments.

-
-
-

Compile your model to ONNX

-

ONNX is a package developed by Microsoft to optimize inference. ONNX allows the model to be independent of PyTorch and run on any ONNX Runtime.

-

To export your model to ONNX format call the to_onnx() function on your LightningModule with the filepath and input_sample.

-
class SimpleModel(LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.l1 = torch.nn.Linear(in_features=64, out_features=4)
-
-    def forward(self, x):
-        return torch.relu(self.l1(x.view(x.size(0), -1)))
-
-
-# create the model
-model = SimpleModel()
-filepath = "model.onnx"
-input_sample = torch.randn((1, 64))
-model.to_onnx(filepath, input_sample, export_params=True)
-
-
-

You can also skip passing the input sample if the example_input_array property is specified in your LightningModule.

-
class SimpleModel(LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.l1 = torch.nn.Linear(in_features=64, out_features=4)
-        self.example_input_array = torch.randn(7, 64)
-
-    def forward(self, x):
-        return torch.relu(self.l1(x.view(x.size(0), -1)))
-
-
-# create the model
-model = SimpleModel()
-filepath = "model.onnx"
-model.to_onnx(filepath, export_params=True)
-
-
-

Once you have the exported model, you can run it on your ONNX runtime in the following way:

-
import onnxruntime
-
-ort_session = onnxruntime.InferenceSession(filepath)
-input_name = ort_session.get_inputs()[0].name
-ort_inputs = {input_name: np.random.randn(1, 64)}
-ort_outs = ort_session.run(None, ort_inputs)
-
-
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/deploy/production_advanced_2.html b/docs/deploy/production_advanced_2.html deleted file mode 100644 index 6f05d73..0000000 --- a/docs/deploy/production_advanced_2.html +++ /dev/null @@ -1,746 +0,0 @@ - - - - - - - - - - - - - - Deploy models into production (advanced) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Deploy models into production (advanced)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Deploy models into production (advanced)

-

Audience: Machine learning engineers optimizing models for enterprise-scale production environments.

-
-
-

Compile your model to TorchScript

-

TorchScript allows you to serialize your models in a way that it can be loaded in non-Python environments. -The LightningModule has a handy method to_torchscript() that returns a scripted module which you -can save or directly use.

-
class SimpleModel(LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.l1 = torch.nn.Linear(in_features=64, out_features=4)
-
-    def forward(self, x):
-        return torch.relu(self.l1(x.view(x.size(0), -1)))
-
-
-# create the model
-model = SimpleModel()
-script = model.to_torchscript()
-
-# save for use in production environment
-torch.jit.save(script, "model.pt")
-
-
-

It is recommended that you install the latest supported version of PyTorch to use this feature without limitations.

-

Once you have the exported model, you can run it in Pytorch or C++ runtime:

-
inp = torch.rand(1, 64)
-scripted_module = torch.jit.load("model.pt")
-output = scripted_module(inp)
-
-
-

If you want to script a different method, you can decorate the method with torch.jit.export():

-
class LitMCdropoutModel(pl.LightningModule):
-    def __init__(self, model, mc_iteration):
-        super().__init__()
-        self.model = model
-        self.dropout = nn.Dropout()
-        self.mc_iteration = mc_iteration
-
-    @torch.jit.export
-    def predict_step(self, batch, batch_idx):
-        # enable Monte Carlo Dropout
-        self.dropout.train()
-
-        # take average of `self.mc_iteration` iterations
-        pred = [self.dropout(self.model(x)).unsqueeze(0) for _ in range(self.mc_iteration)]
-        pred = torch.vstack(pred).mean(dim=0)
-        return pred
-
-
-model = LitMCdropoutModel(...)
-script = model.to_torchscript(file_path="model.pt", method="script")
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/deploy/production_basic.html b/docs/deploy/production_basic.html deleted file mode 100644 index 6129928..0000000 --- a/docs/deploy/production_basic.html +++ /dev/null @@ -1,767 +0,0 @@ - - - - - - - - - - - - - - Deploy models into production (basic) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Deploy models into production (basic)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Deploy models into production (basic)

-

Audience: All users.

-
-
-

Load a checkpoint and predict

-

The easiest way to use a model for predictions is to load the weights using load_from_checkpoint found in the LightningModule.

-
model = LitModel.load_from_checkpoint("best_model.ckpt")
-model.eval()
-x = torch.randn(1, 64)
-
-with torch.no_grad():
-    y_hat = model(x)
-
-
-
-
-
-

Predict step with your LightningModule

-

Loading a checkpoint and predicting still leaves you with a lot of boilerplate around the predict epoch. The predict step in the LightningModule removes this boilerplate.

-
class MyModel(LightningModule):
-    def predict_step(self, batch, batch_idx, dataloader_idx=0):
-        return self(batch)
-
-
-

And pass in any dataloader to the Lightning Trainer:

-
data_loader = DataLoader(...)
-model = MyModel()
-trainer = Trainer()
-predictions = trainer.predict(model, data_loader)
-
-
-
-
-
-

Enable complicated predict logic

-

When you need to add complicated pre-processing or post-processing logic to your data use the predict step. For example here we do Monte Carlo Dropout for predictions:

-
class LitMCdropoutModel(pl.LightningModule):
-    def __init__(self, model, mc_iteration):
-        super().__init__()
-        self.model = model
-        self.dropout = nn.Dropout()
-        self.mc_iteration = mc_iteration
-
-    def predict_step(self, batch, batch_idx):
-        # enable Monte Carlo Dropout
-        self.dropout.train()
-
-        # take average of `self.mc_iteration` iterations
-        pred = [self.dropout(self.model(x)).unsqueeze(0) for _ in range(self.mc_iteration)]
-        pred = torch.vstack(pred).mean(dim=0)
-        return pred
-
-
-
-
-
-

Enable distributed inference

-

By using the predict step in Lightning you get free distributed inference

-
trainer = Trainer(devices=8, accelerator="gpu")
-predictions = trainer.predict(model, data_loader)
-
-
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/deploy/production_intermediate.html b/docs/deploy/production_intermediate.html deleted file mode 100644 index 057969f..0000000 --- a/docs/deploy/production_intermediate.html +++ /dev/null @@ -1,791 +0,0 @@ - - - - - - - - - - - - - - Deploy models into production (intermediate) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Deploy models into production (intermediate)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Deploy models into production (intermediate)

-

Audience: Researchers and MLEs looking to use their models for predictions without Lightning dependencies.

-
-
-

Use PyTorch as normal

-

If you prefer to use PyTorch directly, feel free to use any Lightning checkpoint without Lightning.

-
import torch
-
-model = torch.load("path/to/lightning/checkpoint.ckpt")
-model.eval()
-
-
-

You can also pull out the specific modules you want out of the checkpoint:

-
model = torch.load("path/to/lightning/checkpoint.ckpt")
-encoder = model["encoder"]
-encoder.eval()
-
-
-
-
-
-

Extract nn.Module from Lightning checkpoints

-

You can also load the saved checkpoint and use it as a regular torch.nn.Module. You can extract all your torch.nn.Module -and load the weights using the checkpoint saved using LightningModule after training. For this, we recommend copying the exact implementation -from your LightningModule init and forward method.

-
class Encoder(nn.Module):
-    ...
-
-
-class Decoder(nn.Module):
-    ...
-
-
-class AutoEncoderProd(nn.Module):
-    def __init__(self):
-        super().__init__()
-        self.encoder = Encoder()
-        self.decoder = Decoder()
-
-    def forward(self, x):
-        return self.encoder(x)
-
-
-class AutoEncoderSystem(LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.auto_encoder = AutoEncoderProd()
-
-    def forward(self, x):
-        return self.auto_encoder.encoder(x)
-
-    def training_step(self, batch, batch_idx):
-        x, y = batch
-        y_hat = self.auto_encoder.encoder(x)
-        y_hat = self.auto_encoder.decoder(y_hat)
-        loss = ...
-        return loss
-
-
-# train it
-trainer = Trainer(devices=2, accelerator="gpu", strategy="ddp")
-model = AutoEncoderSystem()
-trainer.fit(model, train_dataloader, val_dataloader)
-trainer.save_checkpoint("best_model.ckpt")
-
-
-# create the PyTorch model and load the checkpoint weights
-model = AutoEncoderProd()
-checkpoint = torch.load("best_model.ckpt")
-hyper_parameters = checkpoint["hyper_parameters"]
-
-# if you want to restore any hyperparameters, you can pass them too
-model = AutoEncoderProd(**hyper_parameters)
-
-state_dict = checkpoint["state_dict"]
-
-# update keys by dropping `auto_encoder.`
-for key in list(model_weights):
-    model_weights[key.replace("auto_encoder.", "")] = model_weights.pop(key)
-
-model.load_state_dict(model_weights)
-model.eval()
-x = torch.randn(1, 64)
-
-with torch.no_grad():
-    y_hat = model(x)
-
-
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/ecosystem/asr_nlp_tts.html b/docs/ecosystem/asr_nlp_tts.html deleted file mode 100644 index b9566d8..0000000 --- a/docs/ecosystem/asr_nlp_tts.html +++ /dev/null @@ -1,1452 +0,0 @@ - - - - - - - - - - - - - - Conversational AI — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Conversational AI
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Conversational AI

-

These are amazing ecosystems to help with Automatic Speech Recognition (ASR), Natural Language Processing (NLP), and Text to speech (TTS).

-
-
-

NeMo

-

NVIDIA NeMo is a toolkit for building new State-of-the-Art -Conversational AI models. NeMo has separate collections for Automatic Speech Recognition (ASR), -Natural Language Processing (NLP), and Text-to-Speech (TTS) models. Each collection consists of -prebuilt modules that include everything needed to train on your data. -Every module can easily be customized, extended, and composed to create new Conversational AI -model architectures.

-

Conversational AI architectures are typically very large and require a lot of data and compute -for training. NeMo uses PyTorch Lightning for easy and performant multi-GPU/multi-node -mixed-precision training.

-
-

Note

-

Every NeMo model is a LightningModule that comes equipped with all supporting infrastructure for training and reproducibility.

-
-
-
-

NeMo Models

-

NeMo Models contain everything needed to train and reproduce state of the art Conversational AI -research and applications, including:

-
    -
  • neural network architectures

  • -
  • datasets/data loaders

  • -
  • data preprocessing/postprocessing

  • -
  • data augmentors

  • -
  • optimizers and schedulers

  • -
  • tokenizers

  • -
  • language models

  • -
-

NeMo uses Hydra for configuring both NeMo models and the PyTorch Lightning Trainer. -Depending on the domain and application, many different AI libraries will have to be configured -to build the application. Hydra makes it easy to bring all of these libraries together -so that each can be configured from .yaml or the Hydra CLI.

-
-

Note

-

Every NeMo model has an example configuration file and a corresponding script that contains all configurations needed for training.

-
-

The end result of using NeMo, Pytorch Lightning, and Hydra is that -NeMo models all have the same look and feel. This makes it easy to do Conversational AI research -across multiple domains. NeMo models are also fully compatible with the PyTorch ecosystem.

-
-

Installing NeMo

-

Before installing NeMo, please install Cython first.

-
pip install Cython
-
-
-

For ASR and TTS models, also install these linux utilities.

-
apt-get update && apt-get install -y libsndfile1 ffmpeg
-
-
-

Then installing the latest NeMo release is a simple pip install.

-
pip install nemo_toolkit[all]==1.0.0b1
-
-
-

To install the main branch from GitHub:

-
python -m pip install git+https://github.com/NVIDIA/NeMo.git@main#egg=nemo_toolkit[all]
-
-
-

To install from a local clone of NeMo:

-
./reinstall.sh # from cloned NeMo's git root
-
-
-

For Docker users, the NeMo container is available on -NGC.

-
docker pull nvcr.io/nvidia/nemo:v1.0.0b1
-
-
-
docker run --runtime=nvidia -it --rm -v --shm-size=8g -p 8888:8888 -p 6006:6006 --ulimit memlock=-1 --ulimit stack=67108864 nvcr.io/nvidia/nemo:v1.0.0b1
-
-
-
-
-

Experiment Manager

-

NeMo’s Experiment Manager leverages PyTorch Lightning for model checkpointing, -TensorBoard Logging, and Weights and Biases logging. The Experiment Manager is included by default -in all NeMo example scripts.

-
exp_manager(trainer, cfg.get("exp_manager", None))
-
-
-

And is configurable via .yaml with Hydra.

-
exp_manager:
-    exp_dir: null
-    name: *name
-    create_tensorboard_logger: True
-    create_checkpoint_callback: True
-
-
-

Optionally launch Tensorboard to view training results in ./nemo_experiments (by default).

-
tensorboard --bind_all --logdir nemo_experiments
-
-
-
-
-
-
-

Automatic Speech Recognition (ASR)

-

Everything needed to train Convolutional ASR models is included with NeMo. -NeMo supports multiple Speech Recognition architectures, including Jasper and QuartzNet. -NeMo Speech Models -can be trained from scratch on custom datasets or -fine-tuned using pre-trained checkpoints trained on thousands of hours of audio -that can be restored for immediate use.

-

Some typical ASR tasks are included with NeMo:

- -

See this asr notebook -for a full tutorial on doing ASR with NeMo, PyTorch Lightning, and Hydra.

-
-

Specify ASR Model Configurations with YAML File

-

NeMo Models and the PyTorch Lightning Trainer can be fully configured from .yaml files using Hydra.

-

See this asr config -for the entire speech to text .yaml file.

-
# configure the PyTorch Lightning Trainer
-trainer:
-    gpus: 0 # number of gpus
-    max_epochs: 5
-    max_steps: null # computed at runtime if not set
-    num_nodes: 1
-    accelerator: ddp
-    ...
-# configure the ASR model
-model:
-    ...
-    encoder:
-        cls: nemo.collections.asr.modules.ConvASREncoder
-        params:
-            feat_in: *n_mels
-            activation: relu
-            conv_mask: true
-
-        jasper:
-            - filters: 128
-            repeat: 1
-            kernel: [11]
-            stride: [1]
-            dilation: [1]
-            dropout: *dropout
-            ...
-    # all other configuration, data, optimizer, preprocessor, etc
-    ...
-
-
-
-
-

Developing ASR Model From Scratch

-

speech_to_text.py

-
# hydra_runner calls hydra.main and is useful for multi-node experiments
-@hydra_runner(config_path="conf", config_name="config")
-def main(cfg):
-    trainer = Trainer(**cfg.trainer)
-    asr_model = EncDecCTCModel(cfg.model, trainer)
-    trainer.fit(asr_model)
-
-
-

Hydra makes every aspect of the NeMo model, -including the PyTorch Lightning Trainer, customizable from the command line.

-
python NeMo/examples/asr/speech_to_text.py --config-name=quartznet_15x5 \
-    trainer.accelerator=gpu \
-    trainer.devices=4 \
-    trainer.max_epochs=128 \
-    +trainer.precision=16 \
-    model.train_ds.manifest_filepath=<PATH_TO_DATA>/librispeech-train-all.json \
-    model.validation_ds.manifest_filepath=<PATH_TO_DATA>/librispeech-dev-other.json \
-    model.train_ds.batch_size=64 \
-    +model.validation_ds.num_workers=16 \
-    +model.train_ds.num_workers=16
-
-
-
-

Note

-

Training NeMo ASR models can take days/weeks so it is highly recommended to use multiple GPUs and multiple nodes with the PyTorch Lightning Trainer.

-
-
-
-

Using State-Of-The-Art Pre-trained ASR Model

-

Transcribe audio with QuartzNet model pretrained on ~3300 hours of audio.

-
quartznet = EncDecCTCModel.from_pretrained("QuartzNet15x5Base-En")
-
-files = ["path/to/my.wav"]  # file duration should be less than 25 seconds
-
-for fname, transcription in zip(files, quartznet.transcribe(paths2audio_files=files)):
-    print(f"Audio in {fname} was recognized as: {transcription}")
-
-
-

To see the available pretrained checkpoints:

-
EncDecCTCModel.list_available_models()
-
-
-
-
-

NeMo ASR Model Under the Hood

-

Any aspect of ASR training or model architecture design can easily be customized -with PyTorch Lightning since every NeMo model is a Lightning Module.

-
class EncDecCTCModel(ASRModel):
-    """Base class for encoder decoder CTC-based models."""
-
-    ...
-
-    def forward(self, input_signal, input_signal_length):
-        processed_signal, processed_signal_len = self.preprocessor(
-            input_signal=input_signal,
-            length=input_signal_length,
-        )
-        # Spec augment is not applied during evaluation/testing
-        if self.spec_augmentation is not None and self.training:
-            processed_signal = self.spec_augmentation(input_spec=processed_signal)
-        encoded, encoded_len = self.encoder(audio_signal=processed_signal, length=processed_signal_len)
-        log_probs = self.decoder(encoder_output=encoded)
-        greedy_predictions = log_probs.argmax(dim=-1, keepdim=False)
-        return log_probs, encoded_len, greedy_predictions
-
-    # PTL-specific methods
-    def training_step(self, batch, batch_nb):
-        audio_signal, audio_signal_len, transcript, transcript_len = batch
-        log_probs, encoded_len, predictions = self.forward(
-            input_signal=audio_signal, input_signal_length=audio_signal_len
-        )
-        loss_value = self.loss(
-            log_probs=log_probs, targets=transcript, input_lengths=encoded_len, target_lengths=transcript_len
-        )
-        wer_num, wer_denom = self._wer(predictions, transcript, transcript_len)
-        self.log_dict(
-            {
-                "train_loss": loss_value,
-                "training_batch_wer": wer_num / wer_denom,
-                "learning_rate": self._optimizer.param_groups[0]["lr"],
-            }
-        )
-        return loss_value
-
-
-
-
-

Neural Types in NeMo ASR

-

NeMo Models and Neural Modules come with Neural Type checking. -Neural type checking is extremely useful when combining many different neural -network architectures for a production-grade application.

-
@property
-def input_types(self) -> Optional[Dict[str, NeuralType]]:
-    if hasattr(self.preprocessor, "_sample_rate"):
-        audio_eltype = AudioSignal(freq=self.preprocessor._sample_rate)
-    else:
-        audio_eltype = AudioSignal()
-    return {
-        "input_signal": NeuralType(("B", "T"), audio_eltype),
-        "input_signal_length": NeuralType(tuple("B"), LengthsType()),
-    }
-
-
-@property
-def output_types(self) -> Optional[Dict[str, NeuralType]]:
-    return {
-        "outputs": NeuralType(("B", "T", "D"), LogprobsType()),
-        "encoded_lengths": NeuralType(tuple("B"), LengthsType()),
-        "greedy_predictions": NeuralType(("B", "T"), LabelsType()),
-    }
-
-
-
-
-
-
-

Natural Language Processing (NLP)

-

Everything needed to finetune BERT-like language models for NLP tasks is included with NeMo. -NeMo NLP Models -include HuggingFace Transformers -and NVIDIA Megatron-LM BERT and Bio-Megatron models. -NeMo can also be used for pretraining BERT-based language models from HuggingFace.

-

Any of the HuggingFace encoders or Megatron-LM encoders can easily be used for the NLP tasks -that are included with NeMo:

- -
-

Named Entity Recognition (NER)

-

NER (or more generally token classification) is the NLP task of detecting and classifying key information (entities) in text. -This task is very popular in Healthcare and Finance. In finance, for example, it can be important to identify -geographical, geopolitical, organizational, persons, events, and natural phenomenon entities. -See this NER notebook -for a full tutorial on doing NER with NeMo, PyTorch Lightning, and Hydra.

-
-
-

Specify NER Model Configurations with YAML File

-
-

Note

-

NeMo Models and the PyTorch Lightning Trainer can be fully configured from .yaml files using Hydra.

-
-

See this token classification config -for the entire NER (token classification) .yaml file.

-
# configure any argument of the PyTorch Lightning Trainer
-trainer:
-    gpus: 1 # the number of gpus, 0 for CPU
-    num_nodes: 1
-    max_epochs: 5
-    ...
-# configure any aspect of the token classification model here
-model:
-    dataset:
-        data_dir: ??? # /path/to/data
-        class_balancing: null # choose from [null, weighted_loss]. Weighted_loss enables the weighted class balancing of the loss, may be used for handling unbalanced classes
-        max_seq_length: 128
-        ...
-  tokenizer:
-    tokenizer_name: ${model.language_model.pretrained_model_name} # or sentencepiece
-    vocab_file: null # path to vocab file
-    ...
-# the language model can be from HuggingFace or Megatron-LM
-language_model:
-    pretrained_model_name: bert-base-uncased
-    lm_checkpoint: null
-    ...
-# the classifier for the downstream task
-  head:
-    num_fc_layers: 2
-    fc_dropout: 0.5
-    activation: 'relu'
-    ...
-# all other configuration: train/val/test/ data, optimizer, experiment manager, etc
-...
-
-
-
-
-

Developing NER Model From Scratch

-

token_classification.py

-
# hydra_runner calls hydra.main and is useful for multi-node experiments
-@hydra_runner(config_path="conf", config_name="token_classification_config")
-def main(cfg: DictConfig) -> None:
-    trainer = pl.Trainer(**cfg.trainer)
-    model = TokenClassificationModel(cfg.model, trainer=trainer)
-    trainer.fit(model)
-
-
-

After training, we can do inference with the saved NER model using PyTorch Lightning.

-

Inference from file:

-
gpu = 1 if cfg.trainer.gpus != 0 else 0
-trainer = pl.Trainer(accelerator="gpu", devices=gpu)
-model.set_trainer(trainer)
-model.evaluate_from_file(
-    text_file=os.path.join(cfg.model.dataset.data_dir, cfg.model.validation_ds.text_file),
-    labels_file=os.path.join(cfg.model.dataset.data_dir, cfg.model.validation_ds.labels_file),
-    output_dir=exp_dir,
-    add_confusion_matrix=True,
-    normalize_confusion_matrix=True,
-)
-
-
-

Or we can run inference on a few examples:

-
queries = ["we bought four shirts from the nvidia gear store in santa clara.", "Nvidia is a company in Santa Clara."]
-results = model.add_predictions(queries)
-
-for query, result in zip(queries, results):
-    logging.info(f"Query : {query}")
-    logging.info(f"Result: {result.strip()}\n")
-
-
-

Hydra makes every aspect of the NeMo model, including the PyTorch Lightning Trainer, customizable from the command line.

-
python token_classification.py \
-    model.language_model.pretrained_model_name=bert-base-cased \
-    model.head.num_fc_layers=2 \
-    model.dataset.data_dir=/path/to/my/data  \
-    trainer.max_epochs=5 \
-    trainer.accelerator=gpu \
-    trainer.devices=[0,1]
-
-
-
-
-
-

Tokenizers

-

Tokenization is the process of converting natural language text into integer arrays -which can be used for machine learning. -For NLP tasks, tokenization is an essential part of data preprocessing. -NeMo supports all BERT-like model tokenizers from -HuggingFace’s AutoTokenizer -and also supports Google’s SentencePieceTokenizer -which can be trained on custom data.

-

To see the list of supported tokenizers:

-
from nemo.collections import nlp as nemo_nlp
-
-nemo_nlp.modules.get_tokenizer_list()
-
-
-

See this tokenizer notebook -for a full tutorial on using tokenizers in NeMo.

-
-
-

Language Models

-

Language models are used to extract information from (tokenized) text. -Much of the state-of-the-art in natural language processing is achieved -by fine-tuning pretrained language models on the downstream task.

-

With NeMo, you can either pretrain -a BERT model on your data or use a pretrained language model from HuggingFace Transformers -or NVIDIA Megatron-LM.

-

To see the list of language models available in NeMo:

-
nemo_nlp.modules.get_pretrained_lm_models_list(include_external=True)
-
-
-

Easily switch between any language model in the above list by using .get_lm_model.

-
nemo_nlp.modules.get_lm_model(pretrained_model_name="distilbert-base-uncased")
-
-
-

See this language model notebook -for a full tutorial on using pretrained language models in NeMo.

-
-
-

Using a Pre-trained NER Model

-

NeMo has pre-trained NER models that can be used -to get started with Token Classification right away. -Models are automatically downloaded from NGC, -cached locally to disk, -and loaded into GPU memory using the .from_pretrained method.

-
# load pre-trained NER model
-pretrained_ner_model = TokenClassificationModel.from_pretrained(model_name="NERModel")
-
-# define the list of queries for inference
-queries = [
-    "we bought four shirts from the nvidia gear store in santa clara.",
-    "Nvidia is a company.",
-    "The Adventures of Tom Sawyer by Mark Twain is an 1876 novel about a young boy growing "
-    + "up along the Mississippi River.",
-]
-results = pretrained_ner_model.add_predictions(queries)
-
-for query, result in zip(queries, results):
-    print()
-    print(f"Query : {query}")
-    print(f"Result: {result.strip()}\n")
-
-
-
-
-

NeMo NER Model Under the Hood

-

Any aspect of NLP training or model architecture design can easily be customized with PyTorch Lightning -since every NeMo model is a Lightning Module.

-
class TokenClassificationModel(ModelPT):
-    """
-    Token Classification Model with BERT, applicable for tasks such as Named Entity Recognition
-    """
-
-    ...
-
-    def forward(self, input_ids, token_type_ids, attention_mask):
-        hidden_states = self.bert_model(
-            input_ids=input_ids, token_type_ids=token_type_ids, attention_mask=attention_mask
-        )
-        logits = self.classifier(hidden_states=hidden_states)
-        return logits
-
-    # PTL-specific methods
-    def training_step(self, batch, batch_idx):
-        """
-        Lightning calls this inside the training loop with the data from the training dataloader
-        passed in as `batch`.
-        """
-        input_ids, input_type_ids, input_mask, subtokens_mask, loss_mask, labels = batch
-        logits = self(input_ids=input_ids, token_type_ids=input_type_ids, attention_mask=input_mask)
-
-        loss = self.loss(logits=logits, labels=labels, loss_mask=loss_mask)
-        self.log_dict({"train_loss": loss, "lr": self._optimizer.param_groups[0]["lr"]})
-        return loss
-
-    ...
-
-
-
-
-

Neural Types in NeMo NLP

-

NeMo Models and Neural Modules come with Neural Type checking. -Neural type checking is extremely useful when combining many different neural network architectures -for a production-grade application.

-
@property
-def input_types(self) -> Optional[Dict[str, NeuralType]]:
-    return self.bert_model.input_types
-
-
-@property
-def output_types(self) -> Optional[Dict[str, NeuralType]]:
-    return self.classifier.output_types
-
-
-
-
-
-
-

Text-To-Speech (TTS)

-

Everything needed to train TTS models and generate audio is included with NeMo. -NeMo TTS Models -can be trained from scratch on your own data or pretrained models can be downloaded -automatically. NeMo currently supports a two step inference procedure. -First, a model is used to generate a mel spectrogram from text. -Second, a model is used to generate audio from a mel spectrogram.

-

Mel Spectrogram Generators:

- -

Audio Generators:

- -
-

Specify TTS Model Configurations with YAML File

-
-

Note

-

NeMo Models and PyTorch Lightning Trainer can be fully configured from .yaml files using Hydra.

-
-

tts/conf/glow_tts.yaml

-
# configure the PyTorch Lightning Trainer
-trainer:
-    gpus: -1 # number of gpus
-    max_epochs: 350
-    num_nodes: 1
-    accelerator: ddp
-    ...
-
-# configure the TTS model
-model:
-    ...
-    encoder:
-        cls: nemo.collections.tts.modules.glow_tts.TextEncoder
-            params:
-            n_vocab: 148
-            out_channels: *n_mels
-            hidden_channels: 192
-            filter_channels: 768
-            filter_channels_dp: 256
-            ...
-# all other configuration, data, optimizer, parser, preprocessor, etc
-...
-
-
-
-
-

Developing TTS Model From Scratch

-

tts/glow_tts.py

-
# hydra_runner calls hydra.main and is useful for multi-node experiments
-@hydra_runner(config_path="conf", config_name="glow_tts")
-def main(cfg):
-    trainer = pl.Trainer(**cfg.trainer)
-    model = GlowTTSModel(cfg=cfg.model, trainer=trainer)
-    trainer.fit(model)
-
-
-

Hydra makes every aspect of the NeMo model, including the PyTorch Lightning Trainer, customizable from the command line.

-
python NeMo/examples/tts/glow_tts.py \
-    trainer.accelerator=gpu \
-    trainer.devices=4 \
-    trainer.max_epochs=400 \
-    ...
-    train_dataset=/path/to/train/data \
-    validation_datasets=/path/to/val/data \
-    model.train_ds.batch_size = 64 \
-
-
-
-

Note

-

Training NeMo TTS models from scratch can take days or weeks so it is highly recommended to use multiple GPUs and multiple nodes with the PyTorch Lightning Trainer.

-
-
-
-

Using State-Of-The-Art Pre-trained TTS Model

-

Generate speech using models trained on LJSpeech <https://keithito.com/LJ-Speech-Dataset/>, -around 24 hours of single speaker data.

-

See this TTS notebook -for a full tutorial on generating speech with NeMo, PyTorch Lightning, and Hydra.

-
# load pretrained spectrogram model
-spec_gen = SpecModel.from_pretrained("GlowTTS-22050Hz").cuda()
-
-# load pretrained Generators
-vocoder = WaveGlowModel.from_pretrained("WaveGlow-22050Hz").cuda()
-
-
-def infer(spec_gen_model, vocder_model, str_input):
-    with torch.no_grad():
-        parsed = spec_gen.parse(text_to_generate)
-        spectrogram = spec_gen.generate_spectrogram(tokens=parsed)
-        audio = vocoder.convert_spectrogram_to_audio(spec=spectrogram)
-    if isinstance(spectrogram, torch.Tensor):
-        spectrogram = spectrogram.to("cpu").numpy()
-    if len(spectrogram.shape) == 3:
-        spectrogram = spectrogram[0]
-    if isinstance(audio, torch.Tensor):
-        audio = audio.to("cpu").numpy()
-    return spectrogram, audio
-
-
-text_to_generate = input("Input what you want the model to say: ")
-spec, audio = infer(spec_gen, vocoder, text_to_generate)
-
-
-

To see the available pretrained checkpoints:

-
# spec generator
-GlowTTSModel.list_available_models()
-
-# vocoder
-WaveGlowModel.list_available_models()
-
-
-
-
-

NeMo TTS Model Under the Hood

-

Any aspect of TTS training or model architecture design can easily -be customized with PyTorch Lightning since every NeMo model is a LightningModule.

-

glow_tts.py

-
class GlowTTSModel(SpectrogramGenerator):
-    """
-    GlowTTS model used to generate spectrograms from text
-    Consists of a text encoder and an invertible spectrogram decoder
-    """
-
-    ...
-    # NeMo models come with neural type checking
-    @typecheck(
-        input_types={
-            "x": NeuralType(("B", "T"), TokenIndex()),
-            "x_lengths": NeuralType(("B"), LengthsType()),
-            "y": NeuralType(("B", "D", "T"), MelSpectrogramType(), optional=True),
-            "y_lengths": NeuralType(("B"), LengthsType(), optional=True),
-            "gen": NeuralType(optional=True),
-            "noise_scale": NeuralType(optional=True),
-            "length_scale": NeuralType(optional=True),
-        }
-    )
-    def forward(self, *, x, x_lengths, y=None, y_lengths=None, gen=False, noise_scale=0.3, length_scale=1.0):
-        if gen:
-            return self.glow_tts.generate_spect(
-                text=x, text_lengths=x_lengths, noise_scale=noise_scale, length_scale=length_scale
-            )
-        else:
-            return self.glow_tts(text=x, text_lengths=x_lengths, spect=y, spect_lengths=y_lengths)
-
-    ...
-
-    def step(self, y, y_lengths, x, x_lengths):
-        z, y_m, y_logs, logdet, logw, logw_, y_lengths, attn = self(
-            x=x, x_lengths=x_lengths, y=y, y_lengths=y_lengths, gen=False
-        )
-
-        l_mle, l_length, logdet = self.loss(
-            z=z,
-            y_m=y_m,
-            y_logs=y_logs,
-            logdet=logdet,
-            logw=logw,
-            logw_=logw_,
-            x_lengths=x_lengths,
-            y_lengths=y_lengths,
-        )
-
-        loss = sum([l_mle, l_length])
-
-        return l_mle, l_length, logdet, loss, attn
-
-    # PTL-specific methods
-    def training_step(self, batch, batch_idx):
-        y, y_lengths, x, x_lengths = batch
-
-        y, y_lengths = self.preprocessor(input_signal=y, length=y_lengths)
-
-        l_mle, l_length, logdet, loss, _ = self.step(y, y_lengths, x, x_lengths)
-
-        self.log_dict({"l_mle": l_mle, "l_length": l_length, "logdet": logdet}, prog_bar=True)
-        return loss
-
-    ...
-
-
-
-
-

Neural Types in NeMo TTS

-

NeMo Models and Neural Modules come with Neural Type checking. -Neural type checking is extremely useful when combining many different neural network architectures -for a production-grade application.

-
@typecheck(
-    input_types={
-        "x": NeuralType(("B", "T"), TokenIndex()),
-        "x_lengths": NeuralType(("B"), LengthsType()),
-        "y": NeuralType(("B", "D", "T"), MelSpectrogramType(), optional=True),
-        "y_lengths": NeuralType(("B"), LengthsType(), optional=True),
-        "gen": NeuralType(optional=True),
-        "noise_scale": NeuralType(optional=True),
-        "length_scale": NeuralType(optional=True),
-    }
-)
-def forward(self, *, x, x_lengths, y=None, y_lengths=None, gen=False, noise_scale=0.3, length_scale=1.0):
-    ...
-
-
-
-
-
-
-

Learn More

- -
-

Note

-

NeMo tutorial notebooks can be run on Google Colab.

-
-

NVIDIA NeMo is actively being developed on GitHub. -Contributions are welcome!

-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/ecosystem/bolts.html b/docs/ecosystem/bolts.html deleted file mode 100644 index d57cea8..0000000 --- a/docs/ecosystem/bolts.html +++ /dev/null @@ -1,774 +0,0 @@ - - - - - - - - - - - - - - Lightning Bolts — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Lightning Bolts

-

PyTorch Lightning Bolts, is our official collection -of prebuilt models across many research domains.

-
pip install lightning-bolts
-
-
-

In bolts we have:

-
    -
  • A collection of pretrained state-of-the-art models.

  • -
  • A collection of models designed to bootstrap your research.

  • -
  • A collection of callbacks, transforms, full datasets.

  • -
  • All models work on CPUs, TPUs, GPUs and 16-bit precision.

  • -
-
-
-

Quality control

-

The Lightning community builds bolts and contributes them to Bolts. -The lightning team guarantees that contributions are:

-
    -
  • Rigorously Tested (CPUs, GPUs, TPUs).

  • -
  • Rigorously Documented.

  • -
  • Standardized via PyTorch Lightning.

  • -
  • Optimized for speed.

  • -
  • Checked for correctness.

  • -
-
-
-
-

Example 1: Pretrained, prebuilt models

-
from pl_bolts.models import VAE, GPT2, ImageGPT, PixelCNN
-from pl_bolts.models.self_supervised import AMDIM, CPCV2, SimCLR, MocoV2
-from pl_bolts.models import LinearRegression, LogisticRegression
-from pl_bolts.models.gans import GAN
-from pl_bolts.callbacks import PrintTableMetricsCallback
-from pl_bolts.datamodules import FashionMNISTDataModule, CIFAR10DataModule, ImagenetDataModule
-
-
-
-
-
-

Example 2: Extend for faster research

-

Bolts are contributed with benchmarks and continuous-integration tests. This means -you can trust the implementations and use them to bootstrap your research much faster.

-
from pl_bolts.models import ImageGPT
-from pl_bolts.self_supervised import SimCLR
-
-
-class VideoGPT(ImageGPT):
-    def training_step(self, batch, batch_idx):
-        x, y = batch
-        x = _shape_input(x)
-
-        logits = self.gpt(x)
-        simclr_features = self.simclr(x)
-
-        # -----------------
-        # do something new with GPT logits + simclr_features
-        # -----------------
-
-        loss = self.criterion(logits.view(-1, logits.size(-1)), x.view(-1).long())
-
-        self.log("loss", loss)
-        return loss
-
-
-
-
-
-

Example 3: Callbacks

-

We also have a collection of callbacks.

-
from pl_bolts.callbacks import PrintTableMetricsCallback
-import pytorch_lightning as pl
-
-trainer = pl.Trainer(callbacks=[PrintTableMetricsCallback()])
-
-# loss│train_loss│val_loss│epoch
-# ──────────────────────────────
-# 2.2541470527648926│2.2541470527648926│2.2158432006835938│0
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/ecosystem/community_examples.html b/docs/ecosystem/community_examples.html deleted file mode 100644 index a118818..0000000 --- a/docs/ecosystem/community_examples.html +++ /dev/null @@ -1,721 +0,0 @@ - - - - - - - - - - - - - - Community Examples — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Community Examples
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
- - - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/ecosystem/ecosystem-ci.html b/docs/ecosystem/ecosystem-ci.html deleted file mode 100644 index c87cf75..0000000 --- a/docs/ecosystem/ecosystem-ci.html +++ /dev/null @@ -1,712 +0,0 @@ - - - - - - - - - - - - - - Ecosystem CI — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Ecosystem CI

-

Ecosystem CI automates issue discovery for your projects against Lightning nightly and releases. -It is a lightweight repository that provides easy configuration of Continues Integration running on CPUs and GPUs. -Any user who wants to keep their project aligned with current and future Lightning releases can use the EcoSystem CI to configure their integrations. -Read more: Stay Ahead of Breaking Changes with the New Lightning Ecosystem CI

-
-
-

Integrate a New Project

-

Follow the instructions below to add a new project to the PyTorch Lightning ecosystem.

-
    -
  1. Fork the ecosystem CI repository to be able to create a new Pull Request and work within a specific branch.

  2. -
  3. Create a new config file in configs/<Organization-name> folder and call it <project-name>.yaml.

  4. -
  5. Define runtime for CPU and link the config for GPU: -For CPU integrations, list OS and Python version combination to be running with GitHub actions. -For GPU integrations, you only add the path to the config (OS/Linux and Python version is fixed) to be running with Azure pipelines.

  6. -
  7. Add a Contact to the .github/CODEOWNERS list for your organization folder or just a single project.

  8. -
  9. Create a Draft PR with all mentioned requirements.

  10. -
  11. Join our Slack (Optional) channel #alerts-ecosystem-ci to be notified if your project is breaking.

  12. -
-

To learn more about Ecosystem CI, please refer to the Ecosystem CI repo. -Also, note that some particular implementation details described above may evolve over time.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
- -
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/ecosystem/flash.html b/docs/ecosystem/flash.html deleted file mode 100644 index 91e2e95..0000000 --- a/docs/ecosystem/flash.html +++ /dev/null @@ -1,757 +0,0 @@ - - - - - - - - - - - - - - Lightning Flash — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Lightning Flash

-

Lightning Flash is a high-level deep learning framework for fast prototyping, baselining, fine-tuning, and solving deep learning problems. -Flash makes complex AI recipes for over 15 tasks across 7 data domains accessible to all. -It is built for beginners with a simple API that requires very little deep learning background, and for data scientists, Kagglers, applied ML practitioners, and deep learning researchers that -want a quick way to get a deep learning baseline with advanced features PyTorch Lightning offers.

-
pip install lightning-flash
-
-
-
-
-

Using Lightning Flash in 3 Steps!

-
-

1. Load your Data

-

All data loading in Flash is performed via a from_* classmethod of a DataModule. -Which DataModule to use and which from_* methods are available depends on the task you want to perform. -For example, for image segmentation where your data is stored in folders, you would use the SemanticSegmentationData’s from_folders method:

-
from flash.image import SemanticSegmentationData
-
-dm = SemanticSegmentationData.from_folders(
-    train_folder="data/CameraRGB",
-    train_target_folder="data/CameraSeg",
-    val_split=0.1,
-    image_size=(256, 256),
-    num_classes=21,
-)
-
-
-
-
-
-

2. Configure your Model

-

Our tasks come loaded with pre-trained backbones and (where applicable) heads. -You can view the available backbones to use with your task using available_backbones. -Once you’ve chosen, create the model:

-
from flash.image import SemanticSegmentation
-
-print(SemanticSegmentation.available_heads())
-# ['deeplabv3', 'deeplabv3plus', 'fpn', ..., 'unetplusplus']
-
-print(SemanticSegmentation.available_backbones("fpn"))
-# ['densenet121', ..., 'xception'] # + 113 models
-
-print(SemanticSegmentation.available_pretrained_weights("efficientnet-b0"))
-# ['imagenet', 'advprop']
-
-model = SemanticSegmentation(head="fpn", backbone="efficientnet-b0", pretrained="advprop", num_classes=dm.num_classes)
-
-
-
-
-
-

3. Finetune!

-
from flash import Trainer
-
-trainer = Trainer(max_epochs=3)
-trainer.finetune(model, datamodule=datamodule, strategy="freeze")
-trainer.save_checkpoint("semantic_segmentation_model.pt")
-
-
-

To learn more about Lightning Flash, please refer to the Lightning Flash documentation.

-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/ecosystem/metrics.html b/docs/ecosystem/metrics.html deleted file mode 100644 index 40f9b18..0000000 --- a/docs/ecosystem/metrics.html +++ /dev/null @@ -1,771 +0,0 @@ - - - - - - - - - - - - - - TorchMetrics — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

TorchMetrics

-

TorchMetrics is a collection of machine learning metrics for distributed, -scalable PyTorch models and an easy-to-use API to create custom metrics. It has a collection of 60+ PyTorch metrics implementations and -is rigorously tested for all edge cases.

-
pip install torchmetrics
-
-
-

In TorchMetrics, we offer the following benefits:

-
    -
  • A standardized interface to increase reproducibility

  • -
  • Reduced Boilerplate

  • -
  • Distributed-training compatible

  • -
  • Rigorously tested

  • -
  • Automatic accumulation over batches

  • -
  • Automatic synchronization across multiple devices

  • -
-
-
-

Example 1: Functional Metrics

-

Below is a simple example for calculating the accuracy using the functional interface:

-
import torch
-import torchmetrics
-
-# simulate a classification problem
-preds = torch.randn(10, 5).softmax(dim=-1)
-target = torch.randint(5, (10,))
-
-acc = torchmetrics.functional.accuracy(preds, target)
-
-
-
-
-
-

Example 2: Module Metrics

-

The example below shows how to use the class-based interface:

-
import torch
-import torchmetrics
-
-# initialize metric
-metric = torchmetrics.Accuracy()
-
-n_batches = 10
-for i in range(n_batches):
-    # simulate a classification problem
-    preds = torch.randn(10, 5).softmax(dim=-1)
-    target = torch.randint(5, (10,))
-    # metric on current batch
-    acc = metric(preds, target)
-    print(f"Accuracy on batch {i}: {acc}")
-
-# metric on all batches using custom accumulation
-acc = metric.compute()
-print(f"Accuracy on all data: {acc}")
-
-# Reseting internal state such that metric ready for new data
-metric.reset()
-
-
-
-
-
-

Example 3: TorchMetrics with Lightning

-

The example below shows how to use a metric in your LightningModule:

-
class MyModel(LightningModule):
-    def __init__(self):
-        ...
-        self.accuracy = torchmetrics.Accuracy()
-
-    def training_step(self, batch, batch_idx):
-        x, y = batch
-        preds = self(x)
-        ...
-        # log step metric
-        self.accuracy(preds, y)
-        self.log("train_acc_step", self.accuracy, on_epoch=True)
-        ...
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/ecosystem/transformers.html b/docs/ecosystem/transformers.html deleted file mode 100644 index 674eea4..0000000 --- a/docs/ecosystem/transformers.html +++ /dev/null @@ -1,725 +0,0 @@ - - - - - - - - - - - - - - Lightning Transformers — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Lightning Transformers
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Lightning Transformers

-

Lightning Transformers offers a flexible interface for training and fine-tuning SOTA Transformer models -using the PyTorch Lightning Trainer.

-
pip install lightning-transformers
-
-
-

In Lightning Transformers, we offer the following benefits:

-
    -
  • Powered by PyTorch Lightning - Accelerators, custom Callbacks, Loggers, and high performance scaling with minimal changes.

  • -
  • Backed by HuggingFace Transformers models and datasets, spanning multiple modalities and tasks within NLP/Audio and Vision.

  • -
  • Task Abstraction for Rapid Research & Experimentation - Build your own custom transformer tasks across all modalities with little friction.

  • -
  • Powerful config composition backed by Hydra - simply swap out models, optimizers, schedulers task, and many more configurations without touching the code.

  • -
  • Seamless Memory and Speed Optimizations - Out-of-the-box training optimizations such as DeepSpeed ZeRO or FairScale Sharded Training with no code changes.

  • -
-
-
-

Using Lightning-Transformers

-

Lightning Transformers has a collection of tasks for common NLP problems such as language_modeling, -translation and more. To use, simply:

-
    -
  1. Pick a task to train (passed to train.py as task=)

  2. -
  3. Pick a dataset (passed to train.py as dataset=)

  4. -
  5. Customize the backbone, optimizer, or any component within the config

  6. -
  7. Add any Lightning supported parameters and optimizations

  8. -
-
python train.py \
-    task=<TASK> \
-    dataset=<DATASET>
-    backbone.pretrained_model_name_or_path=<BACKBONE> # Optionally change the HF backbone
-    optimizer=<OPTIMIZER> # Optionally specify optimizer (Default AdamW)
-    trainer.<ANY_TRAINER_FLAGS> # Optionally specify Lightning trainer arguments
-
-
-

To learn more about Lightning Transformers, please refer to the Lightning Transformers documentation.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/expertise_levels.html b/docs/expertise_levels.html deleted file mode 100644 index 14258c2..0000000 --- a/docs/expertise_levels.html +++ /dev/null @@ -1,1006 +0,0 @@ - - - - - - - - - - - - - - Level up — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Level up

-

Learn enough Lightning to match the level of expertise required by your research or job.

-

-
-
-

Basic skills

-

Learn the basics of model development with Lightning. Researchers and machine learning engineers should start here.

-
-
-
-

Intermediate skills

-

Learn to scale up your models and enable collaborative model development at academic or industry research labs.

-
-
-
-

Advanced skills

-

Configure all aspects of Lightning for advanced usecases.

-
-
-
-

Expert skills

-

Customize and extend Lightning for things like custom hardware or distributed strategies.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/extensions/accelerator.html b/docs/extensions/accelerator.html deleted file mode 100644 index 8592b6d..0000000 --- a/docs/extensions/accelerator.html +++ /dev/null @@ -1,819 +0,0 @@ - - - - - - - - - - - - - - Accelerator — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Accelerator

-

The Accelerator connects a Lightning Trainer to arbitrary hardware (CPUs, GPUs, TPUs, IPUs, …). -Currently there are accelerators for:

- -

The Accelerator is part of the Strategy which manages communication across multiple devices (distributed communication). -Whenever the Trainer, the loops or any other component in Lightning needs to talk to hardware, it calls into the Strategy and the Strategy calls into the Accelerator.

-Illustration of the Strategy as a composition of the Accelerator and several plugins -

We expose Accelerators and Strategies mainly for expert users who want to extend Lightning to work with new -hardware and distributed training or clusters.

-
-
-

Create a Custom Accelerator

-

Here is how you create a new Accelerator. -Let’s pretend we want to integrate the fictional XPU accelerator and we have access to its hardware through a library -xpulib.

-
import xpulib
-
-
-class XPUAccelerator(Accelerator):
-    """Experimental support for XPU, optimized for large-scale machine learning."""
-
-    @staticmethod
-    def parse_devices(devices: Any) -> Any:
-        # Put parsing logic here how devices can be passed into the Trainer
-        # via the `devices` argument
-        return devices
-
-    @staticmethod
-    def get_parallel_devices(devices: Any) -> Any:
-        # Here, convert the device indices to actual device objects
-        return [torch.device("xpu", idx) for idx in devices]
-
-    @staticmethod
-    def auto_device_count() -> int:
-        # Return a value for auto-device selection when `Trainer(devices="auto")`
-        return xpulib.available_devices()
-
-    @staticmethod
-    def is_available() -> bool:
-        return xpulib.is_available()
-
-    def get_device_stats(self, device: Union[str, torch.device]) -> Dict[str, Any]:
-        # Return optional device statistics for loggers
-        return {}
-
-
-

Finally, add the XPUAccelerator to the Trainer:

-
from pytorch_lightning import Trainer
-
-accelerator = XPUAccelerator()
-trainer = Trainer(accelerator=accelerator, devices=2)
-
-
-

Learn more about Strategies and how they interact with the Accelerator.

-
-
-
-

Registering Accelerators

-

If you wish to switch to a custom accelerator from the CLI without code changes, you can implement the register_accelerators() class method to register your new accelerator under a shorthand name like so:

-
class XPUAccelerator(Accelerator):
-    ...
-
-    @classmethod
-    def register_accelerators(cls, accelerator_registry):
-        accelerator_registry.register(
-            "xpu",
-            cls,
-            description=f"XPU Accelerator - optimized for large-scale machine learning.",
-        )
-
-
-

Now, this is possible:

-
trainer = Trainer(accelerator="xpu")
-
-
-

Or if you are using the Lightning CLI, for example:

-
python train.py fit --trainer.accelerator=xpu --trainer.devices=2
-
-
-
-
-
-

Accelerator API

- ---- - - - - - - - - - - - - - - - - - - - - -

Accelerator

The Accelerator Base Class.

CPUAccelerator

Accelerator for CPU devices.

GPUAccelerator

Accelerator for GPU devices.

HPUAccelerator

Accelerator for HPU devices.

IPUAccelerator

Accelerator for IPUs.

TPUAccelerator

Accelerator for TPU devices.

-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/extensions/callbacks.html b/docs/extensions/callbacks.html deleted file mode 100644 index 43b5687..0000000 --- a/docs/extensions/callbacks.html +++ /dev/null @@ -1,1655 +0,0 @@ - - - - - - - - - - - - - - Callback — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Callback

-
-

-
-

A callback is a self-contained program that can be reused across projects.

-

Lightning has a callback system to execute them when needed. Callbacks should capture NON-ESSENTIAL -logic that is NOT required for your lightning module to run.

-

Here’s the flow of how the callback hooks are executed:

-

An overall Lightning system should have:

-
    -
  1. Trainer for all engineering

  2. -
  3. LightningModule for all research code.

  4. -
  5. Callbacks for non-essential code.

  6. -
-
-

-
-

Example:

-
from pytorch_lightning.callbacks import Callback
-
-
-class MyPrintingCallback(Callback):
-    def on_train_start(self, trainer, pl_module):
-        print("Training is starting")
-
-    def on_train_end(self, trainer, pl_module):
-        print("Training is ending")
-
-
-trainer = Trainer(callbacks=[MyPrintingCallback()])
-
-
-

We successfully extended functionality without polluting our super clean -lightning module research code.

-
-
-

Examples

-

You can do pretty much anything with callbacks.

- -
-
-
-

Built-in Callbacks

-

Lightning has a few built-in callbacks.

-
-

Note

-

For a richer collection of callbacks, check out our -bolts library.

-
- ---- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -

BackboneFinetuning

Finetune a backbone model based on a learning rate user-defined scheduling.

BaseFinetuning

This class implements the base logic for writing your own Finetuning Callback.

BasePredictionWriter

Base class to implement how the predictions should be stored.

Callback

Abstract base class used to build new callbacks.

DeviceStatsMonitor

Automatically monitors and logs device stats during training stage.

EarlyStopping

Monitor a metric and stop training when it stops improving.

GradientAccumulationScheduler

Change gradient accumulation factor according to scheduling.

LambdaCallback

Create a simple callback on the fly using lambda functions.

LearningRateMonitor

Automatically monitor and logs learning rate for learning rate schedulers during training.

ModelCheckpoint

Save the model periodically by monitoring a quantity.

ModelPruning

Model pruning Callback, using PyTorch's prune utilities.

ModelSummary

Generates a summary of all layers in a LightningModule.

ProgressBarBase

The base class for progress bars in Lightning.

QuantizationAwareTraining

Quantization allows speeding up inference and decreasing memory requirements by performing computations and storing tensors at lower bitwidths (such as INT8 or FLOAT16) than floating point precision.

RichModelSummary

Generates a summary of all layers in a LightningModule with rich text formatting.

RichProgressBar

Create a progress bar with rich text formatting.

-

StochasticWeightAveraging

Implements the Stochastic Weight Averaging (SWA) Callback to average a model.

Timer

The Timer callback tracks the time spent in the training, validation, and test loops and interrupts the Trainer if the given time limit for the training loop is reached.

TQDMProgressBar

This is the default progress bar used by Lightning.

-
-
-
-

Save Callback state

-

Some callbacks require internal state in order to function properly. You can optionally -choose to persist your callback’s state as part of model checkpoint files using -state_dict() and load_state_dict(). -Note that the returned state must be able to be pickled.

-

When your callback is meant to be used only as a singleton callback then implementing the above two hooks is enough -to persist state effectively. However, if passing multiple instances of the callback to the Trainer is supported, then -the callback must define a state_key property in order for Lightning -to be able to distinguish the different states when loading the callback state. This concept is best illustrated by -the following example.

-
class Counter(Callback):
-    def __init__(self, what="epochs", verbose=True):
-        self.what = what
-        self.verbose = verbose
-        self.state = {"epochs": 0, "batches": 0}
-
-    @property
-    def state_key(self):
-        # note: we do not include `verbose` here on purpose
-        return self._generate_state_key(what=self.what)
-
-    def on_train_epoch_end(self, *args, **kwargs):
-        if self.what == "epochs":
-            self.state["epochs"] += 1
-
-    def on_train_batch_end(self, *args, **kwargs):
-        if self.what == "batches":
-            self.state["batches"] += 1
-
-    def load_state_dict(self, state_dict):
-        self.state.update(state_dict)
-
-    def state_dict(self):
-        return self.state.copy()
-
-
-# two callbacks of the same type are being used
-trainer = Trainer(callbacks=[Counter(what="epochs"), Counter(what="batches")])
-
-
-

A Lightning checkpoint from this Trainer with the two stateful callbacks will include the following information:

-
{
-    "state_dict": ...,
-    "callbacks": {
-        "Counter{'what': 'batches'}": {"batches": 32, "epochs": 0},
-        "Counter{'what': 'epochs'}": {"batches": 0, "epochs": 2},
-        ...
-    }
-}
-
-
-

The implementation of a state_key is essential here. If it were missing, -Lightning would not be able to disambiguate the state for these two callbacks, and state_key -by default only defines the class name as the key, e.g., here Counter.

-
-
-
-

Best Practices

-

The following are best practices when using/designing callbacks.

-
    -
  1. Callbacks should be isolated in their functionality.

  2. -
  3. Your callback should not rely on the behavior of other callbacks in order to work properly.

  4. -
  5. Do not manually call methods from the callback.

  6. -
  7. Directly calling methods (eg. on_validation_end) is strongly discouraged.

  8. -
  9. Whenever possible, your callbacks should not depend on the order in which they are executed.

  10. -
-
-
-
-

Callback API

-

Here is the full API of methods available in the Callback base class.

-

The Callback class is the base for all the callbacks in Lightning just like the LightningModule is the base for all models. -It defines a public interface that each callback implementation must follow, the key ones are:

-
-

Properties

-
-

state_key

-
-
-Callback.state_key
-

Identifier for the state of the callback.

-

Used to store and retrieve a callback’s state from the checkpoint dictionary by -checkpoint["callbacks"][state_key]. Implementations of a callback need to provide a unique state key if 1) -the callback has state and 2) it is desired to maintain the state of multiple instances of that callback.

-
-
Return type
-

str

-
-
-
- -
-
-
-

Hooks

-
-

on_configure_sharded_model

-
-
-Callback.on_configure_sharded_model(trainer, pl_module)[source]
-
-

Deprecated since version v1.6: This callback hook was deprecated in v1.6 and will be removed in v1.8. Use setup() instead.

-
-

Called before configure sharded model.

-
-
Return type
-

None

-
-
-
- -
-
-

setup

-
-
-Callback.setup(trainer, pl_module, stage=None)[source]
-

Called when fit, validate, test, predict, or tune begins.

-
-
Return type
-

None

-
-
-
- -
-
-

teardown

-
-
-Callback.teardown(trainer, pl_module, stage=None)[source]
-

Called when fit, validate, test, predict, or tune ends.

-
-
Return type
-

None

-
-
-
- -
-
-

on_init_start

-
-
-Callback.on_init_start(trainer)[source]
-
-

Deprecated since version v1.6: This callback hook was deprecated in v1.6 and will be removed in v1.8.

-
-

Called when the trainer initialization begins, model has not yet been set.

-
-
Return type
-

None

-
-
-
- -
-
-

on_init_end

-
-
-Callback.on_init_end(trainer)[source]
-
-

Deprecated since version v1.6: This callback hook was deprecated in v1.6 and will be removed in v1.8.

-
-

Called when the trainer initialization ends, model has not yet been set.

-
-
Return type
-

None

-
-
-
- -
-
-

on_fit_start

-
-
-Callback.on_fit_start(trainer, pl_module)[source]
-

Called when fit begins.

-
-
Return type
-

None

-
-
-
- -
-
-

on_fit_end

-
-
-Callback.on_fit_end(trainer, pl_module)[source]
-

Called when fit ends.

-
-
Return type
-

None

-
-
-
- -
-
-

on_sanity_check_start

-
-
-Callback.on_sanity_check_start(trainer, pl_module)[source]
-

Called when the validation sanity check starts.

-
-
Return type
-

None

-
-
-
- -
-
-

on_sanity_check_end

-
-
-Callback.on_sanity_check_end(trainer, pl_module)[source]
-

Called when the validation sanity check ends.

-
-
Return type
-

None

-
-
-
- -
-
-

on_train_batch_start

-
-
-Callback.on_train_batch_start(trainer, pl_module, batch, batch_idx, unused=0)[source]
-

Called when the train batch begins.

-
-
Return type
-

None

-
-
-
- -
-
-

on_train_batch_end

-
-
-Callback.on_train_batch_end(trainer, pl_module, outputs, batch, batch_idx, unused=0)[source]
-

Called when the train batch ends.

-
-
Return type
-

None

-
-
-
- -
-
-

on_train_epoch_start

-
-
-Callback.on_train_epoch_start(trainer, pl_module)[source]
-

Called when the train epoch begins.

-
-
Return type
-

None

-
-
-
- -
-
-

on_train_epoch_end

-
-
-Callback.on_train_epoch_end(trainer, pl_module)[source]
-

Called when the train epoch ends.

-

To access all batch outputs at the end of the epoch, either:

-
    -
  1. Implement training_epoch_end in the LightningModule and access outputs via the module OR

  2. -
  3. Cache data across train batch hooks inside the callback implementation to post-process in this hook.

  4. -
-
-
Return type
-

None

-
-
-
- -
-
-

on_validation_epoch_start

-
-
-Callback.on_validation_epoch_start(trainer, pl_module)[source]
-

Called when the val epoch begins.

-
-
Return type
-

None

-
-
-
- -
-
-

on_validation_epoch_end

-
-
-Callback.on_validation_epoch_end(trainer, pl_module)[source]
-

Called when the val epoch ends.

-
-
Return type
-

None

-
-
-
- -
-
-

on_test_epoch_start

-
-
-Callback.on_test_epoch_start(trainer, pl_module)[source]
-

Called when the test epoch begins.

-
-
Return type
-

None

-
-
-
- -
-
-

on_test_epoch_end

-
-
-Callback.on_test_epoch_end(trainer, pl_module)[source]
-

Called when the test epoch ends.

-
-
Return type
-

None

-
-
-
- -
-
-

on_predict_epoch_start

-
-
-Callback.on_predict_epoch_start(trainer, pl_module)[source]
-

Called when the predict epoch begins.

-
-
Return type
-

None

-
-
-
- -
-
-

on_predict_epoch_end

-
-
-Callback.on_predict_epoch_end(trainer, pl_module, outputs)[source]
-

Called when the predict epoch ends.

-
-
Return type
-

None

-
-
-
- -
-
-Callback.on_epoch_end(trainer, pl_module)[source]
-
-

Deprecated since version v1.6: This callback hook was deprecated in v1.6 and will be removed in v1.8. Use -on_<train/validation/test>_epoch_end instead.

-
-

Called when either of train/val/test epoch ends.

-
-
Return type
-

None

-
-
-
- -
-
-

on_validation_batch_start

-
-
-Callback.on_validation_batch_start(trainer, pl_module, batch, batch_idx, dataloader_idx)[source]
-

Called when the validation batch begins.

-
-
Return type
-

None

-
-
-
- -
-
-

on_validation_batch_end

-
-
-Callback.on_validation_batch_end(trainer, pl_module, outputs, batch, batch_idx, dataloader_idx)[source]
-

Called when the validation batch ends.

-
-
Return type
-

None

-
-
-
- -
-
-

on_test_batch_start

-
-
-Callback.on_test_batch_start(trainer, pl_module, batch, batch_idx, dataloader_idx)[source]
-

Called when the test batch begins.

-
-
Return type
-

None

-
-
-
- -
-
-

on_test_batch_end

-
-
-Callback.on_test_batch_end(trainer, pl_module, outputs, batch, batch_idx, dataloader_idx)[source]
-

Called when the test batch ends.

-
-
Return type
-

None

-
-
-
- -
-
-

on_predict_batch_start

-
-
-Callback.on_predict_batch_start(trainer, pl_module, batch, batch_idx, dataloader_idx)[source]
-

Called when the predict batch begins.

-
-
Return type
-

None

-
-
-
- -
-
-

on_predict_batch_end

-
-
-Callback.on_predict_batch_end(trainer, pl_module, outputs, batch, batch_idx, dataloader_idx)[source]
-

Called when the predict batch ends.

-
-
Return type
-

None

-
-
-
- -
-
-

on_train_start

-
-
-Callback.on_train_start(trainer, pl_module)[source]
-

Called when the train begins.

-
-
Return type
-

None

-
-
-
- -
-
-

on_train_end

-
-
-Callback.on_train_end(trainer, pl_module)[source]
-

Called when the train ends.

-
-
Return type
-

None

-
-
-
- -
-
-

on_validation_start

-
-
-Callback.on_validation_start(trainer, pl_module)[source]
-

Called when the validation loop begins.

-
-
Return type
-

None

-
-
-
- -
-
-

on_validation_end

-
-
-Callback.on_validation_end(trainer, pl_module)[source]
-

Called when the validation loop ends.

-
-
Return type
-

None

-
-
-
- -
-
-

on_test_start

-
-
-Callback.on_test_start(trainer, pl_module)[source]
-

Called when the test begins.

-
-
Return type
-

None

-
-
-
- -
-
-

on_test_end

-
-
-Callback.on_test_end(trainer, pl_module)[source]
-

Called when the test ends.

-
-
Return type
-

None

-
-
-
- -
-
-

on_predict_start

-
-
-Callback.on_predict_start(trainer, pl_module)[source]
-

Called when the predict begins.

-
-
Return type
-

None

-
-
-
- -
-
-

on_predict_end

-
-
-Callback.on_predict_end(trainer, pl_module)[source]
-

Called when predict ends.

-
-
Return type
-

None

-
-
-
- -
-
-

on_keyboard_interrupt

-
-
-Callback.on_keyboard_interrupt(trainer, pl_module)[source]
-
-

Deprecated since version v1.5: This callback hook was deprecated in v1.5 in favor of on_exception and will be removed in v1.7.

-
-

Called when any trainer execution is interrupted by KeyboardInterrupt.

-
-
Return type
-

None

-
-
-
- -
-
-

on_exception

-
-
-Callback.on_exception(trainer, pl_module, exception)[source]
-

Called when any trainer execution is interrupted by an exception.

-
-
Return type
-

None

-
-
-
- -
-
-

state_dict

-
-
-Callback.state_dict()[source]
-

Called when saving a checkpoint, implement to generate callback’s state_dict.

-
-
Return type
-

Dict[str, Any]

-
-
Returns
-

A dictionary containing callback state.

-
-
-
- -
-
-

on_save_checkpoint

-
-
-Callback.on_save_checkpoint(trainer, pl_module, checkpoint)[source]
-

Called when saving a checkpoint to give you a chance to store anything else you might want to save.

-
-
Parameters
-
    -
  • trainer (Trainer) – the current Trainer instance.

  • -
  • pl_module (LightningModule) – the current LightningModule instance.

  • -
  • checkpoint (Dict[str, Any]) – the checkpoint dictionary that will be saved.

  • -
-
-
Return type
-

Optional[dict]

-
-
Returns
-

None or the callback state. Support for returning callback state will be removed in v1.8.

-
-
-
-

Deprecated since version v1.6: Returning a value from this method was deprecated in v1.6 and will be removed in v1.8. -Implement Callback.state_dict instead to return state. -In v1.8 Callback.on_save_checkpoint can only return None.

-
-
- -
-
-

load_state_dict

-
-
-Callback.load_state_dict(state_dict)[source]
-

Called when loading a checkpoint, implement to reload callback state given callback’s state_dict.

-
-
Parameters
-

state_dict (Dict[str, Any]) – the callback state returned by state_dict.

-
-
Return type
-

None

-
-
-
- -
-
-

on_load_checkpoint

-
-
-Callback.on_load_checkpoint(trainer, pl_module, callback_state)[source]
-

Called when loading a model checkpoint, use to reload state.

-
-
Parameters
-
    -
  • trainer (Trainer) – the current Trainer instance.

  • -
  • pl_module (LightningModule) – the current LightningModule instance.

  • -
  • callback_state (Dict[str, Any]) – the callback state returned by on_save_checkpoint.

  • -
-
-
-
-

Note

-

The on_load_checkpoint won’t be called with an undefined state. -If your on_load_checkpoint hook behavior doesn’t rely on a state, -you will still need to override on_save_checkpoint to return a dummy state.

-
-
-

Deprecated since version v1.6: This callback hook will change its signature and behavior in v1.8. -If you wish to load the state of the callback, use Callback.load_state_dict instead. -In v1.8 Callback.on_load_checkpoint(checkpoint) will receive the entire loaded -checkpoint dictionary instead of only the callback state from the checkpoint.

-
-
-
Return type
-

None

-
-
-
- -
-
-

on_before_backward

-
-
-Callback.on_before_backward(trainer, pl_module, loss)[source]
-

Called before loss.backward().

-
-
Return type
-

None

-
-
-
- -
-
-

on_after_backward

-
-
-Callback.on_after_backward(trainer, pl_module)[source]
-

Called after loss.backward() and before optimizers are stepped.

-
-
Return type
-

None

-
-
-
- -
-
-

on_before_optimizer_step

-
-
-Callback.on_before_optimizer_step(trainer, pl_module, optimizer, opt_idx)[source]
-

Called before optimizer.step().

-
-
Return type
-

None

-
-
-
- -
-
-

on_before_zero_grad

-
-
-Callback.on_before_zero_grad(trainer, pl_module, optimizer)[source]
-

Called before optimizer.zero_grad().

-
-
Return type
-

None

-
-
-
- -
-
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/extensions/callbacks_state.html b/docs/extensions/callbacks_state.html deleted file mode 100644 index 81ff9c4..0000000 --- a/docs/extensions/callbacks_state.html +++ /dev/null @@ -1,741 +0,0 @@ - - - - - - - - - - - - - - Save Callback state — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Save Callback state
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Save Callback state

-

Some callbacks require internal state in order to function properly. You can optionally -choose to persist your callback’s state as part of model checkpoint files using -state_dict() and load_state_dict(). -Note that the returned state must be able to be pickled.

-

When your callback is meant to be used only as a singleton callback then implementing the above two hooks is enough -to persist state effectively. However, if passing multiple instances of the callback to the Trainer is supported, then -the callback must define a state_key property in order for Lightning -to be able to distinguish the different states when loading the callback state. This concept is best illustrated by -the following example.

-
class Counter(Callback):
-    def __init__(self, what="epochs", verbose=True):
-        self.what = what
-        self.verbose = verbose
-        self.state = {"epochs": 0, "batches": 0}
-
-    @property
-    def state_key(self):
-        # note: we do not include `verbose` here on purpose
-        return self._generate_state_key(what=self.what)
-
-    def on_train_epoch_end(self, *args, **kwargs):
-        if self.what == "epochs":
-            self.state["epochs"] += 1
-
-    def on_train_batch_end(self, *args, **kwargs):
-        if self.what == "batches":
-            self.state["batches"] += 1
-
-    def load_state_dict(self, state_dict):
-        self.state.update(state_dict)
-
-    def state_dict(self):
-        return self.state.copy()
-
-
-# two callbacks of the same type are being used
-trainer = Trainer(callbacks=[Counter(what="epochs"), Counter(what="batches")])
-
-
-

A Lightning checkpoint from this Trainer with the two stateful callbacks will include the following information:

-
{
-    "state_dict": ...,
-    "callbacks": {
-        "Counter{'what': 'batches'}": {"batches": 32, "epochs": 0},
-        "Counter{'what': 'epochs'}": {"batches": 0, "epochs": 2},
-        ...
-    }
-}
-
-
-

The implementation of a state_key is essential here. If it were missing, -Lightning would not be able to disambiguate the state for these two callbacks, and state_key -by default only defines the class name as the key, e.g., here Counter.

-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
- -
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/extensions/datamodules_state.html b/docs/extensions/datamodules_state.html deleted file mode 100644 index 73e7a3b..0000000 --- a/docs/extensions/datamodules_state.html +++ /dev/null @@ -1,700 +0,0 @@ - - - - - - - - - - - - - - Save DataModule state — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Save DataModule state
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Save DataModule state

-

When a checkpoint is created, it asks every DataModule for their state. If your DataModule defines the state_dict and load_state_dict methods, the checkpoint will automatically track and restore your DataModules.

-
class LitDataModule(pl.DataModuler):
-    def state_dict(self):
-        # track whatever you want here
-        state = {"current_train_batch_index": self.current_train_batch_index}
-        return state
-
-    def load_state_dict(self, state_dict):
-        # restore the state based on what you tracked in (def state_dict)
-        self.current_train_batch_index = state_dict["current_train_batch_index"]
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
- -
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/extensions/generated/pytorch_lightning.loggers.CSVLogger.html b/docs/extensions/generated/pytorch_lightning.loggers.CSVLogger.html deleted file mode 100644 index 317a9d3..0000000 --- a/docs/extensions/generated/pytorch_lightning.loggers.CSVLogger.html +++ /dev/null @@ -1,862 +0,0 @@ - - - - - - - - - - - - - - CSVLogger — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

CSVLogger

-
-
-class pytorch_lightning.loggers.CSVLogger(save_dir, name='lightning_logs', version=None, prefix='', flush_logs_every_n_steps=100)[source]
-

Bases: pytorch_lightning.loggers.base.LightningLoggerBase

-

Log to local file system in yaml and CSV format.

-

Logs are saved to os.path.join(save_dir, name, version).

-

Example

-
>>> from pytorch_lightning import Trainer
->>> from pytorch_lightning.loggers import CSVLogger
->>> logger = CSVLogger("logs", name="my_exp_name")
->>> trainer = Trainer(logger=logger)
-
-
-
-
Parameters
-
    -
  • save_dir (str) – Save directory

  • -
  • name (Optional[str]) – Experiment name. Defaults to 'default'.

  • -
  • version (Union[int, str, None]) – Experiment version. If version is not specified the logger inspects the save -directory for existing versions, then automatically assigns the next available version.

  • -
  • prefix (str) – A string to put at the beginning of metric keys.

  • -
  • flush_logs_every_n_steps (int) – How often to flush logs to disk (defaults to every 100 steps).

  • -
-
-
-
-
-finalize(status)[source]
-

Do any processing that is necessary to finalize an experiment.

-
-
Parameters
-

status (str) – Status that the experiment finished with (e.g. success, failed, aborted)

-
-
Return type
-

None

-
-
-
- -
-
-log_hyperparams(params)[source]
-

Record hyperparameters.

-
-
Parameters
-
    -
  • params (Union[Dict[str, Any], Namespace]) – Namespace containing the hyperparameters

  • -
  • args – Optional positional arguments, depends on the specific logger being used

  • -
  • kwargs – Optional keyword arguments, depends on the specific logger being used

  • -
-
-
Return type
-

None

-
-
-
- -
-
-log_metrics(metrics, step=None)[source]
-

Records metrics. -This method logs metrics as as soon as it received them. If you want to aggregate -metrics for one specific step, use the -agg_and_log_metrics() method.

-
-
Parameters
-
    -
  • metrics (Dict[str, float]) – Dictionary with metric names as keys and measured quantities as values

  • -
  • step (Optional[int]) – Step number at which the metrics should be recorded

  • -
-
-
Return type
-

None

-
-
-
- -
-
-save()[source]
-

Save log data.

-
-
Return type
-

None

-
-
-
- -
-
-property experiment: pytorch_lightning.loggers.csv_logs.ExperimentWriter
-

Actual ExperimentWriter object. To use ExperimentWriter features in your -LightningModule do the following.

-

Example:

-
self.logger.experiment.some_experiment_writer_function()
-
-
-
-
Return type
-

ExperimentWriter

-
-
-
- -
-
-property log_dir: str
-

The log directory for this run.

-

By default, it is named 'version_${self.version}' but it can be overridden by passing a string value for the -constructor’s version parameter instead of None or an int.

-
-
Return type
-

str

-
-
-
- -
-
-property name: str
-

Gets the name of the experiment.

-
-
Return type
-

str

-
-
Returns
-

The name of the experiment.

-
-
-
- -
-
-property root_dir: str
-

Parent directory for all checkpoint subdirectories.

-

If the experiment name parameter is an empty string, no experiment subdirectory is used and the checkpoint will -be saved in “save_dir/version”

-
-
Return type
-

str

-
-
-
- -
-
-property save_dir: Optional[str]
-

The current directory where logs are saved.

-
-
Return type
-

Optional[str]

-
-
Returns
-

The path to current directory where logs are saved.

-
-
-
- -
-
-property version: int
-

Gets the version of the experiment.

-
-
Return type
-

int

-
-
Returns
-

The version of the experiment if it is specified, else the next version.

-
-
-
- -
- -
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- - -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/extensions/generated/pytorch_lightning.loggers.CometLogger.html b/docs/extensions/generated/pytorch_lightning.loggers.CometLogger.html deleted file mode 100644 index 3415fee..0000000 --- a/docs/extensions/generated/pytorch_lightning.loggers.CometLogger.html +++ /dev/null @@ -1,900 +0,0 @@ - - - - - - - - - - - - - - CometLogger — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

CometLogger

-
-
-class pytorch_lightning.loggers.CometLogger(api_key=None, save_dir=None, project_name=None, rest_api_key=None, experiment_name=None, experiment_key=None, offline=False, prefix='', agg_key_funcs=None, agg_default_func=None, **kwargs)[source]
-

Bases: pytorch_lightning.loggers.base.LightningLoggerBase

-

Log using Comet.ml.

-

Install it with pip:

-
pip install comet-ml
-
-
-

Comet requires either an API Key (online mode) or a local directory path (offline mode).

-

ONLINE MODE

-
import os
-from pytorch_lightning import Trainer
-from pytorch_lightning.loggers import CometLogger
-
-# arguments made to CometLogger are passed on to the comet_ml.Experiment class
-comet_logger = CometLogger(
-    api_key=os.environ.get("COMET_API_KEY"),
-    workspace=os.environ.get("COMET_WORKSPACE"),  # Optional
-    save_dir=".",  # Optional
-    project_name="default_project",  # Optional
-    rest_api_key=os.environ.get("COMET_REST_API_KEY"),  # Optional
-    experiment_key=os.environ.get("COMET_EXPERIMENT_KEY"),  # Optional
-    experiment_name="lightning_logs",  # Optional
-)
-trainer = Trainer(logger=comet_logger)
-
-
-

OFFLINE MODE

-
from pytorch_lightning.loggers import CometLogger
-
-# arguments made to CometLogger are passed on to the comet_ml.Experiment class
-comet_logger = CometLogger(
-    save_dir=".",
-    workspace=os.environ.get("COMET_WORKSPACE"),  # Optional
-    project_name="default_project",  # Optional
-    rest_api_key=os.environ.get("COMET_REST_API_KEY"),  # Optional
-    experiment_name="lightning_logs",  # Optional
-)
-trainer = Trainer(logger=comet_logger)
-
-
-
-
Parameters
-
    -
  • api_key (Optional[str]) – Required in online mode. API key, found on Comet.ml. If not given, this -will be loaded from the environment variable COMET_API_KEY or ~/.comet.config -if either exists.

  • -
  • save_dir (Optional[str]) – Required in offline mode. The path for the directory to save local -comet logs. If given, this also sets the directory for saving checkpoints.

  • -
  • project_name (Optional[str]) – Optional. Send your experiment to a specific project. -Otherwise will be sent to Uncategorized Experiments. -If the project name does not already exist, Comet.ml will create a new project.

  • -
  • rest_api_key (Optional[str]) – Optional. Rest API key found in Comet.ml settings. -This is used to determine version number

  • -
  • experiment_name (Optional[str]) – Optional. String representing the name for this particular experiment on Comet.ml.

  • -
  • experiment_key (Optional[str]) – Optional. If set, restores from existing experiment.

  • -
  • offline (bool) – If api_key and save_dir are both given, this determines whether -the experiment will be in online or offline mode. This is useful if you use -save_dir to control the checkpoints directory and have a ~/.comet.config -file but still want to run offline experiments.

  • -
  • prefix (str) – A string to put at the beginning of metric keys.

  • -
  • **kwargs – Additional arguments like workspace, log_code, etc. used by -CometExperiment can be passed as keyword arguments in this logger.

  • -
-
-
Raises
-
    -
  • ModuleNotFoundError – If required Comet package is not installed on the device.

  • -
  • MisconfigurationException – If neither api_key nor save_dir are passed as arguments.

  • -
-
-
-
-
-finalize(status)[source]
-

When calling self.experiment.end(), that experiment won’t log any more data to Comet. -That’s why, if you need to log any more data, you need to create an ExistingCometExperiment. -For example, to log data when testing your model after training, because when training is -finalized CometLogger.finalize() is called.

-

This happens automatically in the experiment() property, when -self._experiment is set to None, i.e. self.reset_experiment().

-
-
Return type
-

None

-
-
-
- -
-
-log_graph(model, input_array=None)[source]
-

Record model graph.

-
-
Parameters
-
    -
  • model (LightningModule) – lightning model

  • -
  • input_array – input passes to model.forward

  • -
-
-
Return type
-

None

-
-
-
- -
-
-log_hyperparams(params)[source]
-

Record hyperparameters.

-
-
Parameters
-
    -
  • params (Union[Dict[str, Any], Namespace]) – Namespace containing the hyperparameters

  • -
  • args – Optional positional arguments, depends on the specific logger being used

  • -
  • kwargs – Optional keyword arguments, depends on the specific logger being used

  • -
-
-
Return type
-

None

-
-
-
- -
-
-log_metrics(metrics, step=None)[source]
-

Records metrics. -This method logs metrics as as soon as it received them. If you want to aggregate -metrics for one specific step, use the -agg_and_log_metrics() method.

-
-
Parameters
-
    -
  • metrics (Dict[str, Union[Tensor, float]]) – Dictionary with metric names as keys and measured quantities as values

  • -
  • step (Optional[int]) – Step number at which the metrics should be recorded

  • -
-
-
Return type
-

None

-
-
-
- -
-
-property experiment: None
-

Actual Comet object. To use Comet features in your -LightningModule do the following.

-

Example:

-
self.logger.experiment.some_comet_function()
-
-
-
-
Return type
-

None

-
-
-
- -
-
-property name: str
-

Gets the project name.

-
-
Return type
-

str

-
-
Returns
-

The project name if it is specified, else “comet-default”.

-
-
-
- -
-
-property save_dir: Optional[str]
-

Gets the save directory.

-
-
Return type
-

Optional[str]

-
-
Returns
-

The path to the save directory.

-
-
-
- -
-
-property version: str
-

Gets the version.

-
-
Return type
-

str

-
-
Returns
-

The first one of the following that is set in the following order

-
    -
  1. experiment id.

  2. -
  3. experiment key.

  4. -
  5. ”COMET_EXPERIMENT_KEY” environment variable.

  6. -
  7. future experiment key.

  8. -
-

If none are present generates a new guid.

-

-
-
-
- -
- -
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- - -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/extensions/generated/pytorch_lightning.loggers.MLFlowLogger.html b/docs/extensions/generated/pytorch_lightning.loggers.MLFlowLogger.html deleted file mode 100644 index 38e87b5..0000000 --- a/docs/extensions/generated/pytorch_lightning.loggers.MLFlowLogger.html +++ /dev/null @@ -1,881 +0,0 @@ - - - - - - - - - - - - - - MLFlowLogger — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

MLFlowLogger

-
-
-class pytorch_lightning.loggers.MLFlowLogger(experiment_name='lightning_logs', run_name=None, tracking_uri=None, tags=None, save_dir='./mlruns', prefix='', artifact_location=None, run_id=None)[source]
-

Bases: pytorch_lightning.loggers.base.LightningLoggerBase

-

Log using MLflow.

-

Install it with pip:

-
pip install mlflow
-
-
-
from pytorch_lightning import Trainer
-from pytorch_lightning.loggers import MLFlowLogger
-
-mlf_logger = MLFlowLogger(experiment_name="lightning_logs", tracking_uri="file:./ml-runs")
-trainer = Trainer(logger=mlf_logger)
-
-
-

Use the logger anywhere in your LightningModule as follows:

-
from pytorch_lightning import LightningModule
-
-
-class LitModel(LightningModule):
-    def training_step(self, batch, batch_idx):
-        # example
-        self.logger.experiment.whatever_ml_flow_supports(...)
-
-    def any_lightning_module_function_or_hook(self):
-        self.logger.experiment.whatever_ml_flow_supports(...)
-
-
-
-
Parameters
-
    -
  • experiment_name (str) – The name of the experiment.

  • -
  • run_name (Optional[str]) – Name of the new run. The run_name is internally stored as a mlflow.runName tag. -If the mlflow.runName tag has already been set in tags, the value is overridden by the run_name.

  • -
  • tracking_uri (Optional[str]) – Address of local or remote tracking server. -If not provided, defaults to MLFLOW_TRACKING_URI environment variable if set, otherwise it falls -back to file:<save_dir>.

  • -
  • tags (Optional[Dict[str, Any]]) – A dictionary tags for the experiment.

  • -
  • save_dir (Optional[str]) – A path to a local directory where the MLflow runs get saved. -Defaults to ./mlflow if tracking_uri is not provided. -Has no effect if tracking_uri is provided.

  • -
  • prefix (str) – A string to put at the beginning of metric keys.

  • -
  • artifact_location (Optional[str]) – The location to store run artifacts. If not provided, the server picks an appropriate -default.

  • -
  • run_id (Optional[str]) – The run identifier of the experiment. If not provided, a new run is started.

  • -
-
-
Raises
-

ModuleNotFoundError – If required MLFlow package is not installed on the device.

-
-
-
-
-finalize(status='FINISHED')[source]
-

Do any processing that is necessary to finalize an experiment.

-
-
Parameters
-

status (str) – Status that the experiment finished with (e.g. success, failed, aborted)

-
-
Return type
-

None

-
-
-
- -
-
-log_hyperparams(params)[source]
-

Record hyperparameters.

-
-
Parameters
-
    -
  • params (Union[Dict[str, Any], Namespace]) – Namespace containing the hyperparameters

  • -
  • args – Optional positional arguments, depends on the specific logger being used

  • -
  • kwargs – Optional keyword arguments, depends on the specific logger being used

  • -
-
-
Return type
-

None

-
-
-
- -
-
-log_metrics(metrics, step=None)[source]
-

Records metrics. -This method logs metrics as as soon as it received them. If you want to aggregate -metrics for one specific step, use the -agg_and_log_metrics() method.

-
-
Parameters
-
    -
  • metrics (Dict[str, float]) – Dictionary with metric names as keys and measured quantities as values

  • -
  • step (Optional[int]) – Step number at which the metrics should be recorded

  • -
-
-
Return type
-

None

-
-
-
- -
-
-property experiment: None
-

Actual MLflow object. To use MLflow features in your -LightningModule do the following.

-

Example:

-
self.logger.experiment.some_mlflow_function()
-
-
-
-
Return type
-

None

-
-
-
- -
-
-property experiment_id: str
-

Create the experiment if it does not exist to get the experiment id.

-
-
Return type
-

str

-
-
Returns
-

The experiment id.

-
-
-
- -
-
-property name: str
-

Get the experiment id.

-
-
Return type
-

str

-
-
Returns
-

The experiment id.

-
-
-
- -
-
-property run_id: str
-

Create the experiment if it does not exist to get the run id.

-
-
Return type
-

str

-
-
Returns
-

The run id.

-
-
-
- -
-
-property save_dir: Optional[str]
-

The root file directory in which MLflow experiments are saved.

-
-
Return type
-

Optional[str]

-
-
Returns
-

Local path to the root experiment directory if the tracking uri is local. -Otherwise returns None.

-
-
-
- -
-
-property version: str
-

Get the run id.

-
-
Return type
-

str

-
-
Returns
-

The run id.

-
-
-
- -
- -
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- - -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/extensions/generated/pytorch_lightning.loggers.NeptuneLogger.html b/docs/extensions/generated/pytorch_lightning.loggers.NeptuneLogger.html deleted file mode 100644 index f8813e5..0000000 --- a/docs/extensions/generated/pytorch_lightning.loggers.NeptuneLogger.html +++ /dev/null @@ -1,989 +0,0 @@ - - - - - - - - - - - - - - NeptuneLogger — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

NeptuneLogger

-
-
-class pytorch_lightning.loggers.NeptuneLogger(*, api_key=None, project=None, name=None, run=None, log_model_checkpoints=True, prefix='training', agg_key_funcs=None, agg_default_func=None, **neptune_run_kwargs)[source]
-

Bases: pytorch_lightning.loggers.base.LightningLoggerBase

-

Log using Neptune.

-

Install it with pip:

-
pip install neptune-client
-
-
-

or conda:

-
conda install -c conda-forge neptune-client
-
-
-

Quickstart

-

Pass NeptuneLogger instance to the Trainer to log metadata with Neptune:

-
from pytorch_lightning import Trainer
-from pytorch_lightning.loggers import NeptuneLogger
-
-neptune_logger = NeptuneLogger(
-    api_key="ANONYMOUS",  # replace with your own
-    project="common/pytorch-lightning-integration",  # format "<WORKSPACE/PROJECT>"
-    tags=["training", "resnet"],  # optional
-)
-trainer = Trainer(max_epochs=10, logger=neptune_logger)
-
-
-

How to use NeptuneLogger?

-

Use the logger anywhere in your LightningModule as follows:

-
from neptune.new.types import File
-from pytorch_lightning import LightningModule
-
-
-class LitModel(LightningModule):
-    def training_step(self, batch, batch_idx):
-        # log metrics
-        acc = ...
-        self.log("train/loss", loss)
-
-    def any_lightning_module_function_or_hook(self):
-        # log images
-        img = ...
-        self.logger.experiment["train/misclassified_images"].log(File.as_image(img))
-
-        # generic recipe
-        metadata = ...
-        self.logger.experiment["your/metadata/structure"].log(metadata)
-
-
-

Note that syntax: self.logger.experiment["your/metadata/structure"].log(metadata) is specific to Neptune -and it extends logger capabilities. Specifically, it allows you to log various types of metadata -like scores, files, images, interactive visuals, CSVs, etc. -Refer to the Neptune docs -for more detailed explanations. -You can also use regular logger methods log_metrics(), and log_hyperparams() with NeptuneLogger -as these are also supported.

-

Log after fitting or testing is finished

-

You can log objects after the fitting or testing methods are finished:

-
neptune_logger = NeptuneLogger(project="common/pytorch-lightning-integration")
-
-trainer = pl.Trainer(logger=neptune_logger)
-model = ...
-datamodule = ...
-trainer.fit(model, datamodule=datamodule)
-trainer.test(model, datamodule=datamodule)
-
-# Log objects after `fit` or `test` methods
-# model summary
-neptune_logger.log_model_summary(model=model, max_depth=-1)
-
-# generic recipe
-metadata = ...
-neptune_logger.experiment["your/metadata/structure"].log(metadata)
-
-
-

Log model checkpoints

-

If you have ModelCheckpoint configured, -Neptune logger automatically logs model checkpoints. -Model weights will be uploaded to the: “model/checkpoints” namespace in the Neptune Run. -You can disable this option:

-
neptune_logger = NeptuneLogger(project="common/pytorch-lightning-integration", log_model_checkpoints=False)
-
-
-

Pass additional parameters to the Neptune run

-

You can also pass neptune_run_kwargs to specify the run in the greater detail, like tags or description:

-
from pytorch_lightning import Trainer
-from pytorch_lightning.loggers import NeptuneLogger
-
-neptune_logger = NeptuneLogger(
-    project="common/pytorch-lightning-integration",
-    name="lightning-run",
-    description="mlp quick run with pytorch-lightning",
-    tags=["mlp", "quick-run"],
-)
-trainer = Trainer(max_epochs=3, logger=neptune_logger)
-
-
-

Check run documentation -for more info about additional run parameters.

-

Details about Neptune run structure

-

Runs can be viewed as nested dictionary-like structures that you can define in your code. -Thanks to this you can easily organize your metadata in a way that is most convenient for you.

-

The hierarchical structure that you apply to your metadata will be reflected later in the UI.

-

You can organize this way any type of metadata - images, parameters, metrics, model checkpoint, CSV files, etc.

-
-

See also

- -
-
-
Parameters
-
    -
  • api_key (Optional[str]) – Optional. -Neptune API token, found on https://neptune.ai upon registration. -Read: how to find and set Neptune API token. -It is recommended to keep it in the NEPTUNE_API_TOKEN -environment variable and then you can drop api_key=None.

  • -
  • project (Optional[str]) – Optional. -Name of a project in a form of “my_workspace/my_project” for example “tom/mask-rcnn”. -If None, the value of NEPTUNE_PROJECT environment variable will be taken. -You need to create the project in https://neptune.ai first.

  • -
  • name (Optional[str]) – Optional. Editable name of the run. -Run name appears in the “all metadata/sys” section in Neptune UI.

  • -
  • run (None) – Optional. Default is None. The Neptune Run object. -If specified, this Run` will be used for logging, instead of a new Run. -When run object is passed you can’t specify other neptune properties.

  • -
  • log_model_checkpoints (Optional[bool]) – Optional. Default is True. Log model checkpoint to Neptune. -Works only if ModelCheckpoint is passed to the Trainer.

  • -
  • prefix (str) – Optional. Default is "training". Root namespace for all metadata logging.

  • -
  • **neptune_run_kwargs – Additional arguments like tags, description, capture_stdout, etc. -used when run is created.

  • -
-
-
Raises
-
    -
  • ModuleNotFoundError – If required Neptune package in version >=0.9 is not installed on the device.

  • -
  • TypeError – If configured project has not been migrated to new structure yet.

  • -
  • ValueError – If argument passed to the logger’s constructor is incorrect.

  • -
-
-
-
-
-after_save_checkpoint(checkpoint_callback)[source]
-

Automatically log checkpointed model. Called after model checkpoint callback saves a new checkpoint.

-
-
Parameters
-

checkpoint_callback – the model checkpoint callback instance

-
-
-
- -
-
-finalize(status)[source]
-

Do any processing that is necessary to finalize an experiment.

-
-
Parameters
-

status (str) – Status that the experiment finished with (e.g. success, failed, aborted)

-
-
Return type
-

None

-
-
-
- -
-
-log_hyperparams(params)[source]
-

Log hyper-parameters to the run.

-

Hyperparams will be logged under the “<prefix>/hyperparams” namespace.

-
-

Note

-

You can also log parameters by directly using the logger instance: -neptune_logger.experiment["model/hyper-parameters"] = params_dict.

-

In this way you can keep hierarchical structure of the parameters.

-
-
-
Parameters
-

params (Union[Dict[str, Any], Namespace]) – dict. -Python dictionary structure with parameters.

-
-
-

Example:

-
from pytorch_lightning.loggers import NeptuneLogger
-
-PARAMS = {
-    "batch_size": 64,
-    "lr": 0.07,
-    "decay_factor": 0.97
-}
-
-neptune_logger = NeptuneLogger(
-    api_key="ANONYMOUS",
-    project="common/pytorch-lightning-integration"
-)
-
-neptune_logger.log_hyperparams(PARAMS)
-
-
-
-
Return type
-

None

-
-
-
- -
-
-log_metrics(metrics, step=None)[source]
-

Log metrics (numeric values) in Neptune runs.

-
-
Parameters
-
    -
  • metrics (Dict[str, Union[Tensor, float]]) – Dictionary with metric names as keys and measured quantities as values.

  • -
  • step (Optional[int]) – Step number at which the metrics should be recorded, currently ignored.

  • -
-
-
Return type
-

None

-
-
-
- -
-
-property experiment: None
-

Actual Neptune run object. Allows you to use neptune logging features in your -LightningModule.

-

Example:

-
class LitModel(LightningModule):
-    def training_step(self, batch, batch_idx):
-        # log metrics
-        acc = ...
-        self.logger.experiment["train/acc"].log(acc)
-
-        # log images
-        img = ...
-        self.logger.experiment["train/misclassified_images"].log(File.as_image(img))
-
-
-

Note that syntax: self.logger.experiment["your/metadata/structure"].log(metadata) -is specific to Neptune and it extends logger capabilities. -Specifically, it allows you to log various types of metadata like scores, files, -images, interactive visuals, CSVs, etc. Refer to the -Neptune docs -for more detailed explanations. -You can also use regular logger methods log_metrics(), and log_hyperparams() -with NeptuneLogger as these are also supported.

-
-
Return type
-

None

-
-
-
- -
-
-property name: str
-

Return the experiment name or ‘offline-name’ when exp is run in offline mode.

-
-
Return type
-

str

-
-
-
- -
-
-property save_dir: Optional[str]
-

Gets the save directory of the experiment which in this case is None because Neptune does not save -locally.

-
-
Return type
-

Optional[str]

-
-
Returns
-

the root directory where experiment logs get saved

-
-
-
- -
-
-property version: str
-

Return the experiment version.

-

It’s Neptune Run’s short_id

-
-
Return type
-

str

-
-
-
- -
- -
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- - -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/extensions/generated/pytorch_lightning.loggers.TensorBoardLogger.html b/docs/extensions/generated/pytorch_lightning.loggers.TensorBoardLogger.html deleted file mode 100644 index 41d7374..0000000 --- a/docs/extensions/generated/pytorch_lightning.loggers.TensorBoardLogger.html +++ /dev/null @@ -1,908 +0,0 @@ - - - - - - - - - - - - - - TensorBoardLogger — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • TensorBoardLogger
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

TensorBoardLogger

-
-
-class pytorch_lightning.loggers.TensorBoardLogger(save_dir, name='lightning_logs', version=None, log_graph=False, default_hp_metric=True, prefix='', sub_dir=None, agg_key_funcs=None, agg_default_func=None, **kwargs)[source]
-

Bases: pytorch_lightning.loggers.base.LightningLoggerBase

-

Log to local file system in TensorBoard format.

-

Implemented using SummaryWriter. Logs are saved to -os.path.join(save_dir, name, version). This is the default logger in Lightning, it comes -preinstalled.

-

Example:

-
from pytorch_lightning import Trainer
-from pytorch_lightning.loggers import TensorBoardLogger
-
-logger = TensorBoardLogger("tb_logs", name="my_model")
-trainer = Trainer(logger=logger)
-
-
-
-
Parameters
-
    -
  • save_dir (str) – Save directory

  • -
  • name (Optional[str]) – Experiment name. Defaults to 'default'. If it is the empty string then no per-experiment -subdirectory is used.

  • -
  • version (Union[int, str, None]) – Experiment version. If version is not specified the logger inspects the save -directory for existing versions, then automatically assigns the next available version. -If it is a string then it is used as the run-specific subdirectory name, -otherwise 'version_${version}' is used.

  • -
  • log_graph (bool) – Adds the computational graph to tensorboard. This requires that -the user has defined the self.example_input_array attribute in their -model.

  • -
  • default_hp_metric (bool) – Enables a placeholder metric with key hp_metric when log_hyperparams is -called without a metric (otherwise calls to log_hyperparams without a metric are ignored).

  • -
  • prefix (str) – A string to put at the beginning of metric keys.

  • -
  • sub_dir (Optional[str]) – Sub-directory to group TensorBoard logs. If a sub_dir argument is passed -then logs are saved in /save_dir/name/version/sub_dir/. Defaults to None in which -logs are saved in /save_dir/name/version/.

  • -
  • **kwargs – Additional arguments used by SummaryWriter can be passed as keyword -arguments in this logger. To automatically flush to disk, max_queue sets the size -of the queue for pending logs before flushing. flush_secs determines how many seconds -elapses before flushing.

  • -
-
-
-
-
-finalize(status)[source]
-

Do any processing that is necessary to finalize an experiment.

-
-
Parameters
-

status (str) – Status that the experiment finished with (e.g. success, failed, aborted)

-
-
Return type
-

None

-
-
-
- -
-
-log_graph(model, input_array=None)[source]
-

Record model graph.

-
-
Parameters
-
    -
  • model (LightningModule) – lightning model

  • -
  • input_array – input passes to model.forward

  • -
-
-
-
- -
-
-log_hyperparams(params, metrics=None)[source]
-

Record hyperparameters. TensorBoard logs with and without saved hyperparameters are incompatible, the -hyperparameters are then not displayed in the TensorBoard. Please delete or move the previously saved logs -to display the new ones with hyperparameters.

-
-
Parameters
-
    -
  • params (Union[Dict[str, Any], Namespace]) – a dictionary-like container with the hyperparameters

  • -
  • metrics (Optional[Dict[str, Any]]) – Dictionary with metric names as keys and measured quantities as values

  • -
-
-
Return type
-

None

-
-
-
- -
-
-log_metrics(metrics, step=None)[source]
-

Records metrics. -This method logs metrics as as soon as it received them. If you want to aggregate -metrics for one specific step, use the -agg_and_log_metrics() method.

-
-
Parameters
-
    -
  • metrics (Dict[str, float]) – Dictionary with metric names as keys and measured quantities as values

  • -
  • step (Optional[int]) – Step number at which the metrics should be recorded

  • -
-
-
Return type
-

None

-
-
-
- -
-
-save()[source]
-

Save log data.

-
-
Return type
-

None

-
-
-
- -
-
-property experiment: torch.utils.tensorboard.writer.SummaryWriter
-

Actual tensorboard object. To use TensorBoard features in your -LightningModule do the following.

-

Example:

-
self.logger.experiment.some_tensorboard_function()
-
-
-
-
Return type
-

SummaryWriter

-
-
-
- -
-
-property log_dir: str
-

The directory for this run’s tensorboard checkpoint.

-

By default, it is named 'version_${self.version}' but it can be overridden by passing a string value for the -constructor’s version parameter instead of None or an int.

-
-
Return type
-

str

-
-
-
- -
-
-property name: str
-

Get the name of the experiment.

-
-
Return type
-

str

-
-
Returns
-

The name of the experiment.

-
-
-
- -
-
-property root_dir: str
-

Parent directory for all tensorboard checkpoint subdirectories.

-

If the experiment name parameter is an empty string, no experiment subdirectory is used and the checkpoint will -be saved in “save_dir/version”

-
-
Return type
-

str

-
-
-
- -
-
-property save_dir: Optional[str]
-

Gets the save directory where the TensorBoard experiments are saved.

-
-
Return type
-

Optional[str]

-
-
Returns
-

The local path to the save directory where the TensorBoard experiments are saved.

-
-
-
- -
-
-property sub_dir: Optional[str]
-

Gets the sub directory where the TensorBoard experiments are saved.

-
-
Return type
-

Optional[str]

-
-
Returns
-

The local path to the sub directory where the TensorBoard experiments are saved.

-
-
-
- -
-
-property version: int
-

Get the experiment version.

-
-
Return type
-

int

-
-
Returns
-

The experiment version if specified else the next version.

-
-
-
- -
- -
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
- -
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/extensions/generated/pytorch_lightning.loggers.WandbLogger.html b/docs/extensions/generated/pytorch_lightning.loggers.WandbLogger.html deleted file mode 100644 index 80acb66..0000000 --- a/docs/extensions/generated/pytorch_lightning.loggers.WandbLogger.html +++ /dev/null @@ -1,1022 +0,0 @@ - - - - - - - - - - - - - - WandbLogger — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

WandbLogger

-
-
-class pytorch_lightning.loggers.WandbLogger(name=None, save_dir=None, offline=False, id=None, anonymous=None, version=None, project=None, log_model=False, experiment=None, prefix='', agg_key_funcs=None, agg_default_func=None, **kwargs)[source]
-

Bases: pytorch_lightning.loggers.base.LightningLoggerBase

-

Log using Weights and Biases.

-

Installation and set-up

-

Install with pip:

-
pip install wandb
-
-
-

Create a WandbLogger instance:

-
from pytorch_lightning.loggers import WandbLogger
-
-wandb_logger = WandbLogger(project="MNIST")
-
-
-

Pass the logger instance to the Trainer:

-
trainer = Trainer(logger=wandb_logger)
-
-
-

A new W&B run will be created when training starts if you have not created one manually before with wandb.init().

-

Log metrics

-

Log from LightningModule:

-
class LitModule(LightningModule):
-    def training_step(self, batch, batch_idx):
-        self.log("train/loss", loss)
-
-
-

Use directly wandb module:

-
wandb.log({"train/loss": loss})
-
-
-

Log hyper-parameters

-

Save LightningModule parameters:

-
class LitModule(LightningModule):
-    def __init__(self, *args, **kwarg):
-        self.save_hyperparameters()
-
-
-

Add other config parameters:

-
# add one parameter
-wandb_logger.experiment.config["key"] = value
-
-# add multiple parameters
-wandb_logger.experiment.config.update({key1: val1, key2: val2})
-
-# use directly wandb module
-wandb.config["key"] = value
-wandb.config.update()
-
-
-

Log gradients, parameters and model topology

-

Call the watch method for automatically tracking gradients:

-
# log gradients and model topology
-wandb_logger.watch(model)
-
-# log gradients, parameter histogram and model topology
-wandb_logger.watch(model, log="all")
-
-# change log frequency of gradients and parameters (100 steps by default)
-wandb_logger.watch(model, log_freq=500)
-
-# do not log graph (in case of errors)
-wandb_logger.watch(model, log_graph=False)
-
-
-

The watch method adds hooks to the model which can be removed at the end of training:

-
wandb_logger.unwatch(model)
-
-
-

Log model checkpoints

-

Log model checkpoints at the end of training:

-
wandb_logger = WandbLogger(log_model=True)
-
-
-

Log model checkpoints as they get created during training:

-
wandb_logger = WandbLogger(log_model="all")
-
-
-

Custom checkpointing can be set up through ModelCheckpoint:

-
# log model only if `val_accuracy` increases
-wandb_logger = WandbLogger(log_model="all")
-checkpoint_callback = ModelCheckpoint(monitor="val_accuracy", mode="max")
-trainer = Trainer(logger=wandb_logger, callbacks=[checkpoint_callback])
-
-
-

latest and best aliases are automatically set to easily retrieve a model checkpoint:

-
# reference can be retrieved in artifacts panel
-# "VERSION" can be a version (ex: "v2") or an alias ("latest or "best")
-checkpoint_reference = "USER/PROJECT/MODEL-RUN_ID:VERSION"
-
-# download checkpoint locally (if not already cached)
-run = wandb.init(project="MNIST")
-artifact = run.use_artifact(checkpoint_reference, type="model")
-artifact_dir = artifact.download()
-
-# load checkpoint
-model = LitModule.load_from_checkpoint(Path(artifact_dir) / "model.ckpt")
-
-
-

Log media

-

Log text with:

-
# using columns and data
-columns = ["input", "label", "prediction"]
-data = [["cheese", "english", "english"], ["fromage", "french", "spanish"]]
-wandb_logger.log_text(key="samples", columns=columns, data=data)
-
-# using a pandas DataFrame
-wandb_logger.log_text(key="samples", dataframe=my_dataframe)
-
-
-

Log images with:

-
# using tensors, numpy arrays or PIL images
-wandb_logger.log_image(key="samples", images=[img1, img2])
-
-# adding captions
-wandb_logger.log_image(key="samples", images=[img1, img2], caption=["tree", "person"])
-
-# using file path
-wandb_logger.log_image(key="samples", images=["img_1.jpg", "img_2.jpg"])
-
-
-

More arguments can be passed for logging segmentation masks and bounding boxes. Refer to -Image Overlays documentation.

-

Log Tables

-

W&B Tables can be used to log, query and analyze tabular data.

-

They support any type of media (text, image, video, audio, molecule, html, etc) and are great for storing, -understanding and sharing any form of data, from datasets to model predictions.

-
columns = ["caption", "image", "sound"]
-data = [["cheese", wandb.Image(img_1), wandb.Audio(snd_1)], ["wine", wandb.Image(img_2), wandb.Audio(snd_2)]]
-wandb_logger.log_table(key="samples", columns=columns, data=data)
-
-
-
-

See also

- -
-
-
Parameters
-
    -
  • name (Optional[str]) – Display name for the run.

  • -
  • save_dir (Optional[str]) – Path where data is saved (wandb dir by default).

  • -
  • offline (Optional[bool]) – Run offline (data can be streamed later to wandb servers).

  • -
  • id (Optional[str]) – Sets the version, mainly used to resume a previous run.

  • -
  • version (Optional[str]) – Same as id.

  • -
  • anonymous (Optional[bool]) – Enables or explicitly disables anonymous logging.

  • -
  • project (Optional[str]) – The name of the project to which this run will belong.

  • -
  • log_model (Union[str, bool]) –

    Log checkpoints created by ModelCheckpoint -as W&B artifacts. latest and best aliases are automatically set.

    -
      -
    • if log_model == 'all', checkpoints are logged during training.

    • -
    • if log_model == True, checkpoints are logged at the end of training, except when -save_top_k == -1 -which also logs every checkpoint during training.

    • -
    • if log_model == False (default), no checkpoint is logged.

    • -
    -

  • -
  • prefix (Optional[str]) – A string to put at the beginning of metric keys.

  • -
  • experiment – WandB experiment object. Automatically set when creating a run.

  • -
  • **kwargs – Arguments passed to wandb.init() like entity, group, tags, etc.

  • -
-
-
Raises
-
    -
  • ModuleNotFoundError – If required WandB package is not installed on the device.

  • -
  • MisconfigurationException – If both log_model and offline is set to True.

  • -
-
-
-
-
-after_save_checkpoint(checkpoint_callback)[source]
-

Called after model checkpoint callback saves a new checkpoint.

-
-
Parameters
-

checkpoint_callback – the model checkpoint callback instance

-
-
-
- -
-
-finalize(status)[source]
-

Do any processing that is necessary to finalize an experiment.

-
-
Parameters
-

status (str) – Status that the experiment finished with (e.g. success, failed, aborted)

-
-
Return type
-

None

-
-
-
- -
-
-log_hyperparams(params)[source]
-

Record hyperparameters.

-
-
Parameters
-
    -
  • params (Union[Dict[str, Any], Namespace]) – Namespace containing the hyperparameters

  • -
  • args – Optional positional arguments, depends on the specific logger being used

  • -
  • kwargs – Optional keyword arguments, depends on the specific logger being used

  • -
-
-
Return type
-

None

-
-
-
- -
-
-log_image(key, images, step=None, **kwargs)[source]
-

Log images (tensors, numpy arrays, PIL Images or file paths).

-

Optional kwargs are lists passed to each image (ex: caption, masks, boxes).

-
-
Return type
-

None

-
-
-
- -
-
-log_metrics(metrics, step=None)[source]
-

Records metrics. -This method logs metrics as as soon as it received them. If you want to aggregate -metrics for one specific step, use the -agg_and_log_metrics() method.

-
-
Parameters
-
    -
  • metrics (Dict[str, float]) – Dictionary with metric names as keys and measured quantities as values

  • -
  • step (Optional[int]) – Step number at which the metrics should be recorded

  • -
-
-
Return type
-

None

-
-
-
- -
-
-log_table(key, columns=None, data=None, dataframe=None, step=None)[source]
-

Log a Table containing any object type (text, image, audio, video, molecule, html, etc).

-

Can be defined either with columns and data or with dataframe.

-
-
Return type
-

None

-
-
-
- -
-
-log_text(key, columns=None, data=None, dataframe=None, step=None)[source]
-

Log text as a Table.

-

Can be defined either with columns and data or with dataframe.

-
-
Return type
-

None

-
-
-
- -
-
-property experiment: None
-

Actual wandb object. To use wandb features in your -LightningModule do the following.

-

Example:

-
.. code-block:: python
-
-
-
-

self.logger.experiment.some_wandb_function()

-
-
-
Return type
-

None

-
-
-
- -
-
-property name: Optional[str]
-

Gets the name of the experiment.

-
-
Return type
-

Optional[str]

-
-
Returns
-

The name of the experiment if the experiment exists else the name given to the constructor.

-
-
-
- -
-
-property save_dir: Optional[str]
-

Gets the save directory.

-
-
Return type
-

Optional[str]

-
-
Returns
-

The path to the save directory.

-
-
-
- -
-
-property version: Optional[str]
-

Gets the id of the experiment.

-
-
Return type
-

Optional[str]

-
-
Returns
-

The id of the experiment if the experiment exists else the id given to the constructor.

-
-
-
- -
- -
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- - -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/extensions/logging.html b/docs/extensions/logging.html deleted file mode 100644 index 9477e51..0000000 --- a/docs/extensions/logging.html +++ /dev/null @@ -1,1058 +0,0 @@ - - - - - - - - - - - - - - Logging — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Logging

-
-

Supported Loggers

-

The following are loggers we support:

- ---- - - - - - - - - - - - - - - - - - - - - -

CometLogger

Log using Comet.ml.

CSVLogger

Log to local file system in yaml and CSV format.

MLFlowLogger

Log using MLflow.

NeptuneLogger

Log using Neptune.

TensorBoardLogger

Log to local file system in TensorBoard format.

WandbLogger

Log using Weights and Biases.

-

The above loggers will normally plot an additional chart (global_step VS epoch). Depending on the loggers you use, there might be some additional charts too.

-

By default, Lightning uses TensorBoard logger under the hood, and stores the logs to a directory (by default in lightning_logs/).

-
from pytorch_lightning import Trainer
-
-# Automatically logs to a directory (by default ``lightning_logs/``)
-trainer = Trainer()
-
-
-

To see your logs:

-
tensorboard --logdir=lightning_logs/
-
-
-

To visualize tensorboard in a jupyter notebook environment, run the following command in a jupyter cell:

-
%reload_ext tensorboard
-%tensorboard --logdir=lightning_logs/
-
-
-

You can also pass a custom Logger to the Trainer.

-
from pytorch_lightning import loggers as pl_loggers
-
-tb_logger = pl_loggers.TensorBoardLogger(save_dir="logs/")
-trainer = Trainer(logger=tb_logger)
-
-
-

Choose from any of the others such as MLflow, Comet, Neptune, WandB, etc.

-
comet_logger = pl_loggers.CometLogger(save_dir="logs/")
-trainer = Trainer(logger=comet_logger)
-
-
-

To use multiple loggers, simply pass in a list or tuple of loggers.

-
tb_logger = pl_loggers.TensorBoardLogger(save_dir="logs/")
-comet_logger = pl_loggers.CometLogger(save_dir="logs/")
-trainer = Trainer(logger=[tb_logger, comet_logger])
-
-
-
-

Note

-

By default, Lightning logs every 50 steps. Use Trainer flags to Control Logging Frequency.

-
-
-

Note

-

By default, all loggers log to os.getcwd(). You can change the logging path using -Trainer(default_root_dir="/your/path/to/save/checkpoints") without instantiating a logger.

-
-
-
-
-

Logging from a LightningModule

-

Lightning offers automatic log functionalities for logging scalars, or manual logging for anything else.

-
-

Automatic Logging

-

Use the log() or log_dict() -methods to log from anywhere in a LightningModule and callbacks.

-
def training_step(self, batch, batch_idx):
-    self.log("my_metric", x)
-
-
-# or a dict to get multiple metrics on the same plot if the logger supports it
-def training_step(self, batch, batch_idx):
-    self.log("performance", {"acc": acc, "recall": recall})
-
-
-# or a dict to log all metrics at once with individual plots
-def training_step(self, batch, batch_idx):
-    self.log_dict({"acc": acc, "recall": recall})
-
-
-
-

Note

-

Everything explained below applies to both log() or log_dict() methods.

-
-

Depending on where the log() method is called, Lightning auto-determines -the correct logging mode for you. Of course you can override the default behavior by manually setting the -log() parameters.

-
def training_step(self, batch, batch_idx):
-    self.log("my_loss", loss, on_step=True, on_epoch=True, prog_bar=True, logger=True)
-
-
-

The log() method has a few options:

-
    -
  • on_step: Logs the metric at the current step.

  • -
  • on_epoch: Automatically accumulates and logs at the end of the epoch.

  • -
  • prog_bar: Logs to the progress bar (Default: False).

  • -
  • logger: Logs to the logger like Tensorboard, or any other custom logger passed to the Trainer (Default: True).

  • -
  • reduce_fx: Reduction function over step values for end of epoch. Uses torch.mean() by default.

  • -
  • enable_graph: If True, will not auto detach the graph.

  • -
  • sync_dist: If True, reduces the metric across devices. Use with care as this may lead to a significant communication overhead.

  • -
  • sync_dist_group: The DDP group to sync across.

  • -
  • add_dataloader_idx: If True, appends the index of the current dataloader to the name (when using multiple dataloaders). If False, user needs to give unique names for each dataloader to not mix the values.

  • -
  • batch_size: Current batch size used for accumulating logs logged with on_epoch=True. This will be directly inferred from the loaded batch, but for some data structures you might need to explicitly provide it.

  • -
  • rank_zero_only: Whether the value will be logged only on rank 0. This will prevent synchronization which would produce a deadlock as not all processes would perform this log call.

  • -
- - ----- - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
Default behavior of logging in Callback or LightningModule

Hook

on_step

on_epoch

on_train_start, on_train_epoch_start, on_train_epoch_end, training_epoch_end

False

True

on_before_backward, on_after_backward, on_before_optimizer_step, on_before_zero_grad

True

False

on_train_batch_start, on_train_batch_end, training_step, training_step_end

True

False

on_validation_start, on_validation_epoch_start, on_validation_epoch_end, validation_epoch_end

False

True

on_validation_batch_start, on_validation_batch_end, validation_step, validation_step_end

False

True

-
-

Note

-

While logging tensor metrics with on_epoch=True inside step-level hooks and using mean-reduction (default) to accumulate the metrics across the current epoch, Lightning tries to extract the -batch size from the current batch. If multiple possible batch sizes are found, a warning is logged and if it fails to extract the batch size from the current batch, which is possible if -the batch is a custom structure/collection, then an error is raised. To avoid this, you can specify the batch_size inside the self.log(... batch_size=batch_size) call.

-
def training_step(self, batch, batch_idx):
-    # extracts the batch size from `batch`
-    self.log("train_loss", loss, on_epoch=True)
-
-
-def validation_step(self, batch, batch_idx):
-    # uses `batch_size=10`
-    self.log("val_loss", loss, batch_size=10)
-
-
-
-
-

Note

-
    -
  • The above config for validation applies for test hooks as well.

  • -
  • Setting on_epoch=True will cache all your logged values during the full training epoch and perform a -reduction in on_train_epoch_end. We recommend using TorchMetrics, when working with custom reduction.

  • -
  • Setting both on_step=True and on_epoch=True will create two keys per metric you log with -suffix _step and _epoch respectively. You can refer to these keys e.g. in the monitor -argument of ModelCheckpoint or in the graphs plotted to the logger of your choice.

  • -
-
-

If your work requires to log in an unsupported method, please open an issue with a clear description of why it is blocking you.

-
-
-

Manual Logging Non-Scalar Artifacts

-

If you want to log anything that is not a scalar, like histograms, text, images, etc., you may need to use the logger object directly.

-
def training_step(self):
-    ...
-    # the logger you used (in this case tensorboard)
-    tensorboard = self.logger.experiment
-    tensorboard.add_image()
-    tensorboard.add_histogram(...)
-    tensorboard.add_figure(...)
-
-
-
-
-
-
-

Make a Custom Logger

-

You can implement your own logger by writing a class that inherits from Logger. -Use the rank_zero_experiment() and rank_zero_only() decorators to make sure that only the first process in DDP training creates the experiment and logs the data respectively.

-
from pytorch_lightning.loggers.logger import Logger, rank_zero_experiment
-from pytorch_lightning.utilities.distributed import rank_zero_only
-
-
-class MyLogger(Logger):
-    @property
-    def name(self):
-        return "MyLogger"
-
-    @property
-    def version(self):
-        # Return the experiment version, int or str.
-        return "0.1"
-
-    @rank_zero_only
-    def log_hyperparams(self, params):
-        # params is an argparse.Namespace
-        # your code to record hyperparameters goes here
-        pass
-
-    @rank_zero_only
-    def log_metrics(self, metrics, step):
-        # metrics is a dictionary of metric names and values
-        # your code to record metrics goes here
-        pass
-
-    @rank_zero_only
-    def save(self):
-        # Optional. Any code necessary to save logger data goes here
-        pass
-
-    @rank_zero_only
-    def finalize(self, status):
-        # Optional. Any code that needs to be run after training
-        # finishes goes here
-        pass
-
-
-

If you write a logger that may be useful to others, please send -a pull request to add it to Lightning!

-
-
-
-

Control Logging Frequency

-
-

Logging frequency

-

It may slow down training to log on every single batch. By default, Lightning logs every 50 rows, or 50 training steps. -To change this behaviour, set the log_every_n_steps Trainer flag.

-
k = 10
-trainer = Trainer(log_every_n_steps=k)
-
-
-
-
-

Log Writing Frequency

-

Individual logger implementations determine their flushing frequency. For example, on the -CSVLogger you can set the flag flush_logs_every_n_steps.

-
-
-
-
-

Progress Bar

-

You can add any metric to the progress bar using log() -method, setting prog_bar=True.

-
def training_step(self, batch, batch_idx):
-    self.log("my_loss", loss, prog_bar=True)
-
-
-

You could learn more about progress bars supported by Lightning here.

-
-

Modifying the Progress Bar

-

The progress bar by default already includes the training loss and version number of the experiment -if you are using a logger. These defaults can be customized by overriding the -get_metrics() hook in your logger.

-
from pytorch_lightning.callbacks.progress import Tqdm
-
-
-class CustomProgressBar(Tqdm):
-    def get_metrics(self, *args, **kwargs):
-        # don't show the version number
-        items = super().get_metrics()
-        items.pop("v_num", None)
-        return items
-
-
-
-
-
-
-

Configure Console Logging

-

Lightning logs useful information about the training process and user warnings to the console. -You can retrieve the Lightning console logger and change it to your liking. For example, adjust the logging level -or redirect output for certain modules to log files:

-
import logging
-
-# configure logging at the root level of Lightning
-logging.getLogger("pytorch_lightning").setLevel(logging.ERROR)
-
-# configure logging on module level, redirect to file
-logger = logging.getLogger("pytorch_lightning.core")
-logger.addHandler(logging.FileHandler("core.log"))
-
-
-

Read more about custom Python logging here.

-
-
-
-

Logging Hyperparameters

-

When training a model, it is useful to know what hyperparams went into that model. -When Lightning creates a checkpoint, it stores a key "hyper_parameters" with the hyperparams.

-
lightning_checkpoint = torch.load(filepath, map_location=lambda storage, loc: storage)
-hyperparams = lightning_checkpoint["hyper_parameters"]
-
-
-

Some loggers also allow logging the hyperparams used in the experiment. For instance, -when using the TensorBoardLogger, all hyperparams will show -in the hparams tab.

-
-

Note

-

If you want to track a metric in the tensorboard hparams tab, log scalars to the key hp_metric. If tracking multiple metrics, initialize TensorBoardLogger with default_hp_metric=False and call log_hyperparams only once with your metric keys and initial values. Subsequent updates can simply be logged to the metric keys. Refer to the examples below for setting up proper hyperparams metrics tracking within the LightningModule.

-
# Using default_hp_metric
-def validation_step(self, batch, batch_idx):
-    self.log("hp_metric", some_scalar)
-
-
-# Using custom or multiple metrics (default_hp_metric=False)
-def on_train_start(self):
-    self.logger.log_hyperparams(self.hparams, {"hp/metric_1": 0, "hp/metric_2": 0})
-
-
-def validation_step(self, batch, batch_idx):
-    self.log("hp/metric_1", some_scalar_1)
-    self.log("hp/metric_2", some_scalar_2)
-
-
-

In the example, using "hp/" as a prefix allows for the metrics to be grouped under “hp” in the tensorboard scalar tab where you can collapse them.

-
-
-
-
-

Managing Remote Filesystems

-

Lightning supports saving logs to a variety of filesystems, including local filesystems and several cloud storage providers.

-

Check out the Remote Filesystems doc for more info.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/extensions/loops.html b/docs/extensions/loops.html deleted file mode 100644 index 3a7d110..0000000 --- a/docs/extensions/loops.html +++ /dev/null @@ -1,1219 +0,0 @@ - - - - - - - - - - - - - - Loops — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Loops

-

Loops let advanced users swap out the default gradient descent optimization loop at the core of Lightning with a different optimization paradigm.

-

The Lightning Trainer is built on top of the standard gradient descent optimization loop which works for 90%+ of machine learning use cases:

-
for i, batch in enumerate(dataloader):
-    x, y = batch
-    y_hat = model(x)
-    loss = loss_function(y_hat, y)
-    optimizer.zero_grad()
-    loss.backward()
-    optimizer.step()
-
-
-

However, some new research use cases such as meta-learning, active learning, recommendation systems, etc., require a different loop structure. -For example here is a simple loop that guides the weight updates with a loss from a special validation split:

-
for i, batch in enumerate(train_dataloader):
-    x, y = batch
-    y_hat = model(x)
-    loss = loss_function(y_hat, y)
-    optimizer.zero_grad()
-    loss.backward()
-
-    val_loss = 0
-    for i, val_batch in enumerate(val_dataloader):
-        x, y = val_batch
-        y_hat = model(x)
-        val_loss += loss_function(y_hat, y)
-
-    scale_gradients(model, 1 / val_loss)
-    optimizer.step()
-
-
-

With Lightning Loops, you can customize to non-standard gradient descent optimizations to get the same loop above:

-
trainer = Trainer()
-trainer.fit_loop.epoch_loop = MyGradientDescentLoop()
-
-
-

Think of this as swapping out the engine in a car!

-
-
-

Understanding the Default Trainer Loop

-

The Lightning Trainer automates the standard optimization loop which every PyTorch user is familiar with:

-
for i, batch in enumerate(dataloader):
-    x, y = batch
-    y_hat = model(x)
-    loss = loss_function(y_hat, y)
-    optimizer.zero_grad()
-    loss.backward()
-    optimizer.step()
-
-
-

The core research logic is simply shifted to the LightningModule:

-
for i, batch in enumerate(dataloader):
-    # x, y = batch                      moved to training_step
-    # y_hat = model(x)                  moved to training_step
-    # loss = loss_function(y_hat, y)    moved to training_step
-    loss = lightning_module.training_step(batch, i)
-
-    # Lightning handles automatically:
-    optimizer.zero_grad()
-    loss.backward()
-    optimizer.step()
-
-
-

Under the hood, the above loop is implemented using the Loop API like so:

-
class DefaultLoop(Loop):
-    def advance(self, batch, i):
-        loss = lightning_module.training_step(batch, i)
-        optimizer.zero_grad()
-        loss.backward()
-        optimizer.step()
-
-    def run(self, dataloader):
-        for i, batch in enumerate(dataloader):
-            self.advance(batch, i)
-
-
-

Defining a loop within a class interface instead of hard-coding a raw Python for/while loop has several benefits:

-
    -
  1. You can have full control over the data flow through loops.

  2. -
  3. You can add new loops and nest as many of them as you want.

  4. -
  5. If needed, the state of a loop can be saved and resumed.

  6. -
  7. New hooks can be injected at any point.

  8. -
-Animation showing how to convert a standard training loop to a Lightning loop -
-
-
-

Overriding the default Loops

-

The fastest way to get started with loops, is to override functionality of an existing loop. -Lightning has 4 main loops which relies on : FitLoop for fitting (training and validating), -EvaluationLoop for validating or testing, -PredictionLoop for predicting.

-

For simple changes that don’t require a custom loop, you can modify each of these loops.

-

Each loop has a series of methods that can be modified. -For example with the FitLoop:

-
from pytorch_lightning.loops import FitLoop
-
-
-class MyLoop(FitLoop):
-    def advance(self):
-        """Advance from one iteration to the next."""
-
-    def on_advance_end(self):
-        """Do something at the end of an iteration."""
-
-    def on_run_end(self):
-        """Do something when the loop ends."""
-
-
-

A full list with all built-in loops and subloops can be found here.

-

To add your own modifications to a loop, simply subclass an existing loop class and override what you need. -Here is a simple example how to add a new hook:

-
from pytorch_lightning.loops import FitLoop
-
-
-class CustomFitLoop(FitLoop):
-    def advance(self):
-        # ... whatever code before
-
-        # pass anything you want to the hook
-        self.trainer.call_hook("my_new_hook", *args, **kwargs)
-
-        # ... whatever code after
-
-
-

Now simply attach the correct loop in the trainer directly:

-
trainer = Trainer(...)
-trainer.fit_loop = CustomFitLoop()
-
-# fit() now uses the new FitLoop!
-trainer.fit(...)
-
-# the equivalent for validate()
-val_loop = CustomValLoop()
-trainer = Trainer()
-trainer.validate_loop = val_loop
-trainer.validate(...)
-
-
-

Now your code is FULLY flexible and you can still leverage ALL the best parts of Lightning!

-Animation showing how to replace a loop on the Trainer -
-
-
-

Creating a New Loop From Scratch

-

You can also go wild and implement a full loop from scratch by sub-classing the Loop base class. -You will need to override a minimum of two things:

-
from pytorch_lightning.loop import Loop
-
-
-class MyFancyLoop(Loop):
-    @property
-    def done(self):
-        """Provide a condition to stop the loop."""
-
-    def advance(self):
-        """
-        Access your dataloader/s in whatever way you want.
-        Do your fancy optimization things.
-        Call the LightningModule methods at your leisure.
-        """
-
-
-

Finally, attach it into the Trainer:

-
trainer = Trainer(...)
-trainer.fit_loop = MyFancyLoop()
-
-# fit() now uses your fancy loop!
-trainer.fit(...)
-
-
-

But beware: Loop customization gives you more power and full control over the Trainer and with great power comes great responsibility. -We recommend that you familiarize yourself with overriding the default loops first before you start building a new loop from the ground up.

-
-
-
-

Loop API

-

Here is the full API of methods available in the Loop base class.

-

The Loop class is the base of all loops in the same way as the LightningModule is the base of all models. -It defines a public interface that each loop implementation must follow, the key ones are:

-
-

Properties

-
-

done

-
-
-Loop.done
-

Property indicating when the loop is finished.

-

Example:

-
@property
-def done(self):
-    return self.trainer.global_step >= self.trainer.max_steps
-
-
-
-
Return type
-

bool

-
-
-
- -
-
-

skip (optional)

-
-
-Loop.skip
-

Determine whether to return immediately from the call to run().

-

Example:

-
@property
-def skip(self):
-    return len(self.trainer.train_dataloader) == 0
-
-
-
-
Return type
-

bool

-
-
-
- -
-
-
-

Methods

-
-

reset (optional)

-
-
-abstract Loop.reset()[source]
-

Resets the internal state of the loop at the beginning of each call to run.

-

Example:

-
def reset(self):
-    # reset your internal state or add custom logic
-    # if you expect run() to be called multiple times
-    self.current_iteration = 0
-    self.outputs = []
-
-
-
-
Return type
-

None

-
-
-
- -
-
-

advance

-
-
-abstract Loop.advance(*args, **kwargs)[source]
-

Performs a single step.

-

Accepts all arguments passed to run.

-

Example:

-
def advance(self, iterator):
-    batch = next(iterator)
-    loss = self.trainer.lightning_module.training_step(batch, batch_idx)
-    ...
-
-
-
-
Return type
-

None

-
-
-
- -
-
-

run (optional)

-
-
-Loop.run(*args, **kwargs)[source]
-

The main entry point to the loop.

-

Will frequently check the done condition and calls advance -until done evaluates to True.

-

Override this if you wish to change the default behavior. The default implementation is:

-

Example:

-
def run(self, *args, **kwargs):
-    if self.skip:
-        return self.on_skip()
-
-    self.reset()
-    self.on_run_start(*args, **kwargs)
-
-    while not self.done:
-        self.advance(*args, **kwargs)
-
-    output = self.on_run_end()
-    return output
-
-
-
-
Return type
-

~T

-
-
Returns
-

The output of on_run_end (often outputs collected from each step of the loop)

-
-
-
- -
-
-
-
-
-

Subloops

-

When you want to customize nested loops within loops, use the replace() method:

-
# This takes care of properly instantiating the new Loop and setting all references
-trainer.fit_loop.replace(epoch_loop=MyEpochLoop)
-# Trainer runs the fit loop with your new epoch loop!
-trainer.fit(model)
-
-
-

Alternatively, for more fine-grained control, use the connect() method:

-
# Optional: stitch back the trainer arguments
-epoch_loop = MyEpochLoop(trainer.fit_loop.epoch_loop.min_steps, trainer.fit_loop.epoch_loop.max_steps)
-# Optional: connect children loops as they might have existing state
-epoch_loop.connect(trainer.fit_loop.epoch_loop.batch_loop, trainer.fit_loop.epoch_loop.val_loop)
-# Instantiate and connect the loop.
-trainer.fit_loop.connect(epoch_loop=epoch_loop)
-trainer.fit(model)
-
-
-

More about the built-in loops and how they are composed is explained in the next section.

-Animation showing how to connect a custom subloop -
-
-
-

Built-in Loops

-

The training loop in Lightning is called fit loop and is actually a combination of several loops. -Here is what the structure would look like in plain Python:

-
# FitLoop
-for epoch in range(max_epochs):
-
-    # TrainingEpochLoop
-    for batch_idx, batch in enumerate(train_dataloader):
-
-        # TrainingBatchLoop
-        for split_batch in tbptt_split(batch):
-
-            # OptimizerLoop
-            for optimizer_idx, opt in enumerate(optimizers):
-
-                loss = lightning_module.training_step(batch, batch_idx, optimizer_idx)
-                ...
-
-        # ValidationEpochLoop
-        for batch_idx, batch in enumerate(val_dataloader):
-            lightning_module.validation_step(batch, batch_idx, optimizer_idx)
-            ...
-
-
-

Each of these for-loops represents a class implementing the Loop interface.

- - ---- - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
Trainer entry points and associated loops

Built-in loop

Description

FitLoop

The FitLoop is the top-level loop where training starts. -It simply counts the epochs and iterates from one to the next by calling TrainingEpochLoop.run() in its advance() method.

TrainingEpochLoop

The TrainingEpochLoop is the one that iterates over the dataloader that the user returns in their train_dataloader() method. -Its main responsibilities are calling the *_epoch_start and *_epoch_end hooks, accumulating outputs if the user request them in one of these hooks, and running validation at the requested interval. -The validation is carried out by yet another loop, ValidationEpochLoop.

-

In the run() method, the training epoch loop could in theory simply call the LightningModule.training_step already and perform the optimization. -However, Lightning has built-in support for automatic optimization with multiple optimizers and on top of that also supports TBPTT. -For this reason there are actually two more loops nested under TrainingEpochLoop.

-

TrainingBatchLoop

The responsibility of the TrainingBatchLoop is to split a batch given by the TrainingEpochLoop along the time-dimension and iterate over the list of splits. -It also keeps track of the hidden state hiddens returned by the training step. -By default, when truncated back-propagation through time (TBPTT) is turned off, this loop does not do anything except redirect the call to the OptimizerLoop. -Read more about TBPTT.

OptimizerLoop

The OptimizerLoop iterates over one or multiple optimizers and for each one it calls the training_step() method with the batch, the current batch index and the optimizer index if multiple optimizers are requested. -It is the leaf node in the tree of loops and performs the actual optimization (forward, zero grad, backward, optimizer step).

ManualOptimization

Substitutes the OptimizerLoop in case of manual optimization and implements the manual optimization step.

EvaluationLoop

The EvaluationLoop is the top-level loop where validation/testing starts. -It simply iterates over each evaluation dataloader from one to the next by calling EvaluationEpochLoop.run() in its advance() method.

PredictionLoop

The PredictionLoop is the top-level loop where prediction starts. -It simply iterates over each prediction dataloader from one to the next by calling PredictionEpochLoop.run() in its advance() method.

-
-
-
-

Available Loops in Lightning Flash

-

Active Learning is a machine learning practice in which the user interacts with the learner in order to provide new labels when required.

-

You can find a real use case in Lightning Flash.

-

Flash implements the ActiveLearningLoop that you can use together with the ActiveLearningDataModule to label new data on the fly. -To run the following demo, install Flash and BaaL first:

-
pip install lightning-flash baal
-
-
-
import torch
-
-import flash
-from flash.core.classification import Probabilities
-from flash.core.data.utils import download_data
-from flash.image import ImageClassificationData, ImageClassifier
-from flash.image.classification.integrations.baal import ActiveLearningDataModule, ActiveLearningLoop
-
-# 1. Create the DataModule
-download_data("https://pl-flash-data.s3.amazonaws.com/hymenoptera_data.zip", "./data")
-
-# Implement the research use-case where we mask labels from labelled dataset.
-datamodule = ActiveLearningDataModule(
-    ImageClassificationData.from_folders(train_folder="data/hymenoptera_data/train/", batch_size=2),
-    initial_num_labels=5,
-    val_split=0.1,
-)
-
-# 2. Build the task
-head = torch.nn.Sequential(
-    torch.nn.Dropout(p=0.1),
-    torch.nn.Linear(512, datamodule.num_classes),
-)
-model = ImageClassifier(backbone="resnet18", head=head, num_classes=datamodule.num_classes, output=Probabilities())
-
-
-# 3.1 Create the trainer
-trainer = flash.Trainer(max_epochs=3)
-
-# 3.2 Create the active learning loop and connect it to the trainer
-active_learning_loop = ActiveLearningLoop(label_epoch_frequency=1)
-active_learning_loop.connect(trainer.fit_loop)
-trainer.fit_loop = active_learning_loop
-
-# 3.3 Finetune
-trainer.finetune(model, datamodule=datamodule, strategy="freeze")
-
-# 4. Predict what's on a few images! ants or bees?
-predictions = model.predict("data/hymenoptera_data/val/bees/65038344_52a45d090d.jpg")
-print(predictions)
-
-# 5. Save the model!
-trainer.save_checkpoint("image_classification_model.pt")
-
-
-

Here is the Active Learning Loop example and the code for the active learning loop.

-
-
-
-

Advanced Examples

- - ---- - - - - - - - - - - - - - -
Ready-to-run loop examples and tutorials

Link to Example

Description

K-fold Cross Validation

KFold / Cross Validation is a machine learning practice in which the training dataset is being partitioned into num_folds complementary subsets. -One cross validation round will perform fitting where one fold is left out for validation and the other folds are used for training. -To reduce variability, once all rounds are performed using the different folds, the trained models are ensembled and their predictions are -averaged when estimating the model’s predictive performance on the test dataset.

Yielding Training Step

This loop enables you to write the training_step() hook -as a Python Generator for automatic optimization with multiple optimizers, i.e., you can yield loss -values from it instead of returning them. This can enable more elegant and expressive implementations, as shown -shown with a GAN in this example.

-
-
-
-

Advanced Features

-

Next: Advanced loop features

-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/extensions/loops_advanced.html b/docs/extensions/loops_advanced.html deleted file mode 100644 index 11d6830..0000000 --- a/docs/extensions/loops_advanced.html +++ /dev/null @@ -1,721 +0,0 @@ - - - - - - - - - - - - - - Loops (Advanced) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Loops (Advanced)

-
-

Persisting the State of Loops

-
-

Note

-

This is an experimental feature and is not activated by default. -Set the environment variable PL_FAULT_TOLERANT_TRAINING = 1 to enable saving the progress of loops. -Read more about fault-tolerant training.

-
-

A powerful property of the class-based loop interface is that it can own an internal state. -Loop instances can save their state to the checkpoint through corresponding hooks and if implemented accordingly, resume the state of execution at the appropriate place. -This design is particularly interesting for fault-tolerant training which is an experimental feature released in Lightning v1.5.

-

The two hooks on_save_checkpoint() and on_load_checkpoint() function very similarly to how LightningModules and Callbacks save and load state.

-
def on_save_checkpoint(self):
-    state_dict["iteration"] = self.iteration
-    return state_dict
-
-
-def on_load_checkpoint(self, state_dict):
-    self.iteration = state_dict["iteration"]
-
-
-

When the Trainer is restarting from a checkpoint (e.g., through trainer.fit(ckpt_path=...)), the loop exposes a boolean attribute restarting. -Based around the value of this variable, the user can write the loop in such a way that it can restart from an arbitrary point given the state loaded from the checkpoint. -For example, the implementation of the reset() method could look like this given our previous example:

-
def reset(self):
-    if not self.restarting:
-        self.iteration = 0
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/extensions/plugins.html b/docs/extensions/plugins.html deleted file mode 100644 index 9da9dc2..0000000 --- a/docs/extensions/plugins.html +++ /dev/null @@ -1,834 +0,0 @@ - - - - - - - - - - - - - - Plugins — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Plugins

-

Plugins allow custom integrations to the internals of the Trainer such as custom precision, checkpointing or -cluster environment implementation.

-

Under the hood, the Lightning Trainer is using plugins in the training routine, added automatically -depending on the provided Trainer arguments.

-

There are three types of Plugins in Lightning with different responsibilities:

-
    -
  • Precision Plugins

  • -
  • CheckpointIO Plugins

  • -
  • Cluster Environments

  • -
-

You can make the Trainer use one or multiple plugins by adding it to the plugins argument like so:

-
trainer = Trainer(plugins=[plugin1, plugin2, ...])
-
-
-

By default, the plugins get selected based on the rest of the Trainer settings such as the strategy.

-
-
-

Precision Plugins

-

We provide precision plugins for you to benefit from numerical representations with lower precision than -32-bit floating-point or higher precision, such as 64-bit floating-point.

-
# Training with 16-bit precision
-trainer = Trainer(precision=16)
-
-
-

The full list of built-in precision plugins is listed below.

- ---- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -

ApexMixedPrecisionPlugin

Mixed Precision Plugin based on Nvidia/Apex (https://github.com/NVIDIA/apex)

DeepSpeedPrecisionPlugin

Precision plugin for DeepSpeed integration.

DoublePrecisionPlugin

Plugin for training with double (torch.float64) precision.

FullyShardedNativeMixedPrecisionPlugin

Native AMP for Fully Sharded Training.

HPUPrecisionPlugin

Plugin that enables bfloat/half support on HPUs.

IPUPrecisionPlugin

Precision plugin for IPU integration.

MixedPrecisionPlugin

Base Class for mixed precision.

NativeMixedPrecisionPlugin

Plugin for Native Mixed Precision (AMP) training with torch.autocast.

PrecisionPlugin

Base class for all plugins handling the precision-specific parts of the training.

ShardedNativeMixedPrecisionPlugin

Native AMP for Sharded Training.

TPUBf16PrecisionPlugin

Plugin that enables bfloats on TPUs.

TPUPrecisionPlugin

Precision plugin for TPU integration.

-

More information regarding precision with Lightning can be found here

-
-
-
-

CheckpointIO Plugins

-

As part of our commitment to extensibility, we have abstracted Lightning’s checkpointing logic into the CheckpointIO plugin. -With this, you have the ability to customize the checkpointing logic to match the needs of your infrastructure.

-

Below is a list of built-in plugins for checkpointing.

- ---- - - - - - - - - - - - - - - -

CheckpointIO

Interface to save/load checkpoints as they are saved through the Strategy.

HPUCheckpointIO

CheckpointIO to save checkpoints for HPU training strategies.

TorchCheckpointIO

CheckpointIO that utilizes torch.save() and torch.load() to save and load checkpoints respectively, common for most use cases.

XLACheckpointIO

CheckpointIO that utilizes xm.save() to save checkpoints for TPU training strategies.

-

Learn more about custom checkpointing with Lightning here.

-
-
-
-

Cluster Environments

-

You can define the interface of your own cluster environment based on the requirements of your infrastructure.

- ---- - - - - - - - - - - - - - - - - - - - - -

ClusterEnvironment

Specification of a cluster environment.

KubeflowEnvironment

Environment for distributed training using the PyTorchJob operator from Kubeflow

LightningEnvironment

The default environment used by Lightning for a single node or free cluster (not managed).

LSFEnvironment

An environment for running on clusters managed by the LSF resource manager.

SLURMEnvironment

Cluster environment for training on a cluster managed by SLURM.

TorchElasticEnvironment

Environment for fault-tolerant and elastic training with torchelastic

-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/extensions/strategy.html b/docs/extensions/strategy.html deleted file mode 100644 index 599b65d..0000000 --- a/docs/extensions/strategy.html +++ /dev/null @@ -1,825 +0,0 @@ - - - - - - - - - - - - - - What is a Strategy? — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • What is a Strategy?
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

What is a Strategy?

-

Strategy controls the model distribution across training, evaluation, and prediction to be used by the Trainer. It can be controlled by passing different -strategy with aliases ("ddp", "ddp_spawn", "deepspeed" and so on) as well as a custom strategy to the strategy parameter for Trainer.

-

The Strategy in PyTorch Lightning handles the following responsibilities:

-
    -
  • Launch and teardown of training processes (if applicable).

  • -
  • Setup communication between processes (NCCL, GLOO, MPI, and so on).

  • -
  • Provide a unified communication interface for reduction, broadcast, and so on.

  • -
  • Owns the LightningModule

  • -
  • Handles/owns optimizers and schedulers.

  • -
-

Strategy also manages the accelerator, precision, and checkpointing plugins.

-Illustration of the Strategy as a composition of the Accelerator and several plugins -

We expose Strategies mainly for expert users that want to extend Lightning for new hardware support or new distributed backends (e.g. a backend not yet supported by PyTorch itself).

-
-
-
-

Enable Different Strategies

-
# Training with the DistributedDataParallel strategy on 4 GPUs
-trainer = Trainer(strategy="ddp", accelerator="gpu", devices=4)
-
-# Training with the custom DistributedDataParallel strategy on 4 GPUs
-trainer = Trainer(strategy=DDPStrategy(...), accelerator="gpu", devices=4)
-
-# Training with the DDP Spawn strategy using auto accelerator selection
-trainer = Trainer(strategy="ddp_spawn", accelerator="auto", devices=4)
-
-# Training with the DeepSpeed strategy on available GPUs
-trainer = Trainer(strategy="deepspeed", accelerator="gpu", devices="auto")
-
-# Training with the DDP strategy using 3 CPU processes
-trainer = Trainer(strategy="ddp", accelerator="cpu", devices=3)
-
-# Training with the DDP Spawn strategy on 8 TPU cores
-trainer = Trainer(strategy="ddp_spawn", accelerator="tpu", devices=8)
-
-# Training with the default IPU strategy on 8 IPUs
-trainer = Trainer(accelerator="ipu", devices=8)
-
-
-
-
-
-

Create a Custom Strategy

-

Expert users may choose to extend an existing strategy by overriding its methods.

-
from pytorch_lightning.strategies import DDPStrategy
-
-
-class CustomDDPStrategy(DDPStrategy):
-    def configure_ddp(self):
-        self.model = MyCustomDistributedDataParallel(
-            self.model,
-            device_ids=...,
-        )
-
-
-

or by subclassing the base class Strategy to create new ones. These custom strategies -can then be passed into the Trainer directly via the strategy parameter.

-
# custom plugins
-trainer = Trainer(strategy=CustomDDPStrategy())
-
-# fully custom accelerator and plugins
-accelerator = MyAccelerator()
-precision_plugin = MyPrecisionPlugin()
-training_strategy = CustomDDPStrategy(accelerator=accelerator, precision_plugin=precision_plugin)
-trainer = Trainer(strategy=training_strategy)
-
-
-

The complete list of built-in strategies is listed below.

-
-
-
-

Available Training Strategies

- ---- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -

BaguaStrategy

Strategy for training using the Bagua library, with advanced distributed training algorithms and system optimizations.

DDP2Strategy

DDP2 behaves like DP in one node, but synchronization across nodes behaves like in DDP.

DDPFullyShardedStrategy

Plugin for Fully Sharded Data Parallel provided by FairScale.

DDPShardedStrategy

Optimizer and gradient sharded training provided by FairScale.

DDPSpawnShardedStrategy

Optimizer sharded training provided by FairScale.

DDPSpawnStrategy

Spawns processes using the torch.multiprocessing.spawn() method and joins processes after training finishes.

DDPStrategy

Strategy for multi-process single-device training on one or multiple nodes.

DataParallelStrategy

Implements data-parallel training in a single process, i.e., the model gets replicated to each device and each gets a split of the data.

DeepSpeedStrategy

Provides capabilities to run training using the DeepSpeed library, with training optimizations for large billion parameter models.

HorovodStrategy

Plugin for Horovod distributed training integration.

HPUParallelStrategy

Strategy for distributed training on multiple HPU devices.

IPUStrategy

Plugin for training on IPU devices.

ParallelStrategy

Plugin for training with multiple processes in parallel.

SingleDeviceStrategy

Strategy that handles communication on a single device.

SingleHPUStrategy

Strategy for training on single HPU device.

SingleTPUStrategy

Strategy for training on a single TPU device.

Strategy

Base class for all strategies that change the behaviour of the training, validation and test- loop.

TPUSpawnStrategy

Strategy for training multiple TPU devices using the torch_xla.distributed.xla_multiprocessing.spawn() method.

-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/generate_docs_for_tags.sh b/docs/generate_docs_for_tags.sh new file mode 100644 index 0000000..a354421 --- /dev/null +++ b/docs/generate_docs_for_tags.sh @@ -0,0 +1,59 @@ +#!/bin/bash +# Usage: +# 1. Generate docs with one or more specified versions: +# $ export PACKAGE_NAME=app +# $ bash docs/generate_docs_for_tags.sh 1.9.3 1.9.2 1.9.1 1.9.0 +# OR +# $ PACKAGE_NAME=pytorch bash docs/generate_docs_for_tags.sh 1.8.6 1.8.5 1.8.4 1.8.3 1.8.2 1.8.1 1.8.0 +set -e + +PATH_ROOT=~/Desktop/builds +PATH_ENV=$PATH_ROOT/venv-docs-$PACKAGE_NAME +# export PACKAGE_NAME=app +export FREEZE_REQUIREMENTS=1 + +echo PATH_ROOT: $PATH_ROOT +echo PATH_ENV: $PATH_ENV +echo PYTHONPATH: $PYTHONPATH + +function build_docs { + python --version + pip --version + + pip install -q setuptools wheel python-multipart + pip install -e . -q -r requirements/$PACKAGE_NAME/docs.txt \ + -f ../pypi -f https://download.pytorch.org/whl/cpu/torch_stable.html + pip list + + cd docs/source-$PACKAGE_NAME + make html --jobs=$(nproc) + # make html SPHINXOPTS="-W --keep-going" --jobs=$(nproc) + cd ../.. + + mkdir -p $PATH_ROOT/docs-${PACKAGE_NAME} + mv docs/build/html $PATH_ROOT/docs-${PACKAGE_NAME}/$tag +} + +# iterate over all arguments assuming that each argument is version +for tag in "$@" +do + echo processing version: $tag + + # Don't install/update anything before activating venv + # to avoid breaking any existing environment. + python -m venv $PATH_ENV + source $PATH_ENV/bin/activate + + cd $PATH_ROOT + git clone --single-branch --branch $tag --depth 1 --recurse-submodules \ + https://github.com/Lightning-AI/lightning.git + cd lightning + + build_docs > "$PATH_ROOT/building-${PACKAGE_NAME}_${tag}.log" + + cd .. + rm -rf lightning + + deactivate + rm -rf $PATH_ENV +done diff --git a/docs/genindex.html b/docs/genindex.html deleted file mode 100644 index 7e2a533..0000000 --- a/docs/genindex.html +++ /dev/null @@ -1,2117 +0,0 @@ - - - - - - - - - - - - - Index — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- - -

Index

- -
- Symbols - | A - | B - | C - | D - | E - | F - | G - | H - | I - | K - | L - | M - | N - | O - | P - | Q - | R - | S - | T - | U - | V - | W - | Z - -
-

Symbols

- - - -
- -

A

- - - -
- -

B

- - - -
- -

C

- - - -
- -

D

- - - -
- -

E

- - - -
- -

F

- - - -
- -

G

- - - -
- -

H

- - - -
- -

I

- - - -
- -

K

- - -
- -

L

- - - -
- -

M

- - - -
- -

N

- - - -
- -

O

- - - -
- -

P

- - - -
- -

Q

- - - -
- -

R

- - - -
- -

S

- - - -
- -

T

- - - -
- -

U

- - - -
- -

V

- - - -
- -

W

- - - -
- -

Z

- - - -
- - - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/guides/data.html b/docs/guides/data.html deleted file mode 100644 index 60657e8..0000000 --- a/docs/guides/data.html +++ /dev/null @@ -1,1088 +0,0 @@ - - - - - - - - - - - - - - Managing Data — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Managing Data

-
-

Data Containers in Lightning

-

There are a few different data containers used in Lightning:

- - ---- - - - - - - - - - - - - - - - - - - - -
Data objects

Object

Definition

Dataset

The PyTorch Dataset represents a map from keys to data samples.

IterableDataset

The PyTorch IterableDataset represents a stream of data.

DataLoader

The PyTorch DataLoader represents a Python iterable over a Dataset.

LightningDataModule

A LightningDataModule is simply a collection of: training DataLoader(s), validation DataLoader(s), test DataLoader(s) and predict DataLoader(s), along with the matching transforms and data processing/downloads steps required.

-
-

Why Use LightningDataModule?

-

The LightningDataModule was designed as a way of decoupling data-related hooks from the LightningModule so you can develop dataset agnostic models. The LightningDataModule makes it easy to hot swap different Datasets with your model, so you can test it and benchmark it across domains. It also makes sharing and reusing the exact data splits and transforms across projects possible.

-

Read this for more details on LightningDataModule.

-
-
-
-
-

Multiple Datasets

-

There are a few ways to pass multiple Datasets to Lightning:

-
    -
  1. Create a DataLoader that iterates over multiple Datasets under the hood.

  2. -
  3. In the training loop, you can pass multiple DataLoaders as a dict or list/tuple, and Lightning will -automatically combine the batches from different DataLoaders.

  4. -
  5. In the validation, test, or prediction, you have the option to return multiple DataLoaders as list/tuple, which Lightning will call sequentially -or combine the DataLoaders using CombinedLoader, which Lightning will -automatically combine the batches from different DataLoaders.

  6. -
-
-

Using LightningDataModule

-

You can set more than one DataLoader in your LightningDataModule using its DataLoader hooks -and Lightning will use the correct one.

-
class DataModule(LightningDataModule):
-
-    ...
-
-    def train_dataloader(self):
-        return DataLoader(self.train_dataset)
-
-    def val_dataloader(self):
-        return [DataLoader(self.val_dataset_1), DataLoader(self.val_dataset_2)]
-
-    def test_dataloader(self):
-        return DataLoader(self.test_dataset)
-
-    def predict_dataloader(self):
-        return DataLoader(self.predict_dataset)
-
-
-
-
-

Using LightningModule Hooks

-
-

Concatenated Dataset

-

For training with multiple Datasets, you can create a DataLoader class -which wraps your multiple Datasets using ConcatDataset. This, of course, -also works for testing, validation, and prediction Datasets.

-
from torch.utils.data import ConcatDataset
-
-
-class LitModel(LightningModule):
-    def train_dataloader(self):
-        concat_dataset = ConcatDataset(datasets.ImageFolder(traindir_A), datasets.ImageFolder(traindir_B))
-
-        loader = DataLoader(
-            concat_dataset, batch_size=args.batch_size, shuffle=True, num_workers=args.workers, pin_memory=True
-        )
-        return loader
-
-    def val_dataloader(self):
-        # SAME
-        ...
-
-    def test_dataloader(self):
-        # SAME
-        ...
-
-
-
-
-

Return Multiple DataLoaders

-

You can set multiple DataLoaders in your LightningModule, and Lightning will take care of batch combination.

-

For more details, refer to multiple_trainloader_mode

-
class LitModel(LightningModule):
-    def train_dataloader(self):
-
-        loader_a = DataLoader(range(6), batch_size=4)
-        loader_b = DataLoader(range(15), batch_size=5)
-
-        # pass loaders as a dict. This will create batches like this:
-        # {'a': batch from loader_a, 'b': batch from loader_b}
-        loaders = {"a": loader_a, "b": loader_b}
-
-        # OR:
-        # pass loaders as sequence. This will create batches like this:
-        # [batch from loader_a, batch from loader_b]
-        loaders = [loader_a, loader_b]
-
-        return loaders
-
-
-

Furthermore, Lightning also supports nested lists and dicts (or a combination).

-
class LitModel(LightningModule):
-    def train_dataloader(self):
-
-        loader_a = DataLoader(range(8), batch_size=4)
-        loader_b = DataLoader(range(16), batch_size=2)
-
-        return {"a": loader_a, "b": loader_b}
-
-    def training_step(self, batch, batch_idx):
-        # access a dictionary with a batch from each DataLoader
-        batch_a = batch["a"]
-        batch_b = batch["b"]
-
-
-
class LitModel(LightningModule):
-    def train_dataloader(self):
-
-        loader_a = DataLoader(range(8), batch_size=4)
-        loader_b = DataLoader(range(16), batch_size=4)
-        loader_c = DataLoader(range(32), batch_size=4)
-        loader_c = DataLoader(range(64), batch_size=4)
-
-        # pass loaders as a nested dict. This will create batches like this:
-        loaders = {"loaders_a_b": [loader_a, loader_b], "loaders_c_d": {"c": loader_c, "d": loader_d}}
-        return loaders
-
-    def training_step(self, batch, batch_idx):
-        # access the data
-        batch_a_b = batch["loaders_a_b"]
-        batch_c_d = batch["loaders_c_d"]
-
-        batch_a = batch_a_b[0]
-        batch_b = batch_a_b[1]
-
-        batch_c = batch_c_d["c"]
-        batch_d = batch_c_d["d"]
-
-
-

Alternatively, you can also pass in a CombinedLoader containing multiple DataLoaders.

-
from pytorch_lightning.trainer.supporters import CombinedLoader
-
-
-def train_dataloader(self):
-    loader_a = DataLoader()
-    loader_b = DataLoader()
-    loaders = {"a": loader_a, "b": loader_b}
-    combined_loader = CombinedLoader(loaders, mode="max_size_cycle")
-    return combined_loader
-
-
-def training_step(self, batch, batch_idx):
-    batch_a = batch["a"]
-    batch_b = batch["b"]
-
-
-
-
-
-

Multiple Validation/Test/Predict DataLoaders

-

For validation, test and predict DataLoaders, you can pass a single DataLoader or a list of them. This optional named -parameter can be used in conjunction with any of the above use cases. You can choose to pass -the batches sequentially or simultaneously, as is done for the training step. -The default mode for these DataLoaders is sequential. Note that when using a sequence of DataLoaders you need -to add an additional argument dataloader_idx in their corresponding step specific hook. The corresponding loop will process -the DataLoaders in sequential order; that is, the first DataLoader will be processed completely, then the second one, and so on.

-

Refer to the following for more details for the default sequential option:

-
    -
  • val_dataloader()

  • -
  • test_dataloader()

  • -
  • predict_dataloader()

  • -
-
def val_dataloader(self):
-    loader_1 = DataLoader()
-    loader_2 = DataLoader()
-    return [loader_1, loader_2]
-
-
-def validation_step(self, batch, batch_idx, dataloader_idx):
-    ...
-
-
-

Evaluation DataLoaders are iterated over sequentially. If you want to iterate over them in parallel, PyTorch Lightning provides a CombinedLoader object which supports collections of DataLoaders such as list, tuple, or dictionary. The DataLoaders can be accessed using in the same way as the provided structure:

-
from pytorch_lightning.trainer.supporters import CombinedLoader
-
-
-def val_dataloader(self):
-    loader_a = DataLoader()
-    loader_b = DataLoader()
-    loaders = {"a": loader_a, "b": loader_b}
-    combined_loaders = CombinedLoader(loaders, mode="max_size_cycle")
-    return combined_loaders
-
-
-def validation_step(self, batch, batch_idx):
-    batch_a = batch["a"]
-    batch_b = batch["b"]
-
-
-
-
-

Evaluate with Additional DataLoaders

-

You can evaluate your models using additional DataLoaders even if the DataLoader specific hooks haven’t been defined within your -LightningModule. For example, this would be the case if your test data -set is not available at the time your model was declared. Simply pass the test set to the test() method:

-
# setup your DataLoader
-test = DataLoader(...)
-
-# test (pass in the loader)
-trainer.test(dataloaders=test)
-
-
-
-
-
-
-

Accessing DataLoaders within LightningModule

-

In the case that you require access to the DataLoader or Dataset objects, DataLoaders for each step can be accessed using the Trainer object:

-
from pytorch_lightning import LightningModule
-
-
-class Model(LightningModule):
-    def test_step(self, batch, batch_idx, dataloader_idx):
-        test_dl = self.trainer.test_dataloaders[dataloader_idx]
-        test_dataset = test_dl.dataset
-        test_sampler = test_dl.sampler
-        ...
-        # extract metadata, etc. from the dataset:
-        ...
-
-
-

If you are using a CombinedLoader object which allows you to fetch batches from a collection of DataLoaders -simultaneously which supports collections of DataLoader such as list, tuple, or dictionary. The DataLoaders can be accessed using the same collection structure:

-
from pytorch_lightning.trainer.supporters import CombinedLoader
-
-test_dl1 = ...
-test_dl2 = ...
-
-# If you provided a list of DataLoaders:
-
-combined_loader = CombinedLoader([test_dl1, test_dl2])
-list_of_loaders = combined_loader.loaders
-test_dl1 = list_of_loaders.loaders[0]
-
-
-# If you provided dictionary of DataLoaders:
-
-combined_loader = CombinedLoader({"dl1": test_dl1, "dl2": test_dl2})
-dictionary_of_loaders = combined_loader.loaders
-test_dl1 = dictionary_of_loaders["dl1"]
-
-
-
-
-
-

Sequential Data

-

Lightning has built in support for dealing with sequential data.

-
-

Packed Sequences as Inputs

-

When using PackedSequence, do two things:

-
    -
  1. Return either a padded tensor in dataset or a list of variable length tensors in the DataLoader’s collate_fn (example shows the list implementation).

  2. -
  3. Pack the sequence in forward or training and validation steps depending on use case.

  4. -
-
-

-
-
# For use in DataLoader
-def collate_fn(batch):
-    x = [item[0] for item in batch]
-    y = [item[1] for item in batch]
-    return x, y
-
-
-# In LightningModule
-def training_step(self, batch, batch_idx):
-    x = rnn.pack_sequence(batch[0], enforce_sorted=False)
-    y = rnn.pack_sequence(batch[1], enforce_sorted=False)
-
-
-
-
-

Truncated Backpropagation Through Time (TBPTT)

-

There are times when multiple backwards passes are needed for each batch. -For example, it may save memory to use Truncated Backpropagation Through Time when training RNNs.

-

Lightning can handle TBPTT automatically via this flag.

-
from pytorch_lightning import LightningModule
-
-
-class MyModel(LightningModule):
-    def __init__(self):
-        super().__init__()
-        # Important: This property activates truncated backpropagation through time
-        # Setting this value to 2 splits the batch into sequences of size 2
-        self.truncated_bptt_steps = 2
-
-    # Truncated back-propagation through time
-    def training_step(self, batch, batch_idx, hiddens):
-        # the training step must be updated to accept a ``hiddens`` argument
-        # hiddens are the hiddens from the previous truncated backprop step
-        out, hiddens = self.lstm(data, hiddens)
-        return {"loss": ..., "hiddens": hiddens}
-
-
-
-

Note

-

If you need to modify how the batch is split, -override tbptt_split_batch().

-
-
-
-

Iterable Datasets

-

Lightning supports using IterableDataset as well as map-style Datasets. IterableDatasets provide a more natural -option when using sequential data.

-
-

Note

-

When using an IterableDataset you must set the val_check_interval to 1.0 (the default) or an int -(specifying the number of training batches to run before each validation loop) when initializing the Trainer. This is -because the IterableDataset does not have a __len__ and Lightning requires this to calculate the validation -interval when val_check_interval is less than one. Similarly, you can set limit_{mode}_batches to a float or -an int. If it is set to 0.0 or 0, it will set num_{mode}_batches to 0, if it is an int, it will set num_{mode}_batches -to limit_{mode}_batches, if it is set to 1.0 it will run for the whole dataset, otherwise it will throw an exception. -Here mode can be train/val/test/predict.

-
-

When iterable datasets are used, Lightning will pre-fetch 1 batch (in addition to the current batch) so it can detect -when the training will stop and run validation if necessary.

-
# IterableDataset
-class CustomDataset(IterableDataset):
-    def __init__(self, data):
-        self.data_source = data
-
-    def __iter__(self):
-        return iter(self.data_source)
-
-
-# Setup DataLoader
-def train_dataloader(self):
-    seq_data = ["A", "long", "time", "ago", "in", "a", "galaxy", "far", "far", "away"]
-    iterable_dataset = CustomDataset(seq_data)
-
-    dataloader = DataLoader(dataset=iterable_dataset, batch_size=5)
-    return dataloader
-
-
-
# Set val_check_interval
-trainer = Trainer(val_check_interval=100)
-
-# Set limit_val_batches to 0.0 or 0
-trainer = Trainer(limit_val_batches=0.0)
-
-# Set limit_val_batches as an int
-trainer = Trainer(limit_val_batches=100)
-
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/guides/speed.html b/docs/guides/speed.html deleted file mode 100644 index a48523c..0000000 --- a/docs/guides/speed.html +++ /dev/null @@ -1,1090 +0,0 @@ - - - - - - - - - - - - - - Speed Up Model Training — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Speed Up Model Training
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Speed Up Model Training

-

When you are limited with the resources, it becomes hard to speed up model training and reduce the training time -without affecting the model’s performance. There are multiple ways you can speed up your model’s time to convergence.

-
-

Training on Accelerators

-

Use when: Whenever possible!

-

With Lightning, running on GPUs, TPUs, IPUs on multiple nodes is a simple switch of a flag.

-
-

GPU Training

-

Lightning supports a variety of plugins to speed up distributed GPU training. Most notably:

-
    -
  • DDPStrategy

  • -
  • DDPShardedStrategy

  • -
  • DeepSpeedStrategy

  • -
-
# run on 1 gpu
-trainer = Trainer(accelerator="gpu", devices=1)
-
-# train on 8 GPUs, using the DDP strategy
-trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp")
-
-# train on multiple GPUs across nodes (uses 8 GPUs in total)
-trainer = Trainer(accelerator="gpu", devices=2, num_nodes=4)
-
-
-
-

GPU Training Speedup Tips

-

When training on single or multiple GPU machines, Lightning offers a host of advanced optimizations to improve throughput, memory efficiency, and model scaling. -Refer to Advanced GPU Optimized Training for more details.

-
-
Prefer DDP Over DP
-

DataParallelStrategy performs three GPU transfers for EVERY batch:

-
    -
  1. Copy the model to the device.

  2. -
  3. Copy the data to the device.

  4. -
  5. Copy the outputs of each device back to the main device.

  6. -
-Animation showing DP execution. -
-

-
-

Whereas DDPStrategy only performs two transfer operations, making DDP much faster than DP:

-
    -
  1. Moving data to the device.

  2. -
  3. Transfer and sync gradients.

  4. -
-Animation showing DDP execution. -
-

-
-

For more details on how to tune performance with DDP, please see the DDP Optimizations section.

-
-
-
DataLoaders
-

When building your DataLoader set num_workers>0 and pin_memory=True (only for GPUs).

-
Dataloader(dataset, num_workers=8, pin_memory=True)
-
-
-
-
-
num_workers
-

The question of how many workers to specify in num_workers is tricky. Here’s a summary of some references, and our suggestions:

-
    -
  1. num_workers=0 means ONLY the main process will load batches (that can be a bottleneck).

  2. -
  3. num_workers=1 means ONLY one worker (just not the main process) will load data, but it will still be slow.

  4. -
  5. The performance of high num_workers depends on the batch size and your machine.

  6. -
  7. A general place to start is to set num_workers equal to the number of CPU cores on that machine. You can get the number of CPU cores in python using os.cpu_count(), but note that depending on your batch size, you may overflow RAM memory.

  8. -
-
-

Warning

-

Increasing num_workers will ALSO increase your CPU memory consumption.

-
-

The best thing to do is to increase the num_workers slowly and stop once there is no more improvement in your training speed.

-

For debugging purposes or for dataloaders that load very small datasets, it is desirable to set num_workers=0. However, this will always log a warning for every dataloader with num_workers <= min(2, os.cpu_count()). In such cases, you can specifically filter this warning by using:

-
import warnings
-
-warnings.filterwarnings("ignore", ".*Consider increasing the value of the `num_workers` argument*")
-
-# or to ignore all warnings that could be false positives
-from pytorch_lightning.utilities.warnings import PossibleUserWarning
-
-warnings.filterwarnings("ignore", category=PossibleUserWarning)
-
-
-
-
-
Spawn
-

When using strategy="ddp_spawn" or training on TPUs, the way multiple GPUs/TPU cores are used is by calling torch.multiprocessing -.spawn() under the hood. The problem is that PyTorch has issues with num_workers>0 when using .spawn(). For this reason, we recommend you -use strategy="ddp" so you can increase the num_workers, however since DDP doesn’t work in an interactive environment like IPython/Jupyter notebooks -your script has to be callable like so:

-
python my_program.py
-
-
-

However, using strategy="ddp_spawn" enables to reduce memory usage with In-Memory Dataset and shared memory tensors. For more info, checkout -Sharing Datasets Across Process Boundaries section.

-
-
-
Persistent Workers
-

When using strategy="ddp_spawn" and num_workers>0, consider setting persistent_workers=True inside your DataLoader since it can result in data-loading bottlenecks and slowdowns. -This is a limitation of Python .spawn() and PyTorch.

-
-
-
-
-

TPU Training

-

You can set the devices trainer argument to 1, [7] (specific core) or eight cores.

-
# train on 1 TPU core
-trainer = Trainer(accelerator="tpu", devices=1)
-
-# train on 7th TPU core
-trainer = Trainer(accelerator="tpu", devices=[7])
-
-# train on 8 TPU cores
-trainer = Trainer(accelerator="tpu", devices=8)
-
-
-

To train on more than eight cores (a POD), -submit this script using the xla_dist script.

-

Example:

-
python -m torch_xla.distributed.xla_dist
---tpu=$TPU_POD_NAME
---conda-env=torch-xla-nightly
---env=XLA_USE_BF16=1
--- python your_trainer_file.py
-
-
-

Read more in our Speed Up Model Training and Plugins guides.

-
-
-
-
-

Early Stopping

-

Usually, long training epochs can lead to either overfitting or no major improvements in your metrics due to no limited convergence. -Here EarlyStopping callback can help you stop the training entirely by monitoring a metric of your choice.

-

You can read more about it here.

-
-
-
-

Mixed Precision (16-bit) Training

-

Lower precision, such as the 16-bit floating-point, enables the training and deployment of large neural networks since they require less memory, enhance data transfer operations since they required -less memory bandwidth and run match operations much faster on GPUs that support Tensor Core.

-

Use when:

-
    -
  • You want to optimize for memory usage on a GPU.

  • -
  • You have a GPU that supports 16-bit precision (NVIDIA pascal architecture or newer).

  • -
  • Your optimization algorithm (training_step) is numerically stable.

  • -
  • You want to be the cool person in the lab :p

  • -
-
-

-
-

Mixed precision combines the use of both 32 and 16-bit floating points to reduce memory footprint during model training, resulting in improved performance, achieving upto +3X speedups on modern GPUs.

-

Lightning offers mixed precision training for GPUs and CPUs, as well as bfloat16 mixed precision training for TPUs.

-
# 16-bit precision
-trainer = Trainer(precision=16, accelerator="gpu", devices=4)
-
-
-

Read more about mixed-precision training.

-
-
-
-

Control Training Epochs

-

Use when: You run a hyperparameter search to find good initial parameters and want to save time, cost (money), or power (environment). -It can allow you to be more cost efficient and also run more experiments at the same time.

-

You can use Trainer flags to force training for a minimum number of epochs or limit it to a max number of epochs. Use the min_epochs and max_epochs Trainer flags to set the number of epochs to run. -Setting min_epochs=N makes sure that the training will run for at least N epochs. Setting max_epochs=N will ensure that training won’t happen after -N epochs.

-
# DEFAULT
-trainer = Trainer(min_epochs=1, max_epochs=1000)
-
-
-

If running iteration based training, i.e., infinite / iterable DataLoader, you can also control the number of steps with the min_steps and max_steps flags:

-
trainer = Trainer(max_steps=1000)
-
-trainer = Trainer(min_steps=100)
-
-
-

You can also interrupt training based on training time:

-
# Stop after 12 hours of training or when reaching 10 epochs (string)
-trainer = Trainer(max_time="00:12:00:00", max_epochs=10)
-
-# Stop after 1 day and 5 hours (dict)
-trainer = Trainer(max_time={"days": 1, "hours": 5})
-
-
-

Learn more in our Trainer flags guide.

-
-
-
-

Control Validation Frequency

-
-

Check Validation Every n Epochs

-

Use when: You have a small dataset and want to run fewer validation checks.

-

You can limit validation check to only run every n epochs using the check_val_every_n_epoch Trainer flag.

-
# default
-trainer = Trainer(check_val_every_n_epoch=1)
-
-# runs validation after every 7th Epoch
-trainer = Trainer(check_val_every_n_epoch=7)
-
-
-
-
-

Validation Within Training Epoch

-

Use when: You have a large training dataset and want to run mid-epoch validation checks.

-

For large datasets, it’s often desirable to check validation multiple times within a training epoch. -Pass in a float to check that often within one training epoch. Pass in an int K to check every K training batch. -Must use an int if using an IterableDataset.

-
# default
-trainer = Trainer(val_check_interval=1.0)
-
-# check every 1/4 th of an epoch
-trainer = Trainer(val_check_interval=0.25)
-
-# check every 100 train batches (ie: for IterableDatasets or fixed frequency)
-trainer = Trainer(val_check_interval=100)
-
-
-

Learn more in our Trainer flags guide.

-
-
-
-
-

Preload Data Into RAM

-

Use when: You need access to all samples in a dataset at once.

-

When your training or preprocessing requires many operations to be performed on entire dataset(s), it can -sometimes be beneficial to store all data in RAM given there is enough space. -However, loading all data at the beginning of the training script has the disadvantage that it can take a long -time, and hence, it slows down the development process. Another downside is that in multiprocessing (e.g., DDP) -the data would get copied in each process. -One can overcome these problems by copying the data into RAM in advance. -Most UNIX-based operating systems provide direct access to tmpfs through a mount point typically named /dev/shm.

-

Increase shared memory if necessary. Refer to the documentation of your OS on how to do this.

-
    -
  1. Copy training data to shared memory:

    -
    cp -r /path/to/data/on/disk /dev/shm/
    -
    -
    -
  2. -
  3. Refer to the new data root in your script or command-line arguments:

    -
    datamodule = MyDataModule(data_root="/dev/shm/my_data")
    -
    -
    -
  4. -
-
-
-
-

Model Toggling

-

Use when: Performing gradient accumulation with multiple optimizers in a -distributed setting.

-

Here is an explanation of what it does:

-
    -
  • Considering the current optimizer as A and all other optimizers as B.

  • -
  • Toggling, which means all parameters from B exclusive to A will have their requires_grad attribute set to False.

  • -
  • Restoring their original state when exiting the context manager.

  • -
-

When performing gradient accumulation, there is no need to perform grad synchronization during the accumulation phase. -Setting sync_grad to False will block this synchronization and improve your training speed.

-

LightningOptimizer provides a -toggle_model() function as a -contextlib.contextmanager() for advanced users.

-

Here is an example of an advanced use case:

-
# Scenario for a GAN with gradient accumulation every two batches and optimized for multiple GPUs.
-class SimpleGAN(LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.automatic_optimization = False
-
-    def training_step(self, batch, batch_idx):
-        # Implementation follows the PyTorch tutorial:
-        # https://pytorch.org/tutorials/beginner/dcgan_faces_tutorial.html
-        g_opt, d_opt = self.optimizers()
-
-        X, _ = batch
-        X.requires_grad = True
-        batch_size = X.shape[0]
-
-        real_label = torch.ones((batch_size, 1), device=self.device)
-        fake_label = torch.zeros((batch_size, 1), device=self.device)
-
-        # Sync and clear gradients
-        # at the end of accumulation or
-        # at the end of an epoch.
-        is_last_batch_to_accumulate = (batch_idx + 1) % 2 == 0 or self.trainer.is_last_batch
-
-        g_X = self.sample_G(batch_size)
-
-        ##########################
-        # Optimize Discriminator #
-        ##########################
-        with d_opt.toggle_model(sync_grad=is_last_batch_to_accumulate):
-            d_x = self.D(X)
-            errD_real = self.criterion(d_x, real_label)
-
-            d_z = self.D(g_X.detach())
-            errD_fake = self.criterion(d_z, fake_label)
-
-            errD = errD_real + errD_fake
-
-            self.manual_backward(errD)
-            if is_last_batch_to_accumulate:
-                d_opt.step()
-                d_opt.zero_grad()
-
-        ######################
-        # Optimize Generator #
-        ######################
-        with g_opt.toggle_model(sync_grad=is_last_batch_to_accumulate):
-            d_z = self.D(g_X)
-            errG = self.criterion(d_z, real_label)
-
-            self.manual_backward(errG)
-            if is_last_batch_to_accumulate:
-                g_opt.step()
-                g_opt.zero_grad()
-
-        self.log_dict({"g_loss": errG, "d_loss": errD}, prog_bar=True)
-
-
-
-
-
-

Set Grads to None

-

In order to improve performance, you can override optimizer_zero_grad().

-

For a more detailed explanation of the pros / cons of this technique, -read the documentation for zero_grad() by the PyTorch team.

-
class Model(LightningModule):
-    def optimizer_zero_grad(self, epoch, batch_idx, optimizer, optimizer_idx):
-        optimizer.zero_grad(set_to_none=True)
-
-
-
-
-
-

Things to Avoid

-
-

.item(), .numpy(), .cpu()

-

Don’t call .item() anywhere in your code. Use .detach() instead to remove the connected graph calls. Lightning -takes a great deal of care to be optimized for this.

-
-
-

Clear Cache

-

Don’t call torch.cuda.empty_cache() unnecessarily! Every time you call this, ALL your GPUs have to wait to sync.

-
-
-

Transferring Tensors to Device

-

LightningModules know what device they are on! Construct tensors on the device directly to avoid CPU->Device transfer.

-
# bad
-t = torch.rand(2, 2).cuda()
-
-# good (self is LightningModule)
-t = torch.rand(2, 2, device=self.device)
-
-
-

For tensors that need to be model attributes, it is best practice to register them as buffers in the module’s -__init__ method:

-
# bad
-self.t = torch.rand(2, 2, device=self.device)
-
-# good
-self.register_buffer("t", torch.rand(2, 2))
-
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/index.html b/docs/index.html deleted file mode 100644 index f3c9f7a..0000000 --- a/docs/index.html +++ /dev/null @@ -1,946 +0,0 @@ - - - - - - - - - - - - - - ⚡ PyTorch Lightning에 오신 것을 환영합니다! — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • ⚡ PyTorch Lightning에 오신 것을 환영합니다!
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

⚡ PyTorch Lightning에 오신 것을 환영합니다!

-

-
Animation showing how to convert a standard training loop to a Lightning loop
-

PyTorch Lightning(파이토치 라이트닝))은 대규모에서 성능을 포기하지 않으면서 최대한의 유연성을 필요로 하는 전문적인 AI 연구자들과 머신러닝 엔지니어들을 위한 딥러닝 프레임워크입니다. -Lightning(라이트닝)은 프로젝트가 생각으로부터 문서 / 제품화에 이르는 동안 함께 발전합니다.

-
-

-
-

Lightning 설치하기

-
-

Pip 사용자라면,

-
pip install pytorch-lightning
-
-
-
-

Conda 사용자라면,

-
conda install pytorch-lightning -c conda-forge
-
-
-
-

또는 advanced install guide 참조하세요.

-
-
-

처음이신가요?

-
-
-

이미 Lightning 사용자라면?

-
- - - - - -
-
-

색인 및 검색

- -
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/advanced.html b/docs/levels/advanced.html deleted file mode 100644 index 3842804..0000000 --- a/docs/levels/advanced.html +++ /dev/null @@ -1,796 +0,0 @@ - - - - - - - - - - - - - - Advanced skills — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/advanced_level_15.html b/docs/levels/advanced_level_15.html deleted file mode 100644 index 10c6e31..0000000 --- a/docs/levels/advanced_level_15.html +++ /dev/null @@ -1,712 +0,0 @@ - - - - - - - - - - - - - - Level 15: Customize configs to run in production — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 15: Customize configs to run in production
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/advanced_level_16.html b/docs/levels/advanced_level_16.html deleted file mode 100644 index 18abbab..0000000 --- a/docs/levels/advanced_level_16.html +++ /dev/null @@ -1,712 +0,0 @@ - - - - - - - - - - - - - - Level 16: Customize the trainer — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 16: Customize the trainer
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/advanced_level_17.html b/docs/levels/advanced_level_17.html deleted file mode 100644 index b51ba7f..0000000 --- a/docs/levels/advanced_level_17.html +++ /dev/null @@ -1,722 +0,0 @@ - - - - - - - - - - - - - - Level 17: Own the training loop — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 17: Own the training loop
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Level 17: Own the training loop

-

Learn all the ways of owning your raw PyTorch loops with Lighting.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/advanced_level_18.html b/docs/levels/advanced_level_18.html deleted file mode 100644 index 1653dac..0000000 --- a/docs/levels/advanced_level_18.html +++ /dev/null @@ -1,712 +0,0 @@ - - - - - - - - - - - - - - Level 18: Enable advanced checkpointing — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 18: Enable advanced checkpointing
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/advanced_level_19.html b/docs/levels/advanced_level_19.html deleted file mode 100644 index 616430b..0000000 --- a/docs/levels/advanced_level_19.html +++ /dev/null @@ -1,722 +0,0 @@ - - - - - - - - - - - - - - Level 19: Explore IPUs — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 19: Explore IPUs
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
- -
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/advanced_level_20.html b/docs/levels/advanced_level_20.html deleted file mode 100644 index 851524a..0000000 --- a/docs/levels/advanced_level_20.html +++ /dev/null @@ -1,712 +0,0 @@ - - - - - - - - - - - - - - Level 19: Explore HPUs — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 19: Explore HPUs
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
- -
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/advanced_level_21.html b/docs/levels/advanced_level_21.html deleted file mode 100644 index 7c04b94..0000000 --- a/docs/levels/advanced_level_21.html +++ /dev/null @@ -1,722 +0,0 @@ - - - - - - - - - - - - - - Level 21: Master TPUs — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 21: Master TPUs
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
- -
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/advanced_level_22.html b/docs/levels/advanced_level_22.html deleted file mode 100644 index 7d373d5..0000000 --- a/docs/levels/advanced_level_22.html +++ /dev/null @@ -1,712 +0,0 @@ - - - - - - - - - - - - - - Level 22: Reach 1 trillion parameters on GPUs — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 22: Reach 1 trillion parameters on GPUs
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/basic_level_2.html b/docs/levels/basic_level_2.html deleted file mode 100644 index dca840d..0000000 --- a/docs/levels/basic_level_2.html +++ /dev/null @@ -1,720 +0,0 @@ - - - - - - - - - - - - - - Level 2: Add a validation and test set — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 2: Add a validation and test set
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/basic_level_5.html b/docs/levels/basic_level_5.html deleted file mode 100644 index 98244bd..0000000 --- a/docs/levels/basic_level_5.html +++ /dev/null @@ -1,720 +0,0 @@ - - - - - - - - - - - - - - Level 5: Debug, visualize and find performance bottlenecks — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 5: Debug, visualize and find performance bottlenecks
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/core_level_3.html b/docs/levels/core_level_3.html deleted file mode 100644 index fb1870d..0000000 --- a/docs/levels/core_level_3.html +++ /dev/null @@ -1,710 +0,0 @@ - - - - - - - - - - - - - - Level 3: Visualize training progress — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 3: Visualize training progress
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/core_level_6.html b/docs/levels/core_level_6.html deleted file mode 100644 index 231c0cf..0000000 --- a/docs/levels/core_level_6.html +++ /dev/null @@ -1,720 +0,0 @@ - - - - - - - - - - - - - - Level 6: Predict with your model — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 6: Predict with your model
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/core_skills.html b/docs/levels/core_skills.html deleted file mode 100644 index 47ba28c..0000000 --- a/docs/levels/core_skills.html +++ /dev/null @@ -1,776 +0,0 @@ - - - - - - - - - - - - - - Basic skills — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
- - -
-
-
- - -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/expert.html b/docs/levels/expert.html deleted file mode 100644 index e040593..0000000 --- a/docs/levels/expert.html +++ /dev/null @@ -1,766 +0,0 @@ - - - - - - - - - - - - - - Expert skills — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Expert skills

-

Customize and extend Lightning for things like custom hardware or distributed strategies.

-

-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- - -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/expert_level_23.html b/docs/levels/expert_level_23.html deleted file mode 100644 index 539eb93..0000000 --- a/docs/levels/expert_level_23.html +++ /dev/null @@ -1,712 +0,0 @@ - - - - - - - - - - - - - - Level 23: Extend the Lightning CLI — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 23: Extend the Lightning CLI
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/expert_level_24.html b/docs/levels/expert_level_24.html deleted file mode 100644 index 0b70438..0000000 --- a/docs/levels/expert_level_24.html +++ /dev/null @@ -1,712 +0,0 @@ - - - - - - - - - - - - - - Level 24: Integrate a custom cluster — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 24: Integrate a custom cluster
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/expert_level_27.html b/docs/levels/expert_level_27.html deleted file mode 100644 index b2b3110..0000000 --- a/docs/levels/expert_level_27.html +++ /dev/null @@ -1,732 +0,0 @@ - - - - - - - - - - - - - - Level 27: Add a new accelerator or Strategy — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 27: Add a new accelerator or Strategy
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Level 27: Add a new accelerator or Strategy

-

Integrate a new accelerator or distributed strategy.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/intermediate.html b/docs/levels/intermediate.html deleted file mode 100644 index d7949f9..0000000 --- a/docs/levels/intermediate.html +++ /dev/null @@ -1,796 +0,0 @@ - - - - - - - - - - - - - - Intermediate skills — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Intermediate skills
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
- - -
-
- -
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/intermediate_level_10.html b/docs/levels/intermediate_level_10.html deleted file mode 100644 index 5f62d2e..0000000 --- a/docs/levels/intermediate_level_10.html +++ /dev/null @@ -1,722 +0,0 @@ - - - - - - - - - - - - - - Level 10: Understand your model — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 10: Understand your model
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Level 10: Understand your model

-

Find the best model using advanced visualizations for deeper insights.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/intermediate_level_11.html b/docs/levels/intermediate_level_11.html deleted file mode 100644 index dec821e..0000000 --- a/docs/levels/intermediate_level_11.html +++ /dev/null @@ -1,712 +0,0 @@ - - - - - - - - - - - - - - Level 11: Explore SOTA scaling techniques — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 11: Explore SOTA scaling techniques
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/intermediate_level_12.html b/docs/levels/intermediate_level_12.html deleted file mode 100644 index aedeadd..0000000 --- a/docs/levels/intermediate_level_12.html +++ /dev/null @@ -1,722 +0,0 @@ - - - - - - - - - - - - - - Level 12: Deploy your models — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 12: Deploy your models
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Level 12: Deploy your models

-

In this level you’ll learn a few options for deploying models into production.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
- -
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/intermediate_level_13.html b/docs/levels/intermediate_level_13.html deleted file mode 100644 index d124a7e..0000000 --- a/docs/levels/intermediate_level_13.html +++ /dev/null @@ -1,722 +0,0 @@ - - - - - - - - - - - - - - Level 13: Optimize training speed — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 13: Optimize training speed
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Level 13: Optimize training speed

-

In this level you’ll use advanced profilers and mixed precision techniques to train bigger models faster.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/intermediate_level_14.html b/docs/levels/intermediate_level_14.html deleted file mode 100644 index 4fcbe45..0000000 --- a/docs/levels/intermediate_level_14.html +++ /dev/null @@ -1,722 +0,0 @@ - - - - - - - - - - - - - - Level 14: Run on on-prem clusters — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 14: Run on on-prem clusters
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/intermediate_level_7.html b/docs/levels/intermediate_level_7.html deleted file mode 100644 index 00c7344..0000000 --- a/docs/levels/intermediate_level_7.html +++ /dev/null @@ -1,732 +0,0 @@ - - - - - - - - - - - - - - Level 7: Interactive cloud development — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 7: Interactive cloud development
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Level 7: Interactive cloud development

-

Learn to develop models on cloud GPUs and TPUs.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/intermediate_level_8.html b/docs/levels/intermediate_level_8.html deleted file mode 100644 index b4f7af8..0000000 --- a/docs/levels/intermediate_level_8.html +++ /dev/null @@ -1,732 +0,0 @@ - - - - - - - - - - - - - - Level 8: Run models on the cloud — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 8: Run models on the cloud
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Level 8: Run models on the cloud

-

Learn to run models on the cloud in the background asynchroneously.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/levels/intermediate_level_9.html b/docs/levels/intermediate_level_9.html deleted file mode 100644 index cd7e491..0000000 --- a/docs/levels/intermediate_level_9.html +++ /dev/null @@ -1,722 +0,0 @@ - - - - - - - - - - - - - - Level 9: Modularize your projects — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Level 9: Modularize your projects
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Level 9: Modularize your projects

-

This module teaches you how to setup complex projects that can be controlled via the CLI.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/links.html b/docs/links.html deleted file mode 100644 index e5b6b99..0000000 --- a/docs/links.html +++ /dev/null @@ -1,684 +0,0 @@ - - - - - - - - - - - - - - <no title> — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- - - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
-
    -
- -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/model/build_model.html b/docs/model/build_model.html deleted file mode 100644 index bfff626..0000000 --- a/docs/model/build_model.html +++ /dev/null @@ -1,751 +0,0 @@ - - - - - - - - - - - - - - Build a Model — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
- - -
-
-
- - -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/model/build_model_advanced.html b/docs/model/build_model_advanced.html deleted file mode 100644 index a308c90..0000000 --- a/docs/model/build_model_advanced.html +++ /dev/null @@ -1,983 +0,0 @@ - - - - - - - - - - - - - - Own your loop (advanced) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Own your loop (advanced)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Own your loop (advanced)

-
-

Customize training loop

-Injecting custom code in a training loop -

Inject custom code anywhere in the Training loop using any of the 20+ methods (Hooks) available in the LightningModule.

-
class LitModel(pl.LightningModule):
-    def backward(self, loss, optimizer, optimizer_idx):
-        loss.backward()
-
-
-
-
-
-

Manual Optimization

-

For advanced research topics like reinforcement learning, sparse coding, or GAN research, it may be desirable to -manually manage the optimization process.

-

This is only recommended for experts who need ultimate flexibility. -Lightning will handle only accelerator, precision and strategy logic. -The users are left with optimizer.zero_grad(), gradient accumulation, model toggling, etc..

-

To manually optimize, do the following:

-
    -
  • Set self.automatic_optimization=False in your LightningModule’s __init__.

  • -
  • Use the following functions and call them manually:

    -
      -
    • self.optimizers() to access your optimizers (one or multiple)

    • -
    • optimizer.zero_grad() to clear the gradients from the previous training step

    • -
    • self.manual_backward(loss) instead of loss.backward()

    • -
    • optimizer.step() to update your model parameters

    • -
    -
  • -
-

Here is a minimal example of manual optimization.

-
from pytorch_lightning import LightningModule
-
-
-class MyModel(LightningModule):
-    def __init__(self):
-        super().__init__()
-        # Important: This property activates manual optimization.
-        self.automatic_optimization = False
-
-    def training_step(self, batch, batch_idx):
-        opt = self.optimizers()
-        opt.zero_grad()
-        loss = self.compute_loss(batch)
-        self.manual_backward(loss)
-        opt.step()
-
-
-
-

Warning

-

Before 1.2, optimizer.step() was calling optimizer.zero_grad() internally. -From 1.2, it is left to the user’s expertise.

-
-
-

Tip

-

Be careful where you call optimizer.zero_grad(), or your model won’t converge. -It is good practice to call optimizer.zero_grad() before self.manual_backward(loss).

-
-
-

Access your Own Optimizer

-

The provided optimizer is a LightningOptimizer object wrapping your own optimizer -configured in your configure_optimizers(). You can access your own optimizer -with optimizer.optimizer. However, if you use your own optimizer to perform a step, Lightning won’t be able to -support accelerators, precision and profiling for you.

-
class Model(LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.automatic_optimization = False
-        ...
-
-    def training_step(self, batch, batch_idx):
-        optimizer = self.optimizers()
-
-        # `optimizer` is a `LightningOptimizer` wrapping the optimizer.
-        # To access it, do the following.
-        # However, it won't work on TPU, AMP, etc...
-        optimizer = optimizer.optimizer
-        ...
-
-
-
-
-

Gradient Accumulation

-

You can accumulate gradients over batches similarly to accumulate_grad_batches argument in -Trainer for automatic optimization. To perform gradient accumulation with one optimizer -after every N steps, you can do as such.

-
def __init__(self):
-    super().__init__()
-    self.automatic_optimization = False
-
-
-def training_step(self, batch, batch_idx):
-    opt = self.optimizers()
-
-    loss = self.compute_loss(batch)
-    self.manual_backward(loss)
-
-    # accumulate gradients of N batches
-    if (batch_idx + 1) % N == 0:
-        opt.step()
-        opt.zero_grad()
-
-
-
-
-

Use Multiple Optimizers (like GANs)

-

Here is an example training a simple GAN with multiple optimizers using manual optimization.

-
import torch
-from torch import Tensor
-from pytorch_lightning import LightningModule
-
-
-class SimpleGAN(LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.G = Generator()
-        self.D = Discriminator()
-
-        # Important: This property activates manual optimization.
-        self.automatic_optimization = False
-
-    def sample_z(self, n) -> Tensor:
-        sample = self._Z.sample((n,))
-        return sample
-
-    def sample_G(self, n) -> Tensor:
-        z = self.sample_z(n)
-        return self.G(z)
-
-    def training_step(self, batch, batch_idx):
-        # Implementation follows the PyTorch tutorial:
-        # https://pytorch.org/tutorials/beginner/dcgan_faces_tutorial.html
-        g_opt, d_opt = self.optimizers()
-
-        X, _ = batch
-        batch_size = X.shape[0]
-
-        real_label = torch.ones((batch_size, 1), device=self.device)
-        fake_label = torch.zeros((batch_size, 1), device=self.device)
-
-        g_X = self.sample_G(batch_size)
-
-        ##########################
-        # Optimize Discriminator #
-        ##########################
-        d_x = self.D(X)
-        errD_real = self.criterion(d_x, real_label)
-
-        d_z = self.D(g_X.detach())
-        errD_fake = self.criterion(d_z, fake_label)
-
-        errD = errD_real + errD_fake
-
-        d_opt.zero_grad()
-        self.manual_backward(errD)
-        d_opt.step()
-
-        ######################
-        # Optimize Generator #
-        ######################
-        d_z = self.D(g_X)
-        errG = self.criterion(d_z, real_label)
-
-        g_opt.zero_grad()
-        self.manual_backward(errG)
-        g_opt.step()
-
-        self.log_dict({"g_loss": errG, "d_loss": errD}, prog_bar=True)
-
-    def configure_optimizers(self):
-        g_opt = torch.optim.Adam(self.G.parameters(), lr=1e-5)
-        d_opt = torch.optim.Adam(self.D.parameters(), lr=1e-5)
-        return g_opt, d_opt
-
-
-
-
-

Learning Rate Scheduling

-

Every optimizer you use can be paired with any -Learning Rate Scheduler. Please see the -documentation of configure_optimizers() for all the available options

-

You can call lr_scheduler.step() at arbitrary intervals. -Use self.lr_schedulers() in your LightningModule to access any learning rate schedulers -defined in your configure_optimizers().

-
-

Warning

-
    -
  • Before v1.3, Lightning automatically called lr_scheduler.step() in both automatic and manual optimization. From -1.3, lr_scheduler.step() is now for the user to call at arbitrary intervals.

  • -
  • Note that the lr_scheduler_config keys, such as "frequency" and "interval", will be ignored even if they are provided in -your configure_optimizers() during manual optimization.

  • -
-
-

Here is an example calling lr_scheduler.step() every step.

-
# step every batch
-def __init__(self):
-    super().__init__()
-    self.automatic_optimization = False
-
-
-def training_step(self, batch, batch_idx):
-    # do forward, backward, and optimization
-    ...
-
-    # single scheduler
-    sch = self.lr_schedulers()
-    sch.step()
-
-    # multiple schedulers
-    sch1, sch2 = self.lr_schedulers()
-    sch1.step()
-    sch2.step()
-
-
-

If you want to call lr_scheduler.step() every N steps/epochs, do the following.

-
def __init__(self):
-    super().__init__()
-    self.automatic_optimization = False
-
-
-def training_step(self, batch, batch_idx):
-    # do forward, backward, and optimization
-    ...
-
-    sch = self.lr_schedulers()
-
-    # step every N batches
-    if (batch_idx + 1) % N == 0:
-        sch.step()
-
-    # step every N epochs
-    if self.trainer.is_last_batch and (self.trainer.current_epoch + 1) % N == 0:
-        sch.step()
-
-
-

If you want to call schedulers that require a metric value after each epoch, consider doing the following:

-
def __init__(self):
-    super().__init__()
-    self.automatic_optimization = False
-
-
-def training_epoch_end(self, outputs):
-    sch = self.lr_schedulers()
-
-    # If the selected scheduler is a ReduceLROnPlateau scheduler.
-    if isinstance(sch, torch.optim.lr_scheduler.ReduceLROnPlateau):
-        sch.step(self.trainer.callback_metrics["loss"])
-
-
-
-
-

Use Closure for LBFGS-like Optimizers

-

It is a good practice to provide the optimizer with a closure function that performs a forward, zero_grad and -backward of your model. It is optional for most optimizers, but makes your code compatible if you switch to an -optimizer which requires a closure, such as LBFGS.

-

See the PyTorch docs for more about the closure.

-

Here is an example using a closure function.

-
def __init__(self):
-    super().__init__()
-    self.automatic_optimization = False
-
-
-def configure_optimizers(self):
-    return torch.optim.LBFGS(...)
-
-
-def training_step(self, batch, batch_idx):
-    opt = self.optimizers()
-
-    def closure():
-        loss = self.compute_loss(batch)
-        opt.zero_grad()
-        self.manual_backward(loss)
-        return loss
-
-    opt.step(closure=closure)
-
-
-
-

Warning

-

The LBFGS optimizer is not supported for apex AMP, native AMP, IPUs, or DeepSpeed.

-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/model/build_model_expert.html b/docs/model/build_model_expert.html deleted file mode 100644 index 1a1cc9d..0000000 --- a/docs/model/build_model_expert.html +++ /dev/null @@ -1,1355 +0,0 @@ - - - - - - - - - - - - - - Raw PyTorch loop (expert) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Raw PyTorch loop (expert)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Raw PyTorch loop (expert)

-
-
-

LightningLite (Stepping Stone to Lightning)

-

LightningLite enables pure PyTorch users to scale their existing code -on any kind of device while retaining full control over their own loops and optimization logic.

-Animation showing how to convert your PyTorch code to LightningLite. -
-

-
-

LightningLite is the right tool for you if you match one of the two following descriptions:

-
    -
  • I want to quickly scale my existing code to multiple devices with minimal code changes.

  • -
  • I would like to convert my existing code to the Lightning API, but a full path to Lightning transition might be too complex. I am looking for a stepping stone to ensure reproducibility during the transition.

  • -
-
-

Warning

-

LightningLite is currently a beta feature. Its API is subject to change based on your feedback.

-
-
-
-

Learn by example

-
-

My Existing PyTorch Code

-

The run function contains custom training loop used to train MyModel on MyDataset for num_epochs epochs.

-
import torch
-from torch import nn
-from torch.utils.data import DataLoader, Dataset
-
-
-class MyModel(nn.Module):
-    ...
-
-
-class MyDataset(Dataset):
-    ...
-
-
-def run(args):
-    device = "cuda" if torch.cuda.is_available() else "cpu"
-
-    model = MyModel(...).to(device)
-    optimizer = torch.optim.SGD(model.parameters(), ...)
-
-    dataloader = DataLoader(MyDataset(...), ...)
-
-    model.train()
-    for epoch in range(args.num_epochs):
-        for batch in dataloader:
-            batch = batch.to(device)
-            optimizer.zero_grad()
-            loss = model(batch)
-            loss.backward()
-            optimizer.step()
-
-
-run(args)
-
-
-
-
-
-

Convert to LightningLite

-

Here are five required steps to convert to LightningLite.

-
    -
  1. Subclass LightningLite and override its run() method.

  2. -
  3. Move the body of your existing run function into LightningLite run method.

  4. -
  5. Remove all .to(...), .cuda() etc calls since LightningLite will take care of it.

  6. -
  7. Apply setup() over each model and optimizers pair and setup_dataloaders() on all your dataloaders and replace loss.backward() by self.backward(loss).

  8. -
  9. Instantiate your LightningLite subclass and call its run() method.

  10. -
-
-

-
-
import torch
-from torch import nn
-from torch.utils.data import DataLoader, Dataset
-from pytorch_lightning.lite import LightningLite
-
-
-class MyModel(nn.Module):
-    ...
-
-
-class MyDataset(Dataset):
-    ...
-
-
-class Lite(LightningLite):
-    def run(self, args):
-
-        model = MyModel(...)
-        optimizer = torch.optim.SGD(model.parameters(), ...)
-        model, optimizer = self.setup(model, optimizer)  # Scale your model / optimizers
-
-        dataloader = DataLoader(MyDataset(...), ...)
-        dataloader = self.setup_dataloaders(dataloader)  # Scale your dataloaders
-
-        model.train()
-        for epoch in range(args.num_epochs):
-            for batch in dataloader:
-                optimizer.zero_grad()
-                loss = model(batch)
-                self.backward(loss)  # instead of loss.backward()
-                optimizer.step()
-
-
-Lite(...).run(args)
-
-
-

That’s all. You can now train on any kind of device and scale your training. Check out this full MNIST training example with LightningLite.

-

LightningLite takes care of device management, so you don’t have to. -You should remove any device-specific logic within your code.

-

Here is how to train on eight GPUs with torch.bfloat16 precision:

-
Lite(strategy="ddp", devices=8, accelerator="gpu", precision="bf16").run(10)
-
-
-

Here is how to use DeepSpeed Zero3 with eight GPUs and precision 16:

-
Lite(strategy="deepspeed", devices=8, accelerator="gpu", precision=16).run(10)
-
-
-

LightningLite can also figure it out automatically for you!

-
Lite(devices="auto", accelerator="auto", precision=16).run(10)
-
-
-

You can also easily use distributed collectives if required. -Here is an example while running on 256 GPUs (eight GPUs times 32 nodes).

-
class Lite(LightningLite):
-    def run(self):
-
-        # Transfer and concatenate tensors across processes
-        self.all_gather(...)
-
-        # Transfer an object from one process to all the others
-        self.broadcast(..., src=...)
-
-        # The total number of processes running across all devices and nodes.
-        self.world_size
-
-        # The global index of the current process across all devices and nodes.
-        self.global_rank
-
-        # The index of the current process among the processes running on the local node.
-        self.local_rank
-
-        # The index of the current node.
-        self.node_rank
-
-        # Wether this global rank is rank zero.
-        if self.is_global_zero:
-            # do something on rank 0
-            ...
-
-        # Wait for all processes to enter this call.
-        self.barrier()
-
-
-Lite(strategy="ddp", devices=8, num_nodes=32, accelerator="gpu").run()
-
-
-

If you require custom data or model device placement, you can deactivate -LightningLite automatic placement by doing -self.setup_dataloaders(..., move_to_device=False) for the data and -self.setup(..., move_to_device=False) for the model. -Furthermore, you can access the current device from self.device or -rely on to_device() -utility to move an object to the current device.

-
-

Note

-

We recommend instantiating the models within the run() method as large models would cause an out-of-memory error otherwise.

-
-
-

Tip

-

If you have hundreds or thousands of lines within your run() function -and you are feeling unsure about them, then that is the correct feeling. -In 2019, our LightningModule was getting larger -and we got the same feeling, so we started to organize our code for simplicity, interoperability and standardization. -This is definitely a good sign that you should consider refactoring your code and / or switching to -LightningModule ultimately.

-
-
-
-
-

Distributed Training Pitfalls

-

The LightningLite provides you with the tools to scale your training, -but there are several major challenges ahead of you now:

- ---- - - - - - - - - - - - - - - - - - - - - -

Processes divergence

This happens when processes execute a different section of the code due to different if/else conditions, race conditions on existing files and so on, resulting in hanging.

Cross processes reduction

Miscalculated metrics or gradients due to errors in their reduction.

Large sharded models

Instantiation, materialization and state management of large models.

Rank 0 only actions

Logging, profiling, and so on.

Checkpointing / Early stopping / Callbacks / Logging

Ability to customize your training behavior easily and make it stateful.

Fault-tolerant training

Ability to resume from a failure as if it never happened.

-

If you are facing one of those challenges, then you are already meeting the limit of LightningLite. -We recommend you to convert to Lightning, so you never have to worry about those.

-
-
-
-

Convert to Lightning

-

LightningLite is a stepping stone to transition fully to the Lightning API and benefit -from its hundreds of features.

-

You can see our LightningLite class as a -future LightningModule, and slowly refactor your code into its API. -Below, the training_step(), forward(), -configure_optimizers(), train_dataloader() methods -are implemented.

-
class Lite(LightningLite):
-
-    # 1. This would become the LightningModule `__init__` function.
-    def run(self, args):
-        self.args = args
-
-        self.model = MyModel(...)
-
-        self.fit()  # This would be automated by the Lightning Trainer.
-
-    # 2. This can be fully removed as Lightning creates its own fitting loop,
-    # and sets up the model, optimizer, dataloader, etc for you.
-    def fit(self):
-        # setup everything
-        optimizer = self.configure_optimizers()
-        self.model, optimizer = self.setup(self.model, optimizer)
-        dataloader = self.setup_dataloaders(self.train_dataloader())
-
-        # start fitting
-        self.model.train()
-        for epoch in range(num_epochs):
-            for batch in enumerate(dataloader):
-                optimizer.zero_grad()
-                loss = self.training_step(batch, batch_idx)
-                self.backward(loss)
-                optimizer.step()
-
-    # 3. This stays here as it belongs to the LightningModule.
-    def forward(self, x):
-        return self.model(x)
-
-    def training_step(self, batch, batch_idx):
-        return self.forward(batch)
-
-    def configure_optimizers(self):
-        return torch.optim.SGD(self.model.parameters(), ...)
-
-    # 4. [Optionally] This can stay here or be extracted to the LightningDataModule to enable higher composability.
-    def train_dataloader(self):
-        return DataLoader(MyDataset(...), ...)
-
-
-Lite(...).run(args)
-
-
-

Finally, change the run() into a -__init__() and drop the fit call from inside.

-
from pytorch_lightning import LightningDataModule, LightningModule, Trainer
-
-
-class LightningModel(LightningModule):
-    def __init__(self, args):
-        super().__init__()
-        self.model = MyModel(...)
-
-    def forward(self, x):
-        return self.model(x)
-
-    def training_step(self, batch, batch_idx):
-        loss = self(batch)
-        self.log("train_loss", loss)
-        return loss
-
-    def configure_optimizers(self):
-        return torch.optim.SGD(self.model.parameters(), lr=0.001)
-
-
-class BoringDataModule(LightningDataModule):
-    def train_dataloader(self):
-        return DataLoader(MyDataset(...), ...)
-
-
-trainer = Trainer(max_epochs=10)
-trainer.fit(LightningModel(), datamodule=BoringDataModule())
-
-
-

You have successfully converted to PyTorch Lightning, and can now benefit from its hundred of features!

-
-
-
-
-

Lightning Lite Flags

-

Lite is specialized in accelerated distributed training and inference. It offers you convenient ways to configure -your device and communication strategy and to switch seamlessly from one to the other. The terminology and usage are -identical to Lightning, which means minimum effort for you to convert when you decide to do so.

-
-

accelerator

-

Choose one of "cpu", "gpu", "tpu", "auto" (IPU support is coming soon).

-
# CPU accelerator
-lite = Lite(accelerator="cpu")
-
-# Running with GPU Accelerator using 2 GPUs
-lite = Lite(devices=2, accelerator="gpu")
-
-# Running with TPU Accelerator using 8 tpu cores
-lite = Lite(devices=8, accelerator="tpu")
-
-# Running with GPU Accelerator using the DistributedDataParallel strategy
-lite = Lite(devices=4, accelerator="gpu", strategy="ddp")
-
-
-

The "auto" option recognizes the machine you are on and selects the available accelerator.

-
# If your machine has GPUs, it will use the GPU Accelerator
-lite = Lite(devices=2, accelerator="auto")
-
-
-
-
-

strategy

-

Choose a training strategy: "dp", "ddp", "ddp_spawn", "tpu_spawn", "deepspeed", "ddp_sharded", or "ddp_sharded_spawn".

-
# Running with the DistributedDataParallel strategy on 4 GPUs
-lite = Lite(strategy="ddp", accelerator="gpu", devices=4)
-
-# Running with the DDP Spawn strategy using 4 cpu processes
-lite = Lite(strategy="ddp_spawn", accelerator="cpu", devices=4)
-
-
-

Additionally, you can pass in your custom strategy by configuring additional parameters.

-
from pytorch_lightning.strategies import DeepSpeedStrategy
-
-lite = Lite(strategy=DeepSpeedStrategy(stage=2), accelerator="gpu", devices=2)
-
-
-

Support for Horovod and Fully Sharded training strategies are coming soon.

-
-
-

devices

-

Configure the devices to run on. Can be of type:

-
    -
  • int: the number of devices (e.g., GPUs) to train on

  • -
  • list of int: which device index (e.g., GPU ID) to train on (0-indexed)

  • -
  • str: a string representation of one of the above

  • -
-
# default used by Lite, i.e., use the CPU
-lite = Lite(devices=None)
-
-# equivalent
-lite = Lite(devices=0)
-
-# int: run on two GPUs
-lite = Lite(devices=2, accelerator="gpu")
-
-# list: run on GPUs 1, 4 (by bus ordering)
-lite = Lite(devices=[1, 4], accelerator="gpu")
-lite = Lite(devices="1, 4", accelerator="gpu")  # equivalent
-
-# -1: run on all GPUs
-lite = Lite(devices=-1, accelerator="gpu")
-lite = Lite(devices="-1", accelerator="gpu")  # equivalent
-
-
-
-
-

gpus

-
-

Warning

-

gpus=x has been deprecated in v1.7 and will be removed in v2.0. -Please use accelerator='gpu' and devices=x instead.

-
-

Shorthand for setting devices=X and accelerator="gpu".

-
# Run on two GPUs
-lite = Lite(accelerator="gpu", devices=2)
-
-# Equivalent
-lite = Lite(devices=2, accelerator="gpu")
-
-
-
-
-

tpu_cores

-
-

Warning

-

tpu_cores=x has been deprecated in v1.7 and will be removed in v2.0. -Please use accelerator='tpu' and devices=x instead.

-
-

Shorthand for devices=X and accelerator="tpu".

-
# Run on eight TPUs
-lite = Lite(accelerator="tpu", devices=8)
-
-# Equivalent
-lite = Lite(devices=8, accelerator="tpu")
-
-
-
-
-

num_nodes

-

Number of cluster nodes for distributed operation.

-
# Default used by Lite
-lite = Lite(num_nodes=1)
-
-# Run on 8 nodes
-lite = Lite(num_nodes=8)
-
-
-

Learn more about distributed multi-node training on clusters here.

-
-
-

precision

-

Lightning Lite supports double precision (64), full precision (32), or half precision (16) operation (including bfloat16). -Half precision, or mixed precision, is the combined use of 32 and 16-bit floating points to reduce the memory footprint during model training. -This can result in improved performance, achieving significant speedups on modern GPUs.

-
# Default used by the Lite
-lite = Lite(precision=32, devices=1)
-
-# 16-bit (mixed) precision
-lite = Lite(precision=16, devices=1)
-
-# 16-bit bfloat precision
-lite = Lite(precision="bf16", devices=1)
-
-# 64-bit (double) precision
-lite = Lite(precision=64, devices=1)
-
-
-
-
-

plugins

-

Plugins allow you to connect arbitrary backends, precision libraries, clusters etc. For example: -To define your own behavior, subclass the relevant class and pass it in. Here’s an example linking up your own -ClusterEnvironment.

-
from pytorch_lightning.plugins.environments import ClusterEnvironment
-
-
-class MyCluster(ClusterEnvironment):
-    @property
-    def main_address(self):
-        return your_main_address
-
-    @property
-    def main_port(self):
-        return your_main_port
-
-    def world_size(self):
-        return the_world_size
-
-
-lite = Lite(plugins=[MyCluster()], ...)
-
-
-
-
-
-
-

Lightning Lite Methods

-
-

run

-

The run method serves two purposes:

-
    -
  1. Override this method from the LightningLite class and put your -training (or inference) code inside.

  2. -
  3. Launch the training procedure by calling the run method. Lite will take care of setting up the distributed backend.

  4. -
-

You can optionally pass arguments to the run method. For example, the hyperparameters or a backbone for the model.

-
from pytorch_lightning.lite import LightningLite
-
-
-class Lite(LightningLite):
-
-    # Input arguments are optional; put whatever you need
-    def run(self, learning_rate, num_layers):
-        """Here goes your training loop"""
-
-
-lite = Lite(accelerator="gpu", devices=2)
-lite.run(learning_rate=0.01, num_layers=12)
-
-
-
-
-

setup

-

Set up a model and corresponding optimizer(s). If you need to set up multiple models, call setup() on each of them. -Moves the model and optimizer to the correct device automatically.

-
model = nn.Linear(32, 64)
-optimizer = torch.optim.SGD(model.parameters(), lr=0.001)
-
-# Set up model and optimizer for accelerated training
-model, optimizer = self.setup(model, optimizer)
-
-# If you don't want Lite to set the device
-model, optimizer = self.setup(model, optimizer, move_to_device=False)
-
-
-

The setup method also prepares the model for the selected precision choice so that operations during forward() get -cast automatically.

-
-
-

setup_dataloaders

-

Set up one or multiple dataloaders for accelerated operation. If you are running a distributed strategy (e.g., DDP), Lite -replaces the sampler automatically for you. In addition, the dataloader will be configured to move the returned -data tensors to the correct device automatically.

-
train_data = torch.utils.DataLoader(train_dataset, ...)
-test_data = torch.utils.DataLoader(test_dataset, ...)
-
-train_data, test_data = self.setup_dataloaders(train_data, test_data)
-
-# If you don't want Lite to move the data to the device
-train_data, test_data = self.setup_dataloaders(train_data, test_data, move_to_device=False)
-
-# If you don't want Lite to replace the sampler in the context of distributed training
-train_data, test_data = self.setup_dataloaders(train_data, test_data, replace_sampler=False)
-
-
-
-
-

backward

-

This replaces any occurrences of loss.backward() and makes your code accelerator and precision agnostic.

-
output = model(input)
-loss = loss_fn(output, target)
-
-# loss.backward()
-self.backward(loss)
-
-
-
-
-

to_device

-

Use to_device() to move models, tensors or collections of tensors to -the current device. By default setup() and -setup_dataloaders() already move the model and data to the correct -device, so calling this method is only necessary for manual operation when needed.

-
data = torch.load("dataset.pt")
-data = self.to_device(data)
-
-
-
-
-

seed_everything

-

Make your code reproducible by calling this method at the beginning of your run.

-
# Instead of `torch.manual_seed(...)`, call:
-self.seed_everything(1234)
-
-
-

This covers PyTorch, NumPy and Python random number generators. In addition, Lite takes care of properly initializing -the seed of dataloader worker processes (can be turned off by passing workers=False).

-
-
-

autocast

-

Let the precision backend autocast the block of code under this context manager. This is optional and already done by -Lite for the model’s forward method (once the model was setup()). -You need this only if you wish to autocast more operations outside the ones in model forward:

-
model, optimizer = self.setup(model, optimizer)
-
-# Lite handles precision automatically for the model
-output = model(inputs)
-
-with self.autocast():  # optional
-    loss = loss_function(output, target)
-
-self.backward(loss)
-...
-
-
-
-
-

print

-

Print to the console via the built-in print function, but only on the main process. -This avoids excessive printing and logs when running on multiple devices/nodes.

-
# Print only on the main process
-self.print(f"{epoch}/{num_epochs}| Train Epoch Loss: {loss}")
-
-
-
-
-

save

-

Save contents to a checkpoint. Replaces all occurrences of torch.save(...) in your code. Lite will take care of -handling the saving part correctly, no matter if you are running a single device, multi-devices or multi-nodes.

-
# Instead of `torch.save(...)`, call:
-self.save(model.state_dict(), "path/to/checkpoint.ckpt")
-
-
-
-
-

load

-

Load checkpoint contents from a file. Replaces all occurrences of torch.load(...) in your code. Lite will take care of -handling the loading part correctly, no matter if you are running a single device, multi-device, or multi-node.

-
# Instead of `torch.load(...)`, call:
-self.load("path/to/checkpoint.ckpt")
-
-
-
-
-

barrier

-

Call this if you want all processes to wait and synchronize. Once all processes have entered this call, -execution continues. Useful for example when you want to download data on one process and make all others wait until -the data is written to disk.

-
# Download data only on one process
-if self.global_rank == 0:
-    download_data("http://...")
-
-# Wait until all processes meet up here
-self.barrier()
-
-# All processes are allowed to read the data now
-
-
-
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/model/build_model_intermediate.html b/docs/model/build_model_intermediate.html deleted file mode 100644 index 5db5ebf..0000000 --- a/docs/model/build_model_intermediate.html +++ /dev/null @@ -1,724 +0,0 @@ - - - - - - - - - - - - - - Supercharge training (intermediate) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Supercharge training (intermediate)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Supercharge training (intermediate)

-
-

Enable training features

-

Enable advanced training features using Trainer arguments. These are SOTA techniques that are automatically integrated into your training loop without changes to your code.

-
# train 1TB+ parameter models with Deepspeed/fsdp
-trainer = Trainer(
-    devices=4,
-    accelerator="gpu",
-    strategy="deepspeed_stage_2",
-    precision=16
- )
-
-# 20+ helpful arguments for rapid idea iteration
-trainer = Trainer(
-    max_epochs=10,
-    min_epochs=5,
-    overfit_batches=1
- )
-
-# access the latest state of the art techniques
-trainer = Trainer(callbacks=[StochasticWeightAveraging(...)])
-
-
-
-
-
-

Extend the Trainer

-

If you have multiple lines of code with similar functionalities, you can use callbacks to easily group them together and toggle all of those lines on or off at the same time.

-
trainer = Trainer(callbacks=[AWSCheckpoints()])
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/model/manual_optimization.html b/docs/model/manual_optimization.html deleted file mode 100644 index f34ef9a..0000000 --- a/docs/model/manual_optimization.html +++ /dev/null @@ -1,965 +0,0 @@ - - - - - - - - - - - - - - Manual Optimization — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Manual Optimization
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Manual Optimization

-

For advanced research topics like reinforcement learning, sparse coding, or GAN research, it may be desirable to -manually manage the optimization process.

-

This is only recommended for experts who need ultimate flexibility. -Lightning will handle only accelerator, precision and strategy logic. -The users are left with optimizer.zero_grad(), gradient accumulation, model toggling, etc..

-

To manually optimize, do the following:

-
    -
  • Set self.automatic_optimization=False in your LightningModule’s __init__.

  • -
  • Use the following functions and call them manually:

    -
      -
    • self.optimizers() to access your optimizers (one or multiple)

    • -
    • optimizer.zero_grad() to clear the gradients from the previous training step

    • -
    • self.manual_backward(loss) instead of loss.backward()

    • -
    • optimizer.step() to update your model parameters

    • -
    -
  • -
-

Here is a minimal example of manual optimization.

-
from pytorch_lightning import LightningModule
-
-
-class MyModel(LightningModule):
-    def __init__(self):
-        super().__init__()
-        # Important: This property activates manual optimization.
-        self.automatic_optimization = False
-
-    def training_step(self, batch, batch_idx):
-        opt = self.optimizers()
-        opt.zero_grad()
-        loss = self.compute_loss(batch)
-        self.manual_backward(loss)
-        opt.step()
-
-
-
-

Warning

-

Before 1.2, optimizer.step() was calling optimizer.zero_grad() internally. -From 1.2, it is left to the user’s expertise.

-
-
-

Tip

-

Be careful where you call optimizer.zero_grad(), or your model won’t converge. -It is good practice to call optimizer.zero_grad() before self.manual_backward(loss).

-
-
-

Access your Own Optimizer

-

The provided optimizer is a LightningOptimizer object wrapping your own optimizer -configured in your configure_optimizers(). You can access your own optimizer -with optimizer.optimizer. However, if you use your own optimizer to perform a step, Lightning won’t be able to -support accelerators, precision and profiling for you.

-
class Model(LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.automatic_optimization = False
-        ...
-
-    def training_step(self, batch, batch_idx):
-        optimizer = self.optimizers()
-
-        # `optimizer` is a `LightningOptimizer` wrapping the optimizer.
-        # To access it, do the following.
-        # However, it won't work on TPU, AMP, etc...
-        optimizer = optimizer.optimizer
-        ...
-
-
-
-
-

Gradient Accumulation

-

You can accumulate gradients over batches similarly to accumulate_grad_batches argument in -Trainer for automatic optimization. To perform gradient accumulation with one optimizer -after every N steps, you can do as such.

-
def __init__(self):
-    super().__init__()
-    self.automatic_optimization = False
-
-
-def training_step(self, batch, batch_idx):
-    opt = self.optimizers()
-
-    loss = self.compute_loss(batch)
-    self.manual_backward(loss)
-
-    # accumulate gradients of N batches
-    if (batch_idx + 1) % N == 0:
-        opt.step()
-        opt.zero_grad()
-
-
-
-
-

Use Multiple Optimizers (like GANs)

-

Here is an example training a simple GAN with multiple optimizers using manual optimization.

-
import torch
-from torch import Tensor
-from pytorch_lightning import LightningModule
-
-
-class SimpleGAN(LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.G = Generator()
-        self.D = Discriminator()
-
-        # Important: This property activates manual optimization.
-        self.automatic_optimization = False
-
-    def sample_z(self, n) -> Tensor:
-        sample = self._Z.sample((n,))
-        return sample
-
-    def sample_G(self, n) -> Tensor:
-        z = self.sample_z(n)
-        return self.G(z)
-
-    def training_step(self, batch, batch_idx):
-        # Implementation follows the PyTorch tutorial:
-        # https://pytorch.org/tutorials/beginner/dcgan_faces_tutorial.html
-        g_opt, d_opt = self.optimizers()
-
-        X, _ = batch
-        batch_size = X.shape[0]
-
-        real_label = torch.ones((batch_size, 1), device=self.device)
-        fake_label = torch.zeros((batch_size, 1), device=self.device)
-
-        g_X = self.sample_G(batch_size)
-
-        ##########################
-        # Optimize Discriminator #
-        ##########################
-        d_x = self.D(X)
-        errD_real = self.criterion(d_x, real_label)
-
-        d_z = self.D(g_X.detach())
-        errD_fake = self.criterion(d_z, fake_label)
-
-        errD = errD_real + errD_fake
-
-        d_opt.zero_grad()
-        self.manual_backward(errD)
-        d_opt.step()
-
-        ######################
-        # Optimize Generator #
-        ######################
-        d_z = self.D(g_X)
-        errG = self.criterion(d_z, real_label)
-
-        g_opt.zero_grad()
-        self.manual_backward(errG)
-        g_opt.step()
-
-        self.log_dict({"g_loss": errG, "d_loss": errD}, prog_bar=True)
-
-    def configure_optimizers(self):
-        g_opt = torch.optim.Adam(self.G.parameters(), lr=1e-5)
-        d_opt = torch.optim.Adam(self.D.parameters(), lr=1e-5)
-        return g_opt, d_opt
-
-
-
-
-

Learning Rate Scheduling

-

Every optimizer you use can be paired with any -Learning Rate Scheduler. Please see the -documentation of configure_optimizers() for all the available options

-

You can call lr_scheduler.step() at arbitrary intervals. -Use self.lr_schedulers() in your LightningModule to access any learning rate schedulers -defined in your configure_optimizers().

-
-

Warning

-
    -
  • Before v1.3, Lightning automatically called lr_scheduler.step() in both automatic and manual optimization. From -1.3, lr_scheduler.step() is now for the user to call at arbitrary intervals.

  • -
  • Note that the lr_scheduler_config keys, such as "frequency" and "interval", will be ignored even if they are provided in -your configure_optimizers() during manual optimization.

  • -
-
-

Here is an example calling lr_scheduler.step() every step.

-
# step every batch
-def __init__(self):
-    super().__init__()
-    self.automatic_optimization = False
-
-
-def training_step(self, batch, batch_idx):
-    # do forward, backward, and optimization
-    ...
-
-    # single scheduler
-    sch = self.lr_schedulers()
-    sch.step()
-
-    # multiple schedulers
-    sch1, sch2 = self.lr_schedulers()
-    sch1.step()
-    sch2.step()
-
-
-

If you want to call lr_scheduler.step() every N steps/epochs, do the following.

-
def __init__(self):
-    super().__init__()
-    self.automatic_optimization = False
-
-
-def training_step(self, batch, batch_idx):
-    # do forward, backward, and optimization
-    ...
-
-    sch = self.lr_schedulers()
-
-    # step every N batches
-    if (batch_idx + 1) % N == 0:
-        sch.step()
-
-    # step every N epochs
-    if self.trainer.is_last_batch and (self.trainer.current_epoch + 1) % N == 0:
-        sch.step()
-
-
-

If you want to call schedulers that require a metric value after each epoch, consider doing the following:

-
def __init__(self):
-    super().__init__()
-    self.automatic_optimization = False
-
-
-def training_epoch_end(self, outputs):
-    sch = self.lr_schedulers()
-
-    # If the selected scheduler is a ReduceLROnPlateau scheduler.
-    if isinstance(sch, torch.optim.lr_scheduler.ReduceLROnPlateau):
-        sch.step(self.trainer.callback_metrics["loss"])
-
-
-
-
-

Use Closure for LBFGS-like Optimizers

-

It is a good practice to provide the optimizer with a closure function that performs a forward, zero_grad and -backward of your model. It is optional for most optimizers, but makes your code compatible if you switch to an -optimizer which requires a closure, such as LBFGS.

-

See the PyTorch docs for more about the closure.

-

Here is an example using a closure function.

-
def __init__(self):
-    super().__init__()
-    self.automatic_optimization = False
-
-
-def configure_optimizers(self):
-    return torch.optim.LBFGS(...)
-
-
-def training_step(self, batch, batch_idx):
-    opt = self.optimizers()
-
-    def closure():
-        loss = self.compute_loss(batch)
-        opt.zero_grad()
-        self.manual_backward(loss)
-        return loss
-
-    opt.step(closure=closure)
-
-
-
-

Warning

-

The LBFGS optimizer is not supported for apex AMP, native AMP, IPUs, or DeepSpeed.

-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/model/own_your_loop.html b/docs/model/own_your_loop.html deleted file mode 100644 index 7e701c0..0000000 --- a/docs/model/own_your_loop.html +++ /dev/null @@ -1,731 +0,0 @@ - - - - - - - - - - - - - - Use a pure PyTorch training loop — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Use a pure PyTorch training loop
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
- - - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/model/train_model_basic.html b/docs/model/train_model_basic.html deleted file mode 100644 index e24fa03..0000000 --- a/docs/model/train_model_basic.html +++ /dev/null @@ -1,801 +0,0 @@ - - - - - - - - - - - - - - Train a model (basic) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Train a model (basic)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Train a model (basic)

-

Audience: Users who need to train a model without coding their own training loops.

-
-
-

Add imports

-

Add the relevant imports at the top of the file

-
import os
-import torch
-from torch import nn
-import torch.nn.functional as F
-from torchvision import transforms
-from torchvision.datasets import MNIST
-from torch.utils.data import DataLoader, random_split
-import pytorch_lightning as pl
-
-
-
-
-
-

Define the PyTorch nn.Modules

-
class Encoder(nn.Module):
-    def __init__(self):
-        self.l1 = nn.Sequential(nn.Linear(28 * 28, 64), nn.ReLU(), nn.Linear(64, 3))
-
-    def forward(self, x):
-        return self.l1(x)
-
-
-class Decoder(nn.Module):
-    def __init__(self):
-        self.l1 = nn.Sequential(nn.Linear(3, 64), nn.ReLU(), nn.Linear(64, 28 * 28))
-
-    def forward(self, x):
-        return self.l1(x)
-
-
-
-
-
-

Define a LightningModule

-

The LightningModule is the full recipe that defines how your nn.Modules interact.

-
    -
  • The training_step defines how the nn.Modules interact together.

  • -
  • In the configure_optimizers define the optimizer(s) for your models.

  • -
-
class LitAutoEncoder(pl.LightningModule):
-    def __init__(self, encoder, decoder):
-        super().__init__()
-        self.encoder = encoder
-        self.decoder = decoder
-
-    def training_step(self, batch, batch_idx):
-        # training_step defines the train loop.
-        x, y = batch
-        x = x.view(x.size(0), -1)
-        z = self.encoder(x)
-        x_hat = self.decoder(z)
-        loss = F.mse_loss(x_hat, x)
-        return loss
-
-    def configure_optimizers(self):
-        optimizer = torch.optim.Adam(self.parameters(), lr=1e-3)
-        return optimizer
-
-
-
-
-
-

Define the training dataset

-

Define a PyTorch DataLoader which contains your training dataset.

-
dataset = MNIST(os.getcwd(), download=True, transform=transforms.ToTensor())
-train_loader = DataLoader(dataset)
-
-
-
-
-
-

Train the model

-

To train the model use the Lightning Trainer which handles all the engineering and abstracts away all the complexity needed for scale.

-
# model
-autoencoder = LitAutoEncoder(Encoder(), Decoder())
-
-# train model
-trainer = pl.Trainer()
-trainer.fit(model=autoencoder, train_dataloaders=train_loader)
-
-
-
-
-
-

Eliminate the training loop

-

Under the hood, the Lightning Trainer runs the following training loop on your behalf

-
autoencoder = LitAutoEncoder(encoder, decoder)
-optimizer = autoencoder.configure_optimizers()
-
-for batch, batch_idx in enumerate(train_loader):
-    loss = autoencoder(batch, batch_idx)
-
-    loss.backward()
-    optimizer.step()
-    optimizer.zero_grad()
-
-
-

The power of Lightning comes when the training loop gets complicated as you add validation/test splits, schedulers, distributed training and all the latest SOTA techniques.

-

With Lightning, you can add mix all these techniques together without needing to rewrite a new loop every time.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/objects.inv b/docs/objects.inv deleted file mode 100644 index 08ed8c9..0000000 Binary files a/docs/objects.inv and /dev/null differ diff --git a/docs/rtfd-build.sh b/docs/rtfd-build.sh new file mode 100644 index 0000000..edfc5b3 --- /dev/null +++ b/docs/rtfd-build.sh @@ -0,0 +1,12 @@ +# building for PRs and skip stable and latest states + +if ! [ $READTHEDOCS_VERSION == "latest" -o $READTHEDOCS_VERSION == "stable" ]; +then + cd ./docs/source-pytorch ; + export PL_FAST_DOCS_DEV=1 ; + make html --jobs $(nproc) ; + ls -lh ../build +else + echo "Void build... :-]" ; + mkdir -p ./docs/build/html +fi diff --git a/docs/search.html b/docs/search.html deleted file mode 100644 index 75efebc..0000000 --- a/docs/search.html +++ /dev/null @@ -1,696 +0,0 @@ - - - - - - - - - - - - - Search — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- - - - -
- -
- -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- -
-
-
- -
-
-
-
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/searchindex.js b/docs/searchindex.js deleted file mode 100644 index ed1e556..0000000 --- a/docs/searchindex.js +++ /dev/null @@ -1 +0,0 @@ -Search.setIndex({docnames:["accelerators/accelerator_prepare","accelerators/gpu","accelerators/gpu_advanced","accelerators/gpu_basic","accelerators/gpu_expert","accelerators/gpu_faq","accelerators/gpu_intermediate","accelerators/hpu","accelerators/hpu_basic","accelerators/hpu_intermediate","accelerators/ipu","accelerators/ipu_advanced","accelerators/ipu_basic","accelerators/ipu_intermediate","accelerators/tpu","accelerators/tpu_advanced","accelerators/tpu_basic","accelerators/tpu_faq","accelerators/tpu_intermediate","advanced/model_parallel","advanced/pruning_quantization","advanced/strategy_registry","advanced/training_tricks","advanced/transfer_learning","benchmarking/benchmarks","cli/lightning_cli","cli/lightning_cli_advanced","cli/lightning_cli_advanced_2","cli/lightning_cli_advanced_3","cli/lightning_cli_expert","cli/lightning_cli_faq","cli/lightning_cli_intermediate","cli/lightning_cli_intermediate_2","clouds/cloud_training","clouds/cloud_training_intermediate","clouds/cluster","clouds/cluster_advanced","clouds/cluster_expert","clouds/cluster_intermediate_1","clouds/cluster_intermediate_2","clouds/fault_tolerant_training","clouds/fault_tolerant_training_basic","clouds/fault_tolerant_training_expert","clouds/fault_tolerant_training_faq","clouds/grid_costs","clouds/run_advanced","clouds/run_basic","clouds/run_expert","clouds/run_intermediate","clouds/session_basic","clouds/session_intermediate","common/checkpointing","common/checkpointing_advanced","common/checkpointing_basic","common/checkpointing_expert","common/checkpointing_intermediate","common/child_modules","common/console_logs","common/early_stopping","common/evaluation","common/evaluation_basic","common/evaluation_intermediate","common/gradient_accumulation","common/hyperparameters","common/lightning_module","common/optimization","common/precision","common/precision_basic","common/precision_expert","common/precision_intermediate","common/progress_bar","common/remote_fs","common/trainer","common_usecases","data/datamodule","debug/debugging","debug/debugging_advanced","debug/debugging_basic","debug/debugging_intermediate","deploy/production","deploy/production_advanced","deploy/production_advanced_2","deploy/production_basic","deploy/production_intermediate","ecosystem/asr_nlp_tts","ecosystem/bolts","ecosystem/community_examples","ecosystem/ecosystem-ci","ecosystem/flash","ecosystem/metrics","ecosystem/transformers","expertise_levels","extensions/accelerator","extensions/callbacks","extensions/callbacks_state","extensions/datamodules_state","extensions/generated/pytorch_lightning.loggers.CSVLogger","extensions/generated/pytorch_lightning.loggers.CometLogger","extensions/generated/pytorch_lightning.loggers.MLFlowLogger","extensions/generated/pytorch_lightning.loggers.NeptuneLogger","extensions/generated/pytorch_lightning.loggers.TensorBoardLogger","extensions/generated/pytorch_lightning.loggers.WandbLogger","extensions/logging","extensions/loops","extensions/loops_advanced","extensions/plugins","extensions/strategy","guides/data","guides/speed","index","levels/advanced","levels/advanced_level_15","levels/advanced_level_16","levels/advanced_level_17","levels/advanced_level_18","levels/advanced_level_19","levels/advanced_level_20","levels/advanced_level_21","levels/advanced_level_22","levels/basic_level_2","levels/basic_level_5","levels/core_level_3","levels/core_level_6","levels/core_skills","levels/expert","levels/expert_level_23","levels/expert_level_24","levels/expert_level_27","levels/intermediate","levels/intermediate_level_10","levels/intermediate_level_11","levels/intermediate_level_12","levels/intermediate_level_13","levels/intermediate_level_14","levels/intermediate_level_7","levels/intermediate_level_8","levels/intermediate_level_9","links","model/build_model","model/build_model_advanced","model/build_model_expert","model/build_model_intermediate","model/manual_optimization","model/own_your_loop","model/train_model_basic","starter/converting","starter/installation","starter/introduction","starter/lightning_lite","starter/style_guide","tuning/profiler","tuning/profiler_advanced","tuning/profiler_basic","tuning/profiler_expert","tuning/profiler_intermediate","visualize/experiment_managers","visualize/loggers","visualize/logging_advanced","visualize/logging_basic","visualize/logging_expert","visualize/logging_intermediate","visualize/supported_exp_managers"],envversion:{"sphinx.domains.c":2,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":5,"sphinx.domains.index":1,"sphinx.domains.javascript":2,"sphinx.domains.math":2,"sphinx.domains.python":3,"sphinx.domains.rst":2,"sphinx.domains.std":2,"sphinx.ext.intersphinx":1,"sphinx.ext.todo":2,"sphinx.ext.viewcode":1,nbsphinx:4,sphinx:56},filenames:["accelerators/accelerator_prepare.rst","accelerators/gpu.rst","accelerators/gpu_advanced.rst","accelerators/gpu_basic.rst","accelerators/gpu_expert.rst","accelerators/gpu_faq.rst","accelerators/gpu_intermediate.rst","accelerators/hpu.rst","accelerators/hpu_basic.rst","accelerators/hpu_intermediate.rst","accelerators/ipu.rst","accelerators/ipu_advanced.rst","accelerators/ipu_basic.rst","accelerators/ipu_intermediate.rst","accelerators/tpu.rst","accelerators/tpu_advanced.rst","accelerators/tpu_basic.rst","accelerators/tpu_faq.rst","accelerators/tpu_intermediate.rst","advanced/model_parallel.rst","advanced/pruning_quantization.rst","advanced/strategy_registry.rst","advanced/training_tricks.rst","advanced/transfer_learning.rst","benchmarking/benchmarks.rst","cli/lightning_cli.rst","cli/lightning_cli_advanced.rst","cli/lightning_cli_advanced_2.rst","cli/lightning_cli_advanced_3.rst","cli/lightning_cli_expert.rst","cli/lightning_cli_faq.rst","cli/lightning_cli_intermediate.rst","cli/lightning_cli_intermediate_2.rst","clouds/cloud_training.rst","clouds/cloud_training_intermediate.rst","clouds/cluster.rst","clouds/cluster_advanced.rst","clouds/cluster_expert.rst","clouds/cluster_intermediate_1.rst","clouds/cluster_intermediate_2.rst","clouds/fault_tolerant_training.rst","clouds/fault_tolerant_training_basic.rst","clouds/fault_tolerant_training_expert.rst","clouds/fault_tolerant_training_faq.rst","clouds/grid_costs.rst","clouds/run_advanced.rst","clouds/run_basic.rst","clouds/run_expert.rst","clouds/run_intermediate.rst","clouds/session_basic.rst","clouds/session_intermediate.rst","common/checkpointing.rst","common/checkpointing_advanced.rst","common/checkpointing_basic.rst","common/checkpointing_expert.rst","common/checkpointing_intermediate.rst","common/child_modules.rst","common/console_logs.rst","common/early_stopping.rst","common/evaluation.rst","common/evaluation_basic.rst","common/evaluation_intermediate.rst","common/gradient_accumulation.rst","common/hyperparameters.rst","common/lightning_module.rst","common/optimization.rst","common/precision.rst","common/precision_basic.rst","common/precision_expert.rst","common/precision_intermediate.rst","common/progress_bar.rst","common/remote_fs.rst","common/trainer.rst","common_usecases.rst","data/datamodule.rst","debug/debugging.rst","debug/debugging_advanced.rst","debug/debugging_basic.rst","debug/debugging_intermediate.rst","deploy/production.rst","deploy/production_advanced.rst","deploy/production_advanced_2.rst","deploy/production_basic.rst","deploy/production_intermediate.rst","ecosystem/asr_nlp_tts.rst","ecosystem/bolts.rst","ecosystem/community_examples.rst","ecosystem/ecosystem-ci.rst","ecosystem/flash.rst","ecosystem/metrics.rst","ecosystem/transformers.rst","expertise_levels.rst","extensions/accelerator.rst","extensions/callbacks.rst","extensions/callbacks_state.rst","extensions/datamodules_state.rst","extensions/generated/pytorch_lightning.loggers.CSVLogger.rst","extensions/generated/pytorch_lightning.loggers.CometLogger.rst","extensions/generated/pytorch_lightning.loggers.MLFlowLogger.rst","extensions/generated/pytorch_lightning.loggers.NeptuneLogger.rst","extensions/generated/pytorch_lightning.loggers.TensorBoardLogger.rst","extensions/generated/pytorch_lightning.loggers.WandbLogger.rst","extensions/logging.rst","extensions/loops.rst","extensions/loops_advanced.rst","extensions/plugins.rst","extensions/strategy.rst","guides/data.rst","guides/speed.rst","index.rst","levels/advanced.rst","levels/advanced_level_15.rst","levels/advanced_level_16.rst","levels/advanced_level_17.rst","levels/advanced_level_18.rst","levels/advanced_level_19.rst","levels/advanced_level_20.rst","levels/advanced_level_21.rst","levels/advanced_level_22.rst","levels/basic_level_2.rst","levels/basic_level_5.rst","levels/core_level_3.rst","levels/core_level_6.rst","levels/core_skills.rst","levels/expert.rst","levels/expert_level_23.rst","levels/expert_level_24.rst","levels/expert_level_27.rst","levels/intermediate.rst","levels/intermediate_level_10.rst","levels/intermediate_level_11.rst","levels/intermediate_level_12.rst","levels/intermediate_level_13.rst","levels/intermediate_level_14.rst","levels/intermediate_level_7.rst","levels/intermediate_level_8.rst","levels/intermediate_level_9.rst","links.rst","model/build_model.rst","model/build_model_advanced.rst","model/build_model_expert.rst","model/build_model_intermediate.rst","model/manual_optimization.rst","model/own_your_loop.rst","model/train_model_basic.rst","starter/converting.rst","starter/installation.rst","starter/introduction.rst","starter/lightning_lite.rst","starter/style_guide.rst","tuning/profiler.rst","tuning/profiler_advanced.rst","tuning/profiler_basic.rst","tuning/profiler_expert.rst","tuning/profiler_intermediate.rst","visualize/experiment_managers.rst","visualize/loggers.rst","visualize/logging_advanced.rst","visualize/logging_basic.rst","visualize/logging_expert.rst","visualize/logging_intermediate.rst","visualize/supported_exp_managers.rst"],objects:{"pytorch_lightning.callbacks.BackboneFinetuning.params":[[93,0,1,"","backbone_initial_lr"],[93,0,1,"","backbone_initial_ratio_lr"],[93,0,1,"","initial_denom_lr"],[93,0,1,"","lambda_func"],[93,0,1,"","rounding"],[93,0,1,"","should_align"],[93,0,1,"","train_bn"],[93,0,1,"","unfreeze_backbone_at_epoch"],[93,0,1,"","verbose"]],"pytorch_lightning.callbacks.BasePredictionWriter.params":[[93,0,1,"","write_interval"]],"pytorch_lightning.callbacks.Callback.load_state_dict.params":[[93,0,1,"","state_dict"]],"pytorch_lightning.callbacks.Callback.on_load_checkpoint.params":[[93,0,1,"","callback_state"],[93,0,1,"","pl_module"],[93,0,1,"","trainer"]],"pytorch_lightning.callbacks.Callback.on_save_checkpoint.params":[[93,0,1,"","checkpoint"],[93,0,1,"","pl_module"],[93,0,1,"","trainer"]],"pytorch_lightning.callbacks.EarlyStopping.params":[[93,0,1,"","check_finite"],[93,0,1,"","check_on_train_epoch_end"],[93,0,1,"","divergence_threshold"],[93,0,1,"","min_delta"],[93,0,1,"","mode"],[93,0,1,"","monitor"],[93,0,1,"","patience"],[93,0,1,"","stopping_threshold"],[93,0,1,"","strict"],[93,0,1,"","verbose"]],"pytorch_lightning.callbacks.GradientAccumulationScheduler.params":[[93,0,1,"","scheduling"]],"pytorch_lightning.callbacks.LambdaCallback.params":[[93,0,1,"","**kwargs"]],"pytorch_lightning.callbacks.LearningRateMonitor.params":[[93,0,1,"","log_momentum"],[93,0,1,"","logging_interval"]],"pytorch_lightning.callbacks.ModelCheckpoint.params":[[93,0,1,"","auto_insert_metric_name"],[93,0,1,"","dirpath"],[93,0,1,"","every_n_epochs"],[93,0,1,"","every_n_train_steps"],[93,0,1,"","filename"],[93,0,1,"","mode"],[93,0,1,"","monitor"],[93,0,1,"","save_last"],[93,0,1,"","save_on_train_epoch_end"],[93,0,1,"","save_top_k"],[93,0,1,"","save_weights_only"],[93,0,1,"","train_time_interval"],[93,0,1,"","verbose"]],"pytorch_lightning.callbacks.ModelPruning.params":[[93,0,1,"","amount"],[93,0,1,"","apply_pruning"],[93,0,1,"","make_pruning_permanent"],[93,0,1,"","parameter_names"],[93,0,1,"","parameters_to_prune"],[93,0,1,"","prune_on_train_epoch_end"],[93,0,1,"","pruning_dim"],[93,0,1,"","pruning_fn"],[93,0,1,"","pruning_norm"],[93,0,1,"","resample_parameters"],[93,0,1,"","use_global_unstructured"],[93,0,1,"","use_lottery_ticket_hypothesis"],[93,0,1,"","verbose"]],"pytorch_lightning.callbacks.ModelSummary.params":[[93,0,1,"","max_depth"]],"pytorch_lightning.callbacks.QuantizationAwareTraining.params":[[93,0,1,"","collect_quantization"],[93,0,1,"","input_compatible"],[93,0,1,"","modules_to_fuse"],[93,0,1,"","observer_enabled_stages"],[93,0,1,"","observer_type"],[93,0,1,"","qconfig"],[93,0,1,"","quantize_on_fit_end"]],"pytorch_lightning.callbacks.RichModelSummary.params":[[93,0,1,"","max_depth"]],"pytorch_lightning.callbacks.RichProgressBar.params":[[93,0,1,"","console_kwargs"],[93,0,1,"","leave"],[93,0,1,"","refresh_rate"],[93,0,1,"","theme"]],"pytorch_lightning.callbacks.StochasticWeightAveraging.params":[[93,0,1,"","annealing_epochs"],[93,0,1,"","annealing_strategy"],[93,0,1,"","avg_fn"],[93,0,1,"","device"],[93,0,1,"","swa_epoch_start"],[93,0,1,"","swa_lrs"]],"pytorch_lightning.callbacks.TQDMProgressBar.params":[[93,0,1,"","process_position"],[93,0,1,"","refresh_rate"]],"pytorch_lightning.callbacks.Timer.params":[[93,0,1,"","duration"],[93,0,1,"","interval"],[93,0,1,"","verbose"]],"pytorch_lightning.core.datamodule.LightningDataModule.load_state_dict.params":[[74,0,1,"","state_dict"]],"pytorch_lightning.core.datamodule.LightningDataModule.on_after_batch_transfer.params":[[74,0,1,"","batch"],[74,0,1,"","dataloader_idx"]],"pytorch_lightning.core.datamodule.LightningDataModule.on_before_batch_transfer.params":[[74,0,1,"","batch"],[74,0,1,"","dataloader_idx"]],"pytorch_lightning.core.datamodule.LightningDataModule.teardown.params":[[74,0,1,"","stage"]],"pytorch_lightning.core.datamodule.LightningDataModule.transfer_batch_to_device.params":[[74,0,1,"","batch"],[74,0,1,"","dataloader_idx"],[74,0,1,"","device"]],"pytorch_lightning.core.lightning.LightningModule.add_to_queue.params":[[64,0,1,"","queue"]],"pytorch_lightning.core.lightning.LightningModule.all_gather.params":[[64,0,1,"","data"],[64,0,1,"","group"],[64,0,1,"","sync_grads"]],"pytorch_lightning.core.lightning.LightningModule.backward.params":[[64,0,1,"","loss"],[64,0,1,"","optimizer"],[64,0,1,"","optimizer_idx"]],"pytorch_lightning.core.lightning.LightningModule.configure_gradient_clipping.params":[[64,0,1,"","gradient_clip_algorithm"],[64,0,1,"","gradient_clip_val"],[64,0,1,"","optimizer"],[64,0,1,"","optimizer_idx"]],"pytorch_lightning.core.lightning.LightningModule.forward.params":[[64,0,1,"","**kwargs"],[64,0,1,"","*args"]],"pytorch_lightning.core.lightning.LightningModule.get_from_queue.params":[[64,0,1,"","queue"]],"pytorch_lightning.core.lightning.LightningModule.load_from_checkpoint.params":[[64,0,1,"","checkpoint_path"],[64,0,1,"","hparams_file"],[64,0,1,"","kwargs"],[64,0,1,"","map_location"],[64,0,1,"","strict"]],"pytorch_lightning.core.lightning.LightningModule.log.params":[[64,0,1,"","add_dataloader_idx"],[64,0,1,"","batch_size"],[64,0,1,"","enable_graph"],[64,0,1,"","logger"],[64,0,1,"","metric_attribute"],[64,0,1,"","name"],[64,0,1,"","on_epoch"],[64,0,1,"","on_step"],[64,0,1,"","prog_bar"],[64,0,1,"","rank_zero_only"],[64,0,1,"","reduce_fx"],[64,0,1,"","sync_dist"],[64,0,1,"","sync_dist_group"],[64,0,1,"","value"]],"pytorch_lightning.core.lightning.LightningModule.log_dict.params":[[64,0,1,"","add_dataloader_idx"],[64,0,1,"","batch_size"],[64,0,1,"","dictionary"],[64,0,1,"","enable_graph"],[64,0,1,"","logger"],[64,0,1,"","on_epoch"],[64,0,1,"","on_step"],[64,0,1,"","prog_bar"],[64,0,1,"","rank_zero_only"],[64,0,1,"","reduce_fx"],[64,0,1,"","sync_dist"],[64,0,1,"","sync_dist_group"]],"pytorch_lightning.core.lightning.LightningModule.manual_backward.params":[[64,0,1,"","**kwargs"],[64,0,1,"","*args"],[64,0,1,"","loss"]],"pytorch_lightning.core.lightning.LightningModule.on_after_batch_transfer.params":[[64,0,1,"","batch"],[64,0,1,"","dataloader_idx"]],"pytorch_lightning.core.lightning.LightningModule.on_before_backward.params":[[64,0,1,"","loss"]],"pytorch_lightning.core.lightning.LightningModule.on_before_batch_transfer.params":[[64,0,1,"","batch"],[64,0,1,"","dataloader_idx"]],"pytorch_lightning.core.lightning.LightningModule.on_before_optimizer_step.params":[[64,0,1,"","optimizer"],[64,0,1,"","optimizer_idx"]],"pytorch_lightning.core.lightning.LightningModule.on_before_zero_grad.params":[[64,0,1,"","optimizer"]],"pytorch_lightning.core.lightning.LightningModule.on_hpc_load.params":[[64,0,1,"","checkpoint"]],"pytorch_lightning.core.lightning.LightningModule.on_hpc_save.params":[[64,0,1,"","checkpoint"]],"pytorch_lightning.core.lightning.LightningModule.on_load_checkpoint.params":[[64,0,1,"","checkpoint"]],"pytorch_lightning.core.lightning.LightningModule.on_predict_batch_end.params":[[64,0,1,"","batch"],[64,0,1,"","batch_idx"],[64,0,1,"","dataloader_idx"],[64,0,1,"","outputs"]],"pytorch_lightning.core.lightning.LightningModule.on_predict_batch_start.params":[[64,0,1,"","batch"],[64,0,1,"","batch_idx"],[64,0,1,"","dataloader_idx"]],"pytorch_lightning.core.lightning.LightningModule.on_save_checkpoint.params":[[64,0,1,"","checkpoint"]],"pytorch_lightning.core.lightning.LightningModule.on_test_batch_end.params":[[64,0,1,"","batch"],[64,0,1,"","batch_idx"],[64,0,1,"","dataloader_idx"],[64,0,1,"","outputs"]],"pytorch_lightning.core.lightning.LightningModule.on_test_batch_start.params":[[64,0,1,"","batch"],[64,0,1,"","batch_idx"],[64,0,1,"","dataloader_idx"]],"pytorch_lightning.core.lightning.LightningModule.on_train_batch_end.params":[[64,0,1,"","batch"],[64,0,1,"","batch_idx"],[64,0,1,"","outputs"],[64,0,1,"","unused"]],"pytorch_lightning.core.lightning.LightningModule.on_train_batch_start.params":[[64,0,1,"","batch"],[64,0,1,"","batch_idx"],[64,0,1,"","unused"]],"pytorch_lightning.core.lightning.LightningModule.on_validation_batch_end.params":[[64,0,1,"","batch"],[64,0,1,"","batch_idx"],[64,0,1,"","dataloader_idx"],[64,0,1,"","outputs"]],"pytorch_lightning.core.lightning.LightningModule.on_validation_batch_start.params":[[64,0,1,"","batch"],[64,0,1,"","batch_idx"],[64,0,1,"","dataloader_idx"]],"pytorch_lightning.core.lightning.LightningModule.optimizer_step.params":[[64,0,1,"","batch_idx"],[64,0,1,"","epoch"],[64,0,1,"","on_tpu"],[64,0,1,"","optimizer"],[64,0,1,"","optimizer_closure"],[64,0,1,"","optimizer_idx"],[64,0,1,"","using_lbfgs"],[64,0,1,"","using_native_amp"]],"pytorch_lightning.core.lightning.LightningModule.optimizer_zero_grad.params":[[64,0,1,"","batch_idx"],[64,0,1,"","epoch"],[64,0,1,"","optimizer"],[64,0,1,"","optimizer_idx"]],"pytorch_lightning.core.lightning.LightningModule.optimizers.params":[[64,0,1,"","use_pl_optimizer"]],"pytorch_lightning.core.lightning.LightningModule.predict_step.params":[[64,0,1,"","batch"],[64,0,1,"","batch_idx"],[64,0,1,"","dataloader_idx"]],"pytorch_lightning.core.lightning.LightningModule.print.params":[[64,0,1,"","**kwargs"],[64,0,1,"","*args"]],"pytorch_lightning.core.lightning.LightningModule.save_hyperparameters.params":[[64,0,1,"","args"],[64,0,1,"","frame"],[64,0,1,"","ignore"],[64,0,1,"","logger"]],"pytorch_lightning.core.lightning.LightningModule.setup.params":[[64,0,1,"","stage"]],"pytorch_lightning.core.lightning.LightningModule.tbptt_split_batch.params":[[64,0,1,"","batch"],[64,0,1,"","split_size"]],"pytorch_lightning.core.lightning.LightningModule.teardown.params":[[64,0,1,"","stage"]],"pytorch_lightning.core.lightning.LightningModule.test_epoch_end.params":[[64,0,1,"","outputs"]],"pytorch_lightning.core.lightning.LightningModule.test_step.params":[[64,0,1,"","batch"],[64,0,1,"","batch_idx"],[64,0,1,"","dataloader_id"]],"pytorch_lightning.core.lightning.LightningModule.test_step_end.params":[[64,0,1,"","step_output"]],"pytorch_lightning.core.lightning.LightningModule.to_onnx.params":[[64,0,1,"","**kwargs"],[64,0,1,"","file_path"],[64,0,1,"","input_sample"]],"pytorch_lightning.core.lightning.LightningModule.to_torchscript.params":[[64,0,1,"","**kwargs"],[64,0,1,"","example_inputs"],[64,0,1,"","file_path"],[64,0,1,"","method"]],"pytorch_lightning.core.lightning.LightningModule.toggle_optimizer.params":[[64,0,1,"","optimizer"],[64,0,1,"","optimizer_idx"]],"pytorch_lightning.core.lightning.LightningModule.training_epoch_end.params":[[64,0,1,"","outputs"]],"pytorch_lightning.core.lightning.LightningModule.training_step.params":[[64,0,1,"","batch"],[64,0,1,"","batch_idx"],[64,0,1,"","hiddens"],[64,0,1,"","optimizer_idx"]],"pytorch_lightning.core.lightning.LightningModule.training_step_end.params":[[64,0,1,"","step_output"]],"pytorch_lightning.core.lightning.LightningModule.transfer_batch_to_device.params":[[64,0,1,"","batch"],[64,0,1,"","dataloader_idx"],[64,0,1,"","device"]],"pytorch_lightning.core.lightning.LightningModule.untoggle_optimizer.params":[[64,0,1,"","optimizer_idx"]],"pytorch_lightning.core.lightning.LightningModule.validation_epoch_end.params":[[64,0,1,"","outputs"]],"pytorch_lightning.core.lightning.LightningModule.validation_step.params":[[64,0,1,"","batch"],[64,0,1,"","batch_idx"],[64,0,1,"","dataloader_idx"]],"pytorch_lightning.core.lightning.LightningModule.validation_step_end.params":[[64,0,1,"","step_output"]],"pytorch_lightning.loggers":[[96,1,1,"","CSVLogger"],[97,1,1,"","CometLogger"],[98,1,1,"","MLFlowLogger"],[99,1,1,"","NeptuneLogger"],[100,1,1,"","TensorBoardLogger"],[101,1,1,"","WandbLogger"]],"pytorch_lightning.loggers.CSVLogger":[[96,2,1,"","experiment"],[96,3,1,"","finalize"],[96,2,1,"","log_dir"],[96,3,1,"","log_hyperparams"],[96,3,1,"","log_metrics"],[96,2,1,"","name"],[96,2,1,"","root_dir"],[96,3,1,"","save"],[96,2,1,"","save_dir"],[96,2,1,"","version"]],"pytorch_lightning.loggers.CSVLogger.finalize.params":[[96,0,1,"","status"]],"pytorch_lightning.loggers.CSVLogger.log_hyperparams.params":[[96,0,1,"","args"],[96,0,1,"","kwargs"],[96,0,1,"","params"]],"pytorch_lightning.loggers.CSVLogger.log_metrics.params":[[96,0,1,"","metrics"],[96,0,1,"","step"]],"pytorch_lightning.loggers.CSVLogger.params":[[102,0,1,"","flush_logs_every_n_steps"],[102,0,1,"","name"],[102,0,1,"","prefix"],[102,0,1,"","save_dir"],[102,0,1,"","version"]],"pytorch_lightning.loggers.CometLogger":[[97,2,1,"","experiment"],[97,3,1,"","finalize"],[97,3,1,"","log_graph"],[97,3,1,"","log_hyperparams"],[97,3,1,"","log_metrics"],[97,2,1,"","name"],[97,2,1,"","save_dir"],[97,2,1,"","version"]],"pytorch_lightning.loggers.CometLogger.log_graph.params":[[97,0,1,"","input_array"],[97,0,1,"","model"]],"pytorch_lightning.loggers.CometLogger.log_hyperparams.params":[[97,0,1,"","args"],[97,0,1,"","kwargs"],[97,0,1,"","params"]],"pytorch_lightning.loggers.CometLogger.log_metrics.params":[[97,0,1,"","metrics"],[97,0,1,"","step"]],"pytorch_lightning.loggers.CometLogger.params":[[102,0,1,"","**kwargs"],[102,0,1,"","api_key"],[102,0,1,"","experiment_key"],[102,0,1,"","experiment_name"],[102,0,1,"","offline"],[102,0,1,"","prefix"],[102,0,1,"","project_name"],[102,0,1,"","rest_api_key"],[102,0,1,"","save_dir"]],"pytorch_lightning.loggers.MLFlowLogger":[[98,2,1,"","experiment"],[98,2,1,"","experiment_id"],[98,3,1,"","finalize"],[98,3,1,"","log_hyperparams"],[98,3,1,"","log_metrics"],[98,2,1,"","name"],[98,2,1,"","run_id"],[98,2,1,"","save_dir"],[98,2,1,"","version"]],"pytorch_lightning.loggers.MLFlowLogger.finalize.params":[[98,0,1,"","status"]],"pytorch_lightning.loggers.MLFlowLogger.log_hyperparams.params":[[98,0,1,"","args"],[98,0,1,"","kwargs"],[98,0,1,"","params"]],"pytorch_lightning.loggers.MLFlowLogger.log_metrics.params":[[98,0,1,"","metrics"],[98,0,1,"","step"]],"pytorch_lightning.loggers.MLFlowLogger.params":[[102,0,1,"","artifact_location"],[102,0,1,"","experiment_name"],[102,0,1,"","prefix"],[102,0,1,"","run_id"],[102,0,1,"","run_name"],[102,0,1,"","save_dir"],[102,0,1,"","tags"],[102,0,1,"","tracking_uri"]],"pytorch_lightning.loggers.NeptuneLogger":[[99,3,1,"","after_save_checkpoint"],[99,2,1,"","experiment"],[99,3,1,"","finalize"],[99,3,1,"","log_hyperparams"],[99,3,1,"","log_metrics"],[99,2,1,"","name"],[99,2,1,"","save_dir"],[99,2,1,"","version"]],"pytorch_lightning.loggers.NeptuneLogger.after_save_checkpoint.params":[[99,0,1,"","checkpoint_callback"]],"pytorch_lightning.loggers.NeptuneLogger.finalize.params":[[99,0,1,"","status"]],"pytorch_lightning.loggers.NeptuneLogger.log_hyperparams.params":[[99,0,1,"","params"]],"pytorch_lightning.loggers.NeptuneLogger.log_metrics.params":[[99,0,1,"","metrics"],[99,0,1,"","step"]],"pytorch_lightning.loggers.NeptuneLogger.params":[[102,0,1,"","**neptune_run_kwargs"],[102,0,1,"","api_key"],[102,0,1,"","log_model_checkpoints"],[102,0,1,"","name"],[102,0,1,"","prefix"],[102,0,1,"","project"],[102,0,1,"","run"]],"pytorch_lightning.loggers.TensorBoardLogger":[[100,2,1,"","experiment"],[100,3,1,"","finalize"],[100,2,1,"","log_dir"],[100,3,1,"","log_graph"],[100,3,1,"","log_hyperparams"],[100,3,1,"","log_metrics"],[100,2,1,"","name"],[100,2,1,"","root_dir"],[100,3,1,"","save"],[100,2,1,"","save_dir"],[100,2,1,"","sub_dir"],[100,2,1,"","version"]],"pytorch_lightning.loggers.TensorBoardLogger.finalize.params":[[100,0,1,"","status"]],"pytorch_lightning.loggers.TensorBoardLogger.log_graph.params":[[100,0,1,"","input_array"],[100,0,1,"","model"]],"pytorch_lightning.loggers.TensorBoardLogger.log_hyperparams.params":[[100,0,1,"","metrics"],[100,0,1,"","params"]],"pytorch_lightning.loggers.TensorBoardLogger.log_metrics.params":[[100,0,1,"","metrics"],[100,0,1,"","step"]],"pytorch_lightning.loggers.TensorBoardLogger.params":[[102,0,1,"","**kwargs"],[102,0,1,"","default_hp_metric"],[102,0,1,"","log_graph"],[102,0,1,"","name"],[102,0,1,"","prefix"],[102,0,1,"","save_dir"],[102,0,1,"","sub_dir"],[102,0,1,"","version"]],"pytorch_lightning.loggers.WandbLogger":[[101,3,1,"","after_save_checkpoint"],[101,2,1,"","experiment"],[101,3,1,"","finalize"],[101,3,1,"","log_hyperparams"],[101,3,1,"","log_image"],[101,3,1,"","log_metrics"],[101,3,1,"","log_table"],[101,3,1,"","log_text"],[101,2,1,"","name"],[101,2,1,"","save_dir"],[101,2,1,"","version"]],"pytorch_lightning.loggers.WandbLogger.after_save_checkpoint.params":[[101,0,1,"","checkpoint_callback"]],"pytorch_lightning.loggers.WandbLogger.finalize.params":[[101,0,1,"","status"]],"pytorch_lightning.loggers.WandbLogger.log_hyperparams.params":[[101,0,1,"","args"],[101,0,1,"","kwargs"],[101,0,1,"","params"]],"pytorch_lightning.loggers.WandbLogger.log_metrics.params":[[101,0,1,"","metrics"],[101,0,1,"","step"]],"pytorch_lightning.loggers.WandbLogger.params":[[102,0,1,"","**kwargs"],[102,0,1,"","anonymous"],[102,0,1,"","experiment"],[102,0,1,"","id"],[102,0,1,"","log_model"],[102,0,1,"","name"],[102,0,1,"","offline"],[102,0,1,"","prefix"],[102,0,1,"","project"],[102,0,1,"","save_dir"],[102,0,1,"","version"]],"pytorch_lightning.plugins.environments.SLURMEnvironment.params":[[105,0,1,"","auto_requeue"]],"pytorch_lightning.plugins.precision.HPUPrecisionPlugin.params":[[105,0,1,"","bf16_file_path"],[105,0,1,"","fp32_file_path"],[105,0,1,"","opt_level"],[105,0,1,"","precision"],[105,0,1,"","verbose"]],"pytorch_lightning.plugins.precision.NativeMixedPrecisionPlugin.params":[[105,0,1,"","device"],[105,0,1,"","precision"],[105,0,1,"","scaler"]],"pytorch_lightning.strategies.BaguaStrategy.params":[[106,0,1,"","algorithm"],[106,0,1,"","bagua_kwargs"],[106,0,1,"","flatten"]],"pytorch_lightning.strategies.DDPFullyShardedStrategy.params":[[106,0,1,"","bucket_cap_mb"],[106,0,1,"","compute_dtype"],[106,0,1,"","cpu_offload"],[106,0,1,"","flatten_parameters"],[106,0,1,"","fp32_reduce_scatter"],[106,0,1,"","min_num_params"],[106,0,1,"","move_grads_to_cpu"],[106,0,1,"","reshard_after_forward"],[106,0,1,"","state_dict_to_cpu"]],"pytorch_lightning.strategies.DeepSpeedStrategy.params":[[106,0,1,"","allgather_bucket_size"],[106,0,1,"","allgather_partitions"],[106,0,1,"","block_size"],[106,0,1,"","config"],[106,0,1,"","contiguous_gradients"],[106,0,1,"","contiguous_memory_optimization"],[106,0,1,"","cpu_checkpointing"],[106,0,1,"","hysteresis"],[106,0,1,"","initial_scale_power"],[106,0,1,"","load_full_weights"],[106,0,1,"","logging_batch_size_per_gpu"],[106,0,1,"","logging_level"],[106,0,1,"","loss_scale"],[106,0,1,"","loss_scale_window"],[106,0,1,"","max_in_cpu"],[106,0,1,"","min_loss_scale"],[106,0,1,"","nvme_path"],[106,0,1,"","offload_optimizer"],[106,0,1,"","offload_optimizer_device"],[106,0,1,"","offload_parameters"],[106,0,1,"","offload_params_device"],[106,0,1,"","optimizer_buffer_count"],[106,0,1,"","overlap_comm"],[106,0,1,"","overlap_events"],[106,0,1,"","params_buffer_count"],[106,0,1,"","params_buffer_size"],[106,0,1,"","partition_activations"],[106,0,1,"","pin_memory"],[106,0,1,"","queue_depth"],[106,0,1,"","reduce_bucket_size"],[106,0,1,"","reduce_scatter"],[106,0,1,"","remote_device"],[106,0,1,"","single_submit"],[106,0,1,"","stage"],[106,0,1,"","sub_group_size"],[106,0,1,"","synchronize_checkpoint_boundary"],[106,0,1,"","thread_count"],[106,0,1,"","zero_allow_untested_optimizer"],[106,0,1,"","zero_optimization"]],"pytorch_lightning.strategies.IPUStrategy.params":[[106,0,1,"","autoreport"],[106,0,1,"","autoreport_dir"],[106,0,1,"","device_iterations"],[106,0,1,"","inference_opts"],[106,0,1,"","training_opts"]],"pytorch_lightning.trainer.Trainer.fit.params":[[72,0,1,"","ckpt_path"],[72,0,1,"","datamodule"],[72,0,1,"","model"],[72,0,1,"","train_dataloaders"],[72,0,1,"","val_dataloaders"]],"pytorch_lightning.trainer.Trainer.params":[[72,0,1,"","accelerator"],[72,0,1,"","accumulate_grad_batches"],[72,0,1,"","amp_backend"],[72,0,1,"","amp_level"],[72,0,1,"","auto_lr_find"],[72,0,1,"","auto_scale_batch_size"],[72,0,1,"","auto_select_gpus"],[72,0,1,"","benchmark"],[72,0,1,"","callbacks"],[72,0,1,"","check_val_every_n_epoch"],[72,0,1,"","checkpoint_callback"],[72,0,1,"","default_root_dir"],[72,0,1,"","detect_anomaly"],[72,0,1,"","deterministic"],[72,0,1,"","devices"],[72,0,1,"","enable_checkpointing"],[72,0,1,"","enable_model_summary"],[72,0,1,"","enable_progress_bar"],[72,0,1,"","fast_dev_run"],[72,0,1,"","flush_logs_every_n_steps"],[72,0,1,"","gpus"],[72,0,1,"","gradient_clip_algorithm"],[72,0,1,"","gradient_clip_val"],[72,0,1,"","ipus"],[72,0,1,"","limit_predict_batches"],[72,0,1,"","limit_test_batches"],[72,0,1,"","limit_train_batches"],[72,0,1,"","limit_val_batches"],[72,0,1,"","log_every_n_steps"],[72,0,1,"","log_gpu_memory"],[72,0,1,"","logger"],[72,0,1,"","max_epochs"],[72,0,1,"","max_steps"],[72,0,1,"","max_time"],[72,0,1,"","min_epochs"],[72,0,1,"","min_steps"],[72,0,1,"","move_metrics_to_cpu"],[72,0,1,"","multiple_trainloader_mode"],[72,0,1,"","num_nodes"],[72,0,1,"","num_processes"],[72,0,1,"","num_sanity_val_steps"],[72,0,1,"","overfit_batches"],[72,0,1,"","plugins"],[72,0,1,"","precision"],[72,0,1,"","prepare_data_per_node"],[72,0,1,"","process_position"],[72,0,1,"","profiler"],[72,0,1,"","progress_bar_refresh_rate"],[72,0,1,"","reload_dataloaders_every_n_epochs"],[72,0,1,"","replace_sampler_ddp"],[72,0,1,"","resume_from_checkpoint"],[72,0,1,"","stochastic_weight_avg"],[72,0,1,"","strategy"],[72,0,1,"","sync_batchnorm"],[72,0,1,"","terminate_on_nan"],[72,0,1,"","tpu_cores"],[72,0,1,"","track_grad_norm"],[72,0,1,"","val_check_interval"],[72,0,1,"","weights_save_path"],[72,0,1,"","weights_summary"]],"pytorch_lightning.trainer.Trainer.predict.params":[[72,0,1,"","ckpt_path"],[72,0,1,"","dataloaders"],[72,0,1,"","datamodule"],[72,0,1,"","model"],[72,0,1,"","return_predictions"]],"pytorch_lightning.trainer.Trainer.test.params":[[72,0,1,"","ckpt_path"],[72,0,1,"","dataloaders"],[72,0,1,"","datamodule"],[72,0,1,"","model"],[72,0,1,"","verbose"]],"pytorch_lightning.trainer.Trainer.tune.params":[[72,0,1,"","datamodule"],[72,0,1,"","lr_find_kwargs"],[72,0,1,"","model"],[72,0,1,"","scale_batch_size_kwargs"],[72,0,1,"","train_dataloaders"],[72,0,1,"","val_dataloaders"]],"pytorch_lightning.trainer.Trainer.validate.params":[[72,0,1,"","ckpt_path"],[72,0,1,"","dataloaders"],[72,0,1,"","datamodule"],[72,0,1,"","model"],[72,0,1,"","verbose"]]},objnames:{"0":["py","parameter","Python parameter"],"1":["py","class","Python class"],"2":["py","property","Python property"],"3":["py","method","Python method"]},objtypes:{"0":"py:parameter","1":"py:class","2":"py:property","3":"py:method"},terms:{"0":[0,3,6,11,16,17,18,19,20,22,23,24,26,27,28,31,32,36,38,39,43,48,55,58,60,62,64,65,72,74,76,77,78,80,81,82,84,85,88,93,94,99,102,103,104,107,108,139,140,142,144,145,147,148,149,152,154,155,157,160,161],"00":[36,49,58,72,108,152],"000":152,"0001":[28,152],"00014637":152,"00024388":152,"00028":64,"000u":154,"001":[26,36,140,148],"0010246":152,"0017477":152,"001ms110":[16,17],"001ms228":[16,17],"001ms32":[16,17],"001ms339":[16,17],"001ms434":[16,17],"001ms61":[16,17],"001ms79":[16,17],"001u":[16,17,154],"0022506":152,"002ms921":[16,17],"008":152,"01":[20,27,28,31,32,48,64,72,77,78,140,148],"010":152,"011":152,"012":152,"012234":152,"015754":152,"01f":159,"02":[26,27,31,36,55,64],"020":152,"022":152,"02d":55,"03":[31,154],"03977392":48,"044m":154,"04835479":48,"05":[6,154],"05200016":48,"055m":154,"059u":154,"06":[24,152,154],"060u":154,"062u":[16,17],"063u":[16,17],"06m09s401ms746":[16,17],"07":99,"074":152,"08":49,"084":152,"0b1":84,"0x2b599e088ae8":0,"1":[1,2,5,6,9,11,15,18,20,22,23,25,31,32,33,36,39,41,42,43,48,55,56,58,60,61,62,64,65,69,72,73,77,78,80,81,82,83,84,91,93,94,99,101,102,103,104,107,108,109,110,111,123,127,129,130,135,136,138,139,140,141,142,144,146,148,152,153,154,155,157,158,160,161],"10":[5,11,15,16,17,20,23,26,27,31,36,39,43,48,49,53,55,58,63,64,69,70,72,77,78,89,91,99,102,108,128,140,141,145,147,148,152,154,157],"100":[6,19,23,26,27,31,72,96,101,107,108,147,159],"1000":[72,108],"100m":[6,19],"101":109,"105u":154,"10th":[33,41,135],"11":[19,49,84,91,128,154],"113":88,"12":[27,28,36,49,63,72,91,108,128,140,148,154],"1234":[140,148],"125":[16,17],"128":[19,22,53,63,64,84,145],"128x128":[16,17],"13":[91,128,152,154],"1307":74,"131":77,"132":77,"135u":154,"14":[64,91,128,154],"148":84,"15":[19,48,88,91,107,110,154],"1558":152,"15\ubd84":109,"15e":152,"16":[9,12,19,20,36,39,43,48,49,53,61,64,68,69,84,85,91,105,107,110,140,141,147,148,154],"167":152,"16\ube44\ud2b8":147,"17":[91,110],"1704":64,"173u":[16,17],"175u":154,"18":[16,17,86,91,110,152,154],"182":152,"183u":[16,17],"187":[16,17],"1875":152,"1876":[84,152],"19":[49,91,110],"192":84,"1e":[19,22,36,48,63,64,65,139,142,144,145,147,149],"1tb":[19,141,147],"2":[0,3,4,11,12,16,17,20,21,22,25,26,28,31,33,36,39,47,48,49,55,61,63,64,65,69,72,76,77,78,83,84,91,92,93,94,103,107,108,111,123,127,129,130,135,136,138,139,140,142,148,149,152,154,155,157,160,161],"20":[11,16,17,19,26,49,60,72,77,91,110,139,141,147,152,154],"200":[16,17],"2019":[140,148],"202":[16,17],"2022":47,"2048":[16,17,72],"205":[16,17],"206":[16,17,152],"209":[16,17],"20\uac1c":147,"21":[88,91,110,154],"2158432006835938":85,"21s102ms853":[16,17],"22":[91,110,154],"22050hz":84,"226e":152,"228u":154,"23":[91,124,154],"236u":[16,17],"24":[6,28,29,63,84,91,124],"25":[20,22,64,72,84,91,108,124],"2541470527648926":85,"256":[77,84,88,140,148],"26":[91,124],"260":152,"267":152,"27":[91,124,154,160],"273":[16,17],"28":[56,63,64,77,144,145,147,154,155,158,160,161],"283u":[16,17],"290":152,"29500":39,"2e8":19,"2f":55,"2vm":[16,17],"3":[0,3,4,6,11,16,17,21,22,23,25,33,36,48,52,55,58,61,64,65,71,72,84,91,99,103,106,123,127,129,135,136,138,139,140,142,144,146,148,149,154,155,157,158,160,161],"30":[19,31,48,64],"305u":[16,17],"3081":74,"3090":69,"32":[6,9,11,13,15,16,17,18,19,22,31,36,38,48,53,55,56,64,69,72,74,77,93,94,105,107,108,140,148,154,155,157,158,160,161],"33":154,"3300":84,"336u":154,"34":154,"344":152,"35":154,"350":84,"351u":154,"353u":154,"362u":154,"3752":152,"38":154,"383":152,"387u":154,"39":[16,17],"393u":154,"3d":86,"3e":19,"3x":[6,67,72,108],"4":[3,4,5,6,11,12,19,21,22,27,28,33,36,38,43,48,49,55,62,63,64,65,69,72,80,81,84,91,103,106,107,108,109,123,127,135,140,141,148,154],"40":58,"400":84,"403e":152,"40\uc885\ub958":147,"40b":19,"41":154,"42":[16,17,60,72,152,154],"425201":[16,17],"426e":152,"432u":154,"44":[152,154],"45":[19,154],"456u":154,"461u":154,"464u":154,"47":0,"481u":154,"484u":154,"4863767":152,"4869394":152,"492u":154,"4\uac1c\uc758":147,"5":[0,11,16,17,19,20,22,27,28,29,33,43,48,64,65,72,74,77,78,84,89,91,93,103,104,107,108,123,139,141,142,146,152,154],"50":[16,17,20,26,43,48,72,102,157],"500":[64,65,101,157],"5000":[19,74],"500m":19,"51011":[16,17,18],"512":[19,77,103],"516e":152,"517u":154,"52":49,"523u":154,"526u":154,"543":154,"549":154,"55000":74,"566u":154,"58":154,"5\ub2e8\uacc4\uc758":147,"5e8":19,"5th":[16,17,22,62,65],"5x":19,"6":[0,16,17,64,69,72,91,93,107,123,152,154],"60":[0,48,89,154],"60000":152,"6006":[84,147],"62":154,"6206e0":70,"63":19,"638u":154,"64":[20,36,48,49,63,64,72,74,80,81,82,83,84,99,105,107,140,144,147,148,154],"644e":152,"65038344_52a45d090d":103,"651":152,"657u":154,"669u":154,"67108864":84,"68":[152,154],"681m":154,"69":154,"694u":154,"6gb":19,"7":[5,22,36,48,62,64,65,72,74,77,80,88,91,93,108,128,140,146,148,152,154],"721":152,"734":152,"74":154,"743u":154,"75":20,"756u":154,"759":152,"76":152,"768":84,"77":154,"773u":[16,17],"778ms572":[16,17],"778u":[16,17],"782u":154,"783u":154,"786u":154,"7\ub2e8\uacc4\ub97c":[109,147],"7gb":19,"7th":108,"7x":19,"8":[4,5,6,8,11,12,13,15,16,17,18,19,21,22,29,36,38,43,48,60,62,64,65,72,82,91,93,106,107,108,128,140,148],"80":[16,17,33,48,135,152],"80m":19,"81":154,"839":152,"8470":[16,17],"85":48,"859u":154,"869":152,"877":152,"887":152,"8888":84,"893":152,"8g":84,"9":[16,17,19,36,48,91,99,128],"90":[16,17,36,48,103,154],"9001":151,"93":152,"95":[16,17,48],"961u":154,"967u":154,"97":99,"973u":[16,17],"99":[16,17,20,55,64],"998":19,"999":19,"9th":[22,62,65],"\uac00\ub2a5\ud55c":147,"\uac00\ub2a5\ud574\uc9d1\ub2c8\ub2e4":147,"\uac00\ub3c5\uc131":147,"\uac00\ub3c5\uc131\uacfc":149,"\uac00\ub3c5\uc131\uc744":147,"\uac00\uc774\ub4dc\uc758":149,"\uac00\uc911\uce58\ub97c":147,"\uac00\uc9dc":147,"\uac04\ub2e8\ud55c":147,"\uac15\ud654\ud559\uc2b5":147,"\uac16\ub294":147,"\uac16\ucd94\uace0":147,"\uac1c\uc120\ud558\ub294":149,"\uac1d\uccb4":147,"\uac80\uc99d":147,"\uac83\ub4e4\uc774":147,"\uac83\uc785\ub2c8\ub2e4":[147,149],"\uacbd\uc0ac\ub3c4":147,"\uacbd\uc6b0":147,"\uace0\uae09":147,"\uacfc":147,"\uad00\uc2ec\uc788\ub294":149,"\uad00\uc5ec\ud569\ub2c8\ub2e4":147,"\uad6c\uc131\ub418\ub3c4\ub85d":149,"\uad6c\ud604\ud569\ub2c8\ub2e4":147,"\uad8c\uc7a5\ud558\ub294\ub370":149,"\uadf8\ub300\ub85c":147,"\uadf8\ub8f9\uc73c\ub85c":147,"\uae30\ub2a5\uc744":147,"\uae30\ubc95\ub4e4":147,"\uae30\uc220\uc744":147,"\uae30\uc220\uc785\ub2c8\ub2e4":147,"\uae30\uc874":147,"\ub04c":147,"\ub098\ub204\uc5b4":147,"\ub098\uc740":147,"\ub0b4\ubcf4\ub0b4\uae30":147,"\ub0b4\uc5d0\uc11c":147,"\ub0b4\uc6a9\ub4e4":147,"\ub294":147,"\ub2e4\ub978":147,"\ub2e4\uc591\ud55c":147,"\ub2e4\uc911":147,"\ub2e8\uacc4\ub294":147,"\ub2e8\uacc4\ub85c":147,"\ub2e8\uacc4\ub97c":147,"\ub2e8\uacc4\uc5d0\uc11c":147,"\ub2e8\uc21c\ud788":147,"\ub300\uaddc\ubaa8\ub85c":147,"\ub300\uaddc\ubaa8\uc5d0\uc11c":109,"\ub354":147,"\ub370\uc774\ud130\ub97c":147,"\ub370\uc774\ud130\uc14b\uc744":147,"\ub3c4":147,"\ub3c4\uad6c":147,"\ub3c4\uc6c0\uc774":147,"\ub3c4\uc911":147,"\ub3d9\uc2dc\uc5d0":147,"\ub3d9\uc548":109,"\ub3d9\uc791\ud560":147,"\ub418\ub294":147,"\ub4a4\uc5d0\ub294":147,"\ub4f1":147,"\ub4f1\uc744":147,"\ub525\ub7ec\ub2dd":[109,147],"\ub530\ub77c":147,"\ub610\ub294":[109,147],"\ub77c\uc774\ud2b8":147,"\ub77c\uc774\ud2b8\ub2dd":[109,147,149],"\ub97c":147,"\ub9cc\uc5d0":109,"\ub9ce\uc740":147,"\ub9e4\uac1c\ubcc0\uc218\ub97c":147,"\uba38\uc2e0\ub7ec\ub2dd":[109,147],"\uba54\uc18c\ub4dc":147,"\uba54\ud0c0\ud559\uc2b5":147,"\uba85\ub839\uc904":147,"\ubaa8\ub378\uc744":147,"\ubaa8\ub4e0":147,"\ubaa9\ud45c":147,"\ubaa9\ud45c\ub294":149,"\ubb36\uc5b4\uc11c":147,"\ubb38\uc11c":109,"\ubb38\uc11c\uc5d0\uc11c\ub294":147,"\ubc0f":147,"\ubc18\ubcf5\ub418\ub294":147,"\ubc18\ubcf5\uc5d0":147,"\ubc18\ubcf5\uc744":147,"\ubc18\ubcf5\uc801\uc73c\ub85c":147,"\ubc1c\uacac\ud558\uace0":149,"\ubc1c\uc804\ud569\ub2c8\ub2e4":109,"\ubc29\uc2dd\uc73c\ub85c":147,"\ubc30\uacbd\uc9c0\uc2dd":147,"\ubc30\uc6c1\ub2c8\ub2e4":109,"\ubc30\uc6cc\ubcf4\uae30":109,"\ubc30\uce58":147,"\ubc30\ud130\ub9ac\uac00":147,"\ubcc0\uacbd":147,"\ubcc0\uacbd\ud558\uc9c0":147,"\ubcf5\uc7a1\ub3c4\uc5d0":147,"\ubcf5\uc7a1\uc131\ub4e4\uc744":147,"\ubcf5\uc7a1\ud55c":147,"\ubd10\uc57c\ud560\uc9c0":149,"\ubd80\ubd84\ub3c4":147,"\ubd80\ubd84\uc744":149,"\ubd84\ub9ac\ud558\uc5ec":147,"\ubd88\ub7ec\uc624\uace0":147,"\ubd88\ub7ec\uc624\uae30":147,"\ubd88\ub7ec\uc635\ub2c8\ub2e4":147,"\ube0c\ub77c\uc6b0\uc800\uc5d0\uc11c":147,"\ube44\ud65c\uc131\ud654\ub97c":147,"\ube60\ub978":147,"\ubfd0\ub9cc":147,"\uc0ac\ub840\uc5d0":147,"\uc0ac\uc6a9":147,"\uc0ac\uc6a9\uc790\uac00":147,"\uc0ac\uc6a9\uc790\ub77c\uba74":147,"\uc0ac\uc6a9\ud558\ub294":147,"\uc0ac\uc6a9\ud558\uc5ec":147,"\uc0ac\uc6a9\ud560":147,"\uc0ac\uc6a9\ud569\ub2c8\ub2e4":147,"\uc0b4\ud3b4\ubcf4\uc138\uc694":147,"\uc0bd\uc785\ud560":147,"\uc0c1\uc0c1\ud574\ubcf4\uc138\uc694":149,"\uc0c1\uc6a9":147,"\uc0dd\uac01\uc73c\ub85c\ubd80\ud130":109,"\uc120\ud0dd\ud569\ub2c8\ub2e4":147,"\uc124\uc815\ud569\ub2c8\ub2e4":147,"\uc131\ub2a5\uc744":[109,147],"\uc190\uc27d\uac8c":147,"\uc218":147,"\uc21c\ud68c":147,"\uc228\uae30\uc9c0":147,"\uc2dc":147,"\uc2dc\uac01\ud654\ud558\ub294\ub370":147,"\uc2e4\ud589\ud558\uace0":147,"\uc2e4\ud589\ud560":147,"\uc2e4\ud5d8\uc744":147,"\uc544\ub2c8\ub77c":147,"\uc544\ub798":147,"\uc544\ub798\ub97c":147,"\uc544\uc774\ub514\uc5b4":147,"\uc544\uc774\ub514\uc5b4\ub97c":147,"\uc548\ub0b4\ud569\ub2c8\ub2e4":147,"\uc54a\uc73c\uba74\uc11c":[109,147],"\uc54c\uace0":149,"\uc5b4\ub514\ub97c":149,"\uc5b4\ub514\uc5d0\ub4e0":147,"\uc5b4\ub5a0\ud55c":147,"\uc5b8\uc81c\ub098":147,"\uc5c6\uc74c":147,"\uc5c6\uc774":147,"\uc5d0":147,"\uc5d0\uc11c":147,"\uc5d0\ud3ed":147,"\uc5d4\uc9c0\ub2c8\uc5b4\ub4e4\uc744":[109,147],"\uc5d4\uc9c0\ub2c8\uc5b4\ub9c1":147,"\uc5d4\uc9c0\ub2c8\uc5b4\ub9c1\uc801":147,"\uc5ec\ub7ec\uac1c\uc758":147,"\uc5ec\ub7ec\uc904\uc758":147,"\uc5f0\uad6c":[147,149],"\uc5f0\uad6c\uc6a9":147,"\uc5f0\uad6c\uc790\ub4e4\uacfc":[109,147],"\uc5f4\uc5b4\ubcf4\uc138\uc694":147,"\uc608\uc2dc\ub4e4\uc744":147,"\uc608\uce21":147,"\uc608\uce21\uc6a9\uc73c\ub85c":147,"\uc608\uce21\uc744":147,"\uc624\ud1a0\uc778\ucf54\ub354":147,"\uc635\uc158":147,"\uc644\ub8cc":147,"\uc644\ub8cc\ud558\uc5ec":147,"\uc644\ubcbd\ud788":147,"\uc644\uc804\ud55c":147,"\uc644\uc804\ud788":147,"\uc694\uad6c\ud558\uba74\uc11c":147,"\uc6cc\ud06c\ud50c\ub85c\uc6b0\uc758":[109,147],"\uc6d0\uce59\uc740":147,"\uc6d0\ud558\ub294\ub9cc\ud07c\uc758":147,"\uc704\ud55c":[109,147],"\uc704\ud574":[147,149],"\uc720\uc0ac\ud558\uac8c":149,"\uc720\uc0ac\ud55c":147,"\uc720\uc5f0\uc131\uc744":[109,147],"\uc720\uc6a9\ud55c":147,"\uc720\ud615\uc758":147,"\uc740":[109,147],"\uc744":[147,149],"\uc758":[147,149],"\uc774":[147,149],"\uc774\uad00\ud558\uae30":147,"\uc774\ub294":147,"\uc774\ub7f0":147,"\uc774\ub974\ub294":109,"\uc774\ubbf8":147,"\uc774\ubbf8\uc9c0\ub85c":147,"\uc774\uc0c1\uc758":147,"\uc778\uc790":147,"\uc778\uc790\ub4e4\uc744":147,"\uc77c\ubc18\uc801\uc778":[109,147],"\uc77c\ubd80\ub97c":147,"\uc788\ub294":147,"\uc788\ub2e4\uace0":149,"\uc788\ub3c4\ub85d":147,"\uc788\uc2b5\ub2c8\ub2e4":[147,149],"\uc788\uc73c\uba70":147,"\uc790\ub3d9\uc73c\ub85c":147,"\uc790\ub3d9\ud654\ub41c":147,"\uc790\ub3d9\ud654\ud569\ub2c8\ub2e4":147,"\uc791\uc5c5\ub4e4\uc744":147,"\uc7ac\uad6c\uc131\ud568\uc73c\ub85c\uc368":147,"\uc7ac\uad6c\uc131\ud569\ub2c8\ub2e4":147,"\uc7ac\ud604\uc131":147,"\uc7ac\ud604\uc131\uc744":[147,149],"\uc800\uc7a5\uc18c\ub098":149,"\uc800\uc7a5\ud558\uae30":147,"\uc804\ubb38\uac00\ub4e4\uc774":147,"\uc804\ubb38\uc801\uc778":[109,147],"\uc815\ubc00\ub3c4":147,"\uc815\uc758":147,"\uc815\uc758\ud569\ub2c8\ub2e4":147,"\uc815\ud655\ud788":149,"\uc81c\uac70\ud558\uace0":147,"\uc81c\uacf5\ud558\ub294":147,"\uc81c\uacf5\ud569\ub2c8\ub2e4":147,"\uc81c\uc5b4\ud560":147,"\uc81c\uc5b4\ud569\ub2c8\ub2e4":147,"\uc81c\ud488\ud654\uc5d0":109,"\uc8fc\uc694\ud55c":[109,147,149],"\uc911":147,"\uc9c0\uc6d0":147,"\uc9c1\uc811":147,"\ucc38\uace0\ud558\uc138\uc694":147,"\ucc38\uc870":147,"\ucc38\uc870\ud558\uc138\uc694":[109,147],"\ucc3e\uae30":149,"\uccb4\ud06c\ud3ec\uc778\ud2b8":147,"\ucd08\uae30\ud654\ud569\ub2c8\ub2e4":147,"\ucd5c\ub300\ud55c\uc758":[109,147],"\ucd5c\uc2e0":147,"\ucd5c\uc801\ud654":147,"\ucd5c\ucca8\ub2e8":147,"\ucd94\uac00\uc801\uc778":147,"\ucd94\uc0c1\ud654":147,"\ucf1c\uac70\ub098":147,"\ucf54\ub4dc":147,"\ucf54\ub4dc\uac00":[147,149],"\ucf54\ub4dc\ub4e4\uc744":147,"\ucf54\ub4dc\ub97c":147,"\ucf54\ub4dc\uc640":147,"\ucf5c\ubc31":147,"\ud14c\uc2a4\ud2b8":147,"\ud14c\uc2a4\ud2b8\ub97c":147,"\ud150\uc11c\ubcf4\ub4dc":147,"\ud1b5\ud569\ud560":147,"\ud2b9\uc815":147,"\ud30c\uc774\ud1a0\uce58":[109,147,149],"\ud3c9\uac00":147,"\ud3ec\uae30\ud558\uc9c0":109,"\ud3ec\ud568\ub418\uc5b4":147,"\ud3ec\ud568\ub41c":147,"\ud3ec\ud568\ud558\uac70\ub098":147,"\ud3ec\ud568\ud558\uc5ec":147,"\ud504\ub808\uc784\uc6cc\ud06c\uc785\ub2c8\ub2e4":[109,147],"\ud504\ub85c\uc81d\ud2b8\uac00":109,"\ud504\ub85c\uc81d\ud2b8\ub97c":147,"\ud504\ub85c\uc81d\ud2b8\uc5d0\uc11c":149,"\ud504\ub85c\uc81d\ud2b8\uc758":147,"\ud50c\ub798\uadf8":147,"\ud544\uc694\ub85c":[109,147],"\ud544\uc694\uc5c6\uc2b5\ub2c8\ub2e4":147,"\ud544\uc694\ud55c":147,"\ud558\ub098\ub97c":147,"\ud558\ub098\uc785\ub2c8\ub2e4":147,"\ud558\ub294":[109,147],"\ud558\uc5ec":147,"\ud559\uc2b5\ud55c":147,"\ud559\uc2b5\ud560":147,"\ud559\uc2b5\ud569\ub2c8\ub2e4":147,"\ud560":147,"\ud568\uaed8":[109,147],"\ud569\ub2c8\ub2e4":147,"\ud574\ub2f9\ud558\ub294":147,"\ud575\uc2ec":147,"\ud638\ucd9c":147,"\ud655\ubcf4\ud558\ub3c4\ub85d":147,"\ud655\uc7a5\uc131":147,"\ud655\uc7a5\uc5d0":147,"\ud658\uacbd\uc5d0":147,"\ud65c\uc131\ud654":147,"\ud6c8\ub828":147,"\ud78c\ud2b8":147,"abstract":[64,72,90,103,105,144,147],"boolean":104,"break":87,"byte":84,"case":[0,6,16,17,19,20,22,23,26,27,28,29,31,43,48,53,54,55,56,58,61,63,64,65,67,69,72,74,84,89,99,101,102,103,107,108],"catch":72,"class":[0,4,5,6,8,11,15,19,20,21,22,23,30,31,32,37,43,52,53,54,55,56,58,60,61,63,64,65,68,69,70,74,76,77,78,80,81,82,83,84,85,89,92,93,94,95,96,97,98,99,100,101,102,103,104,106,107,108,109,139,140,142,144,145,147,148,149,153,155,157,158,159,160,161],"default":[3,4,6,8,9,11,13,18,19,22,30,31,36,52,55,58,62,63,64,65,67,69,70,71,72,78,84,90,93,94,96,97,98,99,100,101,104,105,106,107,108,140,145,147,148,149,151,154,158],"do":[0,3,6,8,11,12,15,18,19,22,28,36,38,47,53,54,56,58,60,62,63,64,65,69,70,72,82,84,85,93,94,96,97,98,99,100,101,103,107,108,109,139,140,142,148,149,157],"export":[16,17,18,19,27,36,64,80,81,147],"final":[22,39,62,63,65,92,96,97,98,99,100,101,102,103,140,148,157],"float":[20,27,31,36,61,64,65,66,67,69,72,96,97,98,99,100,101,105,107,108,130,140,148,149,157],"fsdp\ub97c":147,"function":[0,11,12,19,20,22,28,29,39,54,55,63,64,65,69,72,77,80,91,93,94,102,103,104,108,124,125,126,139,140,141,142,144,145,147,148,153,154,155,157,158,160,161],"gan\uc744":147,"gpu\uc5d0\uc11c":147,"import":[0,4,5,6,9,11,13,15,16,17,18,19,20,21,22,23,28,29,31,32,36,37,38,43,54,55,57,58,60,62,63,64,65,70,71,72,74,76,77,80,83,84,85,88,89,92,93,96,97,98,99,100,101,102,103,106,107,108,139,140,142,145,147,148,149,151,152,153,154,155,157,159,160,161],"int":[3,27,29,31,37,43,60,63,64,72,74,92,96,97,98,99,100,101,102,107,108,140,148,153],"lightning\uc5d0\ub294":147,"lightning\uc5d0\uc11c\ub294":147,"lightning\uc740":147,"lightning\uc758":[147,149],"lightningmodule\uc5d0\uc11c":147,"lightningmodule\uc744":147,"long":[23,30,41,85,107,108,152],"module\uc744":147,"module\uc774":147,"new":[0,1,4,6,11,16,17,18,21,49,64,66,68,70,72,74,84,85,89,91,92,97,98,99,100,101,106,108,124,144,156,159],"null":[26,84],"public":[33,93,103],"pytorch\ub97c":147,"pytorch\uc758":147,"return":[0,4,5,6,11,12,15,18,19,20,21,22,23,28,31,32,37,43,56,58,61,63,64,65,69,70,72,74,80,81,82,83,84,85,92,93,94,95,96,97,98,99,100,101,102,103,104,139,140,142,144,145,147,148,149,153,157,159],"short":[19,22,30],"super":[11,15,19,20,22,23,28,29,31,32,53,56,63,64,65,70,74,80,81,82,83,93,102,107,108,139,140,142,144,145,147,148,149,153,157,159,160],"switch":[16,17,20,64,65,69,76,84,92,108,139,140,142,148],"throw":[15,107],"torchscript\ub85c":147,"trainer\uc5d0":147,"trainer\uc758":147,"true":[0,3,4,18,19,20,21,22,23,26,27,28,31,36,37,54,55,60,61,64,65,70,72,74,77,78,80,84,89,93,94,99,100,101,102,103,107,108,139,142,144,147,149,154,157,158,159],"try":[5,16,17,19,22,28,29,36,37,38,39,48,64,69,72,78,149,151],"validation_step\uc774\ub098":147,"var":[27,63],"while":[8,16,17,18,20,22,30,43,61,64,65,69,72,74,102,103,140,148,151],A:[3,5,16,17,19,22,26,28,29,30,32,38,48,49,53,61,64,65,72,74,77,78,85,89,93,94,96,97,98,100,101,103,104,107,108,149],AND:[0,64],And:[16,17,23,56,64,82,84],As:[18,19,22,29,31,32,41,45,46,55,60,65,105],At:[16,17,64],BE:36,Be:[12,65,139,142],But:[19,53,64,74,103],By:[6,9,11,13,16,17,18,19,22,55,63,64,69,72,82,96,100,102,103,105,140,148,157,158],For:[2,3,4,6,8,9,11,15,16,17,19,20,22,26,27,28,29,30,31,39,43,45,46,49,53,55,56,57,62,64,65,67,69,70,72,74,77,82,83,84,87,88,93,97,99,102,103,104,107,108,139,140,142,145,148,149,157,158],IS:[0,63,64],If:[5,6,11,12,15,18,19,22,28,29,30,32,36,41,43,44,45,46,47,49,53,55,58,61,63,64,65,67,70,74,77,78,81,83,92,93,94,95,96,97,98,99,100,101,102,103,107,108,139,140,141,142,145,146,148,152,155,157,158,159,160,161],In:[5,6,9,11,16,17,19,22,23,24,27,28,29,36,43,45,46,48,55,56,58,61,63,64,65,69,72,74,77,84,85,89,90,93,99,102,103,107,108,112,130,131,132,133,140,144,145,148,149,152,158],Is:149,It:[0,4,6,8,16,17,19,21,22,26,28,29,36,37,53,55,58,61,63,64,65,67,69,70,71,72,74,81,87,88,89,93,99,102,103,106,107,108,139,140,142,146,148,149,151,154,157],Its:[103,140,148],NOT:[6,22,60,63,64,72,93,157],No:[16,17,67],Not:55,OR:[64,93,107],Of:102,On:[8,28,43,49,72,76,77],One:[16,17,28,65,78,86,103,108],Or:[22,62,65,84,92],THE:[0,63],TO:[0,63],That:[6,18,97,140,148],The:[0,3,4,5,6,8,9,12,13,16,17,18,19,20,21,22,26,27,28,29,30,31,36,41,42,43,46,48,53,54,55,56,58,60,61,62,63,64,65,70,71,72,74,77,81,82,85,89,92,93,94,96,97,98,99,100,101,102,103,104,105,106,107,108,139,140,142,144,145,148,149,152,154,157,159],Then:[16,17,22,64,70,84,154,159],There:[3,6,16,17,19,43,61,64,74,105,107,108],These:[4,16,17,19,47,63,64,72,84,102,106,141,149],To:[0,3,5,6,8,9,12,13,15,16,17,18,19,20,22,26,27,28,29,31,36,38,41,42,43,45,46,49,52,53,55,58,60,61,63,64,65,70,72,74,76,77,80,87,88,90,93,96,97,98,100,101,102,103,108,139,140,142,144,145,148,149,151,152,153,154,155,157,158,159,160,161],WITH:6,Will:[64,72,103],With:[19,28,29,30,31,41,48,64,65,77,84,103,105,108,144,154,158],_:[23,43,56,63,64,65,81,82,84,108,139,142,149,159],__call__:152,__dict__:[16,17],__file__:36,__getitem__:[43,152],__init__:[0,11,15,19,20,22,23,28,29,31,43,53,56,63,64,65,72,74,77,80,81,82,83,89,93,94,101,107,108,139,140,142,144,145,147,148,149,153,157,159,160],__iter__:[43,107],__len__:[43,107],__main__:[0,31,36,63,72],__name__:[31,36,63,72],__next__:[43,152],_action_count:153,_action_first_occurr:153,_batch:107,_devic:[16,17],_epoch:[102,157],_epoch_end:[93,103],_epoch_start:103,_experi:97,_fakequeu:64,_for_each_instance_rewrit:[16,17],_generate_state_kei:[93,94],_init:28,_input_format:157,_launch:0,_loss:[56,64],_lrfinder:72,_lrschedul:[28,64],_model:72,_next_data:152,_optim:84,_pickl:0,_run_early_stopping_check:58,_sample_r:84,_shape_input:85,_shared_ev:[56,64],_shared_eval_step:64,_step:[6,102,157],_wer:84,_xla_get_devic:[16,17],_xlac:[16,17],_z:[65,139,142],a100:69,a_float32:69,a_val:72,ab:64,abc:64,abf:71,abil:[19,55,78,105,140,148],abl:[19,43,55,65,69,87,93,94,139,142],abort:[96,98,99,100,101],about:[1,4,6,14,16,17,18,19,21,22,24,25,29,30,36,40,57,59,64,65,71,72,77,84,87,88,90,92,99,102,103,104,105,108,118,139,140,142,148,149],abov:[3,16,17,19,22,28,29,31,36,48,52,61,64,65,69,84,87,93,94,102,103,107,140,148],academ:[23,33,38,47,91,128,149],acc:[64,89,99,102,158,160],acceler:[3,4,5,6,15,16,17,18,19,21,22,36,38,51,63,64,65,69,76,82,83,84,90,91,106,109,124,139,141,142,147],accelerator_registri:92,accept:[28,64,103,107],access:[0,3,5,13,18,19,22,33,37,41,43,44,46,47,49,53,63,64,72,74,88,91,92,93,103,108,128,134,140,141,145,148,155,160,161],accommod:19,accomplish:[69,71],accord:[5,48],accordingli:[19,28,29,104],account:[20,41,42,44,45,46,47,48,49,70],accumul:[19,55,62,64,72,89,102,103,108,157],accumulate_grad_batch:[22,62,64,65,139,142],accur:[5,67],accuraci:[19,20,48,64,69,89,157],achiev:[6,16,17,20,22,72,84,108,140,148],across:[0,4,6,8,11,12,19,20,28,32,36,38,39,43,49,50,55,62,64,65,67,72,74,84,85,88,89,90,92,93,102,106,107,108,136,140,146,147,148,149,152,157,158],act:11,action:[30,87,140,148,152,154],action_nam:153,actioncountprofil:153,activ:[12,20,36,64,65,70,84,103,104,107,139,142,146],active_learning_loop:103,activelearningdatamodul:103,activelearningloop:103,actual:[5,6,18,38,64,92,96,97,98,99,100,101,103],ad:[0,11,19,28,29,64,72,101,105,149],adam:[19,22,28,31,32,64,65,74,139,142,144,145,147],adamw:[19,28,32,90],add:[0,6,9,18,19,27,28,29,31,32,36,38,43,47,55,63,64,65,72,73,74,77,82,87,90,91,92,93,100,101,102,103,107,123,124,138,147,157,158,159],add_argparse_arg:[63,72],add_argu:[29,31,63,72],add_argument_group:63,add_arguments_to_pars:[28,29],add_class_argu:29,add_command:36,add_confusion_matrix:84,add_dataloader_idx:[64,102],add_figur:[102,155,160],add_help:36,add_histogram:[64,102,155,160],add_imag:[64,102,155,160,161],add_lightning_class_arg:29,add_lr_scheduler_arg:28,add_model_specific_arg:63,add_optimizer_arg:28,add_predict:84,add_slurm_cmd:36,add_stat:157,addhandl:[57,102],addit:[8,9,19,22,29,58,63,64,69,97,99,100,102,140,148],addition:[4,19,21,22,28,61,71,72,140,145,148],addmm:154,address:[6,12,16,17,29,38,64,98],adjust:[19,22,39,57,64,69,72,102],adl:[52,71,157],adlf:71,advanc:[1,6,7,9,10,14,31,51,64,65,66,72,73,75,88,108,109,111,112,113,116,117,118,121,128,129,131,132,141,142,143,147,150,152,155,156,160,161],advancedprofil:[72,152],advantag:[6,8,28,64,69],adventur:84,advis:26,advprop:88,affect:[19,43,108],after:[0,6,15,16,17,18,19,22,26,27,29,62,63,64,65,72,74,83,84,93,97,99,101,102,103,108,139,142],after_:29,after_fit:29,after_save_checkpoint:[99,101],against:[24,87],agg_and_log_metr:[96,97,98,100,101],agg_default_func:[97,99,100,101],agg_key_func:[97,99,100,101],aggreg:[6,64,96,97,98,100,101,157],agnost:[23,61,64,107,140,148,149],ago:107,ahead:[87,140,148],ai:[8,16,17,33,41,42,44,45,46,47,49,72,86,88,99,109,147],aim:19,aio_bench_perf_sweep:19,al:64,alert:87,algorithm:[6,19,22,64,72,108],alia:[16,17,101],alias:[4,72,101,106],align:87,all:[0,3,5,6,11,13,16,17,18,19,20,22,25,26,27,28,29,30,31,32,38,41,42,43,46,48,52,53,55,61,63,64,65,67,69,70,71,72,74,76,78,82,83,84,85,87,88,89,90,91,93,96,99,100,101,102,103,108,109,110,111,113,136,139,140,141,142,144,145,146,148,149,152,155,157,160,161],all_gath:[0,140,148],all_pr:64,all_result:6,all_test_pr:64,all_test_step_out:64,allevi:19,allgather_bucket_s:19,alloc:[19,22],allow:[4,6,9,12,16,17,18,19,20,21,27,28,29,36,37,38,39,49,53,61,63,64,65,72,74,77,80,81,99,102,105,107,108,140,148],allreduc:[6,19],almost:19,alon:64,along:[8,53,64,65,74,84,103,107],alpha:[16,17],alreadi:[0,19,29,31,32,42,64,72,97,98,101,102,103,109,140,148,155,158,160,161],also:[0,4,6,9,11,13,18,19,20,21,22,23,27,28,29,31,36,45,46,52,53,55,61,63,64,67,68,69,70,71,72,74,78,80,83,84,85,87,97,99,101,102,103,106,107,108,140,146,148,149,159],alter:[64,74,129],altern:[28,64,65,103,107],although:[42,67,69,149],alwai:[28,29,64,67,72,108],am:[140,148],amaz:[19,84],amazon:71,amazonaw:[45,46,103],amdim:85,among:[6,15,20,140,148],amount:[19,20,22,32,38,72],amp:[64,65,69,72,139,142,147],amp_backend:69,amp_level:69,amper:69,an:[3,4,5,6,9,11,15,16,17,22,27,28,29,30,33,41,43,45,46,49,55,56,60,61,62,64,65,72,73,77,84,86,89,93,96,97,98,99,100,101,102,103,104,106,107,108,109,133,139,140,142,148,149,152,154,157,158,160],an_imag:158,analys:[10,115],analysi:[13,84],analyt:152,analyz:101,anchormod:11,ani:[0,1,3,4,6,7,10,11,12,14,15,16,17,19,20,21,22,27,28,29,31,40,41,45,46,47,55,58,61,64,65,71,72,74,77,80,82,83,84,87,90,92,93,96,97,98,99,100,101,102,103,107,115,134,139,140,142,146,148,149,153,155,157,159,160,161],annot:11,anomali:72,anonym:[99,101,155,160,161],anoth:[20,29,63,64,77,103,108,152],another_paramet:[53,160],answer:[84,86],ant:103,any_extra_hook:149,any_flag:64,any_lightning_module_function_or_hook:[98,99,155,160,161],any_trainer_arg:72,any_trainer_flag:90,anymor:58,anyon:[45,46,49,50],anyth:[31,32,36,38,64,69,72,74,93,102,103,149,158],anywai:64,anywher:[0,6,74,98,99,102,108,139,145],apart:61,apex:[6,53,65,139,142],api:[6,19,27,29,51,54,61,65,84,88,89,97,99,138,140,148,155,156,160,161],api_kei:[97,99,155,160,161],appear:[30,99],append:[6,64,71,72,102,157],appli:[6,15,16,17,18,19,20,22,30,64,65,71,72,74,84,88,99,102,140,148],applic:[4,6,16,17,84,88,106],apply_on:29,apply_to_collect:[64,74],approach:[48,52,56,64],appropri:[6,9,18,36,39,72,98,104],apt:84,ar:[0,3,4,5,6,8,12,13,15,16,17,19,20,21,22,23,24,28,29,30,38,39,41,42,44,45,46,47,48,49,53,55,56,58,61,63,64,65,67,71,74,76,77,78,84,85,88,92,93,94,96,97,98,99,100,101,102,103,105,107,108,139,140,141,142,145,146,148,149,151,157,158],arbitrari:[0,22,28,29,64,72,74,92,104,139,140,142,148],arbitrarili:64,architectur:[8,11,12,15,16,17,18,69,84,108,145],archiv:146,area:[69,109],aren:[16,17,65,72],arg1:[6,39,64],arg2:64,arg3:64,arg:[6,26,28,31,32,39,45,46,53,64,72,74,77,93,94,96,97,98,101,102,103,107,140,148,157,159,160],argmax:[64,84],argpars:[29,30,31,53,72,102],argument:[4,6,8,9,12,16,17,19,21,22,26,29,30,31,32,41,45,53,55,63,64,65,70,72,74,77,78,84,90,92,96,97,98,99,100,101,102,103,105,107,108,139,140,141,142,147,148,154,155,156,157,158,159,160,161],argumentpars:[27,31,36,72],arithmet:69,around:[19,22,82,84,104],arrai:[77,84,101],art:[2,7,15,66,85,116,132,138,141,147],artifact:[98,101,155,161],artifact_dir:101,artifact_loc:98,artifici:12,arxiv:64,as_imag:99,as_strid:154,asic:[16,17],ask:[1,14,25,30,40,74,95,149],aspect:[64,72,84,91,110],asr_model:84,asrmodel:84,assert:[72,157],assign:[4,6,16,17,21,64,74,96,100],assist:72,associ:[8,28,43,61,64,65],assum:[19,39,64,72,74,109],asteroid:86,async:6,asynchron:[6,135,154],atla:86,attach:[45,46,64,103],attempt:[55,72],attent:[72,86],attention_mask:[23,84],attn:[23,84],attribut:[0,22,29,43,63,64,65,72,77,100,104,108],audienc:[2,3,4,6,8,9,11,12,13,15,16,17,18,23,26,29,31,32,33,38,41,42,45,46,47,48,49,50,53,55,57,60,67,68,69,76,77,78,80,81,82,83,144,151,152,153,154,157,158,159,160],audio:[84,86,90,101,158],audio_eltyp:84,audio_sign:84,audio_signal_len:84,audiosign:84,augment:[63,64,72,74,84],augmentor:84,author:6,author_email:6,auto:[4,8,19,22,64,72,92,102,106,140,148,157],auto_device_count:[72,92],auto_encod:[56,64,83,149],auto_lr_find:22,auto_registri:28,auto_requeu:36,auto_resum:41,auto_scale_batch_s:22,auto_select_gpu:3,auto_wrap:19,autocast:69,autoencod:[23,53,56,64,144,147,149],autoencoderprod:83,autoencodersystem:[83,149],autograd:[72,154],autom:[36,64,65,72,87,103,140,148],automat:[0,3,6,18,19,22,27,28,29,30,36,41,42,47,48,53,61,63,64,69,70,72,74,89,95,96,97,99,100,101,103,105,107,139,140,141,142,145,148,152,158,160],automatic_optim:[65,108,139,142],automaticargsmodel:64,autoreport_dir:13,autoscal:22,autosummari:77,autotoken:84,autotun:6,avail:[3,6,16,17,19,28,29,31,32,43,61,63,64,65,71,72,74,84,88,93,96,100,107,139,140,142,148,158],available_backbon:88,available_devic:92,available_head:88,available_pretrained_weight:88,averag:[6,19,24,64,72,81,82,103,158],average_valu:158,avg:154,avoid:[0,22,28,29,55,59,60,64,73,77,91,102,109,119,123,138,140,147,148],aw:[19,41,44,46,49,52,71,157],awai:[84,107,144],awar:[0,20,64],awk:[16,17],awscheckpoint:[141,147],az:71,azur:[52,71,87,157],b0:88,b:[65,84,101,107,108],b_float32:69,baal:103,back:[16,17,63,64,74,76,90,98,103,107,108],backbon:[23,28,29,55,88,90,103,140,148,149],backend:[4,6,64,71,72,106,140,148],background:[16,17,33,36,37,38,39,49,88,91,128,135],backprop:[64,107],backpropag:64,backpropog:64,backward:[6,19,22,62,65,68,72,93,103,107,139,142,144,147,154],bad:[5,28,29,58,64,108],baguarun:6,baguastrategi:6,balanc:[19,84],bandwidth:[12,108],bar:[64,72,73,91,109,110,112,156,158],bard:159,barrier:[74,76],base:[4,6,8,12,19,22,23,28,30,43,48,51,55,58,64,69,72,74,84,89,91,93,95,96,97,98,99,100,101,103,104,105,106,108,110,114,140,148],base_cl:32,baselin:88,basepredictionwrit:64,baseprofil:72,basepruningmethod:20,bash:36,basi:19,basic:[1,7,10,14,33,40,42,45,46,51,59,64,66,73,75,109,115,116,119,120,121,122,130,134,138,147,150,156],batch:[0,5,6,11,12,16,17,19,20,29,31,41,43,48,55,56,58,60,61,62,64,69,70,72,74,76,77,78,81,82,83,84,85,89,93,94,98,99,101,102,103,107,108,139,140,142,144,145,147,148,149,157,158],batch_a:107,batch_a_b:107,batch_b:107,batch_c:107,batch_c_d:107,batch_cifar:64,batch_d:107,batch_first:64,batch_idx:[0,6,43,55,56,58,60,64,65,69,72,76,81,82,83,84,85,89,93,98,99,101,102,103,107,108,139,140,142,144,145,147,148,149,157,158,159],batch_loop:103,batch_mnist:64,batch_nb:[31,84],batch_part:64,batch_progress:70,batch_siz:[5,9,16,17,18,22,29,43,48,64,65,72,74,84,99,102,103,107,108,139,142],batch_split:[6,64],batchnorm1d:77,batchnorm:[64,72],batteri:147,beauti:[70,112,159],becaus:[6,12,19,23,30,38,41,48,64,65,69,97,99,107,149],becom:[19,31,32,43,58,77,84,108,140,148,152],bee:103,been:[11,15,19,20,22,28,29,55,60,61,64,72,74,93,98,99,107,140,148],befor:[0,6,9,11,18,22,26,27,28,29,30,31,36,43,52,58,61,62,64,65,72,74,77,84,93,100,101,103,107,139,142],before_:29,before_fit:29,beforehand:28,begin:[6,32,64,72,77,93,96,97,98,100,101,103,108,140,148],beginblock:11,beginn:[38,65,88,108,139,142],behalf:[41,44,46,49,144],behav:[6,145,158],behavior:[27,30,36,51,52,64,72,73,93,103,112,129,140,148],behaviour:[0,58,64,102,157],behind:[19,36,149],being:[6,12,22,29,30,55,58,61,64,72,84,93,94,96,97,98,101,103,149],believ:[43,58],bellow:24,belong:[64,74,101,140,148],below:[3,4,6,9,11,19,22,29,36,39,54,55,64,72,74,87,89,102,105,106,140,148,154],benchmark:[19,43,61,64,84,85,107,109,149],benefici:[19,20,108],benefit:[19,22,28,47,58,64,69,89,90,103,105,140,148],bert:[84,149],bert_model:84,bertmnlifinetun:23,bertmodel:23,best:[0,19,29,30,33,46,48,53,61,64,72,77,78,91,94,101,103,108,128,129,135,145,149],best_model:[64,82,83],best_model_path:55,beta:[19,20,140,148],better:[6,18,22,29,58,67,69,149,151],between:[4,8,12,16,17,19,20,22,24,32,38,39,55,64,72,74,84,106,149,159],bewar:103,beyond:58,bf16:[9,69,72,140,148],bf16_file_path:9,bfloat16:[18,67,72,108,140,148],bfloat:[140,148],bia:15,bias:[19,84,101],bidirectionalrnn:64,big:64,bigger:[19,91,118,128,132],bin:[6,36],binari:[22,71,72],bind_al:84,binsearch:[22,72],bio:84,bit:[9,19,53,61,64,85,105,140,148],bite:109,bitsandbyt:69,bitwidth:20,blackhc:22,bleed:[113,143,146,147],blob:64,block:[11,19,101,102,108,140,148,157],block_1:19,block_2:19,blog:[84,109],blogpost:69,bodi:[140,148],boi:84,boilerpl:[73,82,89,109,147],bolt:[86,93],bonu:32,bool:[37,61,64,72,92,97,99,100,101,103],bootstrap:85,boring_class:31,boringdatamodul:[31,32,140,148],boringmodel:[43,152],both:[19,22,28,29,33,43,60,64,65,72,84,97,101,102,108,139,142,149],bottleneck:[6,16,17,19,67,72,73,91,108,109,123,132,149],bottom:[16,17],bought:84,bound:[19,101],boundari:108,box:[32,64,69,74,90,101,146],branch:[12,84,87],breakdown:154,breakpoint:76,bridg:8,bring:[69,84],broadcast:[4,106,140,148],broadcast_tensor:154,brows:151,browser:151,bu:[72,140,148],bucket:[27,46,72],buffer:[0,19,108],bug:[72,77,146],bui:[41,44,46,49],build:[0,12,64,73,74,84,85,90,103,108,109,150,157],built:[0,4,8,12,19,47,63,64,65,72,78,88,105,106,107,140,148,152,154,159],builtin:152,bump:19,burden:29,button:151,byol:86,bytegrad:6,c10d:6,c:[27,31,72,81,99,107,109,146,147,154,155,160,161],c_float16:69,cach:[64,84,93,101,102],calc_all_result:64,calcul:[19,55,64,89,107],call:[6,12,15,16,17,19,22,28,31,43,53,58,60,61,62,63,64,65,72,74,77,80,84,87,92,93,97,99,100,101,102,103,107,108,139,140,142,148,152,153,157,158,160],call_hook:103,callabl:[20,64,108],callback:[0,20,22,43,52,53,54,55,61,62,63,64,65,70,77,90,99,101,104,108,109,112,140,141,147,148,152,159],callback_1_args_1:28,callback_1_args_2:28,callback_1_nam:28,callback_metr:[64,65,139,142],callback_n_args_1:28,callback_n_nam:28,callback_registri:28,callback_st:93,camerargb:88,cameraseg:88,can:[0,3,4,6,8,9,11,12,13,16,17,18,19,20,21,22,23,26,27,28,29,30,31,32,36,38,39,41,43,45,46,47,48,49,52,53,54,55,56,57,58,60,61,62,63,64,65,67,68,69,70,71,72,74,76,77,78,80,81,83,84,85,87,88,91,92,93,94,96,97,99,100,101,102,103,104,105,106,107,108,123,136,139,140,141,142,144,145,146,148,149,151,152,154,157,158,159],cannot:[0,6,16,17,19,22,43,55,58],capabl:[11,28,99,158],capac:152,capit:84,caption:[101,155,160,161],captur:[43,57,72,93,152],capture_stdout:99,car:[26,103,158],care:[28,64,65,102,103,107,108,139,140,142,148,157],carlo:[64,81,82],carri:[16,17,20,103],cast:[9,64,69,140,148],cat:6,categori:108,caus:[16,17,30,140,148],cc:[16,17],cd:[6,27,46],cell:[16,17,102],central:[6,43],certain:[6,19,27,29,57,58,64,67,72,102,157],cfg:84,challeng:[140,148],chanc:[64,69,78,93],chang:[0,4,16,17,18,19,20,21,22,28,29,30,31,32,38,52,53,54,55,56,57,58,64,65,72,73,76,77,87,90,92,93,101,102,103,140,141,148,158],channel:[87,158],chart:[24,102,157,158],cheap:41,cheaper:18,check:[5,8,15,16,17,19,28,29,58,64,70,72,74,84,85,93,99,102,103,140,145,146,148,149],check_finit:58,check_on_train_epoch_end:58,check_val_every_n_epoch:[58,64,108],checkout:[9,108,149],checkpoint:[0,4,6,21,36,61,63,64,71,72,73,74,77,84,91,93,94,95,96,97,99,100,101,102,104,105,106,109,110,122,127,129,140,145,147,148],checkpoint_callback:[55,99,101],checkpoint_io:[4,21,54],checkpoint_path:[55,61,64],checkpoint_refer:101,checkpoint_wrapp:19,checkpointio:[4,21,54,71,72],chees:101,child:[77,109],children:[23,103],chip:[8,9],choic:[16,17,22,45,46,58,63,65,102,108,140,148],choos:[4,6,18,22,32,48,64,84,93,94,102,106,107,140,148],chosen:[22,72,88],chunk:[6,18],ci:[24,27,146],cifar10:74,cifar10classifi:23,cifar10datamodul:[74,85],cifar5:[45,46,48],cifar:[23,43,63,64],cifar_load:64,circuit:[16,17],ckpt:[19,52,53,55,61,64,71,72,82,83,101,140,147,148],ckpt_callback:72,ckpt_path:[19,26,27,31,52,53,61,71,72,104],cl:[84,92],clara:84,class_3:26,class_balanc:84,class_path:[28,29],classif:[29,48,84,86,89,93,103],classifi:[23,24,45,46,48,52,71,84],classificationtask:64,classmethod:[64,88,92],clean:[72,74,93,149],clear:[16,17,30,64,65,72,102,139,142,157],cli:[25,27,28,29,32,36,37,38,39,49,73,84,91,92,109,111,124,126,136],click:[16,17,151],client:[16,17,99,155,160,161],clip:[12,64,72,78],clip_grad_norm_:22,clip_grad_value_:22,clip_gradi:[64,65],clock:154,clone:[30,45,46,84],close:[4,64],closur:[32,64],cloud:[5,14,18,20,36,37,38,39,40,42,44,51,71,73,91,102,109,110,114,117,126,128,156],cluster:[3,8,33,40,41,72,73,91,92,109,124,128,140,148],cluster_email:63,clusterenviron:[37,72,140,148],cmd:36,cnn:[24,31],code:[0,1,5,7,9,10,12,14,16,17,18,19,26,28,29,30,31,32,38,45,46,49,55,64,65,72,73,74,90,91,92,93,99,101,102,103,108,109,110,112,115,117,134,139,141,142,144,149],codeown:87,coef_x:149,colab:[6,72,84,101,146,155,158,160,161],collabor:[47,91,128,149],collaps:102,collate_fn:107,colleagu:74,collect:[6,8,19,43,64,72,74,84,85,89,90,93,102,103,107,140,148,149,153],color:159,column:101,com:[6,16,17,22,29,45,46,63,64,84,103,146,159],combin:[19,28,36,48,69,70,72,84,87,103,107,108,140,148],combined_load:107,combinedload:107,come:[18,19,22,43,60,63,64,74,84,88,100,103,140,144,145,148,155,160,161],comet:[97,102],comet_api_kei:97,comet_experiment_kei:97,comet_logg:[97,102,155,160,161],comet_ml:97,comet_rest_api_kei:97,comet_workspac:97,cometexperi:97,cometlogg:[102,155,160,161],comma:3,command:[5,6,16,17,18,19,28,29,30,31,36,39,45,46,48,63,84,102,108,146,154,158],commandlin:[30,31,32,45,46,91,123,147],comment:[31,36],commit:[30,105],common:[15,22,24,26,29,43,48,54,60,71,90,99,155,160,161],commonli:[16,17],commun:[0,1,4,8,11,36,38,39,41,44,46,49,64,73,85,91,92,102,106,109,110,123,124,128,140,147,148,157],compact:[28,29],compani:[33,47,48,49,84,126,135],compar:[16,17,19,69],comparison:43,compat:[19,20,53,61,65,84,89,139,142],compens:[6,19],compil:[12,16,17,64],compiletim:[16,17],complementari:103,complet:[4,19,20,23,28,29,53,61,64,65,69,106,107,152,159],complex:[19,25,26,29,30,31,32,42,43,53,59,64,74,86,88,113,125,136,140,143,144,148,157,160],complianc:47,compliant:5,complic:[45,46,47,144,145],compon:[19,52,70,86,90,92],compos:[25,51,64,74,84,91,103,110,111,114,140,148],composit:[77,90],compress:[6,19,20,79,131],comput:[0,3,6,12,16,17,19,20,22,35,38,43,48,64,65,67,69,72,84,89,100,109,133,147,149,157,158],computation_cli:[16,17],compute_amount:20,compute_loss:[65,139,142],con:108,concat_dataset:107,concatdataset:107,concaten:[140,148],concept:[19,29,84,93,94],concern:22,conda:[18,36,72,99,108,109,147,155,160,161],conda_env:63,condit:[58,64,103,129,140,148],condition:72,conduct:[69,113,143],conf:84,config1:27,config:[23,28,73,84,87,90,91,97,101,102,109,110,125],config_nam:84,config_path:84,configur:[3,6,8,16,17,18,19,22,26,27,28,31,32,36,37,38,39,47,55,57,61,64,69,70,72,73,86,87,90,91,93,99,109,110,139,140,142,148,155,157,160,161],configure_callback:72,configure_column:70,configure_ddp:[4,6,72,106],configure_gradient_clip:65,configure_optim:[6,19,22,28,31,32,65,74,139,140,142,144,145,147,148,149],configure_sharded_model:19,conjunct:[61,107],connect:[18,25,32,36,38,39,42,47,72,92,103,108,125,140,148],consid:[27,63,65,67,72,108,139,140,142,148],consider:[19,65,69],consist:[12,37,64,84],consol:[22,109,140,148],constant:[12,43],constraint:22,construct:[18,19,22,108],constructor:[6,96,99,100,101],consum:67,consumpt:[15,19,22,43,67,108],contact:[41,44,46,47,49,87],contain:[3,19,53,64,72,74,84,93,96,97,98,100,101,112,140,144,146,148],content:[63,64,140,148],context:[11,16,17,19,64,68,78,108,140,148],contextlib:108,contextmanag:108,contextu:86,contiguous_gradi:19,continu:[43,53,64,85,87,140,148],contrast:[28,29,36,67],contribut:[84,85],contributor:72,control:[4,11,19,22,25,26,30,31,32,55,64,69,72,73,97,103,106,111,113,129,136,140,143,147,148],conv_mask:84,convasrencod:84,conveni:[63,64,72,99,140,148],convent:12,converg:[5,8,22,65,72,91,108,128,130,139,142],convert:[27,64,84,92,109],convert_spectrogram_to_audio:84,convert_zero_checkpoint_to_fp32_state_dict:19,convnet:31,convolut:[16,17,84,86],cool:[6,108],copi:[6,15,19,26,38,83,93,94,108],copy_:154,copy_model_to_gpu:6,core:[4,7,8,12,14,15,18,57,64,67,69,72,84,102,103,106,108,116,134,140,148],corpor:[47,149],correct:[6,18,19,36,64,72,74,78,85,102,103,107,140,148,157],correctli:[19,55,140,148],correspond:[16,17,22,30,53,61,64,72,84,104,107,140,148],corrupt:[64,74],cosineann:64,cosineannealinglr:32,cost:[19,22,33,47,108,135,154],cotatron:86,could:[12,16,17,18,28,29,30,64,70,71,102,103,104,108],count:[43,58,74,103],counter:[16,17,93,94],coupl:[28,29,52,149],cours:[74,102,107],cover:[55,140,148],cp37:[16,17],cp37m:[16,17],cp:108,cpcv2:85,cprofil:152,cpu:[0,4,6,12,15,16,17,19,21,22,49,54,64,67,69,72,74,76,84,85,87,92,106,140,146,148,154],cpu_checkpoint:19,cpu_count:108,cpuacceler:72,crash:77,creat:[0,6,11,16,17,19,20,22,28,29,30,36,47,49,53,55,62,64,65,66,70,74,80,81,83,84,87,88,89,91,95,97,98,99,101,102,107,112,127,128,140,148,159],create_checkpoint_callback:84,create_tensorboard_logg:84,creates_processes_extern:37,creation:43,creativ:158,credenti:[47,48,49,72],credit:[41,44,46,49],criterion:[65,85,108,139,142],cross:[103,140,148],cross_entropi:[55,64,145],crucial:69,csv:[96,99],csv_log:96,csvlogger:102,ctc:84,ctrl:72,cuda:[3,19,36,64,69,72,84,108,140,148,154],cuda_awar:19,cudnn:72,cumtim:152,cumul:152,curl:45,current:[11,12,13,16,17,19,22,41,53,58,61,64,72,74,84,87,89,92,93,96,99,102,103,107,108,109,140,145,148,157,158],current_epoch:[65,139,142],current_iter:103,current_train_batch_index:[74,95],custom:[0,10,11,12,20,21,22,25,28,37,39,47,51,55,57,58,62,64,68,71,72,73,74,84,89,90,91,101,103,105,109,110,113,124,125,127,128,140,143,148,150,158],custom_checkpoint_io:[4,21,54],custom_column:70,custom_processing_step:153,custombatch:[64,74],customcallback:28,customcheckpointio:[4,21,54],customdatamodul:74,customdataset:107,customddpstrategi:[4,72,106],customfitloop:103,customiz:[31,72,84],customprecisionplugin:68,customprogressbar:[102,157],customrichprogressbar:70,customvalloop:103,cut:67,cvpr:86,cycl:64,cython:84,d:[19,39,47,55,64,65,84,107,108,139,142,153,159],d_loss:[65,108,139,142],d_opt:[65,108,139,142],d_x:[65,108,139,142],d_z:[65,108,139,142],dai:[49,72,77,84,108],dangl:64,dash:30,dashboard:[158,160],data:[5,9,11,16,17,18,19,22,23,26,27,28,29,30,31,32,43,45,46,52,53,61,63,64,65,67,71,72,74,77,82,84,86,89,93,96,97,100,101,102,103,119,138,140,144,147,148,152,153,157,158],data_dir:[22,26,31,45,46,48,74,84],data_load:82,data_modul:64,data_path:63,data_queu:43,data_root:108,data_sourc:107,data_split:64,databas:64,datafram:101,dataload:[0,5,6,8,16,17,18,22,32,60,64,72,74,82,84,102,103,140,144,145,147,148,152,157],dataloader_i_output:64,dataloader_id:64,dataloader_idx:[64,74,82,93,107],dataloader_out:64,dataloader_output:64,dataloader_output_result:64,datamodul:[9,22,26,28,52,53,61,72,85,88,91,99,103,107,108,128,136,140,148,152],datamodule_class:32,datamodule_registri:32,dataparallel:6,dataparallelstrategi:108,dataset:[5,6,18,23,25,41,47,56,60,61,64,70,72,74,77,78,84,85,90,91,101,103,108,128,136,140,145,147,148,149],datastor:[45,46,48],datastore_nam:[45,46,48],datatyp:[16,17],datetim:72,dcgan_faces_tutori:[65,108,139,142],dd:72,ddp2:[5,64],ddp:[4,5,8,18,21,22,36,38,55,61,62,64,65,72,74,76,83,84,102,106,140,148,157],ddp_comm_hook:19,ddp_comm_stat:19,ddp_comm_wrapp:19,ddp_custom_checkpoint_io:[4,21],ddp_find_unused_parameters_fals:[4,21],ddp_shard:[5,19,140,148],ddp_sharded_spawn:[140,148],ddp_spawn:[4,5,6,22,64,72,106,108,140,148,149],ddp_train:6,ddpshardedstrategi:108,ddpspawnstrategi:[19,22],ddpstrategi:[4,6,19,21,72,106,108],de:19,deactiv:[140,148],deadlock:[0,55,64,102,157],deal:[47,67,78,107,108],debug:[4,19,21,36,72,108,109],debugging_messag:76,decay_factor:99,decentr:6,decid:[39,64,119,140,148,149],declar:[11,61,107],decod:[23,28,53,56,60,64,83,84,144,147,149],decoder_lay:[27,28],decoder_weight:53,decor:[55,64,81,102],decoupl:[22,107,149],decreas:[20,22],deep:[3,6,8,16,17,19,22,67,69,77,86,88],deeper:[6,129],deeplabv3:88,deeplabv3plu:88,deepspe:[4,5,21,55,64,65,90,106,118,139,140,141,142,147,148],deepspeed_config:19,deepspeed_stage_1:19,deepspeed_stage_2:[19,141,147],deepspeed_stage_2_offload:[4,19,21],deepspeed_stage_3:19,deepspeed_stage_3_offload:[4,19,21],deepspeedcpuadam:19,deepspeedstrategi:[19,54,108,140,148],def:[0,4,5,6,11,15,18,19,20,21,22,23,28,29,31,32,36,37,43,52,53,54,55,56,58,60,61,63,64,65,69,70,72,74,76,77,80,81,82,83,84,85,89,92,93,94,95,98,99,101,102,103,104,106,107,108,139,140,142,144,145,147,148,149,153,155,157,158,159,160,161],default_backbon:[28,29],default_config_fil:27,default_hook:19,default_hp_metr:[100,102],default_project:97,default_root_dir:[52,53,71,102,158],defaultdict:153,defaultloop:103,defin:[4,6,11,18,19,21,28,29,38,39,56,61,63,64,65,72,74,84,87,93,94,95,99,100,101,103,105,107,139,140,142,147,148,149],definit:[0,12,37,48,107,140,148,149],degrad:19,degre:61,delet:[19,64,100],deliv:69,demo:[31,32,45,46,101,103,155,160,161],demomodel:[31,32],denomin:64,densenet121:88,depend:[22,29,31,36,38,43,45,46,48,49,72,74,79,83,84,88,93,96,97,98,101,102,105,107,108,122,149,157],deploi:[1,20,67,73,91,109,127,128,147],deploy:[20,47,79,108,131],deprec:[64,72,74,93,140,148],depth:[91,124,138,156],deriv:[29,65,72],descent:103,describ:[6,11,19,22,26,28,29,39,64,87],descript:[4,6,21,29,30,54,64,70,92,99,102,103,109,140,148,157,159],design:[3,11,16,17,28,29,33,38,49,63,84,85,93,104,107,149],desir:[28,29,31,32,36,65,93,108,139,142],destroi:[16,17],detach:[64,65,102,108,139,142,157],detach_:19,detail:[3,6,9,16,17,19,22,24,29,30,31,36,41,43,64,71,72,74,87,91,99,107,108,109,124],detect:[6,8,36,48,72,84,86,107,152],detect_anomali:[72,78],detectron2:19,determin:[22,29,54,60,64,97,100,102,103],determinc:19,determinist:19,dev:[84,108],develop:[1,2,4,8,16,17,28,29,30,33,41,53,80,91,107,108,123,127,128,149,158],devic:[0,4,6,8,9,11,12,13,15,16,17,18,19,20,21,22,36,38,39,54,55,61,62,63,65,69,74,76,82,83,84,89,92,97,98,99,101,102,106,139,141,142,147,157],device_count:[3,72],device_id:[4,72,106],device_iter:11,device_pars:[16,17],device_typ:69,deviceiter:11,devicestatsmonitor:[8,72,77,152],devot:77,diagnos:[16,17],dict:[4,6,21,28,43,61,64,72,74,84,92,93,96,97,98,99,100,101,102,107,108],dict_arg:63,dictconfig:84,dictionari:[22,28,29,61,62,64,65,72,74,93,96,97,98,99,100,101,102,107,160],dictionary_of_load:107,did:[6,74],didn:64,die:8,differ:[1,6,11,12,16,17,19,22,29,32,48,53,54,56,58,61,62,63,64,65,66,69,70,71,72,73,74,81,84,93,94,103,105,107,118,130,140,146,148,149,158],differenti:149,difficult:43,dig:[51,138,156],dilat:84,dim:[6,11,23,64,81,82,84,89],dimens:[31,64,103],dir:[74,101],direct:[18,108],directli:[4,11,19,22,28,32,41,44,46,49,54,63,64,72,74,81,83,93,99,101,102,103,106,108,155,157,160],directori:[13,19,53,72,96,97,98,99,100,101,102],dirnam:36,dirpath:[55,72,152,153],dirti:149,dis_opt:64,dis_sch:64,disabl:[19,28,58,64,70,72,77,78,99,101,159],disadvantag:108,disambigu:[93,94],disc_loss:64,discard:19,discourag:[6,93],discoveri:87,discret:146,discrimin:[64,65,108,139,142],discuss:[19,84],disk:[55,64,72,74,84,96,100,108,140,148,157],displai:[12,64,70,77,100,101,159],dist:[16,17,157],dist_reduce_fx:157,dist_sync_on_step:157,distilbert:84,distinguish:[93,94],distribut:[0,1,4,5,8,16,17,22,35,36,37,38,39,51,53,61,62,64,65,71,72,73,74,75,89,91,92,102,106,108,109,118,124,127,133,144],distributed_forward:6,distributeddataparallel:[4,6,19,72,106,140,148],distributedsampl:[0,61,64,72],div:[36,37,38,39,45,46,48,49],div_:154,dive:[14,117],diverg:[140,148],divergence_threshold:58,divid:64,dl1:[8,107],dl2:107,dl:8,dm:[9,61,64,74,88],doc:[8,19,64,65,69,70,72,99,102,139,142],docker0:36,docker:84,document:[6,11,12,15,19,27,29,30,60,64,65,72,85,88,90,99,101,108,139,142,149,155,160,161],doe:[6,16,17,18,19,22,28,36,43,58,64,65,72,97,98,99,103,107,108,149],doesn:[5,6,18,22,55,62,65,69,71,93,108,149],domain:[84,85,88,107,149],don:[0,3,16,17,18,22,28,31,36,37,48,53,54,64,65,72,78,102,103,108,140,146,148,157,158,159],done:[0,11,15,16,17,19,22,28,29,30,61,64,72,107,140,148,149],doubl:[19,22,67,72,140,148],doubledistilbert:86,down:[0,30,41,72,102,108,149,152,157],download:[13,16,17,18,22,45,46,60,64,74,84,101,107,140,144,147,148],download_data:[64,103,140,148],downsid:108,downstream:[0,84],downward:22,dozen:48,dp:[5,22,61,62,64,65,74,140,148],dp_out:64,draft:87,drastic:19,drive:[19,158],driver:6,drop:[20,64,83,99,140,148,149],drop_prob:64,dropdown:151,dropout:[53,64,81,82,84,103],dtype:69,due:[6,11,12,19,22,108,140,148,152,154],dummi:[45,93],dump:[0,5,13,22,53,64],duplic:[64,72],durat:[72,84,151,152],dure:[0,4,6,13,16,17,19,20,21,22,41,43,53,60,61,64,65,69,70,72,77,84,101,102,108,139,140,142,145,148],dynam:[13,55,64,69],e:[4,6,11,12,16,17,22,28,29,30,61,62,63,64,65,72,74,93,94,96,97,98,99,100,101,102,103,104,106,108,140,148],each:[0,6,8,16,17,18,19,22,25,26,28,30,31,36,38,39,43,48,53,61,62,63,64,65,72,77,84,93,101,102,103,107,108,109,125,139,140,142,148,149,153,154,157],earli:[72,77,109,119,140,148],earliest:72,early_stop:[58,64],early_stop_callback:58,early_stopping_callback:63,earlystop:[28,29,64,108],eas:[29,70],easi:[16,17,56,64,84,87,89,107,149],easier:149,easiest:82,easili:[9,28,36,37,38,39,41,84,86,99,101,140,141,148],ec2:8,ecosystem:84,edg:[20,89,113,143,146,147],edit:99,effect:[5,15,20,49,62,64,65,72,73,93,94,98,109],effici:[8,20,22,64,72,108,149,157],efficientnet:88,effort:[19,140,148],eg:[22,62,64,65,74,93],egg:84,eight:[108,140,148],either:[8,22,30,54,61,64,72,74,84,93,97,101,107,108,154,159],elaps:100,eleg:103,element:19,elif:[20,31,32,63,64,65,74],elimin:[20,73,109],els:[22,64,65,72,74,84,93,96,97,100,101,102,140,148],email:[29,42,47,63],emb:147,embed:[64,72,147,149],emit_nvtx:154,emot:86,emploi:[19,69],empti:[30,96,100,154],emptibl:41,empty_cach:108,empty_lik:154,empty_strid:154,en:84,enabl:[2,6,7,8,12,13,16,17,18,20,22,25,29,32,38,40,41,43,47,51,53,58,63,64,66,67,69,70,71,72,73,78,81,84,86,91,100,101,103,104,108,110,111,113,116,119,121,123,127,128,129,130,132,138,140,143,145,148,154,156,158,159],enable_checkpoint:[53,63],enable_graph:[64,102],enable_model_summari:77,enable_progress_bar:70,encapsul:[43,54,74],encdecctcmodel:84,encod:[23,28,53,56,60,63,64,83,84,86,144,145,147,149],encoded_len:84,encoded_length:84,encoder_lay:[27,28,29,63],encoder_output:84,encoder_weight:53,encount:[22,72],encourag:[30,74],end:[0,6,22,31,36,43,53,55,58,64,70,72,74,84,86,93,97,101,102,103,108,154,157],endpoint:20,energi:20,enforc:64,enforce_sort:107,engin:[8,26,47,57,72,78,80,81,91,93,103,123,144],english:101,enhanc:108,enough:[29,91,93,94,108],ensembl:103,ensur:[0,11,12,15,19,39,43,55,64,69,72,74,108,140,148,152,157],enter:[30,140,148,151],enterpris:[27,38,47,79,80,81,131],entir:[19,22,53,58,84,93,108],entiti:101,entri:[20,28,29,64],enumer:[64,103,140,144,148],env:[6,18,27,36,72,108,146],env_pars:27,environ:[6,16,17,19,25,29,36,37,38,39,40,41,42,47,53,60,72,79,80,81,97,98,99,102,104,108,111,131,140,146,148,157,158],ep:19,epoch:[19,20,22,24,28,30,31,32,41,43,53,55,61,62,65,70,72,82,85,93,94,102,103,139,140,142,147,148,158],epoch_loop:103,epoch_metr:64,equal:[19,30,108],equip:84,equival:[3,8,48,63,64,72,74,103,140,148],errd:[65,108,139,142],errd_fak:[65,108,139,142],errd_real:[65,108,139,142],errg:[65,108,139,142],error:[0,6,12,16,17,19,22,29,38,57,64,101,102,140,148],error_handl:30,es:72,esoter:65,especi:[3,67,72,149],essenti:[12,22,43,69,84,93,94],estim:[20,22,72,103],estimated_stepping_batch:65,et:64,eta:47,etc:[6,16,17,20,22,43,53,55,61,63,64,65,68,72,74,77,84,97,99,101,102,103,107,139,140,142,147,148,149,152],ethernet:8,eval:[23,53,64,82,83,145,147],evalu:[4,16,17,19,22,30,31,61,64,69,72,84,103,106,147,149],evaluate_from_fil:84,evaluationepochloop:103,evaluationloop:103,even:[0,19,22,41,46,47,53,61,64,65,107,139,142],event:[41,72,84],eventu:149,ever:[6,74,77],everi:[6,19,22,27,30,53,55,58,62,63,64,65,70,72,74,84,95,96,101,102,103,139,142,144,157,158],every_n_epoch:55,every_n_training_step:55,everyth:[6,41,43,53,72,76,84,102,109,140,148],everywher:47,evolv:87,ex:101,exact:[30,43,55,72,74,83,107,149],exactli:[6,41,64],exampl:[0,3,4,6,9,11,12,15,16,17,19,20,22,27,28,29,36,37,39,43,45,46,49,53,55,56,57,58,63,65,69,72,74,77,82,84,88,92,94,96,97,98,99,100,101,102,104,107,108,139,142,147,149,153,160],example_imag:64,example_input:64,example_input_arrai:[77,80,100],except:[6,16,17,19,30,38,72,93,101,103,107,145,155,160,161],excess:[140,148],exchang:6,exclus:[3,11,72,108],execut:[8,9,11,16,17,29,64,65,72,74,77,93,104,140,148],exist:[4,22,72,96,97,98,100,101,103,106,109],existingcometexperi:97,exit:[20,30,31,108],exp:99,exp_dir:84,exp_manag:84,expand:154,expect:[19,22,28,43,74,103],expens:43,experi:[6,12,29,30,36,37,38,39,45,46,61,64,72,73,78,96,97,98,99,100,101,102,108,109,121,129,161],experiment:[4,12,16,17,21,29,41,54,69,90,92,104],experiment_id:98,experiment_kei:97,experiment_nam:[97,98,155,160,161],experimentwrit:96,expert:[1,2,25,33,35,40,48,49,51,65,66,78,84,92,106,109,113,125,126,127,135,139,142,143,147,150,156],expertis:[65,91,109,139,142],explain:[19,29,102,103],explan:[22,64,99,108],explicit:[16,17,30,61,145,149],explicitli:[6,63,64,72,74,101,102,145,157],explod:22,explor:[73,91,110,114,117,124,128,132],exponentiallr:[28,64],export_param:[64,80],expos:[4,19,43,92,104,106],express:103,extend:[4,25,28,29,54,64,72,73,84,86,91,92,93,99,106,124,126,154],extens:[29,105],extra:[19,31,43,64],extra_parameters_her:22,extract:[56,64,84,102,107,140,148],extractor:[23,56,64],extrem:[19,58,64,84],ey:0,f:[20,55,56,60,64,76,84,89,92,140,144,145,148,153,159],face:[140,148],facebook:[4,72],facilit:12,factor:[53,65,158],factori:86,fail:[0,30,31,41,72,96,98,99,100,101,102],failur:[19,30,41,43,140,148],fairli:19,fairscal:90,fake_data:18,fake_imag:[155,160,161],fake_image_batch:147,fake_label:[65,108,139,142],fakedataset1:32,fakedataset2:32,fall:[69,98],fals:[4,9,15,21,28,31,36,53,58,60,64,65,70,72,74,77,84,97,99,100,101,102,107,108,139,140,142,148,157,159],familiar:103,fanci:103,fancier:64,fancyadam:32,faq:[1,14,25,40],far:107,fashionmnistdatamodul:85,fast:[16,17,22,43,79,88,131,149],fast_dev_run:[31,63,77],faster:[3,6,8,12,19,22,49,66,67,72,73,77,91,108,128,130,132,157],fasterrcnn:86,fastest:103,fault:[6,33,47,53,91,104,109,124,135,140,148],favor:93,fc:23,fc_dropout:84,feat_dim:32,feat_in:84,featur:[6,19,22,23,28,29,41,43,55,56,64,81,88,96,97,98,99,100,101,104,114,138,140,146,148],feature_extractor:23,feedback:[19,140,148],feel:[6,55,72,83,84,140,148],fetch:[43,72,107,152],few:[0,6,19,30,31,45,46,63,64,72,77,78,84,93,102,103,107,131],fewer:108,ffmpeg:84,fiction:92,field:22,fig:22,figur:[5,22,30,63,140,148,149,152],file:[0,16,17,22,25,28,30,31,32,38,45,46,48,52,55,57,63,64,71,72,74,87,93,94,96,97,98,99,100,101,102,140,144,148,149,152,155,157,160,161],file_path:[64,81],filehandl:[57,102],filenam:[55,152,153,154],filepath:[72,80,102],filesystem:[27,52,109,114],fill_:154,filter:[84,108],filter_channel:84,filter_channels_dp:84,filterwarn:108,final_block:19,final_metr:64,final_valu:64,financ:84,find:[0,3,6,19,22,33,46,48,53,55,72,73,77,91,93,99,103,108,109,128,129,132,135],find_packag:6,find_unused_paramet:[4,21],finder:72,fine:[15,45,46,55,84,88,90,93,103],finetun:[22,23,73,84,103,109],finish:[16,17,29,60,72,74,96,98,99,100,101,102,103,151],finit:69,firewal:[38,39],first:[3,6,8,16,17,19,27,28,29,38,39,40,41,42,45,46,48,63,64,65,70,72,74,84,97,99,102,103,107,149,153,155,157,159,160,161],fit:[6,9,11,13,16,17,18,19,20,22,23,26,27,28,29,30,31,32,36,41,52,53,54,55,56,58,60,63,64,71,74,77,83,84,92,93,99,103,104,140,144,145,147,148,152,153,157],fit_loop:[64,103],fitloop:103,five:[16,17,74,140,148],fix:[0,6,12,19,72,78,87,108,146],flag:[3,9,11,13,16,17,18,19,27,36,58,63,64,102,107,108,109,147,157],flash:[45,46,86,109],flatten:[23,69],flavor:86,flavour:19,flexibl:[65,69,90,103,139,142],float16:[20,69],float32:[69,72],flow:[19,38,39,93,103,149],flush:[72,96,100,102,159],flush_logs_every_n_step:[96,102,157],flush_sec:100,fly:103,fn:[16,17,72],fname:84,focus:[4,20],fold:103,folder:[46,87,88],follow:[0,4,5,6,16,17,18,19,26,28,29,30,31,36,38,41,43,45,53,63,64,65,72,74,80,87,89,90,93,94,96,97,98,99,100,101,102,103,106,107,108,139,140,142,144,145,146,148,151,154,155,158,160,161],foo:[64,72],footprint:[22,69,72,108,140,148],forc:[6,41,72,108,154],forecast:86,forg:[99,109,146,147,155,160,161],forget:[0,36,159],fork:87,forkingpickl:0,form:[12,19,99,101],format:[3,9,16,17,19,26,29,31,43,64,69,70,72,80,96,99,100,155,159,160,161],former:64,forward:[0,6,11,15,19,20,22,23,31,43,56,62,65,68,69,72,76,80,81,83,84,97,100,103,107,139,140,142,144,145,147,148],found:[16,17,19,22,29,39,53,64,82,97,99,102,103,105],four:[70,84],fp16:19,fp16_compress_hook:19,fp16_compress_wrapp:19,fp32:[9,69],fp32_file_path:9,fp:0,fpn:88,fraction:[20,72,77],fragment:19,frame:64,framework:[6,8,30,63,69,88],free:[6,16,17,19,36,37,38,39,41,44,45,46,49,55,72,82,83,158],freed:19,freez:[23,88,103],french:101,freq:84,frequenc:[58,64,65,101,139,142],frequent:[1,14,25,40,103],friction:90,friend:77,from:[4,6,9,11,12,13,15,16,17,19,20,21,22,24,25,28,29,30,31,36,37,39,41,43,46,54,55,58,60,61,62,64,65,67,70,71,72,73,74,76,77,78,85,86,88,91,92,93,94,96,97,98,99,100,101,104,105,106,107,108,109,123,136,139,140,142,144,145,147,148,149,151,152,153,154,155,157,159,160,161],from_:88,from_argparse_arg:[63,72],from_fold:[88,103],from_pretrain:[23,84],fromag:101,fsdp:[4,19,118,141],fsspec:[52,71,109,157],fuel_capac:26,full:[5,6,11,16,17,18,19,26,27,30,31,53,61,64,72,77,84,85,93,102,103,105,140,144,148,149,152,153,155,158,160,161],full_out:6,fulli:[4,5,6,8,11,12,16,17,20,29,47,53,84,103,106,140,145,148],function_to_debug:77,further:[11,20,58,69],furthermor:[28,29,107,140,148],fusedadam:19,futur:[12,19,43,64,74,87,97,140,146,148],g:[4,16,17,22,28,29,61,64,65,72,74,93,94,96,98,99,100,101,102,104,106,108,139,140,142,148],g_loss:[65,108,139,142],g_opt:[65,108,139,142],g_x:[65,108,139,142],gain:[13,26,113,129,143],galaxi:107,game:3,gamma:28,gan:[32,63,64,85,103,108,149],ganmodel:61,gantask:64,gather:[6,19,64],gaudi:[9,91,110],gb:[45,46],gc:[52,71,157],gcloud:[16,17],gcp:19,gcsf:71,gear:84,gen:84,gen_discrimin:28,gen_imag:64,gen_loss:64,gen_opt:64,gen_optim:28,gen_sch:64,gener:[16,17,22,26,28,29,35,36,38,43,48,60,61,64,65,72,74,77,84,93,97,99,103,108,133,139,140,142,148,153,154,157,158],generate_spect:84,generate_spectrogram:84,generated_imag:[155,160,161],generator_network:63,geograph:84,geometr:[22,86],geopolit:84,get:[0,6,8,12,16,17,19,22,28,43,47,53,64,67,70,72,77,78,82,84,88,96,97,98,99,100,101,102,103,105,108,134,140,144,148,149],get_device_stat:92,get_input:80,get_lm_model:84,get_metr:[102,157],get_ordin:18,get_parallel_devic:92,get_pretrained_lm_models_list:84,get_tokenizer_list:84,get_train_batch:152,getcwd:[18,64,72,74,102,144,147],getlogg:[57,102],git:[46,84],github:[6,22,46,55,64,84,87,146,149,159],give:[16,17,29,30,48,53,55,64,78,93,102,103,157],given:[19,27,28,29,30,64,72,74,93,97,101,103,104,108],gke:146,global:[22,29,37,53,64,72,78,140,148],global_rank:[37,76,140,148,157],global_step:[55,65,102,103,158],global_zero:64,gloo:[4,6,106],glossari:12,glow:84,glow_tt:84,glowtt:84,glowttsmodel:84,glue:84,go:[16,17,28,48,49,58,78,103,149],goal:63,goe:[64,102,111,140,148],gone:158,good:[0,22,28,29,30,36,64,65,78,108,139,140,142,148,149],goodgan:63,googl:[6,52,71,72,84,101,146,155,157,160,161],googleapi:[16,17],got:[140,148],gpt2:85,gpt:[19,85],gpu:[0,12,15,16,17,18,21,33,36,38,39,49,63,64,67,69,73,74,76,82,83,84,85,87,91,92,106,109,110,128,134,141,146,147,152],gpu_0_batch:6,gpu_0_pr:64,gpu_0_predict:64,gpu_1_batch:6,gpu_1_pr:64,gpu_1_predict:64,gpu_2_batch:6,gpu_3_batch:6,gpu_model:6,gpu_n_pr:64,gpu_num:6,gpu_transform:[64,74],gpuacceler:72,grace:72,grad:[22,62,64,65,69,72,103,147],grade:84,gradient:[6,12,62,64,68,69,72,101,103,108,140,148,155,160,161],gradient_allreduc:6,gradient_as_bucket_view:19,gradient_clip_algorithm:[22,64,65,72,78],gradient_clip_v:[22,64,65,78],gradientaccumulationschedul:[22,62,65],grain:[55,103],granular:[129,154],graph:[6,12,16,17,22,64,86,97,100,101,102,108,155,157,160],graphcor:[12,13],graphic:3,gre:36,great:[48,64,101,103,108],greater:[72,99],greedy_predict:84,green1:[70,159],green_yellow:[70,159],grep:[16,17],grey82:70,grid:[33,36,37,38,39,41,42,44,47,49,64,109],grid_search:36,griffin:84,ground:[19,24,103],group:[6,18,28,29,64,72,100,101,102,141,157],grow:[31,32,74,84],gs:71,guarante:[30,85],guess:149,guesswork:22,guid:[3,5,6,8,12,15,16,17,18,24,30,38,47,64,72,84,86,97,99,103,108,109,146,147,151],guidanc:22,h:[6,23,27,31,64,153],h_cl:23,ha:[0,6,8,11,12,15,16,17,19,20,22,23,26,28,29,30,38,43,45,46,48,49,53,55,60,61,63,64,69,72,77,78,81,84,89,90,93,98,99,100,102,103,107,108,140,148,149,152,158],habana:[8,9],habit:0,had:58,hadoop:71,half:[13,67,69,72,73,109,130,140,148],hand:149,handi:81,handl:[0,4,16,17,19,22,27,28,41,42,43,52,64,65,69,71,72,74,84,103,106,107,139,140,142,144,148,149,157],hang:[140,148],happen:[22,61,62,64,65,69,72,97,108,140,148,154],happi:55,hard:[11,103,108],harder:22,hardwar:[1,3,4,6,7,8,10,14,16,17,41,64,72,73,91,92,106,115,124,134,145],hasattr:84,hasn:[28,61],havana:[91,110],have:[0,5,6,8,9,12,13,15,19,22,23,24,26,28,29,30,31,32,39,41,42,43,47,48,52,55,61,63,64,65,72,74,80,81,84,85,92,93,97,99,101,103,105,107,108,109,140,141,145,146,148,149,159],haven:107,hccl:8,hdf:[71,72],head:[84,88,103,146],healthcar:84,heavili:12,height:158,hello:158,help:[0,3,13,19,22,27,28,29,30,31,47,55,61,63,64,65,78,84,91,108,128,130,141,149,151,152],helper:[39,147],henc:[18,108],here:[0,6,18,19,20,22,23,27,28,32,36,37,38,43,45,46,48,49,57,61,62,63,64,65,69,72,74,77,82,84,91,92,93,94,95,102,103,105,107,108,123,139,140,142,148,149,153,154,155,158,160,161],heterogen:8,hf:90,hh:72,hidden:[64,103,107],hidden_channel:84,hidden_s:[23,64],hidden_st:[64,84],hierarch:[64,99],high:[12,19,88,90,108,157],higher:[6,19,67,105,140,148,157],highest:19,highli:[12,19,55,67,84],hint:[28,29,30,145],histogram:[20,101,102,155,160],hit:19,hmp:9,hoc:149,hold:[4,21,22,55,64],home:[16,17],hood:[6,18,19,20,64,65,69,102,103,105,107,108,109,144],hook:[6,15,58,61,65,72,74,94,101,102,103,104,139,145,147,149],horovod:[5,140,148],horovod_fusion_threshold:72,horovodrun:6,host:[11,16,17,18,19,22,27,108],host_list:6,host_node_addr:6,hostname1:6,hostname2:6,hot:[107,149],hour:[5,49,72,84,108],how:[1,3,18,19,22,25,28,29,30,31,33,35,36,38,40,45,46,48,49,54,60,61,63,64,71,72,74,89,91,92,93,96,99,100,103,104,107,108,109,114,120,121,123,125,126,128,134,135,136,140,144,147,148,149,152,156,158],howev:[0,6,15,19,22,29,41,43,44,46,49,58,63,64,65,67,69,72,93,94,103,108,139,142,149,154,158],hp:102,hp_metric:[100,102],hparam:[22,36,53,55,61,63,65,72,74,102],hparams_fil:[61,64],hpu:[72,73,91,92,109,110,147,152],hpu_exampl:9,hpuparallelstrategi:8,hpuprecisionplugin:9,html:[65,101,108,139,142],http:[6,16,17,22,45,46,64,65,84,99,103,108,139,140,142,146,147,148,151,159],huge:[5,64],huggingfac:[23,84,86,90],hundr:[140,148],hunt:149,hydra:[84,86,90],hydra_runn:84,hymenoptera_data:103,hyper:[36,99,101],hyper_paramet:[53,64,83,102],hyperoptargumentpars:36,hyperparam:[36,99,102],hyperparam_optim:36,hyperparamat:48,hyperparamet:[29,30,31,36,48,61,64,72,73,83,96,97,98,100,101,108,109,140,148,155,159,161],hyperparametersmixin:64,hypothesi:20,i:[11,12,20,22,30,48,54,62,63,64,65,89,97,103,108,140,147,148],id:[3,11,37,38,97,98,101,140,148],idea:[36,138,141,149],ideal:30,idempot:64,ident:[140,148],identifi:[4,16,17,21,30,72,84,93,98],idx:92,ie:[0,2,6,22,41,60,61,62,63,65,72,78,108,157],ignor:[19,63,64,65,72,99,100,108,139,142],illustr:[6,29,93,94],imag:[23,48,56,64,72,86,88,93,99,101,102,103,120,121,147,155,156,157,160,161],image_classification_model:103,image_s:88,imageclassifi:103,imageclassificationdata:103,imagefold:107,imagegpt:85,imagenet:[5,32,63,74,77,88],imagenetdatamodul:[74,85],imagenettransferlearn:23,imagin:[56,64,158],img1:101,img2:101,img:[72,99],img_1:101,img_2:101,immedi:[58,84,103,149],impact:[0,19,72],implement:[16,17,19,20,22,28,29,30,43,60,64,65,70,74,78,83,85,87,89,92,93,94,100,102,103,104,105,107,108,139,140,142,148,149,157],imposs:[28,29,30,74],impract:22,improv:[11,19,20,22,29,58,63,64,67,69,72,108,140,148,149,151,157],in_dim:53,in_featur:[23,64,80,81],inbuilt:[15,65],includ:[4,6,8,16,17,19,20,21,28,29,30,52,54,64,65,71,72,77,84,93,94,102,140,147,148,152,157],include_extern:84,incompat:100,incorrect:99,increas:[6,11,13,19,20,22,43,62,65,69,72,89,101,108],independ:[15,22,27,29,55,62,65,80,147,149],index:[3,16,17,22,43,62,64,65,74,102,103,109,140,148,157],indic:[3,43,64,92,103,157],individu:[12,22,64,72,102],indivis:72,industri:[49,91,128],inf:72,infer:[4,11,20,30,31,43,61,72,79,80,84,102,109,131,140,148,149,157],inference_opt:11,inferencesess:80,infin:72,infinit:[58,70,72,108],info:[36,38,72,84,99,102,108,146],inform:[0,4,6,8,11,12,15,16,17,19,21,28,30,37,47,57,63,64,69,74,84,93,94,102,105,154,159],infrastructur:[84,105],inherit:[56,64,102],init:[6,9,23,28,29,30,55,56,58,61,63,64,83,101,155,157,159,160,161],init_arg:[28,29],init_dist_connect:6,init_process_group:157,init_validation_tqdm:[70,159],initi:[6,9,16,17,22,28,29,53,58,60,64,65,72,89,93,102,107,108,140,145,148,157],initial_num_label:103,initialis:[4,21],initialize_distribut:64,inject:[55,63,91,103,110,139],inlin:26,inner:64,inp:81,inpaint:86,input:[3,16,17,19,20,29,61,64,72,80,84,93,97,100,101,140,148],input_arrai:[97,100,160],input_compat:20,input_id:[23,84],input_length:84,input_mask:84,input_nam:80,input_s:64,input_sampl:[64,80],input_sign:84,input_signal_length:84,input_spec:84,input_typ:84,input_type_id:84,insert:[16,17,18,64],insid:[22,28,53,55,64,72,74,84,93,102,108,140,145,148,157,158],insight:[129,151],inspect:[22,64,77,96,100],inspir:22,instabl:[69,72],instal:[6,16,17,18,19,27,30,31,38,64,70,71,72,74,81,85,88,89,90,97,98,99,101,103,109,147,155,159,160,161],install_requir:6,instanc:[6,8,18,28,29,61,64,72,93,94,99,101,102,104,145],instanti:[19,29,30,63,102,103,140,148],instantiate_class:28,instantli:64,instead:[6,9,19,22,30,36,52,53,55,58,63,64,65,72,93,96,99,100,103,108,139,140,142,148,149,157,158],instruct:[8,12,16,17,87,149,151],int8:20,integ:[3,64,72,77,84],integr:[4,8,13,16,17,19,35,52,55,68,85,91,92,99,103,105,124,127,141,155,156,157,160,161],intellig:[12,91,110,115,116],intend:[19,28,29],intent:84,interact:[33,45,46,49,63,91,92,99,103,108,128,144,149],interconnect:19,interest:[23,48,64,65,104,158],interfac:[4,8,15,16,17,19,30,31,36,37,63,89,90,93,103,104,105,106],intermedi:[1,7,10,14,19,25,33,35,36,37,51,59,66,75,77,79,109,115,116,117,118,121,122,129,132,133,135,136,138,150,156],intern:[8,9,16,17,19,22,43,52,53,61,62,65,69,70,71,72,89,93,94,98,103,104,105,139,142,149,157],interoper:[140,148],interpol:[29,93],interpret:3,interrupt:[41,53,72,93,108],interv:[6,55,64,103,107,139,142],intro:84,introduc:[19,32,69],introduct:[69,149],introductori:109,intuit:69,invalid:69,invert:84,invok:[22,64],involv:[64,74],io:[4,21,64,72,84],ip:[6,16,17],ipu:[4,64,65,67,72,73,91,92,106,108,109,110,116,139,140,142,146,148,152],ipu_id:11,ipustrategi:[11,13],ipython:108,irregular:86,is_avail:[92,140,148],is_complex:154,is_global_zero:[0,140,148],is_last_batch:[65,108,139,142],is_last_batch_to_accumul:108,isfil:64,isinst:[64,65,74,84,139,142],isn:145,isol:93,issu:[0,5,6,12,16,17,19,30,38,55,64,87,102,108,157],item:[16,17,64,102,107,157,158],iter:[6,11,19,20,22,55,64,72,81,82,103,104,108,141,147,149],iterable_dataset:107,iterabledataset:[43,72,107,108],its:[4,6,8,22,26,28,29,30,43,45,46,53,58,64,72,92,93,103,106,107,140,148,149,153,155,157,159,160,161],itself:[4,38,41,43,64,65,106],jasper:84,jit:[64,81],job:[6,36,47,91],job_id:6,job_nam:36,join:[73,84,87,91,96,100,109,110,123,124,128,147],jpg:[101,103],json:[19,31,84],jsonargpars:[28,29,31],jupyt:[6,16,17,102,108,158],just:[22,28,30,45,46,53,55,64,74,87,93,108],k:[3,6,16,17,22,55,62,64,65,72,77,102,103,108,157],kaggl:[6,146,158],kaggler:88,kaushikbokka:[16,17],keep:[19,22,29,43,64,69,72,78,87,99,103,149],keepdim:84,kei:[16,17,22,29,53,62,63,64,65,72,83,84,93,94,96,97,98,99,100,101,102,103,107,139,142,152,155,160,161],keithito:84,kept:[64,157],kernel:[16,17,84],key1:101,key2:101,keyboard:72,keyboardinterrupt:[72,93],keyword:[64,96,97,98,100,101],kfold:103,kill:[16,17],kind:[28,31,32,140,148],kind_devic:[16,17],know:[0,19,29,48,58,63,64,74,102,108,149,158],knowledg:109,known:[28,29,67],known_implement:71,kwarg:[53,63,64,74,77,93,94,96,97,98,100,101,102,103,157,159,160],kxn:[22,62,65],l1:[31,64,80,81,144],l1_unstructur:20,l:36,l_length:84,l_mle:84,lab:[33,72,91,108,128],label:[84,101,103],label_epoch_frequ:103,labels_fil:84,labels_hat:64,labelstyp:84,lambda:[0,16,17,53,102],lambdalr:64,landscap:22,languag:[20,86],language_model:[84,90],laptop:72,larg:[3,5,6,8,12,16,17,19,20,22,62,64,65,67,78,84,92,108,140,148],larger:[1,11,12,19,22,48,67,69,77,127,140,148],largest:[22,72],last:[11,16,17,26,53,55,64,72],last_batch_iter:19,latent:93,later:[0,19,55,63,64,69,99,101],latest:[18,36,64,72,81,84,101,141,144],latter:64,launch:[4,5,6,37,84,106,140,148,158],launcher:6,layer1:11,layer2:11,layer3:11,layer4:11,layer:[1,11,15,19,20,23,29,36,48,63,69,72],layer_0:20,layer_0a:20,layer_1:[0,15,20,63,145,149],layer_1_dim:63,layer_1a:20,layer_2:[15,145,149],layer_3:[15,149],layer_:20,layer_dim:63,layer_end:20,layersync:72,lazi:74,lazy_inst:[28,29],lazyproperti:[16,17],lbfg:64,lead:[0,12,16,17,18,19,55,64,67,102,108,151,157],leaf:103,learn:[1,3,6,7,8,10,12,14,16,17,18,19,24,25,26,28,29,30,32,33,35,36,37,38,39,40,43,45,46,48,49,51,53,59,63,64,67,69,71,72,73,75,77,78,79,80,81,86,87,88,89,90,91,92,102,103,105,108,109,110,112,113,115,116,117,118,119,120,121,122,123,125,126,128,129,131,132,133,134,135,136,138,143,147,149,150,152,156,158],learner:103,learning_r:[22,26,27,31,36,48,53,63,64,65,72,84,140,148,160],learning_rate_1:31,learning_rate_2:31,learningratelogg:72,learningratemonitor:[28,64,77],least:[3,6,11,30,38,58,72,108],leav:[12,64,70,82,149],left:[28,30,65,103,139,142,151],legaci:145,leisur:103,len:[16,17,43,60,64,84,103,153],length:[15,43,61,64,72,84,107],length_scal:84,lengthi:77,lengthstyp:84,less:[8,11,19,43,67,72,84,107,108],let:[5,6,22,23,26,45,46,48,53,61,62,63,64,65,74,92,103,140,148],level:[6,19,22,28,57,58,63,69,72,73,78,88,102,103,110,123,124,128,147],leverag:[19,84,103],lib:[0,16,17],librari:[8,15,16,17,18,19,32,38,69,70,71,72,84,86,92,93,140,148,159],librispeech:84,libsndfile1:84,libtpu:[16,17],lifecycl:13,light:[42,48,91,110,113],lightn:[0,2,3,4,6,8,9,13,15,16,17,18,19,20,21,23,24,25,27,28,29,32,33,36,37,38,39,41,42,43,44,47,49,52,53,54,55,56,57,61,64,65,66,68,69,70,71,72,73,78,79,82,84,86,87,91,92,93,94,97,99,100,102,104,105,106,108,110,111,113,122,123,124,126,127,138,139,142,143,144,149,155,157,158,159,160,161],lightning_checkpoint:102,lightning_log:[19,72,96,97,98,100,102,147,155,158,160,161],lightning_model:19,lightning_modul:[56,64,103],lightning_script:41,lightningargumentpars:29,lightningcli:[27,28,31,32],lightningdatamodul:[22,25,28,31,61,72,109,136,140,145,148,149],lightninglit:109,lightningloggerbas:[28,72,96,97,98,99,100,101,159],lightningmodel:[140,148],lightningmodul:[0,4,5,6,11,15,16,17,19,20,22,25,28,29,31,36,38,43,52,55,56,58,60,61,65,69,72,74,76,80,81,83,84,89,93,96,97,98,99,100,101,103,104,106,108,109,113,122,136,138,139,140,142,143,145,148,152,153,155,156,158,160,161],lightningoptim:[64,65,108,139,142],lightningtemplatemodel:36,lightweight:87,like:[0,6,16,17,19,22,27,28,29,30,31,32,36,39,43,48,52,53,54,55,57,61,63,64,69,70,71,72,73,74,77,84,91,92,93,97,99,100,101,102,103,104,105,107,108,113,124,128,140,143,148,149,152,154,157,158,159],lim:84,limit:[0,5,6,16,17,19,20,55,64,67,72,81,108,140,148,158],limit_:107,limit_predict_batch:72,limit_train:72,limit_train_batch:[77,147],limit_val_batch:[77,107],line:[0,6,15,16,17,19,28,29,30,31,36,63,64,77,84,108,140,141,148],linear:[11,15,19,20,23,31,63,64,77,80,81,103,140,144,145,147,148,149],linear_lay:19,linearli:22,linearlr:32,linearregress:85,lineno:152,link:[6,16,17,28,29,46,72,87,103,140,148],link_argu:29,link_to:28,linux:[84,87],linux_x86_64:[16,17],list:[3,4,6,9,16,17,22,23,28,43,55,61,64,72,74,83,84,87,101,102,103,105,106,107,140,148,152,155,160,161],list_available_model:84,list_of_load:107,listcomp:152,litadam:32,litautoencod:[55,56,60,64,144,147],litcallback:52,litclassifi:[9,64,74],litdatamodul:[22,74,95],lite:147,liter:64,litlogg:159,litlrschedul:32,litmcdropoutmodel:[64,81,82],litmnist:[63,64],litmodel:[0,5,22,43,52,53,55,58,61,63,64,69,76,77,82,98,99,107,139,145,149,155,157,158,160,161],litmodul:101,litprogressbar:[70,159],littl:[88,90],live:149,lj:84,ljspeech:84,ll:[19,28,39,42,45,46,48,53,112,130,131,132,133,152],lm:84,lm_checkpoint:84,lo:36,load:[12,19,22,36,43,51,52,53,54,55,60,61,63,64,71,72,73,74,81,83,84,93,94,97,101,102,104,108,109,122,145,157],load_checkpoint:[4,21,54],load_data:64,load_dataset:74,load_dataset_from_disk:74,load_from_checkpoint:[23,53,55,61,82,101,147],load_modul:36,load_nvprof:154,load_state_dict:[83,94,95],loader:[18,61,64,72,84,107],loader_1:107,loader_2:107,loader_a:[43,64,107],loader_b:[43,64,107],loader_c:107,loader_d:107,loader_n:64,loaders_a_b:107,loaders_c_d:107,loc:[53,102],local:[0,8,16,17,19,22,30,37,46,52,71,72,76,84,96,97,98,99,100,101,102,140,148,157],local_devic:[16,17],local_nvm:19,local_rank:[6,37,72,74,140,148],localhost:[6,16,17,18,147,151],localservic:[16,17,18],localsgd:19,locat:[22,98],lock:6,log:[12,22,43,52,55,56,58,60,61,63,71,72,84,85,89,93,96,97,98,99,100,101,108,109,129,140,145,147,148,154,155,156,158,159,160,161],log_cod:97,log_dict:[65,84,102,108,139,142,158],log_dir:[96,100],log_every_n_step:[102,157],log_freq:101,log_gpu_memori:72,log_graph:[97,100,101,160],log_hyperparam:[96,97,98,99,100,101,102,159],log_imag:[64,101,155,160,161],log_metr:[64,72,96,97,98,99,100,101,102,159],log_model:[101,155,160,161],log_model_checkpoint:99,log_model_summari:99,log_path:36,log_prob:84,log_tabl:101,log_text:101,logdet:84,logdir:[84,102,147,151,158],logger1:[155,160,161],logger2:[155,160,161],logger:[26,28,31,57,63,71,77,90,92,96,97,98,99,100,101,109,147,155,159,160,161],logger_registri:28,logging_interv:28,logic:[12,22,28,43,54,61,64,65,72,74,92,93,103,105,139,140,142,148,149],login:[6,45,46],logisticregress:85,logit:[0,23,84,85],logprobstyp:84,logw:84,logw_:84,longer:[22,43,64,151],look:[2,3,6,8,9,11,12,13,15,16,17,18,19,22,23,26,29,30,31,32,42,45,46,48,49,50,55,57,67,68,69,71,72,83,84,103,104,140,148,149],lookup:0,loop:[19,24,43,53,58,59,72,73,77,78,84,91,92,93,107,109,110,120,141,145,148,150],loss:[0,6,11,12,13,20,22,31,55,56,58,62,64,65,69,72,83,84,85,93,99,101,102,103,107,139,140,142,144,145,147,148,158],loss_fn:[140,148],loss_funct:[103,140,148],loss_fx:63,loss_mask:84,loss_valu:84,lost:[30,69],lot:[16,17,19,63,77,82,84,149],lotteri:20,low:[6,16,17,19,41,157],low_precision_decentr:6,lower:[16,17,19,20,55,67,69,105,108],lowest:22,lr:[6,19,28,31,36,53,64,65,72,74,84,99,139,140,142,144,147,148,149],lr_find:[22,72],lr_find_kwarg:72,lr_finder:22,lr_scale:[64,65],lr_schedul:[28,32,65,139,142,145],lr_scheduler_config:[64,65,139,142],lr_scheduler_registri:32,lr_scheduler_step:65,lrschedul:32,lsof:[16,17],lstm:[64,107],m60:49,m:[6,16,17,18,39,48,72,84,108,153],machin:[3,5,12,18,19,20,22,26,33,36,37,38,39,41,44,45,46,50,55,64,72,75,78,80,81,84,89,91,92,103,108,123,134,135,140,148],made:[19,43,64,97],magnitud:[19,22,78],mai:[0,4,6,16,17,19,22,36,41,63,64,65,69,72,84,87,102,106,107,108,139,142,157],mailto:[41,42,44,46,47,49],main:[6,16,17,22,26,27,30,31,32,36,39,48,55,63,64,70,72,74,84,103,108,140,148,149],main_address:[37,72,140,148],main_port:[37,72,140,148],mainli:[4,37,92,101,106],maintain:[6,19,69,72,93,146],major:[5,33,52,65,78,108,140,146,148,149,157],make:[3,5,9,12,16,17,19,20,22,28,29,30,32,36,40,42,43,53,55,60,61,62,63,64,65,72,74,84,88,91,105,107,108,113,124,139,140,142,143,145,148,149,151,156,159],make_grid:64,manag:[4,11,19,31,35,37,54,64,65,68,73,78,92,106,108,109,121,129,133,139,140,142,148,149,156,158],mani:[3,6,12,15,16,17,19,22,28,29,30,32,33,36,38,41,45,46,48,49,50,55,63,64,65,69,72,74,77,84,85,90,100,103,108,135,149,154,155,157,160],manifest_filepath:84,manual:[0,6,28,36,64,69,72,74,93,101,103,113,140,143,147,148],manual_backward:[65,108,139,142],manual_se:[60,140,148],manuallyargsmodel:64,manualoptim:103,map:[43,64,72,107],map_loc:[53,61,64,102],mappingproxi:[16,17],mark:84,mask:[86,99,101,103],massiv:[2,10,11,14,19,117],master:[64,91,110,146],master_addr:[6,38,39],master_address:37,master_port:[6,36,37,38,39],match:[15,19,31,32,64,74,91,105,107,108,140,148],materi:[140,148],math:8,mathemat:[3,78],matrix:[8,16,17],matrix_approximation_rank:19,matter:[6,28,64,140,148],max:[55,58,64,72,101,108,153,158],max_depth:[72,77,99],max_epoch:[15,16,17,26,27,64,84,88,99,103,108,140,141,147,148,153],max_len:153,max_lr:65,max_passeng:26,max_queu:100,max_seq_length:84,max_siz:6,max_size_cycl:[72,107],max_spe:26,max_step:[27,52,64,71,84,103,108],max_tim:108,max_trial:22,maxim:77,maximum:[12,22,72,78,149],mayb:74,mc_iter:[64,81,82],md:64,mean:[0,3,6,11,16,17,19,22,28,29,30,38,64,69,72,81,82,85,102,108,140,146,148,152,154,157,158],meant:[29,93,94],measur:[43,96,97,98,99,100,101,154],mechan:[5,28,65],media:101,medic:86,meet:[140,148],megatron:84,mel:84,melspectrogramtyp:84,mem:36,memlock:84,memori:[8,9,15,16,17,20,22,62,64,65,66,67,69,72,73,84,90,107,108,109,130,140,148,152,157],mention:[18,30,64,87],merg:[20,64],messag:[15,28,29,30,31],met:58,meta:[4,103,109,113,143,147],metadata:[16,17,99,107,155,160,161],method:[0,4,6,15,22,29,32,38,43,53,54,56,58,60,61,63,65,70,74,81,83,84,88,92,93,95,96,97,98,99,100,101,102,104,106,107,108,113,139,143,145,152,153,157,158,159],metric:[0,6,13,16,17,43,55,56,58,61,65,70,72,96,97,98,99,100,101,102,108,109,120,121,129,139,140,142,148,156,159],metric_1:102,metric_2:102,metric_attribut:64,metric_n:[64,158],metric_to_track:[64,65],metric_v:64,micro:[11,47],microsoft:[4,71,80],mid:[72,108],middl:[22,41],might:[6,16,17,19,29,30,36,63,64,72,74,93,102,103,140,148,149,157],migrat:[99,113,143],millisecond:151,mimic:[20,72],min:[55,58,64,65,108,158],min_:72,min_delta:58,min_epoch:[27,108,141,147],min_max:72,min_siz:[6,72],min_step:[27,103,108],mind:[12,69],mingpt:19,mini:22,minibatch:5,minim:[9,19,20,28,65,90,139,140,142,148],minimum:[19,22,69,72,103,108,140,148,157],minut:[48,64,72],misbehavior:6,miscalcul:[140,148],misclassified_imag:99,misconfigurationexcept:[16,17,64,74,97,101],miss:[8,16,17,93,94],mississippi:84,mistak:30,mit:72,mix:[7,10,22,25,31,64,66,72,84,91,102,115,116,128,132,136,140,144,147,148,157],mk1:146,mkldnn:69,ml:[49,88,97,98],mle:83,mlf_logger:[98,155,160,161],mlflow:[98,102],mlflow_tracking_uri:98,mlflowlogg:[155,160,161],mlp:[93,99],mlrun:98,mm:[69,72],mnist:[9,12,18,22,24,32,55,60,63,64,74,86,101,140,144,147,148,152,155,160,161],mnist_ful:74,mnist_load:64,mnist_predict:74,mnist_test:74,mnist_train:74,mnist_val:74,mnistdatamodul:[9,22,74],mobil:20,moco:86,mocov2:85,modal:90,mode:[0,3,5,6,18,22,38,55,58,64,65,72,97,99,101,102,107],model1:[32,61],model2:[32,61],model:[1,2,3,4,5,6,8,9,10,12,13,14,15,16,17,18,20,22,23,25,26,27,29,33,35,36,37,38,39,41,42,43,47,48,52,53,54,55,56,58,63,64,65,66,67,69,70,71,72,73,74,86,89,90,91,93,94,97,99,100,101,102,103,106,107,109,110,111,115,116,117,118,119,120,123,127,128,130,132,133,134,136,139,140,141,142,145,147,148,153,155,156,158,161],model_averaging_period:19,model_backbon:48,model_backward:152,model_config:27,model_copy_gpu_0:6,model_copy_gpu_1:6,model_copy_gpu_2:6,model_copy_gpu_3:6,model_di:64,model_gen:64,model_nam:[63,84],model_registri:32,model_trac:64,model_weight:83,modelcheckpoint:[51,54,55,64,72,99,101,102],modelprun:20,modelpt:84,modelsummari:[72,77],modern:[72,108,140,148],modif:[30,72,103],modifi:[5,6,9,19,54,58,64,72,74,91,93,103,107,110,112],modul:[0,6,15,22,28,29,32,36,56,57,61,72,74,77,81,84,93,101,102,108,109,136,140,145,147,148,149],modular:[26,31,91,128,145,149],modulenotfounderror:[97,98,99,101],modules_to_fus:20,molecul:101,moment:[16,17,22,28,29],monai:86,monei:[3,8,12,40,108],monitor:[29,32,55,58,64,65,72,101,102,108,129,158],monolingu:20,mont:[64,81,82],month:[41,63],more:[0,3,6,8,9,11,12,15,16,17,18,19,20,22,24,27,28,29,30,31,32,43,47,48,53,57,59,64,65,67,69,71,72,74,87,88,90,92,97,99,101,102,103,104,105,107,108,129,139,140,142,145,146,147,148,153,154,158,160],most:[6,12,16,17,19,24,30,53,54,64,65,69,71,72,99,108,139,142,152,158],mount:[19,108],move:[0,12,15,16,17,18,64,72,74,76,100,103,108,140,148],move_data_to_devic:[64,74],move_metrics_to_cpu:72,move_to_devic:[140,148],mp:6,mpi:[4,106],mpirun:6,mse_loss:[60,144,147,154],mseloss:[56,64],much:[6,19,22,64,69,72,74,84,85,93,108,152],multi:[1,7,10,14,36,38,39,47,64,72,74,84,115,116,134,140,147,148],multipl:[0,6,19,20,22,27,29,30,32,36,38,46,48,64,70,72,73,74,84,89,90,92,93,94,99,101,102,103,105,108,109,118,134,140,141,146,148,157,158],multiple_trainloader_mod:[72,107],multipli:[16,17,19],multiprocess:[0,22,108],must:[8,11,12,19,26,28,29,31,32,36,41,42,44,46,49,58,64,69,72,74,93,94,103,107,108],mutabl:[28,29],mutual:11,my:[48,55,72,84,147,159],my_bucket:[52,71,157],my_checkpoint:[53,61,72],my_cli_default:27,my_cool_pickable_object:[52,64],my_custom_act:153,my_data:108,my_datafram:101,my_dataload:20,my_early_stop:29,my_env:[63,146],my_exp_nam:96,my_fil:6,my_fit_default:27,my_loss:102,my_lr_arg:72,my_metr:[55,102],my_model:[16,17,18,100],my_new_hook:103,my_path:74,my_program:108,my_project:99,my_reduced_metr:0,my_saved_deepspeed_checkpoint:19,my_valu:22,my_workspac:99,myacceler:[4,106],myaccuraci:157,mybucket:72,myclassmodel:29,myclust:[72,140,148],myclusterenviron:37,mycod:28,mycustomdistributeddataparallel:[4,72,106],mydatamodul:[27,28,29,61,108],mydatamodulebaseclass:28,mydataset:[140,148],mydecod:28,myearlystop:58,myencod:28,myepochloop:103,myfancyloop:103,mygener:63,mygradientdescentloop:103,mylightningcli:[28,29],mylightningmodul:[11,13,16,17,18,53,55,61,64,72,160],mylogg:102,myloop:103,mymainmodel:[28,29],mymodel:[6,19,22,27,28,29,30,54,64,65,82,89,107,139,140,142,148,153],mymodelbaseclass:28,mymodelclass:22,mymodul:[155,160,161],myownacc:72,myprecisionplugin:[4,106],myprintingcallback:93,n:[6,22,55,62,64,65,72,84,139,142,147,153,157],n_batch:[64,89],n_critic:64,n_mel:84,n_optim:64,n_vocab:84,name:[6,28,29,45,46,61,63,64,72,77,80,87,92,93,94,96,97,98,99,100,101,102,107,108,154,157,159],name_for_squeu:36,named_paramet:64,namedtemporaryfil:64,namespac:[53,63,64,96,97,98,99,100,101,102],nan:[58,72],nativ:[20,36,49,64,65,72,139,142],natur:107,navig:[45,46],nb_trial:36,ncall:152,nccl:[4,6,36,38,106,157],nccl_debug:[36,38],nccl_min_nchannel:19,nccl_nsocks_perthread:19,nccl_socket_ifnam:36,nccl_socket_nthread:19,nce:[6,64],nce_loss:64,nearli:22,necessari:[0,19,64,96,98,99,100,101,102,107,108,140,148],need:[0,3,5,6,16,17,18,19,20,22,27,28,29,30,32,36,38,39,43,45,46,48,52,53,55,58,61,62,63,64,65,71,72,82,84,92,93,97,99,102,103,105,107,108,139,140,142,144,145,147,148,149,157],neg:[6,72],neighbor:22,neither:97,nemo_experi:84,nemo_nlp:84,nemo_toolkit:84,neptun:[99,102],neptune_api_token:99,neptune_logg:[99,155,160,161],neptune_project:99,neptune_run_kwarg:99,neptunelogg:[155,160,161],ner:86,nermodel:84,nest:[6,19,64,74,99,103,107],nested_kei:28,net:[0,6,36,64,77,86],network:[16,17,19,22,36,38,39,63,64,69,84,93,108],neural:[16,17,22,63,86,108],neuraltextur:86,neuraltyp:84,never:[61,64,70,72,140,148],nevertheless:[29,30],new_batch_s:22,new_lr:22,new_model:55,new_path:64,new_x:64,newer:108,newli:146,next:[6,11,16,17,20,43,64,72,96,100,103,152,157],ngc:84,nightli:[18,72,87,108,146],nlp:[16,17,74,90,109,147],nn:[11,15,19,20,22,28,29,31,56,63,64,80,81,82,103,140,145,147,148,149],nnode:[6,39],no_grad:[23,64,82,83,84,145],node1:6,node2:6,node:[3,5,6,8,16,17,22,36,37,38,39,47,64,72,74,84,103,108,140,148],node_rank:[6,37,38,39,64,72,74,140,148],noise_scal:84,non:[16,17,22,23,28,29,30,72,78,81,93,103],none:[4,18,19,21,22,30,54,61,64,69,72,74,80,84,93,96,97,98,99,100,101,102,103,140,148,153,157,159],nor:[64,74,97],norm:[19,22,72,78],normal:[16,17,19,22,28,29,55,60,64,74,102,159],normalize_confusion_matrix:84,notabl:108,notat:28,note:[0,6,11,16,17,19,22,28,29,55,58,62,64,65,69,72,74,87,93,94,99,107,108,139,142,146],notebook:[6,16,17,84,102,108,158],notic:[19,43,64,78],notifi:87,notification_email:[29,63],novel:84,now:[0,6,27,31,32,42,45,46,48,55,56,63,64,65,74,92,103,139,140,142,146,148,149,151,152],np:[6,80],npredict:147,nproc:6,nproc_per_nod:[6,39],nprofil:153,ntask:36,nuanc:42,num_:107,num_batch:72,num_class:[23,29,64,74,88,103],num_epoch:[26,140,148],num_fc_lay:84,num_featur:145,num_filt:23,num_fold:103,num_gpu:[6,64],num_lay:[63,64,140,148],num_nod:[5,6,36,38,63,84,108],num_process:6,num_replica:18,num_sanity_val_step:77,num_target_class:23,num_trial:48,num_work:[6,84,107,149],number:[0,3,6,8,11,12,16,17,18,19,22,28,29,36,39,43,48,58,60,61,64,65,70,72,74,77,84,96,97,98,99,100,101,102,107,108,140,148,149,151,157,158],numel:157,numer:[69,99,105,108],numpi:[64,72,84,101,140,147,148],nvcc:19,nvcr:84,nvidia:[3,6,19,72,84,108,146],nvme_path:19,nvprof:154,nvvp:154,nyu:72,o1:[9,72],o2:[69,72],o:[20,45,154],obj:0,object:[16,17,19,26,29,31,36,54,55,61,64,65,72,86,92,96,97,98,99,100,101,102,139,140,142,148],observ:[19,29,43,58],observer_typ:20,obtain:[19,22],occupi:[3,72],occur:[55,64],occurr:[140,148,153],odd:65,off:[19,36,72,77,78,103,140,141,148,154],offer:[2,8,19,22,36,37,38,39,41,65,69,88,89,90,102,108,140,148,157],offici:[6,16,17,33,85],offlin:[97,99,101],offload:[4,21],offload_optim:19,offload_optimizer_devic:19,offload_paramet:19,offload_params_devic:19,offset:19,often:[16,17,19,22,32,48,63,64,72,96,103,108,149],old:[16,17,22],omegaconf:[27,64],on_:93,on_advance_end:103,on_after_backward:[102,152,157],on_before_backward:[102,157],on_before_optimizer_step:[102,157],on_before_zero_grad:[102,157],on_epoch:[0,64,89,102],on_epoch_end:93,on_fit_end:152,on_fit_start:152,on_init_start:64,on_load_checkpoint:[52,54,104],on_post_move_to_devic:15,on_run_end:103,on_run_start:103,on_save_checkpoint:[52,54,104],on_skip:103,on_step:[0,64,102],on_tpu:[64,65],on_train_batch_end:[94,102,152,157,159],on_train_batch_start:[58,72,102,152,157],on_train_end:[58,72,152],on_train_epoch_end:[94,102,152,157],on_train_epoch_start:[102,152,157],on_train_start:[72,102,152,157],on_training_end:152,on_validation_batch_end:[102,157],on_validation_batch_start:[102,157],on_validation_end:58,on_validation_epoch_end:[102,157],on_validation_epoch_start:[102,157],on_validation_start:[102,157],onc:[13,15,16,17,19,27,28,29,33,39,45,46,47,48,49,50,53,58,60,61,64,72,74,80,81,88,102,103,108,135,140,148,151,152,153,158],one:[3,6,11,12,16,17,19,28,30,31,32,48,55,61,63,64,65,70,72,74,77,78,96,97,98,100,101,103,105,107,108,139,140,142,148,155,160],onebitadam:19,onecyclelr:65,ones:[4,26,30,64,65,93,100,103,106,108,139,140,142,148],ones_lik:154,onli:[0,3,6,12,16,17,18,19,20,22,24,27,29,30,31,32,45,46,48,55,56,58,60,61,63,64,65,69,70,72,74,76,77,78,87,93,94,99,101,102,108,139,140,142,145,146,148,149,157,158],onlin:97,onnx:[64,79,91,128,131,147],onnxruntim:80,onprem:[33,41,42,44,46,47,49,133],onto:[11,19,22,72],oom:[22,64],op:[9,16,17,19,154],open:[13,22,43,55,102,151,157],opensourc:158,oper:[6,9,12,16,17,19,52,65,68,69,71,72,74,75,108,132,140,148,150,157],ops_bf16_mnist:9,ops_fp32_mnist:9,opt1:65,opt2:65,opt:[64,65,74,103,139,142],opt_a:64,opt_b:64,opt_idx:93,opt_level:9,opt_list:36,optim:[0,1,4,8,11,12,14,20,25,30,31,43,45,46,47,53,55,58,61,62,63,68,72,74,79,80,81,84,85,90,91,92,93,103,106,108,113,115,116,117,128,129,131,136,140,143,144,147,148,149,156,157],optimize_parallel_cluster_gpu:36,optimizer1:[28,64],optimizer1_init:28,optimizer2:[28,64],optimizer2_init:28,optimizer_closur:[64,65],optimizer_idx:[64,65,103,108,139,147],optimizer_on:64,optimizer_registri:[28,32],optimizer_step:[65,152],optimizer_two:64,optimizer_zero_grad:108,optimizerloop:103,optimum:19,option:[0,1,4,6,7,9,10,14,18,19,21,22,28,29,30,31,36,61,63,64,65,72,74,84,87,90,92,93,94,96,97,98,99,100,101,102,107,115,131,134,139,140,142,148,149,155,160,161],option_1:26,option_2:26,or_a_fold:6,order:[22,28,29,43,64,65,72,93,94,97,103,107,108,140,148,152],ordinari:19,org:[64,65,108,139,142],organ:[22,64,72,74,87,99,109,140,148],organiz:84,origin:[20,58,108],orphan:4,ort:19,ort_input:80,ort_out:80,ort_sess:80,os:[18,36,37,64,72,74,84,87,96,97,100,102,108,144,147],other:[3,5,11,12,16,17,19,20,22,28,29,32,36,55,63,64,69,72,74,76,84,86,92,93,99,101,102,103,108,140,148,149,155,157],other_stuff:64,otherwis:[32,45,46,52,61,64,72,97,98,100,107,140,148],our:[9,19,23,36,41,44,46,47,49,61,73,84,85,87,88,91,93,104,105,108,109,110,123,124,128,140,147,148,158,159],out:[5,6,8,15,16,17,19,20,22,24,30,31,32,36,37,38,39,53,63,64,69,72,74,77,83,90,93,102,103,107,140,145,146,148,149,152],out_channel:84,out_dim:[26,27,31,53],out_featur:[64,80,81],outer:64,output:[0,6,20,23,26,36,57,64,65,81,84,93,102,103,108,139,140,142,148,152,154,159,160],output_attent:23,output_dir:84,output_path:19,output_result:64,output_typ:84,outsid:[16,17,72,140,148],over:[6,8,18,19,22,28,30,31,43,55,61,64,65,70,72,86,87,88,89,91,102,103,107,111,123,129,139,140,142,147,148,157,158],overal:[6,19,74,93,149],overcom:[12,108],overfit:[59,60,61,72,73,108,109,119,138],overfit_batch:[78,141,147],overflow:108,overhead:[0,19,22,43,62,64,65,102,157],overidden:9,overlai:101,overlap:19,overlap_comm:19,overrid:[4,6,9,11,19,22,29,30,58,64,65,70,72,74,93,102,106,107,108,140,148,153,157,159],overridden:[6,28,29,61,64,96,98,100],overwrit:[53,72],own:[4,9,11,19,20,22,26,28,33,35,36,41,44,46,48,49,64,68,70,72,73,84,90,91,99,102,103,104,105,106,110,124,126,135,140,144,146,148,150,155,156,158,160,161],p100:146,p1:64,p2:64,p3:64,p:[22,62,65,72,84,103,108],pack_sequ:107,packag:[6,9,12,16,17,30,38,39,69,70,80,86,97,98,99,101,109,155,160,161],packedsequ:107,pad:107,page:[49,109,146,151],pai:[6,41,44,46,49],pair:[19,63,64,65,84,139,140,142,148],panda:101,panel:101,paper:[22,60,61,64,72],paradigm:103,parallel:[12,19,48,55,64,72,74,107,109],param:[9,19,36,64,65,77,84,91,96,97,98,99,100,101,102,110,118,149,159],param_group:[64,65,84],param_requires_grad_st:64,paramet:[0,1,2,4,6,8,9,15,20,21,22,26,28,29,30,31,58,61,63,64,65,72,73,74,90,91,93,96,97,98,99,100,101,102,106,107,108,109,110,123,139,140,141,142,144,145,147,148],parameter_valid:64,params_dict:99,parent:[96,100],parent_pars:[36,63],pariti:19,pars:[3,19,26,28,29,30,37,84,92],parse_arg:[31,36,63,72],parse_devic:92,parse_known_arg:63,parse_tpu_cor:[16,17],parser:[28,29,31,36,63,72,84],parser_kwarg:[27,30],part:[6,29,30,45,46,58,60,61,64,72,84,92,93,94,103,105,140,148,153],parti:[38,69,121,156,160],partial:86,particular:[16,17,28,30,64,67,87,97],particularli:[20,104],partit:[19,103],pascal:108,pass:[4,6,9,11,19,20,21,22,26,27,28,29,36,43,53,54,58,60,61,62,63,64,65,68,70,71,72,74,80,82,83,84,90,92,93,94,96,97,99,100,101,102,103,106,107,108,140,148,149,155,157,159,160,161],passthroughprofil:153,passwordless:6,past:19,patch:146,path:[4,19,21,23,27,28,29,30,31,36,52,53,54,55,61,63,64,71,72,74,83,84,87,96,97,98,100,101,102,108,140,148,158],path_to_data:84,paths2audio_fil:84,patienc:[28,29,58],pattern:64,pdb:[76,77],peak:19,pend:100,peopl:30,per:[3,6,19,24,27,32,36,39,49,55,64,72,74,78,100,102,154,158],per_experiment_nb_gpu:36,per_experiment_nb_nod:36,percal:152,percent:159,percentil:[16,17],perf:154,perf_log:152,perform:[0,6,8,10,13,15,18,19,20,22,30,31,33,48,53,58,61,64,65,68,69,72,74,84,88,90,91,102,103,108,115,128,132,135,139,140,142,145,148,151,157,160],performan:46,permut:36,persist:[93,94],persistent_work:108,person:[84,101,108],pg:[64,65],phase:[61,64,72,108],phenomenon:84,pick:[22,48,63,72,90,98],pickl:[0,93,94],picklabl:6,pickleabl:64,picklingerror:0,piec:[0,6,43,84,150],pil:101,pin_memori:[107,108],pip:[6,16,17,19,27,31,45,46,70,71,84,85,88,89,90,97,98,99,101,103,109,147,155,159,160,161],pipe:19,pipelin:[11,87],pixelcnn:85,pl:[6,9,11,12,13,16,17,18,19,22,45,46,52,53,55,60,61,64,74,81,82,84,85,95,99,103,139,144,145,147,149,158],pl_bolt:[74,85],pl_cli:32,pl_deepspeed_config_path:19,pl_exampl:9,pl_fault_tolerant_train:[42,104],pl_logger:[102,155,160],pl_modul:[58,72,93,159],place:[11,28,29,30,64,65,72,104,108,149],placehold:100,placement:[140,148],plagu:78,plai:[22,63],plain:[53,74,103],plane:26,platform:[45,46],pleas:[5,6,9,12,19,29,30,41,43,44,46,47,49,64,65,72,74,84,87,88,90,100,102,108,139,140,142,148,157],plot:[22,78,102,158,160],plu:19,plug:4,plugin1:105,plugin2:105,plugin:[4,9,11,21,36,37,64,71,106,108,109],pod:[12,16,17,72,108],point:[19,20,22,53,58,63,64,66,67,69,72,104,105,108,130,140,148,158],pointer:64,pollut:[63,93],pool:19,pop:[16,17,83,102,157],popart:12,popen_spawn_posix:0,poplar:12,poptorch:11,popular:[26,84],port1:6,port:[6,36,38,151],portal:12,portion:[6,60,64,78],pose:86,posit:[28,30,64,72,96,97,98,101,108],posix:30,possibl:[0,3,6,16,17,27,28,29,30,48,63,64,69,92,93,102,107,108,149],possibleuserwarn:108,post:[19,22,68,82,93],post_localsgd:19,post_localsgd_hook:19,postlocalsgdst:19,postprocess:84,potenti:[30,55],power:[12,14,22,36,49,72,90,103,104,108,117,144,158],powersgd:19,powersgd_hook:19,powersgdst:19,pr:87,practic:[22,28,29,30,53,56,60,61,64,65,72,78,103,108,139,142,149],practicion:49,practition:88,pre:[18,22,26,31,32,40,41,42,65,68,82,88,107],prebuilt:84,preced:72,precis:[4,7,10,16,17,19,20,22,53,65,73,84,85,91,106,109,115,116,127,128,130,132,139,141,142,147],precision_plugin:[4,106],precisionplugin:[68,72],pred:[64,81,82,89,145,149,157],predict:[4,19,20,22,23,30,31,53,74,77,79,83,84,91,93,101,103,106,109,123,147,149],predict_data:74,predict_dataload:[72,107],predict_dataset:107,predict_load:74,predict_step:[12,81,82,145,154],predict_step_end:64,predictionepochloop:103,predictionloop:103,predicts_step:64,preemptibl:41,prefer:[47,83],prefix:[30,56,64,96,97,98,99,100,101,102],preinstal:100,prem:[42,47,73,91,109,128],prepar:[1,7,10,14,64,72,74,115,134,140,148,152],prepare_data:[22,72,152],prepare_data_per_nod:72,prepend:[52,157],preprocess:[43,84,108],preprocessor:84,present:[29,64,97],preserv:[30,64],press:72,pretend:[53,92],pretrain:[64,73,84,88,91,123],pretrained_ckpt_path:64,pretrained_model:64,pretrained_model_nam:84,pretrained_model_name_or_path:90,pretrained_ner_model:84,pretti:93,prevent:[0,22,64,76,102,157],previou:[28,30,43,48,61,64,65,72,101,104,107,139,142],previous:[18,29,100],price:[8,33,41,135],primari:[43,64],primarili:19,primit:[6,12,152],principl:149,print:[16,17,22,28,30,31,32,53,61,70,71,72,76,84,88,89,93,103,147,154,159],print_config:[26,28,30,31],printcallback:72,printtablemetricscallback:85,prioriti:64,privat:[33,38,47,49,126,135],pro:[72,108],probabl:[48,64,103],problem:[12,28,29,30,72,78,88,89,90,108],problemat:30,proce:74,procedur:[22,64,84,140,148],process:[0,3,4,6,8,11,12,16,17,19,28,29,30,36,37,39,43,53,55,57,61,64,65,72,74,76,82,86,91,93,96,98,99,100,101,102,106,107,108,110,115,116,139,140,142,148,157,158],process_group:19,process_group_backend:6,process_obj:0,processed_sign:84,processed_signal_len:84,processing_spe:70,processor:8,produc:[6,19,22,26,64,102,157],product:[25,26,48,49,60,72,73,77,84,91,109,110,131,147],prof:154,profession:26,profil:[64,65,91,109,117,124,128,132,139,140,142,148,150],prog_bar:[64,65,72,84,102,108,139,142,158],program:[16,17,26,63,72,93],programm:8,progress:[12,43,45,46,47,64,72,73,91,104,109,110,112,119,149,156,158],progress_bar:[70,159],progress_bar_finish:70,progress_bar_puls:70,progress_bar_refresh_r:72,progressbarbas:[70,159],prohibit:48,project:[6,16,17,25,26,31,32,56,63,64,74,91,93,97,99,101,107,113,125,128,143,145,149,155,160,161],project_id:[16,17],project_nam:97,prone:29,proof:41,propag:[29,64,103,107],proper:[28,64,102],properli:[43,64,93,94,103,140,148],properti:[37,55,65,80,84,94,96,97,98,99,100,101,102,104,107,139,140,142,148,159],protocol:[0,52,71,157],prototyp:[88,149],prototype_arrai:160,provid:[4,6,8,9,11,12,13,15,19,22,28,29,30,37,39,41,44,46,49,52,63,64,65,68,69,71,72,87,93,98,102,103,105,106,107,108,129,139,140,142,148,154,157,158],prune:[79,109,131],pseudo:[64,72],pseudocod:[6,64,72],pt:[19,24,64,81,88,103,140,148],ptl:84,publish:[60,72,146],pull:[53,63,83,84,87,102],punctuat:84,pure:[13,73,79,109,122,140,148],purpos:[36,38,61,72,93,94,108,140,148],push:[2,72,113,143],put:[3,64,72,92,96,97,98,100,101,140,147,148],py3:146,py:[0,6,16,17,18,19,22,26,27,28,29,30,31,32,36,38,39,41,42,45,46,48,63,72,84,90,92,108,152],pyarrow:71,python3:[0,16,17,36],python:[0,5,6,9,16,17,18,19,26,27,28,29,30,31,32,38,39,42,45,46,48,57,63,64,70,81,84,87,90,92,99,101,102,103,107,108,109,140,146,148,152,154],pythonfaulthandl:36,pytorch:[0,4,6,8,9,15,16,17,18,19,20,22,28,31,32,33,38,39,52,53,64,65,71,72,73,74,78,79,80,81,84,85,87,88,89,90,91,99,103,106,107,108,110,113,122,132,139,142,146,149,150,155,157,160,161],pytorch_checkpoint:61,pytorch_lightn:[4,6,9,11,13,15,16,17,18,19,20,21,22,28,29,31,32,36,37,54,55,57,58,62,64,65,70,71,72,74,77,85,92,93,96,97,98,99,100,101,102,103,106,107,108,139,140,142,144,145,147,148,151,152,153,154,155,157,159,160,161],pytorchlightn:[41,42,44,46,47,49,146],pytorchprofil:154,pytorh:78,q3:47,q_adam:6,qadam:6,qadamoptim:6,qat:20,qcb:20,qmodel:20,qualiti:20,quant:20,quantiti:[55,58,96,97,98,99,100,101],quantiz:[79,109,131],quantizationawaretrain:20,quartznet15x5bas:84,quartznet:84,quartznet_15x5:84,queri:[84,101],question:[1,14,25,40,74,84,86,108,149],queue:[64,100],quick:[88,99],quickli:[64,72,84,140,148],quickstart:99,quirk:64,r:[16,17,36,108,159],race:[140,148],rack:12,rais:[16,17,30,64,72,74,97,98,99,101,102],ram:19,ran:[19,48],rand:[64,69,81,108],randint:89,randn:[43,64,80,82,83,89,145],random:[6,43,53,72,80,140,148],random_search:48,random_split:[60,74,144],random_train:32,random_unstructur:20,randomdataset:43,randomiterabledataset:43,randomsampl:43,randomstructur:20,rang:[3,20,43,64,69,72,81,82,89,103,107,140,148,149],rank:[0,18,37,39,55,64,76,102,140,148,154,157],rank_zero_experi:102,rank_zero_onli:[0,55,64,102],rapid:[90,141],rate:[6,16,17,25,28,32,36,43,53,63,64,70,72,136,149],rather:[19,22,54,62,65,69,72],raw:[91,103,109,110,113,143,147],rcnn:99,rdma:8,rdzv_backend:6,rdzv_endpoint:6,rdzv_id:6,re:[3,12,19,48,63,67,72,152,153,158],reach:[22,58,69,72,91,108,110],read:[6,19,20,22,26,30,32,36,41,42,52,57,71,72,84,87,99,102,103,104,107,108,140,148,157],readabl:[30,63],readi:[45,46,89],real:[60,61,64,103],real_label:[65,108,139,142],realist:[29,43,74],realli:[5,6,19],realpath:36,reason:[5,6,16,17,18,19,29,43,52,72,103,108,149],recal:[48,102,160],recap:63,receiv:[93,96,97,98,100,101],recent:[16,17,26,72,146],recip:[86,88,99,144],recogn:[19,69,72,84,140,148],recognit:[20,86],recommend:[6,19,20,22,30,38,45,46,48,49,55,61,64,65,67,69,72,74,76,81,83,84,99,102,103,108,139,140,142,148,149,154,157],reconstruct:[64,86],record:[19,96,97,98,99,100,101,102,154],record_funct:154,recov:[41,58],recurr:[64,86],recurs:19,red:22,redirect:[57,102,103],reduc:[0,15,20,22,64,69,72,89,102,103,108,140,148,149,152,157],reduce_bucket_s:19,reduce_fx:[64,102,158],reducelronplateau:[32,64,65,139,142],reduct:[0,4,19,43,64,102,106,140,148,157],redund:22,ref:[39,146],refactor:[64,140,148,149],refer:[0,9,16,17,19,22,27,29,47,60,64,74,87,88,90,99,101,102,103,107,108,109,153],refin:69,reflect:99,refresh:[72,151],refresh_r:[70,72],regard:[64,105],regardless:[6,64,72],regist:[0,4,21,25,28,108,127,136,145],register_acceler:92,register_buff:[108,145],register_class:32,registr:[4,21,99],registri:[25,28,32,71,109,125],regressionmodel:20,regular:[24,55,74,76,83,99,145,154],reinforc:[64,65,139,142,147],reinstal:84,relat:[29,107,149],releas:[30,69,84,87,104,146],relev:[6,53,72,140,144,148,149],reli:[6,12,19,22,30,61,64,65,69,93,103,140,148],reload:[63,64,72,74,93],reload_dataloaders_every_n_epoch:64,reload_ext:[102,158],relu:[11,19,20,31,64,80,81,84,144,145,147],remain:[0,5,19,22,62,65,69],rememb:[56,63,64],remot:[27,52,72,98,109,114,157],remote_devic:19,remov:[19,64,72,74,79,82,91,93,101,108,123,140,148,152,155,160,161],remove_checkpoint:54,repeat:[72,84],repeatedli:58,replac:[6,64,72,78,83,99,103,140,148,155,160,161],replace_sampl:[140,148],replace_sampler_ddp:0,replic:[11,16,17,61,64],replica:[6,22],replication_devic:[16,17],repo:87,report:[13,16,17,19,30,152,154],report_dir:13,repositori:[30,45,46,87],repres:[22,62,64,65,97,103,107,154],represent:[23,56,64,86,105,140,148],reproduc:[24,28,29,52,63,74,84,89,109,140,148],req:[26,31,32],request:[6,16,17,43,55,58,64,72,74,87,102,103],requeu:36,requir:[5,6,11,12,15,16,17,18,19,20,28,29,30,32,38,43,55,64,65,67,69,72,74,78,84,87,88,91,93,94,97,98,99,100,101,102,103,105,107,108,139,140,142,148,149],requires_grad:108,requisit:[40,41,42],research:[4,16,17,26,33,45,46,49,56,61,65,67,68,72,83,84,86,88,90,91,93,103,109,113,123,128,139,142,143,147],reset:[64,72,89,104],reset_experi:97,resnet18:[48,103,149],resnet50:[19,23,43,48,64],resnet:[23,99],resolv:[12,19],resourc:[16,17,36,67,72,108],respect:[19,29,54,61,65,72,102,145],respons:[4,64,103,105,106],rest:[58,64,69,97,105,149],rest_api_kei:97,restart:[41,42,43,104],restor:[6,19,22,41,43,53,55,64,74,83,84,95,97,108],restrict:152,result:[0,6,12,16,17,19,22,55,61,64,69,72,74,84,93,108,140,148,157],resum:[71,72,101,103,104,140,148],retain:[140,148],retriev:[57,64,93,101,102],return_predict:72,reus:[74,93,107,136,149],reusabl:[74,91,112,128,149],rewrit:144,rich:[70,159],rich_progress:[70,159],richer:93,richmodelsummari:70,richprogressbarthem:[70,159],right:[16,17,18,22,30,37,43,61,62,64,65,72,84,140,148],rigor:[85,89,146],river:84,rl:[64,109,113,143,147],rm:84,rnn:[24,107,149],roberta:19,robust:55,roce:8,root:[6,30,57,60,64,84,98,99,102,108],root_dir:[36,52,96,100,157],rotat:74,roughli:[6,19],round:103,routin:[26,27,30,31,72,105,145],row:[72,102,157],rule:[38,39,60],run:[0,1,3,5,6,7,10,11,14,18,19,22,28,29,30,31,33,41,44,48,55,58,60,61,62,63,64,65,67,69,70,71,72,73,74,76,80,81,84,86,87,91,93,96,97,98,99,100,101,102,107,108,109,110,115,117,123,126,128,134,144,145,146,151,154,155,158,159,160,161],run_fast:31,run_id:[98,101],run_nam:98,run_training_batch:152,run_training_epoch:152,runnam:98,running_mean:145,runtim:[6,11,16,17,19,32,64,80,81,84,87],runtime_vers:[16,17],runtimeerror:[16,17],rust:6,rwmap:[16,17],s3:[27,45,46,52,71,72,103,157],s3f:71,s:[0,3,5,6,8,16,17,18,19,20,23,26,27,28,29,36,43,45,46,48,49,53,54,55,60,61,62,63,64,65,71,72,74,77,78,84,88,92,93,94,96,97,99,100,103,105,107,108,139,140,142,144,148,149,152,153,155,158,160,161],sacrific:19,safe:[64,74],sai:[5,22,26,48,62,65,78,84],sale:47,same:[0,6,19,26,28,29,30,38,43,48,55,56,61,64,72,74,84,93,94,101,102,103,107,108,140,141,148,155,161],sampl:[6,22,29,43,55,61,64,65,72,74,78,80,101,107,108,139,142,149,158],sample_g:[65,108,139,142],sample_img:64,sample_z:[65,139,142],sampler:[18,43,64,72,78,107,140,148],sampler_it:43,saniti:[64,70,72,93],sanity_check:72,santa:84,satisfi:61,satur:11,save:[3,6,8,9,12,16,17,19,20,22,26,30,33,36,40,51,54,63,64,66,69,71,72,73,81,83,84,96,97,98,99,100,101,102,103,104,107,108,109,119,130,135,149,154,157],save_checkpoint:[4,21,54,55,64,83,88,103],save_dir:[71,72,96,97,98,99,100,101,102,157],save_full_weight:19,save_hyperparamet:[22,53,74,101,160],save_img:72,save_last:[54,55],save_on_train_epoch_end:55,save_path:19,save_top_k:[55,101],save_weights_onli:55,sawyer:84,sbatch:36,scalabl:[89,91,128,130,145,147,149],scale:[0,2,4,6,7,8,9,13,14,19,22,42,45,46,47,53,64,66,68,69,72,73,79,80,81,90,91,92,108,110,115,116,117,118,128,131,132,140,144,148],scale_batch_s:[22,72],scale_batch_size_kwarg:72,scale_gradi:103,scaler:[22,69],scatter:[6,69,74],scenario:[24,43,108],scene:[19,86],sch1:[65,139,142],sch2:[65,139,142],sch:[65,139,142],schedul:[4,6,19,22,25,28,36,43,53,62,64,84,90,106,136,144,149],scheduler1:64,scheduler2:64,scientif:67,scientist:88,scope:[30,154],score:99,scratch:41,screenshot:158,script:[6,16,17,19,30,39,41,42,45,46,48,64,81,84,91,108,109,123],scripted_modul:81,scriptmodul:64,sdk:12,seamless:[12,90],seamlessli:[63,140,148],search:[22,36,72,101,108,109,155,160,161],second:[16,17,36,39,64,72,84,100,107,152],section:[16,17,18,19,24,26,28,29,63,64,72,99,103,108,140,148],see:[0,3,6,11,12,13,15,18,19,22,24,30,31,36,38,48,53,60,61,64,65,69,72,77,78,84,102,108,109,139,140,142,147,148,149,152,154],seed:[43,60,72,140,148],seed_everyth:[26,28,29,31,72],seem:0,seen:[19,55,65,72],segment:[86,88,101],select:[3,4,6,16,17,20,22,43,61,65,72,92,105,106,139,140,142,148,155,160],select_fn:[16,17],self:[0,4,5,6,11,12,15,18,19,20,21,22,23,28,29,31,32,37,43,52,53,54,55,56,58,60,61,63,64,65,69,70,72,74,76,77,80,81,82,83,84,85,86,89,92,93,94,95,96,97,98,99,100,101,102,103,104,106,107,108,112,139,140,142,144,145,147,148,153,154,155,156,158,159,160,161],self_supervis:85,semantic_segmentation_model:88,semanticsegment:88,semanticsegmentationdata:88,send:[16,17,22,29,64,97,102,157],send_email:29,sensibl:149,sensit:67,sent:[12,72,97,157],sentencepiec:84,sentencepiecetoken:84,sentiment:84,separ:[3,18,19,23,30,43,61,64,72,74,84,86,149],seq2seq:[64,149],seq_data:107,sequenc:[6,61,64,72],sequenti:[16,17,19,23,26,64,65,72,77,103,144,147],seri:[86,103],serial:[5,81],serializ:63,serv:[8,20,61,140,148],server:[8,98,101,151],servic:[6,151],session:49,set:[3,6,7,8,9,10,11,12,13,16,17,18,20,22,24,28,29,30,31,36,37,38,39,47,58,60,61,62,64,65,66,67,69,72,74,78,84,91,93,97,98,99,100,101,102,103,104,105,107,116,123,130,132,139,140,142,147,148,149,157,158],set_default:[28,29],set_descript:[70,159],set_grad_en:[64,72],set_repl:[16,17],set_to_non:[64,108],set_trac:[76,77],set_train:84,setlevel:[57,102],setup:[4,6,16,17,19,22,39,61,106,107,136,145,152],setuptool:6,sever:[28,43,52,64,65,71,102,103,140,148,157],sgd:[5,6,32,64,65,140,148],sh:[36,84],shall:20,shape:[16,17,64,65,84,108,139,142,157],shard:[55,64,90,93,140,148],share:[18,19,27,43,63,64,74,101,107,108,149],shareabl:74,sharpest:22,shell:[5,20,28,30],shift:103,shirt:84,shm:[84,108],short_id:99,shortcut:32,shorthand:[28,92,140,148],shot:86,should:[6,11,15,19,22,28,29,30,43,52,55,56,62,63,64,65,70,72,74,84,91,93,96,97,98,99,100,101,123,140,145,148,149,157],should_check_v:64,show:[9,19,22,27,28,29,31,38,64,70,72,74,89,102,107,114,154,157,158,160],shown:[19,20,29,54,64,65,72,103,157],shuffl:[18,41,64,72,78,107],shut:[41,72],shutdown:72,siames:86,side:8,sigma:0,sign:[30,78,140,148],signal:[19,36],signatur:[31,93],signific:[0,16,17,19,20,32,64,69,102,140,148,157],significantli:[18,19],sigusr1:36,simclr:85,simclr_featur:85,simd:8,similar:[6,28,64,69,78,141],similarli:[22,28,65,104,107,139,142],simpl:[19,22,24,28,30,45,46,65,72,74,84,88,89,103,108,139,142,152,153],simple_mnist:9,simplegan:[65,108,139,142],simplemodel:[64,80,81],simpleprofil:[72,153,154],simpler:[19,30],simplest:[31,42],simpli:[8,16,17,19,20,47,49,53,64,74,90,102,103,107,158],simplic:[64,140,148],simplif:28,simplifi:[28,63],simul:[72,89],simultan:107,sinc:[6,12,22,28,29,30,61,62,64,65,67,69,72,74,84,93,108,140,145,148],singl:[1,3,6,7,8,9,10,12,14,16,17,22,28,43,48,61,64,65,67,69,72,73,74,84,87,102,103,107,108,109,115,116,134,139,140,142,148,157,158],singleargmodel:64,singledevicestrategi:54,singleton:[93,94],situat:6,size:[5,6,12,16,17,19,20,31,37,43,48,60,61,62,64,65,72,77,80,81,84,85,100,102,107,108,118,131,144,145,147,154,157],skill:109,skip:[18,19,58,64,65,69,74,80],skip_default:31,skip_nul:31,slack:87,slice:[16,17,72],slope:22,slot:84,slow:[0,6,19,72,102,108,149,152,157],slowdown:[16,17,55,108],slower:[16,17,19,24,72,157],slowest:152,slowli:[108,140,148],slurm:[35,64,91,109,128,133],slurmclust:36,slurmenviron:36,small:[16,17,19,22,60,62,65,108,109],smaller:[19,20,72,157],smooth:[22,64],smoother:22,snd_1:101,snd_2:101,snippet:[9,28,65],so:[4,6,8,16,17,19,21,22,23,27,28,29,31,43,47,48,53,55,62,63,64,65,67,69,72,74,77,84,91,92,103,105,106,107,108,123,140,146,148,149,154],soc:47,softmax:[6,11,64,89],softwar:[0,8,41],solut:[19,28,29,33,36,49],solv:88,some:[0,12,16,17,18,19,20,28,29,30,36,38,45,46,47,53,54,58,61,63,64,69,72,84,87,93,94,102,103,108,153,157,159],some_comet_funct:97,some_experiment_writer_funct:96,some_fil:6,some_imag:[56,64],some_images_from_cifar10:23,some_mlflow_funct:98,some_nam:63,some_object:0,some_other_st:64,some_result:64,some_scalar:102,some_scalar_1:102,some_scalar_2:102,some_st:64,some_tensorboard_funct:100,some_text:158,some_valu:158,some_wandb_funct:101,someon:149,someotherloss:63,someth:[0,6,22,29,64,72,74,78,85,103,140,148,149],something_cool_i_want_to_sav:[52,64],sometim:[0,16,17,19,29,63,64,67,77,108],somewher:0,soon:[19,22,58,96,97,98,100,101,140,148],sort:[46,72],sota:[90,91,128,141,144],sound:101,sourc:[19,29,30,36,46,61,64,72,74,86,93,96,97,98,99,100,101,103],space:[19,30,55,93,108],span:90,spanish:101,spars:[64,65,139,142],spawn:[4,16,17,21,22,39,64,72,106,140,148],speaker:84,spec:[26,84],spec_augment:84,spec_gen:84,spec_gen_model:84,special:[3,16,17,19,28,29,48,103,140,148],specif:[6,12,19,20,28,36,38,58,61,63,64,69,70,72,83,84,87,96,97,98,99,100,101,107,108,140,148,149,153,155,157,160,161],specifi:[3,6,11,16,17,20,28,38,39,55,61,63,64,72,74,80,90,96,97,99,100,102,107,108],specmodel:84,spect:84,spect_length:84,spectrogram:84,spectrogramgener:84,speech:[20,86],speech_to_text:84,speed:[3,6,11,19,20,67,72,85,90,91,128,129,156],speedup:[19,69,72,140,148],spend:8,spent:[16,17],split:[6,11,22,62,63,64,65,74,103,107,119,138,144,149,158],split_batch:[6,64,103],split_batches_for_dp:64,split_siz:64,split_x:64,squad:86,squeez:64,squeezewav:84,sram:8,src:[6,140,148],srun:36,ss:72,ssh:[6,16,17,18],ssh_port1:6,ssh_port2:6,stabil:[69,91,128,130],stabl:[6,29,30,67,108],stack:[8,22,30,62,64,65,84],stacktrac:0,stage:[4,21,22,61,64,72,74,93,140,148,153],stai:[87,140,148],standalon:19,standard:[19,26,30,63,72,85,89,103,140,148,152],stanford:72,stare:6,start:[6,8,11,12,16,17,19,22,26,28,29,36,39,47,63,72,84,91,93,98,101,103,108,123,140,148,153,154],start_localsgd_it:19,start_powersgd_it:19,starter:109,startup:[16,17],stat:[19,72,152,154],state:[2,6,7,15,16,17,19,22,43,52,55,64,66,85,89,103,108,116,119,132,138,140,141,147,148,157],state_dict:[53,83,94,95,104,140,148],state_kei:94,statement:76,static_graph:19,staticmethod:[63,72,92],statist:[92,158],statu:[45,46,72,96,97,98,99,100,101,102],stdlib:72,stdout:[70,159],step:[0,6,11,12,16,17,19,22,32,53,55,56,62,64,68,69,72,73,74,77,84,89,93,96,97,98,99,100,101,102,103,107,108,109,139,142,144,147,151,159],step_output:[6,64],step_siz:145,steplr:[65,145],steps_per_tri:22,stick:19,still:[16,17,18,19,26,28,61,64,67,69,72,82,93,97,103,108,145],stitch:103,stochast:72,stochastic_weight_avg:72,stochasticweightaverag:[22,72,141,147],stone:109,stop:[64,72,77,78,103,107,109,119,140,148,149,153],stopping_threshold:58,storag:[16,17,52,53,54,71,102,157],storage_opt:54,store:[0,19,20,22,29,43,62,63,64,65,71,72,84,88,93,98,101,102,108],str:[3,4,21,22,31,37,61,63,64,72,74,84,92,93,96,97,98,99,100,101,102,140,148,159],str_input:84,strategi:[1,5,8,9,11,13,16,17,22,36,38,51,54,55,61,64,65,73,74,76,83,88,91,92,103,105,108,109,118,124,139,141,142,147,149],strategyregistri:[4,21],stream:[72,101,107,152],strftime:153,strict:64,strictli:64,stride:[84,154],string:[3,4,20,21,28,29,64,72,96,97,98,100,101,108,140,148,149],strip:84,strive:30,strong:[16,17],strongli:[6,69,93],structur:[22,28,29,36,64,74,86,99,102,103,107,149,155,157,160,161],style:[6,30,107,109],sub:[43,100,103],sub_batch:64,sub_dir:100,subclass:[4,20,23,29,58,68,72,103,106,140,148,153,159],subclass_mode_data:28,subclass_mode_model:28,subclassess:28,subcommand:[27,28,29,31],subdirectori:[96,100],subgroup:19,subject:[4,19,20,21,54,140,148],submit:[18,36,47,72,108],submodul:72,subprocess:[6,72],subsequ:[11,20,28,69,102],subset:[6,16,17,48,103],substanti:[8,19],substitut:103,subtokens_mask:84,success:[19,46,96,98,99,100,101],successfulli:[93,140,148],suffix:[64,102],suggest:[19,22,55,72,108],suitabl:72,sum:[20,31,64,84,157],sum_out:154,summar:72,summari:[19,70,72,99,108,153,158],summarywrit:100,supercharg:138,supermicro:8,supervis:[64,86,93],support:[4,6,8,12,13,15,16,17,18,19,20,22,27,28,29,32,33,43,47,48,54,63,64,65,69,70,71,72,74,81,84,90,92,93,94,99,101,103,106,107,108,139,140,142,146,148,155,158,160],sure:[3,5,19,22,36,40,42,53,55,60,61,62,63,64,65,72,102,108,145,149,151],swa:[22,72,109],swa_lr:22,swap:[90,103,107,149],sweep:[33,45,46,47,109,135],sy:[99,159],synapseai:8,sync:[0,6,19,22,62,64,65,76,102,108,157],sync_dist:[0,64,102],sync_dist_group:[64,102],sync_grad:[64,108],sync_interval_m:6,synchron:[6,64,72,89,102,108,140,148,154,157],syntax:[6,99],system:[6,8,12,16,17,27,52,64,71,72,93,96,100,103,108,157],t:[0,3,5,6,15,16,17,18,22,28,31,36,37,43,48,53,54,55,61,62,64,65,69,71,72,74,78,84,93,97,99,102,103,107,108,139,140,142,145,146,148,149,153,154,157,158,159],t_max:64,tab:102,tabl:[3,70,77,101,157],tabular:[86,101],tacotron:84,tag:[64,98,99,101],tailor:8,take:[19,28,29,49,64,69,78,81,82,84,103,107,108,140,148,152],taken:[19,20,64,72,99],talk:[36,92],tanhlrschedul:65,tar:46,target:[30,64,69,74,84,89,140,148,157],target_length:84,task:[0,16,17,29,36,64,69,74,84,88,90,103],tb_log:100,tb_logger:102,tbptt:[64,72,103],tbptt_split:103,tbptt_split_batch:107,tbptt_step:64,teach:136,team:[4,19,22,41,44,46,47,49,55,85,108,149],teardown:[4,106,152,153],teaser:30,technic:19,techniqu:[1,2,4,6,10,14,15,19,20,65,66,68,73,78,91,108,109,117,127,128,129,132,138,141,144,152],tell:[31,64],temp_arg:63,tempfil:64,temporari:36,tempt:[28,29],tend:[56,64,149],tensor:[6,8,16,17,20,22,43,56,64,65,67,69,72,74,77,84,97,99,101,102,107,139,140,142,145,147,148,155,157,158,160,161],tensorboard:[45,46,64,72,84,93,100,102,147,157,158],tensorboard_logg:[64,155,160,161],tensorboardlogg:[71,72,102,155,157,160,161],tensorflow:[16,17],term:[19,48],termin:[16,17,30,70,72],terminate_on_nan:[26,72],terminolog:[12,140,148],test:[6,18,19,27,30,31,43,56,70,73,74,77,84,85,89,91,93,97,99,102,103,109,123,138,144,146,147,149,158],test_acc:64,test_batch:[64,72],test_data:[64,74,140,148],test_dataload:[61,72,107],test_dataset:[107,140,148],test_dl1:107,test_dl2:107,test_dl:107,test_epoch_end:[0,61,72,149,157],test_load:74,test_loss:[0,60,64,145],test_out:64,test_sampl:107,test_set:60,test_step:[0,6,12,56,60,61,72,107,145,147,149,154,157,158],test_step_end:[6,149,157],test_step_out:64,test_step_output:64,test_train_imagenet:18,test_tub:61,text:[64,70,74,86,101,102,120,121,156],text_fil:84,text_length:84,text_to_gener:84,textcolumn:70,textencod:84,textual:159,tf:64,th:108,than:[6,18,19,20,22,28,29,54,58,64,69,72,74,77,84,105,107,108,129,151,153],thank:99,the_other_valu:53,the_valu:53,the_world_s:[72,140,148],thei:[0,3,12,19,29,30,61,63,65,72,74,92,93,101,103,108,139,142,149],them:[3,4,9,12,19,21,26,28,32,38,43,61,63,64,65,66,72,74,83,85,93,96,97,98,100,101,102,103,107,108,127,139,140,141,142,145,148],theme:[70,159],themselv:11,theori:103,therebi:28,therefor:[6,28,30,58,64,145],thereof:64,thi:[0,3,5,6,8,9,11,12,13,15,16,17,18,19,20,22,24,26,27,28,29,30,31,32,36,38,39,42,43,45,46,48,52,53,54,55,56,58,60,61,63,64,65,67,69,70,71,72,74,77,78,81,82,83,84,85,92,93,94,96,97,98,99,100,101,102,103,104,105,107,108,111,112,114,130,131,132,133,136,139,140,142,146,148,149,151,152,154,157,158,159],thing:[0,16,17,19,29,56,64,65,73,74,77,91,103,107,124],think:[65,103,158],third:[38,69,121,156,160],those:[6,16,17,28,63,64,69,74,140,141,148],though:29,thousand:[84,140,148],three:[16,17,63,105,108],threshold:58,through:[6,16,17,28,29,40,43,54,64,66,72,77,92,101,103,104,108,127,149,151,158],throughout:[53,158],throughput:[6,11,19,22,69,108],thu:[22,29,64],thumb:60,ti:15,tib:[16,17],ticket:20,tie:64,tile:12,till:[11,12,22,62,65],time:[3,6,11,16,17,20,22,30,41,43,48,49,55,61,63,64,65,70,72,74,77,86,87,103,108,140,141,144,148,149,151,153,154,155,158,160,161],time_dim:64,timedelta:72,timer:72,timeseri:[157,158],timm:65,tini:[23,43,78],tinycifar5:46,tip:72,tmpdir:[52,71],tmpf:108,tmpfile:64,to_onnx:80,to_tensor:152,to_torchscript:[20,81],todai:[15,36,37,38,39],todo:[54,157,158,160],togeth:[20,22,72,84,103,141,144],toggl:[27,64,65,72,139,141,142],toggle_model:108,token:[64,74,99],token_classif:84,token_classification_config:84,token_type_id:[23,84],tokenclassificationmodel:84,tokenindex:84,tokenizer_nam:84,toler:[6,33,47,53,91,104,109,124,135,140,148],tolranc:42,tom:[84,99],toma:22,ton:31,too:[16,17,22,31,48,83,102,140,148,152],tool:[8,13,26,28,29,30,31,77,140,148,151],toolkit:[84,86],top:[6,55,72,103,144,151,152,154],topic:[30,64,65,139,142],topolog:[101,155,161],torch:[0,3,11,15,18,19,20,22,23,28,29,31,32,35,39,43,53,54,56,60,61,63,64,65,69,72,74,77,80,81,82,83,84,89,92,100,102,103,107,108,109,133,139,140,142,144,145,147,148,154,155,157,158,160,161],torch_api:6,torch_xla:[16,17,18,72,108],torchcheckpointio:54,torchelast:[1,72],torchio:86,torchmetr:[0,64,102,157],torchpoint3d:69,torchscript:[20,64,79,91,128,131],torchtext:[64,74],torchvis:[23,60,64,74,144],total:[6,11,19,43,64,70,72,108,140,148,152,153,154,157],total_fit_batch:72,total_step:65,total_train_batch:[72,159],total_train_sampl:72,total_val_batch:72,total_val_sampl:72,totalsampl:[16,17],totensor:[18,22,64,74,144],tottim:152,touch:[31,90],tpc:8,tpu:[0,4,6,21,54,64,65,67,69,72,73,74,85,86,91,92,106,109,110,128,134,139,140,142,146,147,148,150,152],tpu_ip_address:[16,17],tpu_nam:[16,17],tpu_pod_nam:[18,72,108],tpu_spawn:[140,148],tpu_spawn_debug:[4,16,17,21],tpu_work:[16,17],tpuspawn:[16,17],tpuv2:146,tpuvm:[16,17,18],tqdm:[70,102,157],tqdmprogressbar:72,trace:[12,30,64,72,151],trace_nam:154,traceback:[16,17],track:[0,19,30,43,61,72,73,74,95,98,101,102,103,120,121,155,161],track_grad_norm:78,tracking_uri:[98,155,160,161],trade:19,tradeoff:19,tradition:61,traffic:[38,39],train:[20,21,24,26,27,30,35,37,39,54,56,57,58,62,63,65,66,67,69,70,71,73,74,77,78,81,82,83,88,89,90,91,92,93,97,99,101,102,103,104,105,107,109,110,115,116,117,119,120,123,127,128,130,133,134,135,138,142,147,149,150],train_acc_step:[89,157],train_batch:64,train_batch_idx:159,train_batch_s:72,train_d:84,train_data:[64,74,140,148],train_dataload:[5,18,22,32,43,56,72,83,103,107,140,144,147,148],train_dataset:[22,74,84,107,140,148],train_fold:[88,103],train_load:[22,64,72,74,144,147],train_loss:[64,84,85,102,140,147,148],train_on_devic:64,train_out:64,train_set:60,train_set_s:60,train_step:65,train_target_fold:88,train_time_interv:55,trainabl:19,traindir_a:107,traindir_b:107,trainer:[0,3,4,5,6,8,9,11,12,13,15,16,17,18,19,20,21,22,23,26,27,29,31,32,36,37,38,41,52,53,54,55,56,58,60,61,62,65,67,68,69,70,71,74,76,77,78,82,83,84,85,88,90,91,92,93,94,96,97,98,99,100,101,102,104,105,106,107,108,109,110,138,139,140,142,144,145,148,149,151,152,153,154,155,157,158,159,160,161],trainer_2:26,trainer_config:27,trainer_main:63,trainers_per_nod:6,training_batch:72,training_batch_w:84,training_epoch_end:[65,93,102,139,142,149,157],training_opt:11,training_script_setup:39,training_step:[6,12,31,43,55,56,60,65,68,69,72,76,83,84,85,89,98,99,101,102,103,107,108,139,140,142,144,145,147,148,154,155,157,158,160],training_step_end:[6,102,149,152,157],training_step_output:64,training_strategi:[4,106],trainingbatchloop:103,trainingepochloop:103,trainingtypeplugin:54,trajectori:64,transcrib:84,transcript:[84,86],transcript_len:84,transfer:[16,17,19,64,74,86,109,140,148],transfer_batch_to_devic:6,transform:[0,18,19,22,23,31,32,43,48,64,74,84,85,86,107,109,144,149,152],transit:[140,148],translat:90,transpos:154,travers:72,treat:[19,64],tree:[101,103],tri:[6,22,30,48,72,102],trial:48,trick:93,tricki:108,trigger:22,trillion:[1,2,73,91,109,110],trivial:[36,37,38,39],troubleshoot:[15,64],truncat:[64,103],truncated_bptt_step:107,trust:85,tsmodel:20,tunabl:36,tune:[6,10,22,30,31,84,88,90,93,108,115,132,149],tuner:[22,72,77],tupl:[64,74,84,102,107],ture:69,turn:[36,58,72,77,78,103,140,148],tutori:[6,48,64,65,84,108,139,142],twain:84,tweak:[19,67],twice:29,two:[6,11,15,22,26,28,30,43,45,46,48,60,64,65,70,72,84,93,94,102,103,104,107,108,140,146,148,154,157],txt:[9,38],type:[3,16,17,18,19,27,31,36,49,61,63,64,69,70,72,74,77,93,94,96,97,98,99,100,101,103,105,140,148,149,157],type_a:64,typecheck:84,typeerror:[16,17,99],typic:[19,22,72,84,108],u:31,ui:[36,37,38,39,99],ulimit:84,ultim:[65,139,140,142,148],unavail:[16,17],unbalanc:84,uncas:84,uncategor:97,uncommit:30,undefin:93,under:[6,16,17,18,19,20,61,63,64,65,69,92,99,102,103,105,107,108,109,140,144,148],underfit:[91,123,147],understand:[6,29,31,54,91,101,123,124,128,149,154,158],unetplusplu:88,uneven:[61,64],unexpect:[30,55],unfinish:[16,17],unifi:[4,74,106],uniform:48,uninterrupt:72,union:[4,21,61,64,72,92,96,97,98,99,100,101],uniqu:[64,72,93,102,157],unit:[3,12,16,17,64,72,91,110,115,116],univers:[33,47,48,49,126,135],unix:108,unless:[19,64,69,72,74],unlik:[19,53],unnecessarili:108,unscal:[22,64,72],unseen:[60,61],unseri:5,unset:28,unsqueez:[64,81,82],unstabl:67,unsupport:[16,17,102,157],unsur:[140,148],unsustain:31,until:[22,29,61,62,65,72,76,103,140,145,148,157],untoggl:64,unus:[19,64,93],unusu:19,unwatch:101,unzip:45,up:[3,8,11,16,17,18,19,20,22,31,33,36,37,38,39,43,47,49,62,64,65,70,72,74,78,84,101,102,103,128,135,140,148,160],updat:[0,6,19,22,43,55,62,64,65,70,72,83,84,93,94,101,102,103,107,139,142,157],upgrad:18,upload:99,upon:[74,99],upto:108,uri:98,url:[6,52,64,72,151],us:[3,4,6,8,9,11,12,13,14,16,17,18,20,28,29,30,31,32,33,36,38,42,44,45,46,47,48,49,52,53,54,55,56,57,58,60,61,62,63,64,67,69,70,71,73,76,77,78,79,81,82,85,86,87,89,91,92,93,94,96,97,98,99,100,101,102,103,105,106,108,109,111,112,113,117,119,121,122,123,127,128,129,132,136,140,141,144,146,148,149,151,152,153,154,157,158],usabl:[18,53],usag:[19,27,31,108,140,148],use_artifact:101,use_pl_optim:64,use_spot:41,use_tpu:18,usecas:[91,110],user:[2,3,4,6,8,9,11,12,13,15,16,17,18,19,22,23,26,28,29,30,31,32,33,36,38,41,42,47,48,53,55,57,60,61,64,65,67,69,72,76,77,78,82,84,87,92,99,100,101,102,103,104,106,108,139,140,142,144,148,149,151,152,153,154,157,158,159,160],using_lbfg:[64,65],using_native_amp:[64,65],usr:[6,16,17,18],usual:[0,6,18,19,31,32,38,48,61,64,74,108],util:[8,12,13,15,16,17,18,19,20,22,28,31,32,43,54,60,61,63,64,72,74,84,100,102,103,107,108,140,144,147,148],v100:[16,17],v1:[64,65,72,74,84,93,104,139,140,142,148],v2:[8,72,101,140,148],v3:[16,17,72],v:[16,17,64,84],v_num:[102,157],vae:[85,86],val1:101,val2:101,val:[31,56,58,61,64,72,74,77,84,93,103,107],val_acc:64,val_accuraci:[58,101],val_batch:[64,72,103],val_batch_idx:64,val_batch_s:72,val_check_batch:72,val_check_interv:[58,70,107,108],val_checks_per_epoch:72,val_data:[64,74],val_dataload:[56,72,83,103,107,152],val_dataset:74,val_dataset_1:107,val_dataset_2:107,val_load:74,val_loop:[64,103],val_loss:[29,55,58,60,64,72,85,102,103,145],val_out:64,val_set:60,val_split:[88,103],val_step_output:64,valid:[6,19,30,31,41,55,56,58,70,74,77,78,91,93,102,103,109,123,138,144,147,149,158,159],valid_set:60,valid_set_s:60,validate_at_some_point:64,validate_loop:103,validation_d:84,validation_dataset:84,validation_epoch_end:[61,72,102,149,157],validation_loss:[0,55,158],validation_step:[0,6,12,55,56,58,60,61,72,102,103,107,145,149,154,157,158],validation_step_end:[6,102,149,157],validation_step_output:64,validationepochloop:103,valu:[12,16,17,19,20,22,28,29,30,36,53,55,58,62,63,64,65,72,78,92,93,96,97,98,99,100,101,102,103,104,107,108,139,142,149,157,158],valueerror:[72,99],valuer:[16,17],vari:[19,60,157],variabl:[6,16,17,19,29,37,38,39,42,64,77,97,98,99,103,104,107],variant:19,variat:[22,93],varieti:[71,102,108],variou:[2,19,22,49,58,99],ve:[19,40,72,77,88],verbos:[9,58,61,72,93,94],veri:[0,6,19,28,29,55,56,63,64,84,88,104,108],verifi:15,version:[6,16,17,18,19,28,29,30,36,48,53,61,63,64,72,74,76,81,87,93,96,97,98,99,100,101,102,146,157,159],version_0:[19,147,159],version_:[96,100],vgg16:64,via:[0,4,5,6,11,13,19,22,25,29,31,32,36,37,38,39,41,44,45,46,47,49,55,69,72,73,78,84,85,88,92,93,106,107,111,136,140,148],video:[16,17,19,84,101,109],videogpt:85,view:[31,60,64,80,81,84,85,88,99,144,145,147],virtual:[22,43,158],visibl:[5,6,57,70],vision:[90,109,147],visit:84,visual:[19,72,73,91,99,102,123,128,129],vliw:8,vm:[16,17],vocab:[74,84],vocab_fil:84,vocabulari:74,vocder_model:84,vocod:84,voic:84,volta:69,volum:[16,17,19,67],vram:19,vs:[22,102],vstack:[64,81,82],w:[16,17,19,23,101],wa:[16,17,30,41,43,53,61,63,64,65,72,84,93,107,139,140,142,145,148,149],wai:[4,6,12,16,17,19,22,28,30,31,42,43,49,61,63,64,74,80,81,82,88,91,99,103,104,107,108,110,113,140,148,149,158,159],wait:[72,77,108,140,148],wall:154,wandb:[101,102,155,160,161],wandb_logg:[101,155,160,161],wandblogg:[155,160,161],want:[4,5,6,19,27,28,29,31,33,36,41,44,46,47,49,53,55,56,58,60,61,63,64,65,67,70,72,74,76,77,78,81,83,84,87,88,92,93,95,96,97,98,100,101,102,103,106,107,108,139,140,142,145,146,148,151,152,153,154,157,158,159,160],warm:[64,65],warmup_max_lr:19,warmup_min_lr:19,warmup_num_step:19,warmup_step:6,warmuplr:19,warn:[15,57,64,102,108],wasserstein:64,watch:[16,17,84,101,155,160,161],wav:84,waveglow:84,waveglowmodel:84,we:[0,4,6,11,12,16,17,18,19,22,23,24,26,27,28,31,32,38,43,45,46,47,48,53,55,56,58,60,61,62,63,64,65,69,72,74,76,77,78,82,83,84,85,89,90,92,93,94,102,103,105,106,108,140,146,148,149,152,157,158],web:[36,37,38,39],websit:[13,84],week:[41,84],weigh:19,weight:[13,19,20,53,55,61,64,69,72,82,83,84,99,101,103,122],weight_decai:19,weighted_loss:84,weightsharingmodul:15,welcom:[46,84],well:[4,19,28,61,63,71,72,74,102,106,107,108,149,157],went:102,wer_denom:84,wer_num:84,were:[4,16,17,19,21,28,29,63,64,93,94,149],wether:[140,148],what:[0,6,23,28,29,32,54,63,64,65,72,84,93,94,95,99,102,103,108,149],whatev:[61,64,72,74,95,103,140,148],whatever_ml_flow_support:98,wheel:[16,17],when:[0,3,6,11,12,16,17,20,22,26,28,30,36,38,41,43,48,52,53,58,60,61,62,63,64,65,67,69,70,72,74,76,77,78,82,84,92,93,94,95,97,99,100,101,102,103,104,107,108,119,140,144,148,149,154,157,158],whenev:[77,92,93,108,149],where:[6,12,13,15,16,17,19,22,27,28,36,41,43,53,58,62,63,64,65,72,74,88,96,98,99,100,101,102,103,139,142,149,158],wherea:[64,108],whether:[64,72,97,102,103,157],which:[0,3,6,8,11,12,13,15,16,17,19,20,22,26,27,28,29,30,31,36,37,38,39,41,42,43,44,45,46,47,49,52,61,62,63,64,65,69,70,72,74,78,81,84,88,92,93,96,97,98,99,100,101,102,103,104,107,108,139,140,142,144,148,149,154,157,158],whilst:[11,19],whl:[16,17],who:[29,30,31,32,33,38,41,47,60,65,76,77,78,87,92,139,142,144,151,152,153,154,157,158,159,160],whole:[64,72,107,158],whose:[29,64],why:[6,43,97,102,157],width:[74,158],wild:103,william:64,williamfalcon:46,window:158,wine:101,wish:[61,64,70,72,74,92,93,103,140,148],within:[0,6,8,11,19,41,43,58,61,63,64,69,70,72,74,87,90,102,103,140,145,148,149],without:[0,6,19,20,28,30,31,32,45,46,48,64,65,72,81,83,90,92,93,100,102,108,122,141,144,149,158],won:[6,15,43,55,64,65,72,74,78,93,97,108,139,142],word:[11,84],work:[4,6,12,15,16,17,18,19,22,25,32,40,42,43,47,53,55,61,63,64,65,71,72,74,76,78,85,87,92,93,99,102,103,107,108,139,142,145,147,149,158],worker:[0,6,16,17,19,43,72,107,140,148,149],workflow:[45,46,48,49,59],workload:[8,12,16,17,27,33,43],workspac:[97,99,155,160,161],world:[19,23,37,60,61,64,72,158],world_siz:[6,37,38,64,72,140,148,157],worri:[19,140,148,149],wors:58,worst:43,worth:6,would:[6,16,17,18,19,22,23,28,29,30,48,61,64,72,88,93,94,102,103,107,108,140,145,148,157],wrap:[19,20,31,43,64,65,74,107,139,142],wrapper:[6,19],write:[28,29,30,52,64,71,72,103,104,157,159],writer:100,written:[6,19,22,72,140,148],wrong:6,x12:8,x:[0,6,11,15,19,20,23,26,31,53,55,56,60,64,65,72,74,77,80,81,82,83,84,85,89,102,103,107,108,139,140,142,144,145,146,147,148,149,153,157],x_hat:[0,56,60,64,144,147],x_length:84,xarg:[16,17],xception:88,xla:[14,16,17,18,64,72,108,117,151],xla_client:[16,17],xla_devic:[16,17],xla_dist:[16,17,18,72,108],xla_model:[16,17,18],xla_replication_devic:[16,17],xla_use_bf16:[72,108],xlacheckpointio:54,xlaprofil:151,xlm:19,xm:[16,17,18,54],xmp:[16,17],xpu:92,xpuacceler:92,xpulib:92,xrt:[16,17,18],xrt_tpu_config:[16,17,18],xrt_world_siz:18,xu:[16,17],y:[0,6,26,55,60,64,74,77,83,84,85,89,103,107,144,145,147,153,157],y_0:6,y_1:6,y_2:6,y_3:6,y_hat:[6,53,55,64,82,83,103,145],y_length:84,y_log:84,y_m:84,yaml:[25,29,31,61,63,64,73,87,91,96,110,111],ye:67,yet:[4,22,55,64,69,93,99,103,106,146],yield:[22,43,103],you:[0,3,4,5,6,8,9,11,12,13,16,17,18,19,20,21,22,23,26,27,28,31,32,36,37,38,39,40,41,42,43,44,45,46,47,48,49,52,53,55,57,58,61,62,63,64,65,67,68,69,70,71,74,76,77,78,80,81,82,83,84,85,86,87,88,91,92,93,94,95,96,97,98,99,100,101,102,103,105,107,108,109,112,114,123,130,131,132,133,136,139,140,141,142,144,146,148,149,151,152,154,155,157,158,159,160,161],young:84,your:[0,1,4,5,7,10,11,12,13,14,16,17,18,19,20,21,22,23,27,28,29,30,31,32,33,35,38,39,41,43,44,45,46,48,53,54,55,57,58,61,63,64,66,67,68,69,70,72,73,74,83,84,85,86,87,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103,105,107,108,109,110,113,115,119,120,123,124,126,128,130,134,135,140,141,144,146,147,148,149,155,156,157,158,160,161],your_class_path:28,your_comet_api_kei:[155,160,161],your_lightning_training_script:6,your_main_address:[72,140,148],your_main_port:[72,140,148],your_trainer_fil:[72,108],yourmodel:5,yourse:6,yourself:[18,28,37,64,103,149],z:[0,60,64,65,84,139,142,144,145,147,149],zero3:[140,148],zero:[4,21,22,30,62,64,65,72,90,103,108,139,140,142,145,148],zero_allow_untested_optim:19,zero_grad:[19,64,65,72,93,103,108,139,140,142,144,147,148],zero_optim:19,zip:[45,46,84,103,146],zone:[16,17]},titles:["Hardware agnostic training (preparation)","Accelerator: GPU training","GPU training (Advanced)","GPU training (Basic)","GPU training (Expert)","GPU training (FAQ)","GPU training (Intermediate)","Accelerator: HPU training","Accelerator: HPU training","Accelerator: HPU training","Accelerator: IPU training","Accelerator: IPU training","Accelerator: IPU training","Accelerator: IPU training","Accelerator: TPU training","TPU training (Advanced)","TPU training (Basic)","TPU training (Basic)","TPU training (Intermediate)","Train 1 trillion+ parameter models","Pruning and Quantization","Strategy Registry","Effective Training Techniques","Transfer Learning","Benchmark with vanilla PyTorch","Eliminate config boilerplate","Eliminate config boilerplate (Advanced)","Eliminate config boilerplate (Advanced)","Instantiation only mode","Eliminate config boilerplate (Advanced)","Eliminate config boilerplate (expert)","Eliminate config boilerplate (Intermediate)","Eliminate config boilerplate (intermediate)","Train on the cloud","Train on the cloud (intermediate)","Run on an on-prem cluster","Run on an on-prem cluster (advanced)","Run on an on-prem cluster (expert)","Run on an on-prem cluster (intermediate)","Run on an on-prem cluster (intermediate)","Fault-tolerant Training","Fault-tolerant Training (basic)","Fault-tolerant Training (expert)","Fault-tolerant Training (FAQ)","Cost","Train on the cloud (advanced)","Train on the cloud (intermediate)","Train on the cloud (expert)","Train on the cloud (intermediate)","Train on the cloud (basic)","Train on the cloud (basic)","Checkpointing","Checkpointing (advanced)","Checkpointing (basic)","Checkpointing (expert)","Checkpointing (intermediate)","<no title>","Console logging","Early Stopping","Add validation and test datasets","Validate and test a model (basic)","Validate and test a model (intermediate)","<no title>","Configure hyperparameters from the CLI","LightningModule","Optimization","N-Bit Precision","N-Bit Precision (Basic)","N-Bit Precision (Expert)","N-Bit Precision (Intermediate)","Customize the progress bar","Remote Filesystems","Trainer","Common Workflows","LightningDataModule","Debug your model","Debug your model (advanced)","Debug your model (basic)","Debug your model (intermediate)","Deploy models into production","Deploy models into production (advanced)","Deploy models into production (advanced)","Deploy models into production (basic)","Deploy models into production (intermediate)","Conversational AI","Lightning Bolts","Community Examples","Ecosystem CI","Lightning Flash","TorchMetrics","Lightning Transformers","Level up","Accelerator","Callback","Save Callback state","Save DataModule state","CSVLogger","CometLogger","MLFlowLogger","NeptuneLogger","TensorBoardLogger","WandbLogger","Logging","Loops","Loops (Advanced)","Plugins","What is a Strategy?","Managing Data","Speed Up Model Training","\u26a1 PyTorch Lightning\uc5d0 \uc624\uc2e0 \uac83\uc744 \ud658\uc601\ud569\ub2c8\ub2e4!","Advanced skills","Level 15: Customize configs to run in production","Level 16: Customize the trainer","Level 17: Own the training loop","Level 18: Enable advanced checkpointing","Level 19: Explore IPUs","Level 19: Explore HPUs","Level 21: Master TPUs","Level 22: Reach 1 trillion parameters on GPUs","Level 2: Add a validation and test set","Level 5: Debug, visualize and find performance bottlenecks","Level 3: Visualize training progress","Level 6: Predict with your model","Basic skills","Expert skills","Level 23: Extend the Lightning CLI","Level 24: Integrate a custom cluster","Level 27: Add a new accelerator or Strategy","Intermediate skills","Level 10: Understand your model","Level 11: Explore SOTA scaling techniques","Level 12: Deploy your models","Level 13: Optimize training speed","Level 14: Run on on-prem clusters","Level 7: Interactive cloud development","Level 8: Run models on the cloud","Level 9: Modularize your projects","<no title>","Build a Model","Own your loop (advanced)","Raw PyTorch loop (expert)","Supercharge training (intermediate)","Manual Optimization","Use a pure PyTorch training loop","Train a model (basic)","How to Organize PyTorch Into Lightning","Installation","Lightning 15\ubd84 \ub9cc\uc5d0 \ubc30\uc6cc\ubcf4\uae30","LightningLite (Stepping Stone to Lightning)","\uc2a4\ud0c0\uc77c \uac00\uc774\ub4dc","Find bottlenecks in your code","Find bottlenecks in your code (advanced)","Find bottlenecks in your code (basic)","Find bottlenecks in your code (expert)","Find bottlenecks in your code (intermediate)","Manage Experiments","Track and Visualize Experiments","Track and Visualize Experiments (advanced)","Track and Visualize Experiments (basic)","Track and Visualize Experiments (expert)","Track and Visualize Experiments (intermediate)","Comet.ml"],titleterms:{"0":[45,46,151],"1":[3,8,12,16,17,19,45,46,49,85,88,89,118,145,147,151],"10":[19,129],"11":130,"12":131,"13":132,"14":133,"15":111,"15\ubd84":147,"16":[6,13,18,67,72,108,112],"17":113,"18":114,"19":[115,116],"2":[6,19,45,46,85,88,89,119,145,147,151],"21":117,"22":118,"23":125,"24":126,"27":127,"3":[19,45,46,85,88,89,121,145,147,151],"32":67,"4":[45,46,145,147,151],"5":[120,145,147],"6":[122,145,147],"64":67,"7":[134,145,147],"8":[69,135,145],"9":136,"\uac00\uc774\ub4dc":149,"\uac80\uc0c9":109,"\uac83\uc744":109,"\uadf9\ub300\ud654\ud558\uae30":147,"\ub2e4\uc74c":147,"\ub2e8\uacc4":147,"\ub370\uc774\ud130\uc14b":147,"\ub9cc\uc5d0":147,"\ubaa8\ub378":147,"\ubc0f":109,"\ubc18\ubcf5":147,"\ubc30\uc6cc\ubcf4\uae30":147,"\ube60\ub974\uac8c":147,"\uc0ac\uc6a9\uc790":147,"\uc0ac\uc6a9\uc790\ub77c\uba74":109,"\uc0ac\uc6a9\ud558\uae30":147,"\uc0c9\uc778":109,"\uc124\uce58\ud558\uae30":[109,147],"\uc2a4\ud0c0\uc77c":149,"\uc2dc\uac01\ud654\ud558\uae30":147,"\uc5c4\uccad":147,"\uc624\uc2e0":109,"\uc720\uc5f0\uc131":147,"\uc774\ubbf8":109,"\uc790\uccb4\uc758":147,"\uc815\uc758\ud558\uae30":147,"\ucc98\uc74c\uc774\uc2e0\uac00\uc694":109,"\ud559\uc2b5":147,"\ud559\uc2b5\ud558\uae30":147,"\ud655\uc7a5\ud558\uae30":147,"\ud658\uc601\ud569\ub2c8\ub2e4":109,"class":[28,29,72],"default":[27,28,29,102,103,157],"do":[5,32,43,49,74,152,158],"function":[89,152],"import":144,"lightning\uc5d0":109,"new":[87,103,127],"return":107,"static":19,If:72,In:157,Into:[108,145],Of:84,The:84,To:84,acceler:[1,7,8,9,10,11,12,13,14,67,72,92,108,127,140,148,152],access:[8,12,16,17,65,107,139,142],accumul:[22,65,139,142,158],accumulate_grad_batch:72,across:22,action:153,activ:19,add:[59,60,119,127,144],add_dataloader_idx:157,add_to_queu:64,addit:[61,107],adjust:5,advanc:[2,11,15,19,22,25,26,27,29,36,45,52,76,79,80,81,91,103,104,110,114,139,151,157],after:61,agnost:0,ai:[84,155,160,161],all:77,all_gath:64,amp_backend:72,amp_level:72,an:[8,12,19,35,36,37,38,39,58,159],analys:13,ani:[23,32,145],anomali:78,anywher:[42,52],apex:[69,72],api:[64,72,74,92,93,103,109],ar:[43,72],arbitrari:65,arg:63,argpars:63,argument:[27,28],argumentpars:63,art:84,artifact:[102,160],asr:84,associ:103,audio:160,auto:36,auto_lr_find:72,auto_scale_batch_s:72,auto_select_gpu:72,autocast:[140,148],autograd:78,automat:[8,65,84,102,157],automatic_optim:64,avail:[4,103,106],averag:22,avoid:108,aw:8,backend:18,background:[45,46],backpropag:107,backward:[64,140,148],bagua:6,bar:[70,102,157,159],barrier:[140,148],basic:[3,16,17,25,41,49,50,53,60,67,72,77,79,82,91,123,144,152,158],batch:[22,65],batch_siz:157,behavior:[42,55,102,157],benchmark:[24,72],bert:23,best:[63,93],bfloat16:69,bias:[155,160,161],billion:19,bit:[6,13,18,66,67,68,69,72,108],boilerpl:[25,26,27,29,30,31,32],bolt:85,both:157,bottleneck:[120,150,151,152,153,154],boundari:22,breakpoint:77,bring:65,browser:158,bucket:19,build:[36,138,153,159],built:[22,54,93,103],cach:108,call:[0,145],callback:[28,29,58,72,85,93,94,102,157],callback_metr:72,captur:151,caveat:6,chang:[157,159],chart:160,check:[77,108],check_val_every_n_epoch:72,checkpoint:[19,51,52,53,54,55,82,83,114],checkpoint_callback:72,checkpointio:105,child:64,choos:[3,19,45,46],ci:87,clear:108,cli:[26,30,31,63,125],clip:[22,65],clone:49,closur:[65,139,142],cloud:[16,17,27,33,34,41,45,46,47,48,49,50,52,134,135,151,157],cluster:[19,35,36,37,38,39,42,47,105,126,133],code:[77,78,140,145,148,150,151,152,153,154],colab:[5,16,17],collat:19,comet:[155,160,161],cometlogg:97,command:27,commandlin:158,common:[73,109],commun:[6,19,86],comparison:24,compil:[80,81],complic:82,compos:26,comput:[23,145],concaten:107,conda:146,condit:55,config:[19,25,26,27,29,30,31,32,111],configur:[29,63,65,84,88,102,145,158],configure_callback:64,configure_gradient_clip:64,configure_optim:64,configure_sharded_model:64,connect:[29,31],consol:[57,102],contain:[107,149],content:53,control:[85,102,108],convers:84,convert:[140,148],core:[16,17,109],cost:[41,44,46,48,49],coverag:146,cpu:108,creat:[4,45,46,92,103,106],csvlogger:96,cuda:[0,145],current_epoch:[64,72],custom:[4,9,19,27,29,54,65,70,92,102,106,111,112,126,139,153,157,159],data:[6,60,78,88,107,108,145,149],dataload:[43,61,107,108,149],datamodul:[32,74,95,149],dataparallel:64,dataset:[22,28,32,43,45,46,59,107,144],ddp2:6,ddp:[6,19,108],debug:[38,75,76,77,78,120],deepspe:19,default_root_dir:72,defin:[60,144],delet:0,deploi:[79,80,81,82,83,131],design:36,detect:78,determinist:72,develop:[84,134],devic:[3,5,64,72,108,140,145,148],differ:[4,106],dimens:77,directli:27,directori:158,disabl:53,distribut:[6,18,19,55,76,82,140,148,154,157],distributedsampl:18,doe:77,don:151,done:103,dp:[6,108],earli:[58,108],earlystop:58,ecosystem:[86,87],effect:22,effici:19,elast:6,elimin:[25,26,27,29,30,31,32,144],enabl:[4,9,19,27,31,36,42,57,82,106,114,141,157],enable_checkpoint:72,enable_graph:157,enable_model_summari:72,enable_progress_bar:72,entiti:84,entri:103,environ:[27,105],epoch:[58,64,77,108,157],error:5,estimated_stepping_batch:72,evalu:107,everi:[108,152],exampl:[23,64,85,86,89,93,103,109,140,148],example_input_arrai:64,exclud:63,exist:[140,148],exp:[155,160,161],experi:[84,155,156,157,158,159,160],expert:[4,30,37,42,47,54,68,91,124,140,153,159],explod:78,explor:[115,116,130],extend:[85,125,141],extract:83,fairscal:19,fals:19,faq:[5,16,17,43],fast_dev_run:72,faster:85,fault:[40,41,42,43],featur:[103,141],file:[19,26,27,29,84],filesystem:[71,102,157],find:[60,120,150,151,152,153,154],find_unused_paramet:19,finder:22,fine:19,finetun:88,fit:[61,72],flag:[72,140,148],flash:[88,103],flush:157,flush_logs_every_n_step:72,forc:29,forward:[64,149],fp16:69,free:47,freez:64,frequenc:[102,108,157],from:[26,27,32,52,53,63,83,84,102,103,146],fulli:19,gan:[65,139,142],gaudi:8,gcp:[16,17],get:[5,36,37,38,39,109],get_from_queu:64,global_rank:64,global_step:[64,72],glossari:109,good:145,googl:[16,17],gpu:[1,2,3,4,5,6,19,22,72,108,118,140,148],grad:108,gradient:[19,22,65,78,139,142],gradient_clip_v:72,graph:[13,19],grid:[45,46,48],group:27,hand:109,happen:43,hardwar:0,hassl:47,help:[36,37,38,39,77],hood:[72,84],hook:[19,64,93,107],horovod:6,how:[5,8,12,16,17,43,77,145],hparam:64,hpu:[7,8,9,116],hyperparamet:[53,63,74,102,160],i:[5,19,32,43,49,74,78,152,158],ightningmodul:157,imag:158,imagenet:23,impact:43,implement:6,infer:[64,82],infin:19,init:[0,53,72,149],initi:19,input:[77,107],instal:[45,46,84,146,151],instanti:28,instantli:19,integr:[37,87,126,159],interact:134,interest:[72,153],intermedi:[6,18,31,32,34,38,39,46,48,55,61,69,78,83,91,128,141,154,160],interpol:27,interv:65,io:54,ipu:[10,11,12,13,115],is_global_zero:72,item:108,iter:[43,107],job:38,jupyt:[5,49],kaggl:[16,17],keep:145,know:145,known:[8,12],languag:84,layer:77,lbfg:[65,139,142],learn:[5,22,23,65,84,139,140,142,148],length:77,level:[64,91,109,111,112,113,114,115,116,117,118,119,120,121,122,125,126,127,129,130,131,132,133,134,135,136],lightn:[22,31,45,46,63,74,77,83,85,88,89,90,103,107,109,125,140,145,146,147,148],lightningcli:[29,30],lightningdatamodul:[74,107],lightninglit:[140,148],lightningmodul:[23,32,53,63,64,77,82,102,107,144,147,149,157],like:[65,139,142],limit:[8,12],limit_test_batch:72,limit_train_batch:72,limit_val_batch:72,list:48,lite:[140,148],load:[82,88,140,148],load_from_checkpoint:[63,64],load_state_dict:[74,93],local_rank:64,log:[0,57,64,102,151,157],log_dict:64,log_dir:72,log_every_n_step:72,logged_metr:72,logger:[64,72,102,157],logic:[82,145],look:78,loop:[60,64,103,104,113,139,140,143,144,147,152],lr:[22,32,145],lr_schedul:64,m:5,machin:[6,49],make:[0,102],manag:[36,45,46,84,102,107,155,159,160,161],manual:[55,65,102,139,142],manual_backward:64,master:117,max_epoch:72,max_step:72,max_tim:72,maximum:19,me:77,measur:152,memori:19,method:[64,72,103,140,148,149],metric:[64,89,157,158,160],min_epoch:72,min_step:72,minut:49,mix:[9,13,32,69,108],ml:[78,155,160,161],mlflow:[155,160,161],mlflowlogg:98,mode:28,model:[0,11,19,28,31,32,45,46,49,60,61,75,76,77,78,79,80,81,82,83,84,85,88,108,122,129,131,135,138,144,149,151,154,157,160],modifi:[52,55,102,157],modul:[19,23,53,63,64,83,89,144],modular:[52,136],monei:41,monitor:[45,46],more:84,move:145,multi:[6,19],multipl:[3,5,8,12,16,17,28,43,61,63,65,107,139,142,155,160,161],my:[43,140,148],n:[66,67,68,69,108],name:84,nativ:69,natur:84,nccl:19,need:[49,74,152,158],nemo:84,neptun:[155,160,161],neptunelogg:99,ner:84,neural:84,next:[45,46,48,49],nlp:[23,84],nn:[23,53,83,144],node:19,non:102,none:108,normal:83,notebook:[5,49],num_nod:[72,140,148],num_process:72,num_sanity_val_step:72,num_work:108,numpi:108,nvidia:69,nvme:19,object:107,offload:19,on_after_backward:[64,93],on_after_batch_transf:[64,74],on_before_backward:[64,93],on_before_batch_transf:[64,74],on_before_optimizer_step:[64,93],on_before_zero_grad:[64,93],on_configure_sharded_model:93,on_epoch:157,on_except:93,on_fit_end:[64,93],on_fit_start:[64,93],on_hpc_load:64,on_hpc_sav:64,on_init_end:93,on_init_start:93,on_keyboard_interrupt:93,on_load_checkpoint:[64,93],on_post_move_to_devic:64,on_predict_batch_end:[64,93],on_predict_batch_start:[64,93],on_predict_dataload:[64,74],on_predict_end:[64,93],on_predict_epoch_end:[64,93],on_predict_epoch_start:[64,93],on_predict_start:[64,93],on_sanity_check_end:93,on_sanity_check_start:93,on_save_checkpoint:[64,93],on_step:157,on_test_batch_end:[64,93],on_test_batch_start:[64,93],on_test_dataload:[64,74],on_test_end:[64,93],on_test_epoch_end:[64,93],on_test_epoch_start:[64,93],on_test_model_ev:64,on_test_model_train:64,on_test_start:[64,93],on_train_batch_end:[64,93],on_train_batch_start:[64,93],on_train_dataload:[64,74],on_train_end:[64,93],on_train_epoch_end:[64,93],on_train_epoch_start:[64,93],on_train_start:[64,93],on_val_dataload:[64,74],on_validation_batch_end:[64,93],on_validation_batch_start:[64,93],on_validation_end:[64,93],on_validation_epoch_end:[64,93],on_validation_epoch_start:[64,93],on_validation_model_ev:64,on_validation_model_train:64,on_validation_start:[64,93],onc:77,onli:28,onnx:80,open:49,oper:[64,154],optim:[6,16,17,19,22,28,32,64,65,69,132,139,142,145],optimizer:65,optimizer_step:64,optimizer_zero_grad:64,option:[11,27,103,145],order:149,organ:145,other:[53,160],out:78,output:77,over:108,overfit:78,overfit_batch:72,overrid:103,own:[6,37,42,47,65,113,139,142,145,153,159],pack:107,packag:32,parallel:[6,11],paramet:[19,53,118],part:43,perform:[16,17,43,120],persist:[104,108],pickl:5,pickleabl:0,pip:146,pitfal:[140,148],plugin:[54,68,72,105,140,148],pod:18,point:103,popvis:13,practic:[63,93],pre:[19,61,84],prebuilt:85,precis:[6,9,13,18,64,66,67,68,69,72,105,108,140,148],predict:[64,72,82,107,122,145],predict_dataload:[64,74],predict_step:64,prefer:108,preload:108,prem:[35,36,37,38,39,133],prepar:0,prepare_data:[64,74],prepare_data_per_nod:[64,74],pretrain:[23,85],print:[26,64,77,140,148],process:[22,84],process_posit:72,product:[64,79,80,81,82,83,111],profil:[72,151,152,153,154],prog_bar:157,progress:[70,102,121,157,159],progress_bar_metr:72,project:[87,136],properti:[64,72,93,103],prune:20,pure:143,python:72,pytorch:[23,24,69,83,86,109,140,143,144,145,147,148,154],qualiti:85,quantiz:20,quickli:77,ram:108,random:48,rang:48,rank_zero_onli:157,rate:[5,22,65,139,142],raw:140,reach:[19,118],readi:103,recognit:84,reduc:19,reduce_fx:157,regist:[32,92],register_buff:0,registr:28,registri:[4,21],relat:5,reload_dataloaders_every_n_epoch:72,remot:[71,102],remov:[0,145],replace_sampler_ddp:72,reproduc:[30,72],requir:151,research:[64,85],reset:103,resubmit:36,resum:[52,53],resume_from_checkpoint:72,richprogressbar:[70,159],run:[8,12,16,17,26,27,35,36,37,38,39,45,46,47,49,77,103,111,133,135,140,148],s:[22,145],same:160,sampl:48,sampler:0,saniti:77,save:[41,52,53,55,74,93,94,95,140,148,158],save_hyperparamet:[63,64],scalar:102,scale:130,schedul:[32,65,139,142,145],scratch:[84,103],script:[36,38,72],search:48,seed_everyth:[140,148],select:8,self:[149,157],sequenc:107,sequenti:107,set:[19,27,77,108,119],setup:[38,64,74,93,140,148,151],setup_dataload:[140,148],shard:19,share:[15,22],shortcut:48,shorten:77,should:[5,78],shouldn:19,shuffl:43,singl:[19,26],size:22,skill:[91,110,123,124,128],skip:103,slrum:36,slurm:36,sota:130,sourc:146,spawn:[6,108],specif:[16,17],specifi:84,speech:84,speed:[48,49,108,132,157],speedup:108,split:60,stage:19,start:[48,49,109,151],starter:64,state:[53,72,74,84,93,94,95,104],state_dict:[74,93],state_kei:93,step:[45,46,48,49,65,82,88,140,148,157],stochast:22,stone:[140,148],stop:[58,108,151],strategi:[4,6,19,21,48,72,106,127,140,148],string:48,subclass:28,subcommand:30,subloop:103,submit:38,submodul:28,subset:78,summari:77,supercharg:141,support:[67,102],sweep:48,sync_batchnorm:72,sync_dist:157,sync_dist_group:157,synchron:0,syntax:48,system:149,t:[19,151],tbptt:107,tbptt_split_batch:64,teardown:[64,74,93],techniqu:[22,130],tensor:[0,108],tensorboard:[151,155,160,161],tensorboardlogg:100,test:[0,59,60,61,64,72,107,119,145],test_dataload:[64,74],test_epoch_end:64,test_step:64,test_step_end:64,text:[84,158],thing:108,through:107,time:[19,24,36,107,152],tip:[19,108],to_devic:[140,148],to_onnx:64,to_torchscript:64,toggl:108,toggle_optim:64,token:84,toler:[40,41,42,43],topolog:160,torch:6,torchdistribut:39,torchmetr:89,torchscript:81,total:65,tpu:[14,15,16,17,18,108,117,151],tpu_cor:[72,140,148],tqdmprogressbar:[70,159],track:[156,157,158,159,160],track_grad_norm:72,train:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,22,31,33,34,36,38,40,41,42,43,45,46,47,48,49,50,52,53,55,60,61,64,72,84,106,108,113,121,132,139,140,141,143,144,145,148,152,157],train_dataload:[64,74],trainer:[28,63,64,72,103,112,141,147],training_epoch_end:64,training_step:[64,149],training_step_end:64,transfer:[23,108],transfer_batch_to_devic:[64,74],transform:90,trillion:[19,118],troubleshoot:30,truncat:107,truncated_bptt_step:64,tt:84,tune:[19,72],tutori:103,two:29,ty:15,type:[28,29,84],type_a:0,under:[72,84],understand:[103,129,157],unfreez:64,untoggle_optim:64,up:[91,108,109,157],us:[0,5,19,22,23,25,26,27,41,43,65,72,74,83,84,88,90,107,139,142,143,145,155,159,160,161],usag:152,val_check_interv:72,val_dataload:[64,74],valid:[0,59,60,61,64,72,107,108,119,145],validation_epoch_end:64,validation_step:64,validation_step_end:64,vanilla:24,variabl:27,via:27,view:[19,151,158],vision:23,visual:[120,121,154,156,157,158,159,160],vm:18,vs:[19,48,49,149],wall:36,wandblogg:101,want:32,weight:[15,22,77,155,160,161],weights_save_path:72,weights_summari:72,what:[3,4,5,8,12,16,17,26,30,31,41,43,45,46,48,53,55,69,74,106],when:[5,19,55],where:55,which:55,why:[32,49,74,78,107,152,158],within:[107,108,152],without:74,worker:108,workflow:[73,109],write:[26,102],xla:15,yaml:[26,27,84],you:[72,145],your:[6,36,37,42,47,49,52,65,75,76,77,78,80,81,82,88,122,129,131,136,139,142,145,150,151,152,153,154,159],zero:19}}) \ No newline at end of file diff --git a/docs/source-app/Makefile b/docs/source-app/Makefile new file mode 100644 index 0000000..268e095 --- /dev/null +++ b/docs/source-app/Makefile @@ -0,0 +1,19 @@ +# Minimal makefile for Sphinx documentation +# + +# You can set these variables from the command line. +SPHINXOPTS = -T -W +SPHINXBUILD = sphinx-build +SOURCEDIR = . +BUILDDIR = ../build + +# Put it first so that "make" without argument is like "make help". +help: + @$(SPHINXBUILD) -M help "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O) + +.PHONY: help Makefile + +# Catch-all target: route all unknown targets to Sphinx using the new +# "make mode" option. $(O) is meant as a shortcut for $(SPHINXOPTS). +%: Makefile + @$(SPHINXBUILD) -M $@ "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O) diff --git a/source/_static/copybutton.js b/docs/source-app/_static/copybutton.js similarity index 100% rename from source/_static/copybutton.js rename to docs/source-app/_static/copybutton.js diff --git a/docs/source-app/_static/images/icon.svg b/docs/source-app/_static/images/icon.svg new file mode 100644 index 0000000..e88fc19 --- /dev/null +++ b/docs/source-app/_static/images/icon.svg @@ -0,0 +1,9 @@ + + + + + + + + + diff --git a/docs/source-app/_static/images/logo-large.svg b/docs/source-app/_static/images/logo-large.svg new file mode 100644 index 0000000..39531f9 --- /dev/null +++ b/docs/source-app/_static/images/logo-large.svg @@ -0,0 +1,9 @@ + + + + + + + + + diff --git a/docs/source-app/_static/images/logo-small.svg b/docs/source-app/_static/images/logo-small.svg new file mode 100644 index 0000000..1f523a5 --- /dev/null +++ b/docs/source-app/_static/images/logo-small.svg @@ -0,0 +1,9 @@ + + + + + + + + + diff --git a/docs/source-app/_static/images/logo.png b/docs/source-app/_static/images/logo.png new file mode 100644 index 0000000..392c965 Binary files /dev/null and b/docs/source-app/_static/images/logo.png differ diff --git a/docs/source-app/_static/images/logo.svg b/docs/source-app/_static/images/logo.svg new file mode 100644 index 0000000..60efaa2 --- /dev/null +++ b/docs/source-app/_static/images/logo.svg @@ -0,0 +1,12 @@ + + + + + + + + + + + + diff --git a/docs/_static/main.css b/docs/source-app/_static/main.css similarity index 100% rename from docs/_static/main.css rename to docs/source-app/_static/main.css diff --git a/docs/source-app/_templates/classtemplate.rst b/docs/source-app/_templates/classtemplate.rst new file mode 100644 index 0000000..5b7f465 --- /dev/null +++ b/docs/source-app/_templates/classtemplate.rst @@ -0,0 +1,9 @@ +.. role:: hidden + :class: hidden-section +.. currentmodule:: {{ module }} + + +{{ name | underline }} + +.. autoclass:: {{ name }} + :members: diff --git a/docs/source-app/_templates/classtemplate_no_index.rst b/docs/source-app/_templates/classtemplate_no_index.rst new file mode 100644 index 0000000..858c37b --- /dev/null +++ b/docs/source-app/_templates/classtemplate_no_index.rst @@ -0,0 +1,12 @@ +:orphan: + +.. role:: hidden + :class: hidden-section +.. currentmodule:: {{ module }} + + +{{ name | underline }} + +.. autoclass:: {{ name }} + :members: + :noindex: diff --git a/docs/source-app/_templates/layout.html b/docs/source-app/_templates/layout.html new file mode 100644 index 0000000..dfb2c26 --- /dev/null +++ b/docs/source-app/_templates/layout.html @@ -0,0 +1,10 @@ +{% extends "!layout.html" %} + + +{% block footer %} +{{ super() }} + + +{% endblock %} diff --git a/docs/source-app/_templates/theme_variables.jinja b/docs/source-app/_templates/theme_variables.jinja new file mode 100644 index 0000000..914f8dc --- /dev/null +++ b/docs/source-app/_templates/theme_variables.jinja @@ -0,0 +1,18 @@ +{%- set external_urls = { + 'github': 'https://github.com/Lightning-AI/lightning', + 'github_issues': 'https://github.com/Lightning-AI/lightning/issues', + 'contributing': 'https://github.com/Lightning-AI/lightning/blob/master/.github/CONTRIBUTING.md', + 'governance': 'https://github.com/Lightning-AI/lightning/blob/master/docs/source-pytorch/governance.rst', + 'docs': 'https://lightning.rtfd.io/en/latest', + 'twitter': 'https://twitter.com/PyTorchLightnin', + 'discuss': 'https://discord.gg/VptPCZkGNa', + 'tutorials': 'https://pt-lightning.readthedocs.io/en/latest/#tutorials', + 'previous_pytorch_versions': 'https://pt-lightning.rtfd.io/en/latest/', + 'home': 'https://lightning.ai/', + 'get_started': 'https://pt-lightning.readthedocs.io/en/latest/introduction_guide.html', + 'features': 'https://pt-lightning.rtfd.io/en/latest/', + 'blog': 'https://www.pytorchlightning.ai/blog', + 'resources': 'https://pt-lightning.readthedocs.io/en/latest/#community-examples', + 'support': 'https://pt-lightning.rtfd.io/en/latest/', +} +-%} diff --git a/docs/source-app/api_reference/components.rst b/docs/source-app/api_reference/components.rst new file mode 100644 index 0000000..69d53b7 --- /dev/null +++ b/docs/source-app/api_reference/components.rst @@ -0,0 +1,35 @@ +######################## +lightning.app.components +######################## + +.. contents:: + :depth: 1 + :local: + :backlinks: top + +.. currentmodule:: lightning.app.components + + +Built-in Components +___________________ + +.. autosummary:: + :toctree: generated/ + :nosignatures: + :template: classtemplate.rst + + ~database.client.DatabaseClient + ~database.server.Database + ~python.popen.PopenPythonScript + ~python.tracer.TracerPythonScript + ~training.LightningTrainerScript + ~serve.gradio_server.ServeGradio + ~serve.serve.ModelInferenceAPI + ~serve.python_server.PythonServer + ~serve.streamlit.ServeStreamlit + ~multi_node.base.MultiNode + ~multi_node.fabric.FabricMultiNode + ~multi_node.pytorch_spawn.PyTorchSpawnMultiNode + ~multi_node.trainer.LightningTrainerMultiNode + ~serve.auto_scaler.AutoScaler + ~serve.auto_scaler.ColdStartProxy diff --git a/docs/source-app/api_reference/core.rst b/docs/source-app/api_reference/core.rst new file mode 100644 index 0000000..324f3c4 --- /dev/null +++ b/docs/source-app/api_reference/core.rst @@ -0,0 +1,26 @@ +:orphan: + +################## +lightning.app.core +################## + +.. contents:: + :depth: 1 + :local: + :backlinks: top + +.. currentmodule:: lightning.app.core + +Core APIs +___________________ + +.. autosummary:: + :toctree: api/ + :nosignatures: + :template: classtemplate.rst + + LightningApp + LightningFlow + LightningWork + +Learn more about :ref:`Lightning Core `. diff --git a/docs/source-app/api_reference/frontend.rst b/docs/source-app/api_reference/frontend.rst new file mode 100644 index 0000000..514b2cf --- /dev/null +++ b/docs/source-app/api_reference/frontend.rst @@ -0,0 +1,25 @@ +###################### +lightning.app.frontend +###################### + +.. contents:: + :depth: 1 + :local: + :backlinks: top + +.. currentmodule:: lightning.app.frontend + +Lightning FrontEnds +___________________ + +.. autosummary:: + :toctree: generated/ + :nosignatures: + :template: classtemplate.rst + + ~frontend.Frontend + ~web.StaticWebFrontend + ~stream_lit.StreamlitFrontend + ~panel.PanelFrontend + +Learn more about :ref:`Frontend's `. diff --git a/docs/source-app/api_reference/runners.rst b/docs/source-app/api_reference/runners.rst new file mode 100644 index 0000000..f7e550b --- /dev/null +++ b/docs/source-app/api_reference/runners.rst @@ -0,0 +1,21 @@ +##################### +lightning.app.runners +##################### + +.. contents:: + :depth: 1 + :local: + :backlinks: top + +.. currentmodule:: lightning.app.runners + +Lightning Core +______________ + +.. autosummary:: + :toctree: generated/ + :nosignatures: + :template: classtemplate.rst + + ~cloud.CloudRuntime + ~multiprocess.MultiProcessRuntime diff --git a/docs/source-app/api_reference/storage.rst b/docs/source-app/api_reference/storage.rst new file mode 100644 index 0000000..3173914 --- /dev/null +++ b/docs/source-app/api_reference/storage.rst @@ -0,0 +1,71 @@ +##################### +lightning.app.storage +##################### + +Lightning Core +______________ + +.. contents:: + :depth: 1 + :local: + :backlinks: top + +.. currentmodule:: lightning.app.storage + +.. autosummary:: + :toctree: generated/ + :nosignatures: + :template: classtemplate.rst + + ~path.Path + ~drive.Drive + ~payload.Payload + ~mount.Mount + +---- + +************************ +Learn more about Storage +************************ + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Learn about the differences between Drive vs Path. + :description: Learn about their differences. + :col_css: col-md-4 + :button_link: ../glossary/storage/differences.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: The Drive Object. + :description: Put, List and Get Files From a Shared Drive Disk. + :col_css: col-md-4 + :button_link: ../glossary/storage/drive.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: The Path Object. + :description: Transfer Files From One Component to Another by Reference. + :col_css: col-md-4 + :button_link: ../glossary/storage/path.html + :height: 180 + :tag: Intermediate + +.. displayitem:: + :header: The Mount Object. + :description: Mount an AWS S3 Bucket When Running on the Cloud. + :col_css: col-md-4 + :button_link: ../workflows/mount_aws_s3_bucket.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/basics.rst b/docs/source-app/basics.rst new file mode 100644 index 0000000..8a64df8 --- /dev/null +++ b/docs/source-app/basics.rst @@ -0,0 +1,259 @@ +:orphan: + +.. _basics: + +###### +Basics +###### + +In this guide, we'll cover the basic terminology associated with the Lightning framework. + +---- + +************** +Lightning App +************** + +The :class:`~lightning.app.core.app.LightningApp` runs a tree of one or more components that interact to create end-to-end applications. There are two kinds of components: :class:`~lightning.app.core.flow.LightningFlow` and :class:`~lightning.app.core.work.LightningWork`. This modular design enables you to reuse components created by other users. + +---- + +Lightning Work +^^^^^^^^^^^^^^ + +The :class:`~lightning.app.core.work.LightningWork` component is a building block optimized for long-running jobs or integrating third-party services. LightningWork can be used for training large models, downloading a dataset, or any long-lasting operation. + +---- + +Lightning Flow +^^^^^^^^^^^^^^ + +The :class:`~lightning.app.core.flow.LightningFlow` component coordinates long-running tasks :class:`~lightning.app.core.work.LightningWork` and runs its children :class:`~lightning.app.core.flow.LightningFlow` components. + +---- + +Lightning App Tree +^^^^^^^^^^^^^^^^^^ + +Components can be nested to form component trees where the LightningFlows are its branches and LightningWorks are its leaves. + +Here's a basic application with four flows and two works: + +.. literalinclude:: code_samples/quickstart/app_comp.py + +And here's its associated tree structure: + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/tree.gif + :alt: Basic App Components + :width: 100 % + +A Lightning App runs all flows into a single process. Its flows coordinate the execution of the works each running in their own independent processes. + +---- + +Lightning Distributed Event Loop +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +Drawing inspiration from modern web frameworks like `React.js `_, the Lightning app runs all flows in an **event loop** (forever), which is triggered every 0.1 seconds after collecting any works' state change. + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/lightning_loop.gif + +When running an app in the cloud, the :class:`~lightning.app.core.work.LightningWork` run on different machines. Lightning communicates any :class:`~lightning.app.core.work.LightningWork` state changes to the **event loop** which re-executes the flow with the newly-collected works' state. + +---- + +Lightning App State +^^^^^^^^^^^^^^^^^^^ + +By design, each component is stateful and its state is composed of all its attributes. The **Lightning App State** is the collection of all its components state. + +With this mechanism, any component can **react** to any other component **state changes**, simply by relying on its attributes within the flow. + +For example, here we define two flow components, **RootFlow** and **ChildFlow**, where the child flow prints and increments a counter indefinitely and gets reflected in **RootFlow** state. + +You can easily check the state of your entire app: + +.. literalinclude:: code_samples/quickstart/app_01.py + +Here's the entire tree structure associated with your app: + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/parent_child.png + :alt: Parent Child Components + :width: 100 % + +And here's the output you get when running the above application using **Lightning CLI**: + +.. code-block:: console + + $ lightning run app docs/source/code_samples/quickstart/app_01.py + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + State: {'works': {'w_1': {'vars': {'counter': 1}}, 'w_2': {'vars': {'counter': 0}}}} + + State: {'works': {'w_1': {'vars': {'counter': 3}}, 'w_2': {'vars': {'counter': 1}}}} + + State: {'works': {'w_1': {'vars': {'counter': 4}}, 'w_2': {'vars': {'counter': 1}}}} + + State: {'works': {'w_1': {'vars': {'counter': 5}}, 'w_2': {'vars': {'counter': 2}}}} + + State: {'works': {'w_1': {'vars': {'counter': 6}}, 'w_2': {'vars': {'counter': 2}}}} + + State: {'works': {'w_1': {'vars': {'counter': 7}}, 'w_2': {'vars': {'counter': 3}}}} + ... + +This app will count forever because the **lightning event loop** indefinitely calls the root flow run method. + +---- + +******************************* +Controlling the Execution Flow +******************************* + + +LightningWork: To Cache or Not to Cache Calls +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +With Lightning, you can control how to run your components. + +By default, the :class:`~lightning.app.core.flow.LightningFlow` is executed infinitely by the **Lightning Infinite Loop** and the :class:`~lightning.app.core.work.LightningWork` does not run in **parallel**, +meaning the **Lightning Infinite Loop** (a.k.a the flow) waits until that long-running work is completed to continue. + +Similar to `React.js Components and Props `_, the :class:`~lightning.app.core.work.LightningWork` +component accepts arbitrary inputs (the "props") to its **run** method and by default runs **once** for each unique input provided. + +Here's an example of this behavior: + +.. literalinclude:: code_samples/basics/0.py + :language: python + :emphasize-lines: 10, 19 + +And you should see the following by running the code above: + +.. code-block:: console + + $ python example.py + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + # After you have clicked `run` on the UI. + I received the following props: args: () kwargs: {'value': 1} + I received the following props: args: () kwargs: {'value': 10} + +As you can see, the intermediate run didn't execute as already cached. + +To disable this behavior, set ``cache_calls=False`` to make any LightningWork run infinitely. + +.. literalinclude:: code_samples/basics/1.py + :diff: code_samples/basics/0.py + +.. code-block:: console + + $ python example.py + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + # After you have clicked `run` on the UI. + I received the following props: args: () kwargs: {'value': 1} + I received the following props: args: () kwargs: {'value': 1} + I received the following props: args: () kwargs: {'value': 1} + I received the following props: args: () kwargs: {'value': 1} + I received the following props: args: () kwargs: {'value': 1} + I received the following props: args: () kwargs: {'value': 10} + + +.. note:: Passing a sequence of different props to the work run method queues their execution. We recommend avoiding this behavior as it can be hard to debug. Instead, wait for the previous run to execute. + +---- + +LightningWork: Parallel vs Non Parallel +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +The LightningWork component is made for long-running jobs. + +As an example, let's create a long-running **LightningWork** component that will take 1 hour to do its "work". + +.. literalinclude:: code_samples/quickstart/app_02.py + :language: python + :emphasize-lines: 15 + +Here's the output you get when running the above application using **Lightning CLI**: + +.. code-block:: console + + $ lightning run app docs/source/code_samples/quickstart/app_02.py + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + # After you have clicked `run` on the UI. + 0.0 0.0 + ... + 0.0003 0.0003 + ... + 1.0 1.0 + ... + 1 hour later! + 1.0 1.0 + 1 hour later! + 1.0 1.0 + 1 hour later! + ... + +The child work runs only once, hence why the progress counter stops increasing once the work is completed. + +This is useful for monitoring the progress of a long-running operation, like training a big model. + +.. note :: + The Lightning Infinite Loop runs multiple cycles per second. + It is good practice to keep the loop running fast, so that your application stays responsive, + especially when it contains user-interface components. + +---- + +**************** +Multiple works +**************** + +In practical use cases, you might want to execute multiple long-running works in parallel. + +To enable this behavior, set ``parallel=True`` in the ``__init__`` method of +your :class:`~lightning.app.core.work.LightningWork`. + +Here's an example of the interaction between parallel and non-parallel behaviors: + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/blocking_non_blocking.gif + :alt: mnist GPU bar + :width: 100 % + +Below, we reuse the **HourLongWork** work defined in the previous example, but modify the **RootFlow** +to run two **HourLongWork** works in a parallel way. + +.. literalinclude:: code_samples/quickstart/app/app_0.py + :emphasize-lines: 21 + +Above, both ``child_work_1`` and ``child_work_2`` are long-running works that are executed +asynchronously in parallel. + +When running the above app, we see the following logs: + +.. code-block:: console + + $ lightning run app docs/source/code_samples/quickstart/app/app_0.py + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + # After you have clicked `run` on the UI. + 0.0, 0.0 + ... + 0.0003, 0.0003 + ... + 1.0, 1.0 + ... + 1 hour later `child_work_1` started! + 1 hour later `child_work_2` started! + 0.0, 0.0 + ... + 0.0003, 0.0003 + ... + 1.0, 1.0 + 1 hour later `child_work_1` started! + 1 hour later `child_work_2` started! + ... + +---- + +*********** +Next Steps +*********** + +To keep learning about Lightning, build a :ref:`ui_and_frontends`. diff --git a/docs/source-app/cloud/customize_a_lightning_cluster.rst b/docs/source-app/cloud/customize_a_lightning_cluster.rst new file mode 100644 index 0000000..6a2f12a --- /dev/null +++ b/docs/source-app/cloud/customize_a_lightning_cluster.rst @@ -0,0 +1,13 @@ +********************************* +Take full control of your cluster +********************************* +If you are an experienced user, we can enable you to fully own your cluster +configuration using terraform directly. Please email support@lightning.ai for more information. + +---- + +************************************** +Get help building an optimized cluster +************************************** +For enterprise and academic use-cases, we offer tailored cluster set up in case you don't +have experts in-house. Email support@lightning.ai. diff --git a/docs/source-app/code_samples/basics/0.py b/docs/source-app/code_samples/basics/0.py new file mode 100644 index 0000000..75959d9 --- /dev/null +++ b/docs/source-app/code_samples/basics/0.py @@ -0,0 +1,19 @@ +import lightning as L + + +class ExampleWork(L.LightningWork): + def run(self, *args, **kwargs): + print(f"I received the following props: args: {args} kwargs: {kwargs}") + + +work = ExampleWork() +work.run(value=1) + +# Providing the same value. This won't run as already cached. +work.run(value=1) +work.run(value=1) +work.run(value=1) +work.run(value=1) + +# Changing the provided value. This isn't cached and will run again. +work.run(value=10) diff --git a/docs/source-app/code_samples/basics/1.py b/docs/source-app/code_samples/basics/1.py new file mode 100644 index 0000000..3a249c8 --- /dev/null +++ b/docs/source-app/code_samples/basics/1.py @@ -0,0 +1,22 @@ +import lightning as L + + +class ExampleWork(L.LightningWork): + def __init__(self): + super().__init__(cache_calls=False) + + def run(self, *args, **kwargs): + print(f"I received the following props: args: {args} kwargs: {kwargs}") + + +work = ExampleWork() +work.run(value=1) + +# Providing the same value. This won't run as already cached. +work.run(value=1) +work.run(value=1) +work.run(value=1) +work.run(value=1) + +# Changing the provided value. This isn't cached and will run again. +work.run(value=10) diff --git a/docs/source-app/code_samples/convert_pl_to_app/app.py b/docs/source-app/code_samples/convert_pl_to_app/app.py new file mode 100644 index 0000000..e83a428 --- /dev/null +++ b/docs/source-app/code_samples/convert_pl_to_app/app.py @@ -0,0 +1,17 @@ +import lightning as L +from lightning.app.components import TracerPythonScript + + +class RootFlow(L.LightningFlow): + def __init__(self): + super().__init__() + self.runner = TracerPythonScript( + "train.py", + cloud_compute=L.CloudCompute("gpu"), + ) + + def run(self): + self.runner.run() + + +app = L.LightningApp(RootFlow()) diff --git a/docs/source-app/code_samples/convert_pl_to_app/requirements.txt b/docs/source-app/code_samples/convert_pl_to_app/requirements.txt new file mode 100644 index 0000000..e8fb43e --- /dev/null +++ b/docs/source-app/code_samples/convert_pl_to_app/requirements.txt @@ -0,0 +1,3 @@ +torch +torchvision +pytorch_lightning diff --git a/docs/source-app/code_samples/convert_pl_to_app/train.py b/docs/source-app/code_samples/convert_pl_to_app/train.py new file mode 100644 index 0000000..6dd3042 --- /dev/null +++ b/docs/source-app/code_samples/convert_pl_to_app/train.py @@ -0,0 +1,46 @@ +import os + +import torch +import torch.nn.functional as F +from torch import nn +from torch.utils.data import DataLoader, random_split +from torchvision import transforms as T +from torchvision.datasets import MNIST + +import pytorch_lightning as pl + + +class LitAutoEncoder(pl.LightningModule): + def __init__(self): + super().__init__() + self.encoder = nn.Sequential(nn.Linear(28 * 28, 128), nn.ReLU(), nn.Linear(128, 3)) + self.decoder = nn.Sequential(nn.Linear(3, 128), nn.ReLU(), nn.Linear(128, 28 * 28)) + + def forward(self, x): + # in lightning, + # forward defines the prediction/inference actions + embedding = self.encoder(x) + return embedding + + def training_step(self, batch, batch_idx): + # training_step defines the train loop. + # It is independent of forward + x, y = batch + x = x.view(x.size(0), -1) + z = self.encoder(x) + x_hat = self.decoder(z) + loss = F.mse_loss(x_hat, x) + self.log("train_loss", loss) + return loss + + def configure_optimizers(self): + optimizer = torch.optim.Adam(self.parameters(), lr=1e-3) + return optimizer + + +dataset = MNIST(os.getcwd(), download=True, transform=T.ToTensor()) +train, val = random_split(dataset, [55000, 5000]) + +autoencoder = LitAutoEncoder() +trainer = pl.Trainer(accelerator="auto") +trainer.fit(autoencoder, DataLoader(train), DataLoader(val)) diff --git a/docs/.nojekyll b/docs/source-app/code_samples/quickstart/__init__.py similarity index 100% rename from docs/.nojekyll rename to docs/source-app/code_samples/quickstart/__init__.py diff --git a/docs/source-app/code_samples/quickstart/app/__init__.py b/docs/source-app/code_samples/quickstart/app/__init__.py new file mode 100644 index 0000000..e69de29 diff --git a/docs/source-app/code_samples/quickstart/app/app_0.py b/docs/source-app/code_samples/quickstart/app/app_0.py new file mode 100644 index 0000000..82b687b --- /dev/null +++ b/docs/source-app/code_samples/quickstart/app/app_0.py @@ -0,0 +1,21 @@ +import lightning as L +from docs.quickstart.app_02 import HourLongWork + + +class RootFlow(L.LightningFlow): + def __init__(self, child_work_1: L.LightningWork, child_work_2: L.LightningWork): + super().__init__() + self.child_work_1 = child_work_1 + self.child_work_2 = child_work_2 + + def run(self): + print(round(self.child_work_1.progress, 4), round(self.child_work_2.progress, 4)) + self.child_work_1.run() + self.child_work_2.run() + if self.child_work_1.progress == 1.0: + print("1 hour later `child_work_1` started!") + if self.child_work_2.progress == 1.0: + print("1 hour later `child_work_2` started!") + + +app = L.LightningApp(RootFlow(HourLongWork(parallel=True), HourLongWork(parallel=True))) diff --git a/docs/source-app/code_samples/quickstart/app/app_1.py b/docs/source-app/code_samples/quickstart/app/app_1.py new file mode 100644 index 0000000..29d8db2 --- /dev/null +++ b/docs/source-app/code_samples/quickstart/app/app_1.py @@ -0,0 +1,92 @@ +import flash +from flash.core.data.utils import download_data +from flash.image import ImageClassificationData, ImageClassifier + +import lightning as L +from pytorch_lightning.callbacks import ModelCheckpoint + + +# Step 1: Create a training LightningWork component that gets a backbone as input +# and saves the best model and its score +class ImageClassifierTrainWork(L.LightningWork): + def __init__(self, max_epochs: int, backbone: str, cloud_compute: L.CloudCompute): + # parallel is set to True to run asynchronously + super().__init__(parallel=True, cloud_compute=cloud_compute) + # Number of epochs to run + self.max_epochs = max_epochs + # The model backbone to train on + self.backbone = backbone + self.best_model_path = None + self.best_model_score = None + + def run(self, train_folder): + # Create a datamodule from the given dataset + datamodule = ImageClassificationData.from_folders( + train_folder=train_folder, + batch_size=1, + val_split=0.5, + ) + # Create an image classfier task with the given backbone + model = ImageClassifier(datamodule.num_classes, backbone=self.backbone) + # Start a Lightning trainer, with 1 training batch and 4 validation batches + trainer = flash.Trainer( + max_epochs=self.max_epochs, + limit_train_batches=1, + limit_val_batches=4, + callbacks=[ModelCheckpoint(monitor="val_cross_entropy")], + ) + # Train the model + trainer.fit(model, datamodule=datamodule) + # Save the model path + self.best_model_path = trainer.checkpoint_callback.best_model_path + # Save the model score + self.best_model_score = trainer.checkpoint_callback.best_model_score.item() + + +# Step 2: Create a serving LightningWork component that gets a model input and serves it +class ImageClassifierServeWork(L.LightningWork): + def run(self, best_model_path: str): + # Load the model from the model path + model = ImageClassifier.load_from_checkpoint(best_model_path) + model.serve(output="labels") + + +# Step 3: Create a root LightningFlow component that gets number of epochs and a path to +# a dataset as inputs, initialize 2 training components and serves the best model +class RootFlow(L.LightningFlow): + def __init__(self, max_epochs: int, data_dir: str): + super().__init__() + self.data_dir = data_dir + # Init an image classifier with resnet18 backbone + self.train_work_1 = ImageClassifierTrainWork( + max_epochs, + "resnet18", + ) + # Init an image classifier with resnet26 backbone + self.train_work_2 = ImageClassifierTrainWork( + max_epochs, + "resnet26", + ) + # Init the serving component + self.server_work = ImageClassifierServeWork() + + def run(self): + # running both `train_work_1` and `train_work_2` in parallel and asynchronously. + self.train_work_1.run(self.data_dir) + self.train_work_2.run(self.data_dir) + + # run serve_work only when both `best_model_score` are available. + if self.train_work_1.best_model_score and self.train_work_2.best_model_score: + # serve only the best model between `train_work_1` and `train_work_2`. + self.server_work.run( + self.train_work_1.best_model_path + if self.train_work_1.best_model_score < self.train_work_2.best_model_score + else self.train_work_2.best_model_path + ) + + +# Step 4: download a dataset to your local directory under `/data` +download_data("https://pl-flash-data.s3.amazonaws.com/hymenoptera_data.zip", "./data") + +# Initialize your Lightning app with 5 epochs +app = L.LightningApp(RootFlow(5, "./data/hymenoptera_data")) diff --git a/docs/source-app/code_samples/quickstart/app_01.py b/docs/source-app/code_samples/quickstart/app_01.py new file mode 100644 index 0000000..0a435c6 --- /dev/null +++ b/docs/source-app/code_samples/quickstart/app_01.py @@ -0,0 +1,27 @@ +import lightning as L +from lightning.app.utilities.app_helpers import pretty_state + + +class Work(L.LightningWork): + def __init__(self): + super().__init__(cache_calls=False) + # Attributes are registered automatically in the state. + self.counter = 0 + + def run(self): + # Incrementing an attribute gets reflected in the `Flow` state. + self.counter += 1 + + +class Flow(L.LightningFlow): + def __init__(self): + super().__init__() + self.w = Work() + + def run(self): + if self.w.has_started: + print(f"State: {pretty_state(self.state)} \n") + self.w.run() + + +app = L.LightningApp(Flow()) diff --git a/docs/source-app/code_samples/quickstart/app_02.py b/docs/source-app/code_samples/quickstart/app_02.py new file mode 100644 index 0000000..e756019 --- /dev/null +++ b/docs/source-app/code_samples/quickstart/app_02.py @@ -0,0 +1,32 @@ +from time import sleep + +import lightning as L + + +# This work takes an hour to run +class HourLongWork(L.LightningWork): + def __init__(self, parallel: bool = False): + super().__init__(parallel=parallel) + self.progress = 0.0 + + def run(self): + self.progress = 0.0 + for _ in range(3600): + self.progress += 1.0 / 3600 # Reporting my progress to the Flow. + sleep(1) + + +class RootFlow(L.LightningFlow): + def __init__(self, child_work: L.LightningWork): + super().__init__() + self.child_work = child_work + + def run(self): + # prints the progress from the child work + print(round(self.child_work.progress, 4)) + self.child_work.run() + if self.child_work.counter == 1.0: + print("1 hour later!") + + +app = L.LightningApp(RootFlow(HourLongWork())) diff --git a/docs/source-app/code_samples/quickstart/app_03.py b/docs/source-app/code_samples/quickstart/app_03.py new file mode 100644 index 0000000..ee2047a --- /dev/null +++ b/docs/source-app/code_samples/quickstart/app_03.py @@ -0,0 +1,31 @@ +from time import sleep + +import lightning as L + + +class HourLongWork(L.LightningWork): + def __init__(self): + super().__init__(cache_calls=False) + self.progress = 0.0 + + def run(self): + self.progress = 0.0 + for _ in range(3600): + self.progress += 1.0 / 3600 + sleep(1) + + +class RootFlow(L.LightningFlow): + def __init__(self, child_work: L.LightningWork): + super().__init__() + self.child_work = child_work + + def run(self): + # prints the progress from the child work + print(round(self.child_work.progress, 4)) + self.child_work.run() + if self.child_work.counter == 1.0: + print("1 hour later!") + + +app = L.LightningApp(RootFlow(HourLongWork())) diff --git a/docs/source-app/code_samples/quickstart/app_comp.py b/docs/source-app/code_samples/quickstart/app_comp.py new file mode 100644 index 0000000..d09c89b --- /dev/null +++ b/docs/source-app/code_samples/quickstart/app_comp.py @@ -0,0 +1,26 @@ +import lightning as L +from lightning.app.testing import EmptyFlow, EmptyWork + + +class FlowB(L.LightningFlow): + def __init__(self): + super().__init__() + self.flow_d = EmptyFlow() + self.work_b = EmptyWork() + + def run(self): + ... + + +class FlowA(L.LightningFlow): + def __init__(self): + super().__init__() + self.flow_b = FlowB() + self.flow_c = EmptyFlow() + self.work_a = EmptyWork() + + def run(self): + ... + + +app = L.LightningApp(FlowA()) diff --git a/docs/source-app/code_samples/quickstart/hello_world/app.py b/docs/source-app/code_samples/quickstart/hello_world/app.py new file mode 100644 index 0000000..94ac255 --- /dev/null +++ b/docs/source-app/code_samples/quickstart/hello_world/app.py @@ -0,0 +1,15 @@ +import lightning as L + + +# Step 1: Subclass LightningFlow component to define the app flow. +class HelloWorld(L.LightningFlow): + # Step 2: Add the app logic to the LightningFlow run method to + # ``print("Hello World!")`. + # The LightningApp executes the run method of the main LightningFlow + # within an infinite loop. + def run(self): + print("Hello World!") + + +# Step 3: Initialize a LightningApp with the LightningFlow you defined (in step 1) +app = L.LightningApp(HelloWorld()) diff --git a/docs/source-app/code_samples/quickstart/hello_world/app_ui.py b/docs/source-app/code_samples/quickstart/hello_world/app_ui.py new file mode 100644 index 0000000..67fa6aa --- /dev/null +++ b/docs/source-app/code_samples/quickstart/hello_world/app_ui.py @@ -0,0 +1,57 @@ +import os + +import lightning as L +from lightning.app.frontend import StaticWebFrontend, StreamlitFrontend +from lightning.app.utilities.state import AppState + + +# Step 1: Define your LightningFlow component with the app UI +class UIStreamLit(L.LightningFlow): + def __init__(self): + super().__init__() + self.should_print = False + + # Step 2: Override `configure_layout` to define the layout of the UI + # In this example, we are using `StreamlitFrontend` + def configure_layout(self): + return StreamlitFrontend(render_fn=render_fn) + + +# Step 3: Implement the StreamLit render method +def render_fn(state: AppState): + import streamlit as st + from streamlit_autorefresh import st_autorefresh + + st_autorefresh(interval=2000, limit=None, key="refresh") + + state.should_print = st.select_slider( + "Should the Application print 'Hello World !' to the terminal:", + [False, True], + ) + + +# Step 4: Implement a Static Web Frontend. This could be react, vue, etc. +class UIStatic(L.LightningFlow): + # Step 5: + def configure_layout(self): + return StaticWebFrontend(os.path.join(os.path.dirname(__file__), "ui")) + + +# Step 6: Implement the root flow. +class HelloWorld(L.LightningFlow): + def __init__(self): + super().__init__() + self.static_ui = UIStatic() + self.streamlit_ui = UIStreamLit() + + def run(self): + print("Hello World!" if self.streamlit_ui.should_print else "") + + def configure_layout(self): + return [ + {"name": "StreamLit", "content": self.streamlit_ui}, + {"name": "Static", "content": self.static_ui}, + ] + + +app = L.LightningApp(HelloWorld()) diff --git a/docs/source-app/code_samples/quickstart/hello_world/ui/index.html b/docs/source-app/code_samples/quickstart/hello_world/ui/index.html new file mode 100644 index 0000000..fe38c43 --- /dev/null +++ b/docs/source-app/code_samples/quickstart/hello_world/ui/index.html @@ -0,0 +1 @@ +
Hello from component UIStatic
diff --git a/docs/source-app/conf.py b/docs/source-app/conf.py new file mode 100644 index 0000000..3541b27 --- /dev/null +++ b/docs/source-app/conf.py @@ -0,0 +1,398 @@ +# Configuration file for the Sphinx documentation builder. +# +# This file does only contain a selection of the most common options. For a +# full list see the documentation: +# http://www.sphinx-doc.org/en/master/config + +# -- Path setup -------------------------------------------------------------- + +# If extensions (or modules to document with autodoc) are in another directory, +# add these directories to sys.path here. If the directory is relative to the +# documentation root, use os.path.abspath to make it absolute, like shown here. + +import glob +import inspect +import os +import shutil +import sys + +import pt_lightning_sphinx_theme +from lightning_utilities.docs import fetch_external_assets + +import lightning + +_PATH_HERE = os.path.abspath(os.path.dirname(__file__)) +_PATH_ROOT = os.path.realpath(os.path.join(_PATH_HERE, "..", "..")) +sys.path.insert(0, os.path.abspath(_PATH_ROOT)) + +SPHINX_MOCK_REQUIREMENTS = int(os.environ.get("SPHINX_MOCK_REQUIREMENTS", True)) + +# -- Project information ----------------------------------------------------- + +# this name shall match the project name in Github as it is used for linking to code +project = "lightning" +copyright = lightning.__copyright__ +author = lightning.__author__ + +# The short X.Y version +version = lightning.__version__ +# The full version, including alpha/beta/rc tags +release = lightning.__version__ + +# Options for the linkcode extension +# ---------------------------------- +github_user = "Lightning-AI" +github_repo = project + +# -- Project documents ------------------------------------------------------- + + +fetch_external_assets( + docs_folder=_PATH_HERE, assets_folder="_static/fetched-s3-assets", retrieve_pattern=r"https?://[-a-zA-Z0-9_]+\.s3\.[-a-zA-Z0-9()_\\+.\\/=]+" +) + +# -- General configuration --------------------------------------------------- + +# If your documentation needs a minimal Sphinx version, state it here. + +needs_sphinx = "4.5" + +# Add any Sphinx extension module names here, as strings. They can be +# extensions coming with Sphinx (named 'sphinx.ext.*') or your custom +# ones. +extensions = [ + "sphinx.ext.autodoc", + "sphinx.ext.doctest", + "sphinx.ext.intersphinx", + "sphinx_toolbox.collapse", + "sphinx.ext.todo", + "sphinx.ext.coverage", + "sphinx.ext.linkcode", + "sphinx.ext.autosummary", + "sphinx.ext.napoleon", + "sphinx.ext.imgmath", + # 'sphinxcontrib.mockautodoc', # raises error: directive 'automodule' is already registered ... + # 'sphinxcontrib.fulltoc', # breaks pytorch-theme with unexpected kw argument 'titles_only' + "sphinxcontrib.video", + "myst_parser", + "sphinx.ext.autosectionlabel", + "nbsphinx", + "sphinx_autodoc_typehints", + "sphinx_copybutton", + "sphinx_paramlinks", + "sphinx_togglebutton", + "sphinx.ext.githubpages", + # "lai_sphinx_theme.extensions.lightning", + "pt_lightning_sphinx_theme.extensions.lightning", +] + +# Add any paths that contain templates here, relative to this directory. +templates_path = ["_templates"] + +# myst-parser, forcing to parse all html pages with mathjax +# https://github.com/executablebooks/MyST-Parser/issues/394 +myst_update_mathjax = False +# https://myst-parser.readthedocs.io/en/latest/syntax/optional.html?highlight=anchor#auto-generated-header-anchors +myst_heading_anchors = 3 + +# https://berkeley-stat159-f17.github.io/stat159-f17/lectures/14-sphinx..html#conf.py-(cont.) +# https://stackoverflow.com/questions/38526888/embed-ipython-notebook-in-sphinx-document +# I execute the notebooks manually in advance. If notebooks test the code, +# they should be run at build time. +nbsphinx_execute = "never" +nbsphinx_allow_errors = True +nbsphinx_requirejs_path = "" + +# The suffix(es) of source filenames. +# You can specify multiple suffix as a list of string: +# +# source_suffix = ['.rst', '.md'] +# source_suffix = ['.rst', '.md', '.ipynb'] +source_suffix = { + ".rst": "restructuredtext", + ".txt": "markdown", + ".md": "markdown", + ".ipynb": "nbsphinx", +} + +# The master toctree document. +master_doc = "index" + +# The language for content autogenerated by Sphinx. Refer to documentation +# for a list of supported languages. +# +# This is also used if you do content translation via gettext catalogs. +# Usually you set "language" from the command line for these cases. +language = 'en' + +# List of patterns, relative to source-app directory, that match files and +# directories to ignore when looking for source-app files. +# This pattern also affects html_static_path and html_extra_path. +exclude_patterns = [ + "PULL_REQUEST_TEMPLATE.md", + "**/README.md/*", + "readme.md", + "_templates", + "code_samples/convert_pl_to_app/requirements.txt", + "**/_static/*" +] + +# The name of the Pygments (syntax highlighting) style to use. +pygments_style = None + +# -- Options for HTML output ------------------------------------------------- + +# The theme to use for HTML and HTML Help pages. See the documentation for +# a list of builtin themes. +# +# html_theme = "lai_sphinx_theme" +html_theme = "pt_lightning_sphinx_theme" +html_theme_path = [os.environ.get('LIT_SPHINX_PATH', pt_lightning_sphinx_theme.get_html_theme_path())] + +# Theme options are theme-specific and customize the look and feel of a theme +# further. For a list of options available for each theme, see the +# documentation. + +html_theme_options = { + "pytorch_project": lightning.__homepage__, + "analytics_id": "G-D3Q2ESCTZR", + "canonical_url": lightning.__homepage__, + "collapse_navigation": False, + "display_version": True, + "logo_only": False, +} + +html_favicon = "_static/images/icon.svg" + +# Add any paths that contain custom static files (such as style sheets) here, +# relative to this directory. They are copied after the builtin static files, +# so a file named "default.css" will overwrite the builtin "default.css". +html_static_path = ["_templates", "_static"] + +# Custom sidebar templates, must be a dictionary that maps document names +# to template names. +# +# The default sidebars (for documents that don't match any pattern) are +# defined by theme itself. Builtin themes are using these templates by +# default: ``['localtoc.html', 'relations.html', 'sourcelink.html', +# 'searchbox.html']``. +# +# html_sidebars = {} + +# -- Options for HTMLHelp output --------------------------------------------- + +# Output file base name for HTML help builder. +htmlhelp_basename = project + "-doc" + +# -- Options for LaTeX output ------------------------------------------------ + +latex_elements = { + # The paper size ('letterpaper' or 'a4paper'). + # 'papersize': 'letterpaper', + # The font size ('10pt', '11pt' or '12pt'). + # 'pointsize': '10pt', + # Additional stuff for the LaTeX preamble. + # 'preamble': '', + # Latex figure (float) alignment + "figure_align": "htbp", +} + +# Grouping the document tree into LaTeX files. List of tuples +# (source-app start file, target name, title, +# author, documentclass [howto, manual, or own class]). +latex_documents = [ + (master_doc, project + ".tex", project + " Documentation", author, "manual"), +] + +# -- Options for manual page output ------------------------------------------ + +# One entry per manual page. List of tuples +# (source-app start file, name, description, authors, manual section). +man_pages = [(master_doc, project, project + " Documentation", [author], 1)] + +# -- Options for Texinfo output ---------------------------------------------- + +# Grouping the document tree into Texinfo files. List of tuples +# (source-app start file, target name, title, author, +# dir menu entry, description, category) +texinfo_documents = [ + ( + master_doc, + project, + project + " Documentation", + author, + project, + lightning.__docs__, + "Miscellaneous", + ), +] + +# -- Options for Epub output ------------------------------------------------- + +# Bibliographic Dublin Core info. +epub_title = project + +# The unique identifier of the text. This can be a ISBN number +# or the project homepage. +# +# epub_identifier = '' + +# A unique identification for the text. +# +# epub_uid = '' + +# A list of files that should not be packed into the epub file. +epub_exclude_files = ["search.html"] + +# -- Extension configuration ------------------------------------------------- + +# -- Options for intersphinx extension --------------------------------------- + +# Example configuration for intersphinx: refer to the Python standard library. +intersphinx_mapping = { + "python": ("https://docs.python.org/3", None), + "torch": ("https://pytorch.org/docs/stable/", None), + # "numpy": ("https://docs.scipy.org/doc/numpy/", None), +} + +# -- Options for todo extension ---------------------------------------------- + +# If true, `todo` and `todoList` produce output, else they produce nothing. +todo_include_todos = True + + +def setup(app): + # this is for hiding doctest decoration, + # see: http://z4r.github.io/python/2011/12/02/hides-the-prompts-and-output/ + app.add_js_file("copybutton.js") + app.add_css_file("main.css") + + +# copy all notebooks to local folder +path_nbs = os.path.join(_PATH_HERE, "notebooks") +if not os.path.isdir(path_nbs): + os.mkdir(path_nbs) +for path_ipynb in glob.glob(os.path.join(_PATH_ROOT, "notebooks", "*.ipynb")): + path_ipynb2 = os.path.join(path_nbs, os.path.basename(path_ipynb)) + shutil.copy(path_ipynb, path_ipynb2) + +# copy all examples to local folder +path_examples = os.path.join(_PATH_HERE, "..", "examples") +if not os.path.isdir(path_examples): + os.mkdir(path_examples) +for path_app_example in glob.glob(os.path.join(_PATH_ROOT, "examples", "app_*")): + path_app_example2 = os.path.join(path_examples, os.path.basename(path_app_example)) + if not os.path.isdir(path_app_example2): + shutil.copytree(path_app_example, path_app_example2, dirs_exist_ok=True) + + +# Ignoring Third-party packages +# https://stackoverflow.com/questions/15889621/sphinx-how-to-exclude-imports-in-automodule +def _package_list_from_file(file): + list_pkgs = [] + with open(file) as fp: + lines = fp.readlines() + for ln in lines: + found = [ln.index(ch) for ch in list(",=<>#") if ch in ln] + pkg = ln[: min(found)] if found else ln + if pkg.rstrip(): + list_pkgs.append(pkg.rstrip()) + return list_pkgs + + +# define mapping from PyPI names to python imports +PACKAGE_MAPPING = { + "PyYAML": "yaml", +} +MOCK_PACKAGES = [] +if SPHINX_MOCK_REQUIREMENTS: + # mock also base packages when we are on RTD since we don't install them there + MOCK_PACKAGES += _package_list_from_file(os.path.join(_PATH_ROOT, "requirements.txt")) +MOCK_PACKAGES = [PACKAGE_MAPPING.get(pkg, pkg) for pkg in MOCK_PACKAGES] + +autodoc_mock_imports = MOCK_PACKAGES + + +# Resolve function +# This function is used to populate the (source-app) links in the API +def linkcode_resolve(domain, info): + def find_source(): + # try to find the file and line number, based on code from numpy: + # https://github.com/numpy/numpy/blob/master/doc/source/conf.py#L286 + obj = sys.modules[info["module"]] + for part in info["fullname"].split("."): + obj = getattr(obj, part) + fname = inspect.getsourcefile(obj) + # https://github.com/rtfd/readthedocs.org/issues/5735 + if any(s in fname for s in ("readthedocs", "rtfd", "checkouts")): + # /home/docs/checkouts/readthedocs.org/user_builds/pytorch_lightning/checkouts/ + # devel/pytorch_lightning/utilities/cls_experiment.py#L26-L176 + path_top = os.path.abspath(os.path.join("..", "..", "..")) + fname = os.path.relpath(fname, start=path_top) + else: + # Local build, imitate master + fname = "master/" + os.path.relpath(fname, start=os.path.abspath("..")) + source, lineno = inspect.getsourcelines(obj) + return fname, lineno, lineno + len(source) - 1 + + if domain != "py" or not info["module"]: + return None + try: + filename = "%s#L%d-L%d" % find_source() + except Exception: + filename = info["module"].replace(".", "/") + ".py" + # import subprocess + # tag = subprocess.Popen(['git', 'rev-parse', 'HEAD'], stdout=subprocess.PIPE, + # universal_newlines=True).communicate()[0][:-1] + branch = filename.split("/")[0] + # do mapping from latest tags to master + branch = {"latest": "master", "stable": "master"}.get(branch, branch) + filename = "/".join([branch] + filename.split("/")[1:]) + return f"https://github.com/{github_user}/{github_repo}/blob/{filename}" + + +autosummary_generate = True + +autodoc_member_order = "groupwise" +autoclass_content = "both" +# the options are fixed and will be soon in release, +# see https://github.com/sphinx-doc/sphinx/issues/5459 +autodoc_default_options = { + "members": None, + "methods": None, + # 'attributes': None, + "special-members": "__call__", + "exclude-members": "_abc_impl", + "show-inheritance": True, + "private-members": True, + "noindex": True, +} + +# Sphinx will add “permalinks” for each heading and description environment as paragraph signs that +# become visible when the mouse hovers over them. +# This value determines the text for the permalink; it defaults to "¶". Set it to None or the empty +# string to disable permalinks. +# https://www.sphinx-doc.org/en/master/usage/configuration.html#confval-html_permalinks +# html_add_permalinks = "¶" +# True to prefix each section label with the name of the document it is in, followed by a colon. +# For example, index:Introduction for a section called Introduction that appears in document index.rst. +# Useful for avoiding ambiguity when the same section heading appears in different documents. +# http://www.sphinx-doc.org/en/master/usage/extensions/autosectionlabel.html +autosectionlabel_prefix_document = True + +# only run doctests marked with a ".. doctest::" directive +doctest_test_doctest_blocks = "" +doctest_global_setup = """ +import importlib +import os +import lightning as L + +from lightning.fabric.loggers.tensorboard import _TENSORBOARD_AVAILABLE, _TENSORBOARDX_AVAILABLE +""" +coverage_skip_undoc_in_source = True + +# skip false positive linkcheck errors from anchors +linkcheck_anchors = False + +# ignore all links in any CHANGELOG file +linkcheck_exclude_documents = [r"^(.*\/)*CHANGELOG.*$"] diff --git a/docs/source-app/contribute_app.rst b/docs/source-app/contribute_app.rst new file mode 100644 index 0000000..2f690e8 --- /dev/null +++ b/docs/source-app/contribute_app.rst @@ -0,0 +1,7 @@ +:orphan: + +################# +Contribute an app +################# + +Show off your work! Contribute and example to be highlighted in our documentation and App gallery. diff --git a/docs/source-app/core_api/lightning_app/app.py b/docs/source-app/core_api/lightning_app/app.py new file mode 100644 index 0000000..0a435c6 --- /dev/null +++ b/docs/source-app/core_api/lightning_app/app.py @@ -0,0 +1,27 @@ +import lightning as L +from lightning.app.utilities.app_helpers import pretty_state + + +class Work(L.LightningWork): + def __init__(self): + super().__init__(cache_calls=False) + # Attributes are registered automatically in the state. + self.counter = 0 + + def run(self): + # Incrementing an attribute gets reflected in the `Flow` state. + self.counter += 1 + + +class Flow(L.LightningFlow): + def __init__(self): + super().__init__() + self.w = Work() + + def run(self): + if self.w.has_started: + print(f"State: {pretty_state(self.state)} \n") + self.w.run() + + +app = L.LightningApp(Flow()) diff --git a/docs/source-app/core_api/lightning_app/communication.rst b/docs/source-app/core_api/lightning_app/communication.rst new file mode 100644 index 0000000..9a823b0 --- /dev/null +++ b/docs/source-app/core_api/lightning_app/communication.rst @@ -0,0 +1,15 @@ +:orphan: + +########################################## +Communication between Lightning Components +########################################## + +**Audience:** Users that want to create interactive applications. + +**Level:** Intermediate + +**Prerequisite**: Read the `Communication in Lightning Apps article <../../access_app_state.html>`_. + +---- + +.. include:: ../../core_api/lightning_app/communication_content.rst diff --git a/docs/source-app/core_api/lightning_app/communication_content.rst b/docs/source-app/core_api/lightning_app/communication_content.rst new file mode 100644 index 0000000..ea39749 --- /dev/null +++ b/docs/source-app/core_api/lightning_app/communication_content.rst @@ -0,0 +1,160 @@ + +******************************** +Communication Between Components +******************************** + +When creating interactive Lightning Apps (App) with multiple components, you may need your components to share information with each other and rely on that information to control their execution, share progress in the UI, trigger a sequence of operations, etc. + +To accomplish that, Lightning components can communicate using the App State. The App State is composed of all attributes defined within each component's **__init__** method e.g anything attached to the component with **self.x = y**. + +All attributes of all **LightningWork (Work)** components are accessible in the **LightningFlow (Flow)** components in real-time. + +By design, the Flows communicate to all **Works** within the application. However, Works can't communicate with each other directly, they must use Flows as a proxy to communicate. + +Once a Work is running, any updates to the Work's state is automatically communicated to the Flow, as a delta (using `DeepDiff `_). The state communication isn't bi-directional, communication is only done from Work to Flow. + +Internally, the App is alternatively collecting deltas sent from all the registered Works and/or UI, and running the root Flow run method of the App. + +---- + +************************************************* +Communication from LightningWork to LightningFlow +************************************************* + +LightningFlow (Flow) can access their children's LightningWork (Work) state. + +When a running Work attribute gets updated inside its method (separate process locally or remote machine), the app re-executes Flow's run method once it receives the state update from the Work. + +Here's an example to better understand communication from Work to Flow. + +The ``WorkCounter`` increments a counter until 1 million and the ``Flow`` prints the work counter. + +As the Work is running its own process, its state changes are sent to the Flow which contains the latest value of the counter. + +.. code-block:: python + + import lightning as L + + + class WorkCounter(L.LightningWork): + def __init__(self): + super().__init__(parallel=True) + self.counter = 0 + + def run(self): + for _ in range(int(10e6)): + self.counter += 1 + + + class Flow(L.LightningFlow): + def __init__(self): + super().__init__() + self.w = WorkCounter() + + def run(self): + self.w.run() + print(self.w.counter) + + + app = L.LightningApp(Flow()) + + +A delta sent from the Work to the Flow looks like this: + +.. code-block:: python + + {"values_changed": {"root['works']['w']['vars']['counter']": {"new_value": 425}}} + +Here is the associated illustration: + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/deltas.gif + :alt: Mechanism showing how delta are sent. + :width: 100 % + +Here's another example that is slightly different. Here we define a Flow and Work, where the Work increments a counter indefinitely and the Flow prints its state which contain the Work. + +You can easily check the state of your entire app as follows: + +.. literalinclude:: ../../core_api/lightning_app/app.py + +Run the app with: + +.. code-block:: bash + + lightning run app docs/source/core_api/lightning_app/app.py + +And here's the output you get when running the App using the **Lightning CLI**: + +.. code-block:: console + + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + State: {'works': {'w': {'vars': {'counter': 1}}}} + State: {'works': {'w': {'vars': {'counter': 2}}}} + State: {'works': {'w': {'vars': {'counter': 3}}}} + State: {'works': {'w': {'vars': {'counter': 3}}}} + State: {'works': {'w': {'vars': {'counter': 4}}}} + ... + +---- + +************************************************* +Communication from LightningFlow to LightningWork +************************************************* + +Communication from the LightningFlow (Flow) to the LightningWork (Work) while running **isn't supported yet**. If your application requires this feature, please open an issue on Github. + +Here's an example of what would happen if you try to have the Flow communicate with the Work: + +.. code-block:: python + + import lightning as L + from time import sleep + + + class WorkCounter(L.LightningWork): + def __init__(self): + super().__init__(parallel=True) + self.counter = 0 + + def run(self): + while True: + sleep(1) + print(f"Work {self.counter}") + + + class Flow(L.LightningFlow): + def __init__(self): + super().__init__() + self.w = WorkCounter() + + def run(self): + self.w.run() + sleep(1) + print(f"Flow {self.w.counter}") + self.w.counter += 1 + + + app = L.LightningApp(Flow()) + +As you can see, there is a divergence between the values within the Work and the Flow. + +.. code-block:: console + + Flow 0 + Flow 1 + Flow 2 + Flow 3 + Work 0 + Flow 4 + Work 0 + Flow 5 + Work 0 + Flow 6 + Work 0 + Flow 7 + Work 0 + Flow 8 + Work 0 + Flow 9 + Work 0 + Flow 10 diff --git a/docs/source-app/core_api/lightning_app/compute_content.rst b/docs/source-app/core_api/lightning_app/compute_content.rst new file mode 100644 index 0000000..8bb2e70 --- /dev/null +++ b/docs/source-app/core_api/lightning_app/compute_content.rst @@ -0,0 +1,40 @@ +:orphan: + +*************************** +Customize my Flow resources +*************************** + +In the cloud, you can simply configure which machine to run on by passing +a :class:`~lightning.app.utilities.packaging.cloud_compute.CloudCompute` to your work ``__init__`` method: + +.. code-block:: python + + import lightning as L + + # Run on a small, shared CPU machine. This is the default for every LightningFlow. + app = L.LightningApp(L.Flow(), flow_cloud_compute=L.CloudCompute()) + + +Here is the full list of supported machine names: + +.. list-table:: Hardware by Accelerator Type + :widths: 25 25 25 + :header-rows: 1 + + * - Name + - # of CPUs + - Memory + * - flow-lite + - 0.3 + - 4 GB + +The up-to-date prices for these instances can be found `here `_. + +---- + +************ +CloudCompute +************ + +.. autoclass:: lightning.app.utilities.packaging.cloud_compute.CloudCompute + :noindex: diff --git a/docs/source-app/core_api/lightning_app/dynamic_work.rst b/docs/source-app/core_api/lightning_app/dynamic_work.rst new file mode 100644 index 0000000..bf202aa --- /dev/null +++ b/docs/source-app/core_api/lightning_app/dynamic_work.rst @@ -0,0 +1,15 @@ +:orphan: + +.. _dynamic_work: + +##################### +Dynamic LightningWork +##################### + +**Audience:** Users who want to create applications that adapt to user demands. + +**Level:** Advanced + +---- + +.. include:: dynamic_work_content.rst diff --git a/docs/source-app/core_api/lightning_app/dynamic_work_content.rst b/docs/source-app/core_api/lightning_app/dynamic_work_content.rst new file mode 100644 index 0000000..309e607 --- /dev/null +++ b/docs/source-app/core_api/lightning_app/dynamic_work_content.rst @@ -0,0 +1,202 @@ +*************************************** +What Dynamic LightningWork does for you +*************************************** + +Dynamic LightningWork (Work) changes the resources your application uses while the application is running (aka at runtime). + +For example, imagine you want to create a research notebook app for your team. You want every member to be able to create multiple `JupyterLab `_ sessions on their hardware of choice. + +To allow every notebook to choose hardware, it needs to be set up in it's own :class:`~lightning.app.core.work.LightningWork`, but you can't know the number of notebooks user will need in advance. In this case you'll need to add ``LightningWorks`` dynamically at run time. + +---- + +***************** +Use Dynamic Works +***************** + +Dynamic Works should be used anytime you want change the resources your application is using while it is running (aka at runtime). + +You're usually going to use the ``start`` and ``stop`` methods together. + +---- + +Add a Dynamic Work +^^^^^^^^^^^^^^^^^^ + +There are a couple of ways you can add a dynamic Work: + +- Option 1: Attach your components in the **run** method using the Python functions. +- Option 2: Use the Lightning built-in classes :class:`~lightning.structures.Dict` or :class:`~lightning.structures.List`. + +.. note:: Using the Lightning built-in classes is usually easier to read. + +---- + +**OPTION 1:** Attach your components in the run method of a flow using the Python functions **hasattr**, **setattr**, and **getattr**: + +.. code-block:: python + + class RootFlow(lapp.LightningFlow): + + def run(self): + + if not hasattr(self, "work"): + # The `Work` component is created and attached here. + setattr(self, "work", Work()) + # Run the `Work` component. + getattr(self, "work").run() + +**OPTION 2:** Use the built-in Lightning classes :class:`~lightning.app.structures.Dict` or :class:`~lightning.app.structures.List` + +.. code-block:: python + + from lightning.app.structures import Dict + + class RootFlow(lapp.LightningFlow): + + def __init__(self): + super().__init__() + self.dict = Dict() + + def run(self): + if "work" not in self.dict: + # The `Work` component is attached here. + self.dict["work"] = Work() + self.dict["work"].run() + +---- + +Stop a Work +^^^^^^^^^^^ +Stop a work when you are concerned about cost. + +To stop a work, use the work ``stop`` method: + +.. code-block:: python + + class RootFlow(L.LightningFlow): + + def __init__(self): + super().__init__() + self.work = Work() + + def run(self): + self.work.stop() + +---- + +********************* +Dynamic Work Examples +********************* + +.. + The entire application can be found `here `_. + +---- + +Dynamic Work with Jupyter Notebooks +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +In this example, we are dynamically creating ``JupyterLabWork`` every time a user clicks the **Create Jupyter Notebook** button. + +In order to do that, we are iterating over the list of ``jupyter_config_requests`` infinitely. + +.. code-block:: python + + import lightning as L + + + class JupyterLabManager(L.LightningFlow): + + """This flow manages the users notebooks running within works."""" + + def __init__(self): + super().__init__() + self.jupyter_works = L.structures.Dict() + self.jupyter_config_requests = [] + + def run(self): + for idx, jupyter_config in enumerate(self.jupyter_config_requests): + + # The Jupyter Config has this form is: + # {"use_gpu": False/True, "token": None, "username": ..., "stop": False} + + # Step 1: Check if JupyterWork already exists for this username + username = jupyter_config["username"] + if username not in self.jupyter_works: + jupyter_config["ready"] = False + + # Set the hardware selected by the user: GPU or CPU. + cloud_compute = L.CloudCompute("gpu" if jupyter_config["use_gpu"] else "cpu-small") + + # Step 2: Create new JupyterWork dynamically ! + self.jupyter_works[username] = JupyterLabWork(cloud_compute=cloud_compute) + + # Step 3: Run the JupyterWork + self.jupyter_works[username].run() + + # Step 4: Store the notebook token in the associated config. + # We are using this to know when the notebook is ready + # and display the stop button on the UI. + if self.jupyter_works[username].token: + jupyter_config["token"] = self.jupyter_works[username].token + + # Step 5: Stop the work if the user requested it. + if jupyter_config['stop']: + self.jupyter_works[username].stop() + self.jupyter_config_requests.pop(idx) + + def configure_layout(self): + return L.app.frontend.StreamlitFrontend(render_fn=render_fn) + +---- + +Dynamic Works with StreamLit UI +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +Continuing from the Jupyter Notebook example, in the UI, we receive the **state** of the Jupyter Manager and the state can be modified directly from the UI. + +.. code-block:: python + + import streamlit as st + + + def render_fn(state): + + # Step 1: Enable users to select their notebooks and create them + column_1, column_2, column_3 = st.columns(3) + with column_1: + create_jupyter = st.button("Create Jupyter Notebook") + with column_2: + username = st.text_input('Enter your username', "tchaton") + assert username + with column_3: + use_gpu = st.checkbox('Use GPU') + + # Step 2: If a user clicked the button, add an element to the list of configs + # Note: state.jupyter_config_requests = ... will sent the state update to the component. + if create_jupyter: + new_config = [{"use_gpu": use_gpu, "token": None, "username": username, "stop": False}] + state.jupyter_config_requests = state.jupyter_config_requests + new_config + + # Step 3: List of running notebooks. + for idx, config in enumerate(state.jupyter_config_requests): + column_1, column_2, column_3 = st.columns(3) + with column_1: + if not idx: + st.write(f"Idx") + st.write(f"{idx}") + with column_2: + if not idx: + st.write(f"Use GPU") + st.write(config['use_gpu']) + with column_3: + if not idx: + st.write(f"Stop") + if config["token"]: + should_stop = st.button("Stop this notebook") + + # Step 4: Change stop if the user clicked the button + if should_stop: + config["stop"] = should_stop + state.jupyter_config_requests = state.jupyter_config_requests diff --git a/docs/source-app/core_api/lightning_app/index.rst b/docs/source-app/core_api/lightning_app/index.rst new file mode 100644 index 0000000..bf0430f --- /dev/null +++ b/docs/source-app/core_api/lightning_app/index.rst @@ -0,0 +1,94 @@ +############# +Lightning App +############# +**Audience:** Users who want to know how an app works under the hood 🤯. + +**Lightning App:** We call workflows composed of multiple LightningWorks a **Lightning App**. + +---- + +******************* +Peek under the hood +******************* + + +.. raw:: html + +
+
+ +.. displayitem:: + :header: App Components Tree (Basic) + :description: Learn more component composition and nesting. + :col_css: col-md-4 + :button_link: ../../glossary/app_tree.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: The event loop (Basic) + :description: Learn more about the event loop. + :col_css: col-md-4 + :button_link: ../../glossary/event_loop.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: Communication between Flow and Works + :description: Learn more about components communicate. + :col_css: col-md-4 + :button_link: communication.html + :height: 180 + :tag: Intermediate + +.. displayitem:: + :header: Customize Flow compute resources + :description: Learn more about Flow customizations. + :col_css: col-md-4 + :button_link: compute_content.html + :height: 180 + :tag: Intermediate + +.. displayitem:: + :header: Dynamically create, execute and stop Work + :description: Learn more about components creation. + :col_css: col-md-4 + :button_link: dynamic_work.html + :height: 180 + :tag: Intermediate + +.. displayitem:: + :header: Sharing My Components (Intermediate) + :description: Learn more component composition and nesting. + :col_css: col-md-4 + :button_link: ../../glossary/sharing_components.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
+ +---- + +***************** +Lightning App API +***************** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: LightningApp API + :description: Look into the Lightning API reference. + :col_css: col-md-4 + :button_link: lightning_app.html + :height: 180 + +.. raw:: html + +
+
diff --git a/docs/source-app/core_api/lightning_app/lightning_app.rst b/docs/source-app/core_api/lightning_app/lightning_app.rst new file mode 100644 index 0000000..af95926 --- /dev/null +++ b/docs/source-app/core_api/lightning_app/lightning_app.rst @@ -0,0 +1,12 @@ +:orphan: + +.. _lightning_app: + +############ +LightningApp +############ + + +.. autoclass:: lightning.app.core.app.LightningApp + :exclude-members: _run, connect, get_component_by_name, maybe_apply_changes, set_state + :noindex: diff --git a/docs/source-app/core_api/lightning_flow.rst b/docs/source-app/core_api/lightning_flow.rst new file mode 100644 index 0000000..642112a --- /dev/null +++ b/docs/source-app/core_api/lightning_flow.rst @@ -0,0 +1,8 @@ +.. _lightning_flow: + +############# +LightningFlow +############# + +.. autoclass:: lightning.app.core.flow.LightningFlow + :exclude-members: _attach_backend, _exit, _is_state_attribute, set_state diff --git a/docs/source-app/core_api/lightning_work/compute.rst b/docs/source-app/core_api/lightning_work/compute.rst new file mode 100644 index 0000000..89313c4 --- /dev/null +++ b/docs/source-app/core_api/lightning_work/compute.rst @@ -0,0 +1,15 @@ +:orphan: + +.. _cloud_compute: + +############################ +Customize your Cloud Compute +############################ + +**Audience:** Users who want to select the hardware to run in the cloud. + +**Level:** Intermediate + +---- + +.. include:: compute_content.rst diff --git a/docs/source-app/core_api/lightning_work/compute_content.rst b/docs/source-app/core_api/lightning_work/compute_content.rst new file mode 100644 index 0000000..1ca6442 --- /dev/null +++ b/docs/source-app/core_api/lightning_work/compute_content.rst @@ -0,0 +1,94 @@ + +*************************** +Customize my Work resources +*************************** + +In the cloud, you can simply configure which machine to run on by passing +a :class:`~lightning.app.utilities.packaging.cloud_compute.CloudCompute` to your work ``__init__`` method: + +.. code-block:: python + + import lightning as L + + # Run on a free, shared CPU machine. This is the default for every LightningWork. + MyCustomWork(cloud_compute=L.CloudCompute()) + + # Run on a dedicated, medium-size CPU machine (see specs below) + MyCustomWork(cloud_compute=L.CloudCompute("cpu-medium")) + + # Run on cheap GPU machine with a single GPU (see specs below) + MyCustomWork(cloud_compute=L.CloudCompute("gpu")) + + # Run on a fast multi-GPU machine (see specs below) + MyCustomWork(cloud_compute=L.CloudCompute("gpu-fast-multi")) + +.. warning:: + Custom base images are not supported with the default CPU cloud compute. For example: + + .. code-block:: py + + class MyWork(LightningWork): + def __init__(self): + super().__init__(cloud_build_config=BuildConfig(image="my-custom-image")) # no cloud compute, for example default work + + +Here is the full list of supported machine names: + +.. list-table:: Hardware by Accelerator Type + :widths: 25 25 25 25 + :header-rows: 1 + + * - Name + - # of CPUs + - GPUs + - Memory + * - default + - 1 + - 0 + - 4 GB + * - cpu-small + - 2 + - 0 + - 8 GB + * - cpu-medium + - 8 + - 0 + - 32 GB + * - gpu + - 4 + - 1 (T4, 16 GB) + - 16 GB + * - gpu-fast + - 8 + - 1 (V100, 16 GB) + - 61 GB + * - gpu-fast-multi + - 32 + - 4 (V100 16 GB) + - 244 GB + +The up-to-date prices for these instances can be found `here `_. + +---- + +********************** +Stop my work when idle +********************** + +By providing **idle_timeout=X Seconds**, the work is automatically stopped **X seconds** after doing nothing. + +.. code-block:: python + + import lightning as L + + # Run on a single CPU and turn down immediately when idle. + MyCustomWork(cloud_compute=L.CloudCompute("gpu", idle_timeout=0)) + +---- + +************ +CloudCompute +************ + +.. autoclass:: lightning.app.utilities.packaging.cloud_compute.CloudCompute + :noindex: diff --git a/docs/source-app/core_api/lightning_work/handling_app_exception.rst b/docs/source-app/core_api/lightning_work/handling_app_exception.rst new file mode 100644 index 0000000..20c9b61 --- /dev/null +++ b/docs/source-app/core_api/lightning_work/handling_app_exception.rst @@ -0,0 +1,13 @@ +:orphan: + +############################### +Handle Lightning App exceptions +############################### + +**Audience:** Users who want to make Lightning Apps more robust to potential issues. + +**Level:** Advanced + +---- + +.. include:: handling_app_exception_content.rst diff --git a/docs/source-app/core_api/lightning_work/handling_app_exception_content.rst b/docs/source-app/core_api/lightning_work/handling_app_exception_content.rst new file mode 100644 index 0000000..4840cf5 --- /dev/null +++ b/docs/source-app/core_api/lightning_work/handling_app_exception_content.rst @@ -0,0 +1,74 @@ + +*************************************************** +What handling Lightning App exceptions does for you +*************************************************** + +Imagine you are creating a Lightning App (App) where your team can launch model training by providing their own Github Repo any time they want. + +As the App admin, you don't want the App to go down if their code has a bug and breaks. + +Instead, you would like the LightningWork (Work) to capture the exception and present the issue to users. + +---- + +**************************** +Configure exception handling +**************************** + +The LightningWork (Work) accepts an argument **raise_exception** which is **True** by default. This aligns with Python default behaviors. + +However, for the user case stated in the previous section, we want to capture the Work exceptions. This is done by providing ``raise_exception=False`` to the work ``__init__`` method. + +.. code-block:: python + + import lightning as L + + MyCustomWork(raise_exception=False) # <== HERE: The exception is captured. + + # Default behavior + MyCustomWork(raise_exception=True) # <== HERE: The exception is raised within the flow and terminates the app + + +And you can customize this behavior by overriding the ``on_exception`` hook to the Work. + +.. code-block:: python + + import lightning as L + + class MyCustomWork(L.LightningWork): + + def on_exception(self, exception: Exception): + # do something when an exception is triggered. + +---- + +************************** +Exception handling example +************************** + +This is the pseudo-code for the application described above. + +.. code-block:: python + + import lightning as L + + class RootFlow(L.LightningFlow): + def __init__(self): + super().__init__() + self.user_jobs = L.structures.Dict() + self.requested_jobs = [] + + def run(self): + for request in self.requested_jobs: + job_id = request["id"] + if job_id not in self.user_jobs: + # Note: The `GithubRepoLauncher` doesn't exist yet. + self.user_jobs[job_id] = GithubRepoLauncher( + **request, + raise_exception=False, # <== HERE: The exception is captured. + ) + self.user_jobs[job_id].run() + + if self.user_jobs[job_id].status.stage == "failed" and "printed" not in request: + print(self.user_jobs[job_id].status) # <== HERE: Print the user exception. + request["printed"] = True diff --git a/docs/source-app/core_api/lightning_work/index.rst b/docs/source-app/core_api/lightning_work/index.rst new file mode 100644 index 0000000..0b660f2 --- /dev/null +++ b/docs/source-app/core_api/lightning_work/index.rst @@ -0,0 +1,112 @@ +############## +Lightning Work +############## + +**Audience:** Users who want to know how Lightning Work works under the hood 🤯. + +---- + +******************* +Peek under the hood +******************* + + +.. raw:: html + +
+
+ +.. displayitem:: + :header: To Cache or Not to Cache Calls + :description: Learn more about work execution and internal caching. + :col_css: col-md-4 + :button_link: ../../workflows/run_work_once.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: Parallel Work + :description: Learn more about work parallelization. + :col_css: col-md-4 + :button_link: ../../workflows/run_work_in_parallel.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: Sharing files between works + :description: Learn more about data transfer works. + :col_css: col-md-4 + :button_link: ../../glossary/storage/storage.html + :height: 180 + :tag: Intermediate + +.. displayitem:: + :header: Sharing Python Objects between works + :description: Learn more about sharing objects. + :col_css: col-md-4 + :button_link: payload.html + :height: 180 + :tag: Intermediate + +.. displayitem:: + :header: Checking Work Status + :description: Learn more about work status. + :col_css: col-md-4 + :button_link: status.html + :height: 180 + :tag: Advanced + +.. displayitem:: + :header: Handling App Exceptions + :description: Learn more about exception capturing. + :col_css: col-md-4 + :button_link: handling_app_exception.html + :height: 180 + :tag: Advanced + +.. raw:: html + +
+
+ +.. raw:: html + +
+
+ +.. displayitem:: + :header: Customize your Cloud Compute + :description: Learn more about changing hardware and requirements. + :col_css: col-md-4 + :button_link: compute.html + :height: 180 + :tag: Cloud + +.. raw:: html + +
+
+ + +---- + +****************** +Lightning Work API +****************** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: LightningWork API + :description: Look into the Lightning API reference. + :col_css: col-md-4 + :button_link: lightning_work.html + :height: 180 + +.. raw:: html + +
+
diff --git a/docs/source-app/core_api/lightning_work/lightning_work.rst b/docs/source-app/core_api/lightning_work/lightning_work.rst new file mode 100644 index 0000000..54c7328 --- /dev/null +++ b/docs/source-app/core_api/lightning_work/lightning_work.rst @@ -0,0 +1,11 @@ +:orphan: + +.. _lightning_work: + +############# +LightningWork +############# + +.. autoclass:: lightning.app.core.work.LightningWork + :exclude-members: _aggregate_status_timeout, _is_state_attribute, _is_state_attribute, set_state + :noindex: diff --git a/docs/source-app/core_api/lightning_work/payload.rst b/docs/source-app/core_api/lightning_work/payload.rst new file mode 100644 index 0000000..b23bf7c --- /dev/null +++ b/docs/source-app/core_api/lightning_work/payload.rst @@ -0,0 +1,15 @@ +:orphan: + +###################################### +Sharing Objects between LightningWorks +###################################### + +**Audience:** Users who want to know how to transfer Python objects between their LightningWorks. + +**Level:** Advanced + +**Prerequisite**: Reach Level 16+, know about the `pandas DataFrames `_ and read and read the `Access app state guide <../../access_app_state.html>`_. + +---- + +.. include:: payload_content.rst diff --git a/docs/source-app/core_api/lightning_work/payload_content.rst b/docs/source-app/core_api/lightning_work/payload_content.rst new file mode 100644 index 0000000..780f398 --- /dev/null +++ b/docs/source-app/core_api/lightning_work/payload_content.rst @@ -0,0 +1,75 @@ + +************************************** +What transferring objects does for you +************************************** + +Imagine your application is processing some data using `pandas DaFrame `_ and you want to pass that data to another LightningWork (Work). This is what the **Payload API** is meant for. + +---- + +************************* +Use the Lightning Payload +************************* + +The Payload enables non JSON-serializable attribute objects to be part of your Work's state and to be communicated to other Works. + +Here is an example: + +.. code-block:: python + + import lightning as L + import pandas as pd + + + class SourceWork(L.LightningWork): + def __init__(self): + super().__init__() + self.df = None + + def run(self): + # do some processing + + df = pd.DataFrame(data={"col1": [1, 2], "col2": [3, 4]}) + + # The object you care about needs to be wrapped into a Payload object. + self.df = L.storage.Payload(df) + + # You can access the original object from the payload using its value property. + print("src", self.df.value) + # src col1 col2 + # 0 1 3 + # 1 2 4 + +Once the Payload object is attached to your Work's state, it can be passed to another work using the LightningFlow (Flow) as follows: + +.. code-block:: python + + import lightning as L + import pandas as pd + + + class DestinationWork(L.LightningWork): + def run(self, df: L.storage.Payload): + # You can access the original object from the payload using its value property. + print("dst", df.value) + # dst col1 col2 + # 0 1 3 + # 1 2 4 + + + class Flow(L.LightningFlow): + def __init__(self): + super().__init__() + self.src = SourceWork() + self.dst = DestinationWork() + + def run(self): + self.src.run() + # The pandas DataFrame created by the ``SourceWork`` + # is passed to the ``DestinationWork``. + # Internally, Lightning pickles and un-pickle the python object, + # so you receive a copy of the original object. + self.dst.run(df=self.src.df) + + + app = L.LightningApp(Flow()) diff --git a/docs/source-app/core_api/lightning_work/status.rst b/docs/source-app/core_api/lightning_work/status.rst new file mode 100644 index 0000000..af3a27a --- /dev/null +++ b/docs/source-app/core_api/lightning_work/status.rst @@ -0,0 +1,13 @@ +:orphan: + +#################### +LightningWork Status +#################### + +**Audience:** Users who want to understand ``LightningWork`` under the hood. + +**Level:** Advanced + +---- + +.. include:: status_content.rst diff --git a/docs/source-app/core_api/lightning_work/status_content.rst b/docs/source-app/core_api/lightning_work/status_content.rst new file mode 100644 index 0000000..bb1f2f0 --- /dev/null +++ b/docs/source-app/core_api/lightning_work/status_content.rst @@ -0,0 +1,197 @@ + +************************************* +Everything about LightningWork Status +************************************* + +Statuses indicate transition points in the life of a LightningWork (Work) and contain metadata. + +The different stages are: + +.. code-block:: python + + class WorkStageStatus: + NOT_STARTED = "not_started" + STOPPED = "stopped" + PENDING = "pending" + RUNNING = "running" + SUCCEEDED = "succeeded" + FAILED = "failed" + +And a single status is as follows: + +.. code-block:: python + + @dataclass + class WorkStatus: + stage: WorkStageStatus + timestamp: float + reason: Optional[str] = None + message: Optional[str] = None + count: int = 1 + + +On creation, the Work's status flags all evaluate to ``False`` (in particular ``has_started``) and when calling ``work.run`` in your Lightning Flow (Flow), +the Work transitions from ``is_pending`` to ``is_running`` and then to ``has_succeeded`` if everything went well or ``has_failed`` otherwise. + +.. code-block:: python + + from time import sleep + import lightning as L + + + class Work(L.LightningWork): + def run(self, value: int): + sleep(1) + if value == 0: + return + raise Exception(f"The provided value was {value}") + + + class Flow(L.LightningFlow): + def __init__(self): + super().__init__() + self.work = Work(raise_exception=False) + self.counter = 0 + + def run(self): + if not self.work.has_started: + print("NOT STARTED") + + elif self.work.is_pending: + print("PENDING") + + elif self.work.is_running: + print("RUNNING") + + elif self.work.has_succeeded: + print("SUCCESS") + + elif self.work.has_failed: + print("FAILED") + + elif self.work.has_stopped: + print("STOPPED") + self.stop() + + print(self.work.status) + self.work.run(self.counter) + self.counter += 1 + + + app = L.LightningApp(Flow()) + +Run this app as follows: + +.. code-block:: bash + + lightning run app test.py > app_log.txt + +And here is the expected output inside ``app_log.txt`` and as expected, +we are observing the following transition ``has_started``, ``is_pending``, ``is_running``, ``has_succeeded``, ``is_running`` and ``has_failed`` + +.. code-block:: console + + NOT STARTED + WorkStatus(stage='not_started', timestamp=1653498225.18468, reason=None, message=None, count=1) + PENDING + WorkStatus(stage='pending', timestamp=1653498225.217413, reason=None, message=None, count=1) + PENDING + WorkStatus(stage='pending', timestamp=1653498225.217413, reason=None, message=None, count=1) + PENDING + ... + PENDING + WorkStatus(stage='pending', timestamp=1653498225.217413, reason=None, message=None, count=1) + PENDING + WorkStatus(stage='pending', timestamp=1653498225.217413, reason=None, message=None, count=1) + RUNNING + WorkStatus(stage='running', timestamp=1653498228.825194, reason=None, message=None, count=1) + ... + SUCCESS + WorkStatus(stage='succeeded', timestamp=1653498229.831793, reason=None, message=None, count=1) + SUCCESS + WorkStatus(stage='succeeded', timestamp=1653498229.831793, reason=None, message=None, count=1) + SUCCESS + WorkStatus(stage='succeeded', timestamp=1653498229.831793, reason=None, message=None, count=1) + RUNNING + WorkStatus(stage='running', timestamp=1653498229.846451, reason=None, message=None, count=1) + RUNNING + ... + WorkStatus(stage='running', timestamp=1653498229.846451, reason=None, message=None, count=1) + RUNNING + WorkStatus(stage='running', timestamp=1653498229.846451, reason=None, message=None, count=1) + FAILED + WorkStatus(stage='failed', timestamp=1653498230.852565, reason='user_exception', message='The provided value was 1', count=1) + FAILED + WorkStatus(stage='failed', timestamp=1653498230.852565, reason='user_exception', message='The provided value was 1', count=1) + FAILED + WorkStatus(stage='failed', timestamp=1653498230.852565, reason='user_exception', message='The provided value was 1', count=1) + FAILED + WorkStatus(stage='failed', timestamp=1653498230.852565, reason='user_exception', message='The provided value was 1', count=1) + ... + +In order to access all statuses: + +.. code-block:: python + + from time import sleep + import lightning as L + + + class Work(L.LightningWork): + def run(self, value: int): + sleep(1) + if value == 0: + return + raise Exception(f"The provided value was {value}") + + + class Flow(L.LightningFlow): + def __init__(self): + super().__init__() + self.work = Work(raise_exception=False) + self.counter = 0 + + def run(self): + print(self.statuses) + self.work.run(self.counter) + self.counter += 1 + + + app = L.LightningApp(Flow()) + + +Run this app as follows: + +.. code-block:: bash + + lightning run app test.py > app_log.txt + +And here is the expected output inside ``app_log.txt``: + + +.. code-block:: console + + # First execution with value = 0 + + [] + [WorkStatus(stage='pending', timestamp=1653498622.252016, reason=None, message=None, count=1)] + ... + [WorkStatus(stage='pending', timestamp=1653498622.252016, reason=None, message=None, count=1)] + [WorkStatus(stage='pending', timestamp=1653498622.252016, reason=None, message=None, count=1)] + [WorkStatus(stage='pending', timestamp=1653498622.252016, reason=None, message=None, count=1), WorkStatus(stage='running', timestamp=1653498626.185683, reason=None, message=None, count=1)] + [WorkStatus(stage='pending', timestamp=1653498622.252016, reason=None, message=None, count=1), WorkStatus(stage='running', timestamp=1653498626.185683, reason=None, message=None, count=1)] + ... + [WorkStatus(stage='pending', timestamp=1653498622.252016, reason=None, message=None, count=1), WorkStatus(stage='running', timestamp=1653498626.185683, reason=None, message=None, count=1)] + [WorkStatus(stage='pending', timestamp=1653498622.252016, reason=None, message=None, count=1), WorkStatus(stage='running', timestamp=1653498626.185683, reason=None, message=None, count=1)] + [WorkStatus(stage='pending', timestamp=1653498622.252016, reason=None, message=None, count=1), WorkStatus(stage='running', timestamp=1653498626.185683, reason=None, message=None, count=1), WorkStatus(stage='succeeded', timestamp=1653498627.191053, reason=None, message=None, count=1)] + [WorkStatus(stage='pending', timestamp=1653498622.252016, reason=None, message=None, count=1), WorkStatus(stage='running', timestamp=1653498626.185683, reason=None, message=None, count=1), WorkStatus(stage='succeeded', timestamp=1653498627.191053, reason=None, message=None, count=1)] + [WorkStatus(stage='pending', timestamp=1653498622.252016, reason=None, message=None, count=1), WorkStatus(stage='running', timestamp=1653498626.185683, reason=None, message=None, count=1), WorkStatus(stage='succeeded', timestamp=1653498627.191053, reason=None, message=None, count=1)] + + # Second execution with value = 1 + + [WorkStatus(stage='pending', timestamp=1653498627.204636, reason=None, message=None, count=1), WorkStatus(stage='running', timestamp=1653498627.205509, reason=None, message=None, count=1)] + [WorkStatus(stage='pending', timestamp=1653498627.204636, reason=None, message=None, count=1), WorkStatus(stage='running', timestamp=1653498627.205509, reason=None, message=None, count=1)] + ... + [WorkStatus(stage='pending', timestamp=1653498627.204636, reason=None, message=None, count=1), WorkStatus(stage='running', timestamp=1653498627.205509, reason=None, message=None, count=1)] + [WorkStatus(stage='pending', timestamp=1653498627.204636, reason=None, message=None, count=1), WorkStatus(stage='running', timestamp=1653498627.205509, reason=None, message=None, count=1), WorkStatus(stage='running', timestamp=1653498627.205509, reason=None, message=None, count=1), WorkStatus(stage='failed', timestamp=1653498628.210164, reason='user_exception', message='The provided value was 1', count=1)] + [WorkStatus(stage='pending', timestamp=1653498627.204636, reason=None, message=None, count=1), WorkStatus(stage='running', timestamp=1653498627.205509, reason=None, message=None, count=1), WorkStatus(stage='running', timestamp=1653498627.205509, reason=None, message=None, count=1), WorkStatus(stage='failed', timestamp=1653498628.210164, reason='user_exception', message='The provided value was 1', count=1)] diff --git a/docs/source-app/core_api/overview.rst b/docs/source-app/core_api/overview.rst new file mode 100644 index 0000000..594433a --- /dev/null +++ b/docs/source-app/core_api/overview.rst @@ -0,0 +1,40 @@ +:orphan: + +.. _core_api: + +############################### +Learn more about Lightning Core +############################### + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Level-up with Lightning Apps + :description: From Basics to Advanced Skills + :col_css: col-md-6 + :button_link: ../levels/basic/index.html + :height: 180 + +.. displayitem:: + :header: Understand Lightning App + :description: Detailed description + :col_css: col-md-6 + :button_link: lightning_app/index.html + :height: 180 + +.. displayitem:: + :header: Understand Lightning Flow + :description: Detailed description + :col_css: col-md-6 + :button_link: lightning_flow.html + :height: 180 + +.. displayitem:: + :header: Understand Lightning Work + :description: Detailed description + :col_css: col-md-6 + :button_link: lightning_work/index.html + :height: 180 diff --git a/docs/source-app/examples/dag/dag.rst b/docs/source-app/examples/dag/dag.rst new file mode 100644 index 0000000..0df028e --- /dev/null +++ b/docs/source-app/examples/dag/dag.rst @@ -0,0 +1,81 @@ +:orphan: + +###################################### +Develop a Directed Acyclic Graph (DAG) +###################################### + +.. _dag_example: + +**Audience:** Users coming from MLOps to Lightning Apps, looking for more flexibility. + +A typical ML training workflow can be implemented with a simple DAG. + +Below is a pseudo-code using the lightning framework that uses a LightningFlow to orchestrate the serial workflow: process data, train a model, and serve the model. + +.. code-block:: python + + import lightning as L + + class DAGFlow(L.LightningFlow): + + def __init__(self): + super().__init__() + self.processor = DataProcessorWork(...) + self.train_work = TrainingWork(...) + self.serve_work = ServeWork(...) + + def run(self): + self.processor.run(...) + self.train_work.run(...) + self.serve_work.run(...) + +Below is a pseudo-code to run several works in parallel using a built-in :class:`~lightning.app.structures.Dict`. + +.. code-block:: python + + import lightning as L + + class DAGFlow(L.LightningFlow): + + def __init__(self): + super().__init__() + ... + self.train_works = L.structures.Dict(**{ + "1": TrainingWork(..., parallel=True), + "2": TrainingWork(..., parallel=True), + "3": TrainingWork(..., parallel=True), + ... + }) + ... + + def run(self): + self.processor.run(...) + + # The flow runs through them all, so we need to guard self.serve_work.run + for work in self.train_works.values(): + work.run(...) + + # Wait for all to have finished without errors. + if not all(w.has_succeeded for w in self.train_works): + continue + + self.serve_work.run(...) + +---- + +********** +Next Steps +********** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Scheduled DAG with pandas and sklearn from scratch. + :description: DAG example in pure Lightning. + :col_css: col-md-4 + :button_link: dag_from_scratch.html + :height: 180 + :tag: intermediate diff --git a/docs/source-app/examples/dag/dag_from_scratch.rst b/docs/source-app/examples/dag/dag_from_scratch.rst new file mode 100644 index 0000000..ac843ab --- /dev/null +++ b/docs/source-app/examples/dag/dag_from_scratch.rst @@ -0,0 +1,53 @@ +:orphan: + +################################################### +Scheduled DAG with pandas and sklearn from scratch. +################################################### + +**Audience:** Users coming from MLOps to Lightning Apps, looking for more flexibility. + +**Level:** Intermediate. + +In this example, you will learn how to create a simple DAG which: + +* Download and process some data +* Train several models and report their associated metrics + +and learn how to schedule this entire process. + +Find the complete example `here `_. + +---- + +************************** +Step 1: Implement your DAG +************************** + +Here is an illustration of the DAG to implement: + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/simple_dag.png + :alt: Simple DAG + :width: 100 % + +First, let's define the component we need: + +* DataCollector is responsible to download the data +* Processing is responsible to execute a ``processing.py`` script. +* A collection of model work to train all models in parallel. + +.. literalinclude:: ../../../../examples/app/dag/app.py + :lines: 53-75 + +And its run method executes the steps described above. + +.. literalinclude:: ../../../../examples/app/dag/app.py + :lines: 77-100 + +---- + +***************************** +Step 2: Define the scheduling +***************************** + +.. literalinclude:: ../../../../examples/app/dag/app.py + :lines: 103-131 diff --git a/docs/source-app/examples/data_explore_app.rst b/docs/source-app/examples/data_explore_app.rst new file mode 100644 index 0000000..cd7011a --- /dev/null +++ b/docs/source-app/examples/data_explore_app.rst @@ -0,0 +1,5 @@ +:orphan: + +########################## +Build a Data Exploring App +########################## diff --git a/docs/source-app/examples/etl_app.rst b/docs/source-app/examples/etl_app.rst new file mode 100644 index 0000000..5b494e9 --- /dev/null +++ b/docs/source-app/examples/etl_app.rst @@ -0,0 +1,5 @@ +:orphan: + +############### +Build a ETL App +############### diff --git a/docs/source-app/examples/file_server/app.py b/docs/source-app/examples/file_server/app.py new file mode 100644 index 0000000..3afba48 --- /dev/null +++ b/docs/source-app/examples/file_server/app.py @@ -0,0 +1,241 @@ +import json +import os +import tarfile +import uuid +import zipfile +from pathlib import Path + +import lightning as L +from lightning.app.storage import Drive + + +class FileServer(L.LightningWork): + def __init__( + self, + drive: Drive, + base_dir: str = "file_server", + chunk_size=10240, + **kwargs + ): + """This component uploads, downloads files to your application. + + Arguments: + drive: The drive can share data inside your application. + base_dir: The local directory where the data will be stored. + chunk_size: The quantity of bytes to download/upload at once. + """ + super().__init__( + cloud_build_config=L.BuildConfig(["flask, flask-cors"]), + parallel=True, + **kwargs, + ) + # 1: Attach the arguments to the state. + self.drive = drive + self.base_dir = base_dir + self.chunk_size = chunk_size + + # 2: Create a folder to store the data. + os.makedirs(self.base_dir, exist_ok=True) + + # 3: Keep a reference to the uploaded filenames. + self.uploaded_files = dict() + + def get_filepath(self, path: str) -> str: + """Returns file path stored on the file server.""" + return os.path.join(self.base_dir, path) + + def get_random_filename(self) -> str: + """Returns a random hash for the file name.""" + return uuid.uuid4().hex + + def upload_file(self, file): + """Upload a file while tracking its progress.""" + # 1: Track metadata about the file + filename = file.filename + uploaded_file = self.get_random_filename() + meta_file = uploaded_file + ".meta" + self.uploaded_files[filename] = { + "progress": (0, None), "done": False + } + + # 2: Create a stream and write bytes of + # the file to the disk under `uploaded_file` path. + with open(self.get_filepath(uploaded_file), "wb") as out_file: + content = file.read(self.chunk_size) + while content: + # 2.1 Write the file bytes + size = out_file.write(content) + + # 2.2 Update the progress metadata + self.uploaded_files[filename]["progress"] = ( + self.uploaded_files[filename]["progress"][0] + size, + None, + ) + # 4: Read next chunk of data + content = file.read(self.chunk_size) + + # 3: Update metadata that the file has been uploaded. + full_size = self.uploaded_files[filename]["progress"][0] + self.drive.put(self.get_filepath(uploaded_file)) + self.uploaded_files[filename] = { + "progress": (full_size, full_size), + "done": True, + "uploaded_file": uploaded_file, + } + + # 4: Write down the metadata about the file to the disk + meta = { + "original_path": filename, + "display_name": os.path.splitext(filename)[0], + "size": full_size, + "drive_path": uploaded_file, + } + with open(self.get_filepath(meta_file), "w") as f: + json.dump(meta, f) + + # 5: Put the file to the drive. + # It means other components can access get or list them. + self.drive.put(self.get_filepath(meta_file)) + return meta + + def list_files(self, file_path: str): + # 1: Get the local file path of the file server. + file_path = self.get_filepath(file_path) + + # 2: If the file exists in the drive, transfer it locally. + if not os.path.exists(file_path): + self.drive.get(file_path) + + if os.path.isdir(file_path): + result = set() + for _, _, f in os.walk(file_path): + for file in f: + if not file.endswith(".meta"): + for filename, meta in self.uploaded_files.items(): + if meta["uploaded_file"] == file: + result.add(filename) + return {"asset_names": [v for v in result]} + + # 3: If the filepath is a tar or zip file, list their contents + if zipfile.is_zipfile(file_path): + with zipfile.ZipFile(file_path, "r") as zf: + result = zf.namelist() + elif tarfile.is_tarfile(file_path): + with tarfile.TarFile(file_path, "r") as tf: + result = tf.getnames() + else: + raise ValueError("Cannot open archive file!") + + # 4: Returns the matching files. + return {"asset_names": result} + + def run(self): + # 1: Imports flask requirements. + from flask import Flask, request + from flask_cors import CORS + + # 2: Create a flask app + flask_app = Flask(__name__) + CORS(flask_app) + + # 3: Define the upload file endpoint + @flask_app.post("/upload_file/") + def upload_file(): + """Upload a file directly as form data.""" + f = request.files["file"] + return self.upload_file(f) + + @flask_app.get("/") + def list_files(): + return self.list_files(str(Path(self.base_dir).resolve())) + + # 5: Start the flask app while providing the `host` and `port`. + flask_app.run(host=self.host, port=self.port, load_dotenv=False) + + def alive(self): + """Hack: Returns whether the server is alive.""" + return self.url != "" + + +import requests + +from lightning import LightningWork + + +class TestFileServer(LightningWork): + def __init__(self, drive: Drive): + super().__init__(cache_calls=True) + self.drive = drive + + def run(self, file_server_url: str, first=True): + if first: + with open("test.txt", "w") as f: + f.write("Some text.") + + response = requests.post( + file_server_url + "/upload_file/", + files={'file': open("test.txt", 'rb')} + ) + assert response.status_code == 200 + else: + response = requests.get(file_server_url) + assert response.status_code == 200 + assert response.json() == {"asset_names": ["test.txt"]} + + +from lightning import LightningApp, LightningFlow + + +class Flow(LightningFlow): + def __init__(self): + super().__init__() + # 1: Create a drive to share data between works + self.drive = Drive("lit://file_server") + # 2: Create the filer server + self.file_server = FileServer(self.drive) + # 3: Create the file ser + self.test_file_server = TestFileServer(self.drive) + + def run(self): + # 1: Start the file server. + self.file_server.run() + + # 2: Trigger the test file server work when ready. + if self.file_server.alive(): + # 3 Execute the test file server work. + self.test_file_server.run(self.file_server.url) + self.test_file_server.run(self.file_server.url, first=False) + + # 4 When both execution are successful, exit the app. + if self.test_file_server.num_successes == 2: + self.stop() + + def configure_layout(self): + # Expose the file_server component + # in the UI using its `/` endpoint. + return {"name": "File Server", "content": self.file_server} + + +from lightning.app.runners import MultiProcessRuntime + + +def test_file_server(): + app = LightningApp(Flow()) + MultiProcessRuntime(app).dispatch() + + +from lightning.app.testing import run_app_in_cloud + + +def test_file_server_in_cloud(): + # You need to provide the directory containing the app file. + app_dir = "docs/source-app/examples/file_server" + with run_app_in_cloud(app_dir) as (admin_page, view_page, get_logs_fn, name): + """# 1. `admin_page` and `view_page` are playwright Page Objects. + + # Check out https://playwright.dev/python/ doc to learn more. + # You can click the UI and trigger actions. + + # 2. By calling logs = get_logs_fn(), + # you get all the logs currently on the admin page. + """ diff --git a/docs/source-app/examples/file_server/file_server.rst b/docs/source-app/examples/file_server/file_server.rst new file mode 100644 index 0000000..f9f800a --- /dev/null +++ b/docs/source-app/examples/file_server/file_server.rst @@ -0,0 +1,13 @@ +:orphan: + +.. _fileserver_example: + +##################### +Develop a File Server +##################### + +**Prerequisite**: Reach :ref:`level 16+ ` and read the :ref:`Drive article `. + +---- + +.. include:: file_server_content.rst diff --git a/docs/source-app/examples/file_server/file_server_content.rst b/docs/source-app/examples/file_server/file_server_content.rst new file mode 100644 index 0000000..e9e9017 --- /dev/null +++ b/docs/source-app/examples/file_server/file_server_content.rst @@ -0,0 +1,85 @@ + + +********* +Our Goal +********* + +Create a simple Lightning App (App) that allows users to upload files and list the uploaded files. + +---- + +************* +Completed App +************* + +Here is a recording of the final App built in this example, tested with pytest. + +.. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/file_server.mp4 + :poster: https://pl-public-data.s3.amazonaws.com/assets_lightning/file_server.png + :width: 600 + :class: background-video + :autoplay: + :loop: + :muted: + +---- + +********** +App Design +********** + +In order to create this App, we need to develop two components and an App: + +* A **File Server Component** that gives you the ability to download or list files shared with your App. This is particularly useful when you want to trigger an ML job but your users need to provide their own data or if the user wants to download the trained checkpoints. + +* A **Test File Server** Component to interact with the file server. + +* An App putting everything together and the App's associated pytest tests. + +---- + +******** +Tutorial +******** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Step 1: Implement the File Server general structure + :description: Put together the shape of the Component + :col_css: col-md-4 + :button_link: file_server_step_1.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: Step 2: Implement the File Server upload and list files methods + :description: Add the core functionalities to the Component + :col_css: col-md-4 + :button_link: file_server_step_2.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: Step 3: Implement a File Server Testing Component + :description: Create a Component to test the file server + :col_css: col-md-4 + :button_link: file_server_step_3.html + :height: 180 + :tag: Intermediate + +.. displayitem:: + :header: Step 4: Implement tests for the File Server component with pytest + :description: Create an App to validate the upload and list files endpoints + :col_css: col-md-4 + :button_link: file_server_step_4.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/examples/file_server/file_server_step_1.rst b/docs/source-app/examples/file_server/file_server_step_1.rst new file mode 100644 index 0000000..8703a1d --- /dev/null +++ b/docs/source-app/examples/file_server/file_server_step_1.rst @@ -0,0 +1,49 @@ +:orphan: + +################################################## +Step 1: Implement the FileServer general structure +################################################## + +Let’s dive in on how to develop the component with the following code: + +.. literalinclude:: ./app.py + :lines: 1-41, 132-158 + :emphasize-lines: 16, 51- + +******** +Tutorial +******** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Step 2: Implement the File Server upload and list files methods + :description: Add the core functionalities to the Component + :col_css: col-md-4 + :button_link: file_server_step_2.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: Step 3: Implement a File Server Testing Component + :description: Create a Component to test the file server + :col_css: col-md-4 + :button_link: file_server_step_3.html + :height: 180 + :tag: Intermediate + +.. displayitem:: + :header: Step 4: Implement tests for the File Server component with pytest + :description: Create an App to validate the upload and list files endpoints + :col_css: col-md-4 + :button_link: file_server_step_4.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/examples/file_server/file_server_step_2.rst b/docs/source-app/examples/file_server/file_server_step_2.rst new file mode 100644 index 0000000..8647160 --- /dev/null +++ b/docs/source-app/examples/file_server/file_server_step_2.rst @@ -0,0 +1,75 @@ +:orphan: + +################################################################ +Step 2: Implement the File Server upload and list_files methods +################################################################ + +Let's dive in on how to implement these methods. + +*************************** +Implement the upload method +*************************** + +In this method, we are creating a stream between the uploaded file and the uploaded file stored on the file server disk. + +Once the file is uploaded, we are putting the file into the :class:`~lightning.app.storage.drive.Drive`, so it becomes persistent and accessible to all Components. + +.. literalinclude:: ./app.py + :lines: 12, 51-99 + :emphasize-lines: 49 + +******************************* +Implement the fist_files method +******************************* + +First, in this method, we get the file in the file server filesystem, if available in the Drive. Once done, we list the the files under the provided paths and return the results. + +.. literalinclude:: ./app.py + :lines: 12, 100-130 + :emphasize-lines: 9 + + +******************* +Implement utilities +******************* + +.. literalinclude:: ./app.py + :lines: 12, 43-49 + +******** +Tutorial +******** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Step 1: Implement the File Server general structure + :description: Put together the shape of the Component + :col_css: col-md-4 + :button_link: file_server_step_1.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: Step 3: Implement a File Server Testing Component + :description: Create a Component to test the file server + :col_css: col-md-4 + :button_link: file_server_step_3.html + :height: 180 + :tag: Intermediate + +.. displayitem:: + :header: Step 4: Implement tests for the File Server component with pytest + :description: Create an App to validate the upload and list files endpoints + :col_css: col-md-4 + :button_link: file_server_step_4.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/examples/file_server/file_server_step_3.rst b/docs/source-app/examples/file_server/file_server_step_3.rst new file mode 100644 index 0000000..4703ef0 --- /dev/null +++ b/docs/source-app/examples/file_server/file_server_step_3.rst @@ -0,0 +1,54 @@ +:orphan: + +################################################# +Step 3: Implement a File Server Testing Component +################################################# + +Let's dive in on how to implement a testing component for a server. + +This component needs to test two things: + +* The **/upload_file/** endpoint by creating a file and sending its content to it. + +* The **/** endpoint listing files, by validating the that previously uploaded file is present in the response. + +.. literalinclude:: ./app.py + :lines: 165-182 + +******** +Tutorial +******** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Step 1: Implement the File Server general structure + :description: Put together the shape of the Component + :col_css: col-md-4 + :button_link: file_server_step_1.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: Step 2: Implement the File Server upload and list files methods + :description: Add the core functionalities to the Component + :col_css: col-md-4 + :button_link: file_server_step_2.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: Step 4: Implement tests for the File Server component with pytest + :description: Create an App to validate the upload and list files endpoints + :col_css: col-md-4 + :button_link: file_server_step_4.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/examples/file_server/file_server_step_4.rst b/docs/source-app/examples/file_server/file_server_step_4.rst new file mode 100644 index 0000000..04517df --- /dev/null +++ b/docs/source-app/examples/file_server/file_server_step_4.rst @@ -0,0 +1,127 @@ +:orphan: + +################################################################# +Step 4: Implement tests for the File Server component with pytest +################################################################# + +Let's create a simple App with our **File Server** and **File Server Test** components. + +Once the File Server is up and running, we'll execute the **test_file_server** LightningWork and when both calls are successful, we exit the App using ``self._exit``. + +.. literalinclude:: ./app.py + :lines: 187-218 + + +Simply create a ``test.py`` file with the following code and run ``pytest tests.py``: + +.. literalinclude:: ./app.py + :lines: 221-226 + +To test the App in the cloud, create a ``cloud_test.py`` file with the following code and run ``pytest cloud_test.py``. +Under the hood, we are using the end-to-end testing `playwright `_ library, so you can interact with the UI. + +.. literalinclude:: ./app.py + :lines: 229- + +---- + +******************** +Test the application +******************** + +Clone the Lightning repo and run the following command: + +.. code-block:: bash + + pytest docs/source/examples/file_server/app.py --capture=no -v + +---- + +******** +Tutorial +******** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Step 1: Implement the File Server general structure + :description: Put together the shape of the Component + :col_css: col-md-4 + :button_link: file_server_step_1.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: Step 2: Implement the File Server upload and list files methods + :description: Add the core functionalities to the Component + :col_css: col-md-4 + :button_link: file_server_step_2.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: Step 3: Implement a File Server Testing Component + :description: Create a Component to test the file server + :col_css: col-md-4 + :button_link: file_server_step_3.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
+ +---- + +****************** +Find more examples +****************** + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Develop a DAG + :description: Create a dag pipeline + :col_css: col-md-4 + :button_link: ../dag/dag.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: Develop a Github Repo Script Runner + :description: Run any script on github in the cloud + :col_css: col-md-4 + :button_link: ../github_repo_runner/github_repo_runner.html + :height: 150 + :tag: Intermediate + + +.. displayitem:: + :header: Develop a HPO Sweeper + :description: Train multiple models with different parameters + :col_css: col-md-4 + :button_link: ../hpo/hpo.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: Develop a Model Server + :description: Serve multiple models with different parameters + :col_css: col-md-4 + :button_link: ../model_server_app/model_server_app.html + :height: 150 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/examples/github_repo_runner/app.py b/docs/source-app/examples/github_repo_runner/app.py new file mode 100644 index 0000000..486055f --- /dev/null +++ b/docs/source-app/examples/github_repo_runner/app.py @@ -0,0 +1,308 @@ +import io +import os +import subprocess +import sys +from copy import deepcopy +from functools import partial +from subprocess import Popen +from typing import Dict, List, Optional + +from lightning import BuildConfig, CloudCompute, LightningApp, LightningFlow +from lightning.app import structures +from lightning.app.components import TracerPythonScript +from lightning.app.frontend import StreamlitFrontend +from lightning.app.storage import Path +from lightning.app.utilities.state import AppState + + +class GithubRepoRunner(TracerPythonScript): + def __init__( + self, + id: str, + github_repo: str, + script_path: str, + script_args: List[str], + requirements: List[str], + cloud_compute: Optional[CloudCompute] = None, + **kwargs, + ): + """The GithubRepoRunner Component clones a repo, runs a specific script with provided arguments and collect + logs. + + Arguments: + id: Identified of the component. + github_repo: The Github Repo URL to clone. + script_path: The path to the script to execute. + script_args: The arguments to be provided to the script. + requirements: The python requirements tp run the script. + cloud_compute: The object to select the cloud instance. + """ + super().__init__( + script_path=script_path, + script_args=script_args, + cloud_compute=cloud_compute, + cloud_build_config=BuildConfig(requirements=requirements), + **kwargs, + ) + self.id = id + self.github_repo = github_repo + self.logs = [] + + def run(self, *args, **kwargs): + # 1. Hack: Patch stdout so we can capture the logs. + string_io = io.StringIO() + sys.stdout = string_io + + # 2: Use git command line to clone the repo. + repo_name = self.github_repo.split("/")[-1].replace(".git", "") + cwd = os.path.dirname(__file__) + subprocess.Popen( + f"git clone {self.github_repo}", cwd=cwd, shell=True).wait() + + # 3: Execute the parent run method of the TracerPythonScript class. + os.chdir(os.path.join(cwd, repo_name)) + super().run(*args, **kwargs) + + # 4: Get all the collected logs and add them to the state. + # This isn't optimal as heavy, but works for this demo purpose. + self.logs = string_io.getvalue() + string_io.close() + + def configure_layout(self): + return {"name": self.id, "content": self} + + +class PyTorchLightningGithubRepoRunner(GithubRepoRunner): + def __init__(self, *args, **kwargs): + super().__init__(*args, **kwargs) + self.best_model_path = None + self.best_model_score = None + + def configure_tracer(self): + from pytorch_lightning import Trainer + from pytorch_lightning.callbacks import Callback + + tracer = super().configure_tracer() + + class TensorboardServerLauncher(Callback): + def __init__(self, work): + # The provided `work` is the + # current ``PyTorchLightningScript`` work. + self.w = work + + def on_train_start(self, trainer, *_): + # Add `host` and `port` for tensorboard to work in the cloud. + cmd = f"tensorboard --logdir='{trainer.logger.log_dir}'" + server_args = f"--host {self.w.host} --port {self.w.port}" + Popen(cmd + " " + server_args, shell=True) + + def trainer_pre_fn(self, *args, work=None, **kwargs): + # Intercept Trainer __init__ call + # and inject a ``TensorboardServerLauncher`` component. + kwargs["callbacks"].append(TensorboardServerLauncher(work)) + return {}, args, kwargs + + # 5. Patch the `__init__` method of the Trainer + # to inject our callback with a reference to the work. + tracer.add_traced( + Trainer, "__init__", pre_fn=partial(trainer_pre_fn, work=self)) + return tracer + + def on_after_run(self, end_script_globals): + import torch + + # 1. Once the script has finished to execute, + # we can collect its globals and access any objects. + trainer = end_script_globals["cli"].trainer + checkpoint_callback = trainer.checkpoint_callback + lightning_module = trainer.lightning_module + + # 2. From the checkpoint_callback, + # we are accessing the best model weights + checkpoint = torch.load(checkpoint_callback.best_model_path) + + # 3. Load the best weights and torchscript the model. + lightning_module.load_state_dict(checkpoint["state_dict"]) + lightning_module.to_torchscript(f"{self.name}.pt") + + # 4. Use lightning.app.storage.Pathto create a reference to the + # torch scripted model. In the cloud with multiple machines, + # by simply passing this reference to another work, + # it triggers automatically a file transfer. + self.best_model_path = Path(f"{self.name}.pt") + + # 5. Keep track of the metrics. + self.best_model_score = float(checkpoint_callback.best_model_score) + + +class KerasGithubRepoRunner(GithubRepoRunner): + """Left to the users to implement.""" + + +class TensorflowGithubRepoRunner(GithubRepoRunner): + """Left to the users to implement.""" + + +GITHUB_REPO_RUNNERS = { + "PyTorch Lightning": PyTorchLightningGithubRepoRunner, + "Keras": KerasGithubRepoRunner, + "Tensorflow": TensorflowGithubRepoRunner, +} + + +class Flow(LightningFlow): + def __init__(self): + super().__init__() + # 1: Keep track of the requests within the state + self.requests = [] + # 2: Create a dictionary of components. + self.ws = structures.Dict() + + def run(self): + # Iterate continuously over all requests + for request_id, request in enumerate(self.requests): + self._handle_request(request_id, deepcopy(request)) + + def _handle_request(self, request_id: int, request: Dict): + # 1: Create a name and find selected framework + name = f"w_{request_id}" + ml_framework = request["train"].pop("ml_framework") + + # 2: If the component hasn't been created yet, create it. + if name not in self.ws: + work_cls = GITHUB_REPO_RUNNERS[ml_framework] + work = work_cls(id=request["id"], **request["train"]) + self.ws[name] = work + + # 3: Run the component + self.ws[name].run() + + # 4: Once the component has finished, + # add metadata to the original request for the UI. + if self.ws[name].best_model_path: + request = self.requests[request_id] + request["best_model_score"] = self.ws[name].best_model_score + request["best_model_path"] = self.ws[name].best_model_path + + def configure_layout(self): + # Create a StreamLit UI for the user to run his Github Repo. + return StreamlitFrontend(render_fn=render_fn) + + +def page_1__create_new_run(state): + import streamlit as st + + st.markdown("# Create a new Run 🎈") + + # 1: Collect arguments from the users + id = st.text_input("Name your run", value="my_first_run") + github_repo = st.text_input( + "Enter a Github Repo URL", value="https://github.com/Lightning-AI/lightning-quick-start.git" + ) + + default_script_args = ( + "--trainer.max_epochs=5" + " --trainer.limit_train_batches=4" + " --trainer.limit_val_batches=4" + " --trainer.callbacks=ModelCheckpoint" + " --trainer.callbacks.monitor=val_acc" + ) + default_requirements = "torchvision, pytorch_lightning, jsonargparse[signatures]" + + script_path = st.text_input("Enter your script to run", value="train_script.py") + script_args = st.text_input("Enter your base script arguments", value=default_script_args) + requirements = st.text_input("Enter your requirements", value=default_requirements) + ml_framework = st.radio( + "Select your ML Training Frameworks", options=["PyTorch Lightning", "Keras", "Tensorflow"] + ) + + if ml_framework not in ("PyTorch Lightning"): + st.write(f"{ml_framework} isn't supported yet.") + return + + clicked = st.button("Submit") + + # 2: If clicked, create a new request. + if clicked: + new_request = { + "id": id, + "train": { + "github_repo": github_repo, + "script_path": script_path, + "script_args": script_args.split(" "), + "requirements": requirements.split(" "), + "ml_framework": ml_framework, + }, + } + # 3: IMPORTANT: Add a new request to the state in-place. + # The flow receives the UI request and dynamically create + # and run the associated work from the request information. + state.requests = state.requests + [new_request] + + +def page_2__view_run_lists(state): + import streamlit as st + + st.markdown("# Run Lists 🎈") + # 1: Iterate through all the requests in the state. + for i, r in enumerate(state.requests): + i = str(i) + # 2: Display information such as request, logs, work state, model score. + work = state._state["structures"]["ws"]["works"][f"w_{i}"] + with st.expander(f"Expand to view Run {i}", expanded=False): + if st.checkbox("Expand to view your configuration", key=i): + st.json(r) + if st.checkbox("Expand to view logs", key=i): + st.code(body=work["vars"]["logs"]) + if st.checkbox("Expand to view your work state", key=i): + work["vars"].pop("logs") + st.json(work) + best_model_score = r.get("best_model_score", None) + if best_model_score: + if st.checkbox("Expand to view your run performance", key=i): + st.json({"best_model_score": best_model_score, "best_model_path": r.get("best_model_path")}) + + +def page_3__view_app_state(state): + import streamlit as st + + st.markdown("# App State 🎈") + st.write(state._state) + + +def render_fn(state: AppState): + import streamlit as st + + page_names_to_funcs = { + "Create a new Run": partial(page_1__create_new_run, state=state), + "View your Runs": partial(page_2__view_run_lists, state=state), + "View the App state": partial(page_3__view_app_state, state=state), + } + selected_page = st.sidebar.selectbox( + "Select a page", page_names_to_funcs.keys()) + page_names_to_funcs[selected_page]() + + +class RootFlow(LightningFlow): + def __init__(self): + super().__init__() + # Create the flow + self.flow = Flow() + + def run(self): + # Run the flow + self.flow.run() + + def configure_layout(self): + # 1: Add the main StreamLit UI + selection_tab = [{ + "name": "Run your Github Repo", + "content": self.flow, + }] + # 2: Add a new tab whenever a new work is dynamically created + run_tabs = [e.configure_layout() for e in self.flow.ws.values()] + # 3: Returns the list of tabs. + return selection_tab + run_tabs + + +app = LightningApp(RootFlow()) diff --git a/docs/source-app/examples/github_repo_runner/github_repo_runner.rst b/docs/source-app/examples/github_repo_runner/github_repo_runner.rst new file mode 100644 index 0000000..7e239b2 --- /dev/null +++ b/docs/source-app/examples/github_repo_runner/github_repo_runner.rst @@ -0,0 +1,15 @@ +:orphan: + +.. _github_repo_script_runner_example: + +################################### +Develop a Github Repo Script Runner +################################### + +**Audience:** Users that want to develop interactive applications which runs Github Repo in the cloud at any scale for multiple users. + +**Prerequisite**: Reach :ref:`level 16+ ` and read the docstring of of :class:`~lightning.app.components.python.tracer.TracerPythonScript` component. + +---- + +.. include:: github_repo_runner_content.rst diff --git a/docs/source-app/examples/github_repo_runner/github_repo_runner_content.rst b/docs/source-app/examples/github_repo_runner/github_repo_runner_content.rst new file mode 100644 index 0000000..2a0a3aa --- /dev/null +++ b/docs/source-app/examples/github_repo_runner/github_repo_runner_content.rst @@ -0,0 +1,97 @@ + +******** +Our Goal +******** + +Create a simple Lightning App (App) where users can enter information in a UI to run a given PyTorch Lightning Script from a given Github Repo with some optional extra Python requirements and arguments. + +Users should be able to monitor their training progress in real-time, view the logs, and get the best monitored metric and associated checkpoint for their models. + +---- + +Completed App +^^^^^^^^^^^^^ + +Here is a recording of the final application built in this example. The example is around 200 lines in total and should give you a great foundation to build your own Lightning App. + +.. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/github_app.mp4 + :poster: "https://pl-public-data.s3.amazonaws.com/assets_lightning/github_app.png + :width: 600 + :class: background-video + :autoplay: + :loop: + :muted: + +---- + +********** +App Design +********** + +In order to develop the App, we need to build several components: + +* A GithubRepoRunner Component that clones a repo, runs a specific script with provided arguments and collect logs. + +* A PyTorch Lightning GithubRepoRunner Component that augments the GithubRepoRunner component to track PyTorch Lightning Trainer. + +* A UI for the users to provide to trigger dynamically a new execution. + +* A Flow to dynamically create GithubRepoRunner once a user submits information from the UI. + +---- + +******** +Tutorial +******** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Step 1: Implement the GithubRepoRunner Component + :description: Clone and execute script from a GitHub Repo. + :col_css: col-md-4 + :button_link: github_repo_runner_step_1.html + :height: 180 + :tag: Intermediate + +.. displayitem:: + :header: Step 2: Implement the PyTorch Lightning GithubRepoRunner Component + :description: Automate PyTorch Lightning execution + :col_css: col-md-4 + :button_link: github_repo_runner_step_2.html + :height: 180 + :tag: Advanced + +.. displayitem:: + :header: Step 3: Implement the Flow to manage user requests + :description: Dynamically create GithubRepoRunner + :col_css: col-md-4 + :button_link: github_repo_runner_step_3.html + :height: 180 + :tag: Intermediate + + +.. displayitem:: + :header: Step 4: Implement the UI with StreamLit + :description: Several pages application + :col_css: col-md-4 + :button_link: github_repo_runner_step_4.html + :height: 180 + :tag: Intermediate + + +.. displayitem:: + :header: Step 5: Put it all together + :description: + :col_css: col-md-4 + :button_link: github_repo_runner_step_5.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/examples/github_repo_runner/github_repo_runner_step_1.rst b/docs/source-app/examples/github_repo_runner/github_repo_runner_step_1.rst new file mode 100644 index 0000000..e85ecc9 --- /dev/null +++ b/docs/source-app/examples/github_repo_runner/github_repo_runner_step_1.rst @@ -0,0 +1,62 @@ +:orphan: + +************************************************ +Step 1: Implement the GithubRepoRunner Component +************************************************ + +The GithubRepoRunner Component clones a repo, runs a specific script with provided arguments, and collect logs. + +Let's dive in on how to develop the component with the following code: + +.. literalinclude:: ./app.py + :lines: -72 + +---- + +******** +Tutorial +******** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Step 2: Implement the PyTorch Lightning GithubRepoRunner Component + :description: Automate PyTorch Lightning execution + :col_css: col-md-4 + :button_link: github_repo_runner_step_2.html + :height: 180 + :tag: Advanced + +.. displayitem:: + :header: Step 3: Implement the Flow to manage user requests + :description: Dynamically create GithubRepoRunner + :col_css: col-md-4 + :button_link: github_repo_runner_step_3.html + :height: 180 + :tag: Intermediate + + +.. displayitem:: + :header: Step 4: Implement the UI with StreamLit + :description: Several pages application + :col_css: col-md-4 + :button_link: github_repo_runner_step_4.html + :height: 180 + :tag: Intermediate + + +.. displayitem:: + :header: Step 5: Put it all together + :description: + :col_css: col-md-4 + :button_link: github_repo_runner_step_5.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/examples/github_repo_runner/github_repo_runner_step_2.rst b/docs/source-app/examples/github_repo_runner/github_repo_runner_step_2.rst new file mode 100644 index 0000000..deae884 --- /dev/null +++ b/docs/source-app/examples/github_repo_runner/github_repo_runner_step_2.rst @@ -0,0 +1,68 @@ +:orphan: + +****************************************************************** +Step 2: Implement the PyTorch Lightning GithubRepoRunner Component +****************************************************************** + +The PyTorch Lightning GithubRepoRunner Component subclasses the GithubRepoRunner but tailors the execution experience to PyTorch Lightning. + +As a matter of fact, this component adds two primary tailored features for PyTorch Lightning users: + +* It injects dynamically a custom callback ``TensorboardServerLauncher`` in the PyTorch Lightning Trainer to start a tensorboard server so it can be exposed in Lightning App UI. + +* Once the script has run, the ``on_after_run`` hook of the :class:`~lightning.app.components.python.tracer.TracerPythonScript` is invoked with the script globals, meaning we can collect anything we need. In particular, we are reloading the best model, torch scripting it, and storing its path in the state along side the best metric score. + +Let's dive in on how to develop the component with the following code: + +.. literalinclude:: ./app.py + :lines: 75-136 + +---- + +******** +Tutorial +******** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Step 1: Implement the GithubRepoRunner Component + :description: Clone and execute script from a GitHub Repo. + :col_css: col-md-4 + :button_link: github_repo_runner_step_1.html + :height: 180 + :tag: Intermediate + +.. displayitem:: + :header: Step 3: Implement the Flow to manage user requests + :description: Dynamically create GithubRepoRunner + :col_css: col-md-4 + :button_link: github_repo_runner_step_3.html + :height: 180 + :tag: Intermediate + + +.. displayitem:: + :header: Step 4: Implement the UI with StreamLit + :description: Several pages application + :col_css: col-md-4 + :button_link: github_repo_runner_step_4.html + :height: 180 + :tag: Intermediate + + +.. displayitem:: + :header: Step 5: Put it all together + :description: + :col_css: col-md-4 + :button_link: github_repo_runner_step_5.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/examples/github_repo_runner/github_repo_runner_step_3.rst b/docs/source-app/examples/github_repo_runner/github_repo_runner_step_3.rst new file mode 100644 index 0000000..44cf7dd --- /dev/null +++ b/docs/source-app/examples/github_repo_runner/github_repo_runner_step_3.rst @@ -0,0 +1,62 @@ +:orphan: + +************************************************** +Step 3: Implement the Flow to manage user requests +************************************************** + +In step 1 and 2, we have implemented the ``GithubRepoRunner`` and ``PyTorchLightningGithubRepoRunner`` components. + +Now, we are going to develop a component to dynamically handle user requests. +Let's dive in on how to develop the component with the following code: + +.. literalinclude:: ./app.py + :lines: 142-190 + +---- + +******** +Tutorial +******** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Step 1: Implement the GithubRepoRunner Component + :description: Clone and execute script from a GitHub Repo. + :col_css: col-md-4 + :button_link: github_repo_runner_step_1.html + :height: 180 + :tag: Intermediate + +.. displayitem:: + :header: Step 2: Implement the PyTorch Lightning GithubRepoRunner Component + :description: Automate PyTorch Lightning execution + :col_css: col-md-4 + :button_link: github_repo_runner_step_2.html + :height: 180 + :tag: Advanced + +.. displayitem:: + :header: Step 4: Implement the UI with StreamLit + :description: Several pages application + :col_css: col-md-4 + :button_link: github_repo_runner_step_4.html + :height: 180 + :tag: Intermediate + + +.. displayitem:: + :header: Step 5: Put it all together + :description: + :col_css: col-md-4 + :button_link: github_repo_runner_step_5.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/examples/github_repo_runner/github_repo_runner_step_4.rst b/docs/source-app/examples/github_repo_runner/github_repo_runner_step_4.rst new file mode 100644 index 0000000..16893aa --- /dev/null +++ b/docs/source-app/examples/github_repo_runner/github_repo_runner_step_4.rst @@ -0,0 +1,86 @@ +:orphan: + +*************************************** +Step 4: Implement the UI with StreamLit +*************************************** + +In step 3, we have implemented a Flow which dynamically creates a Work when a new request is added to the requests list. + +From the UI, we create 3 pages with `StreamLit `_: + +* **Page 1**: Create a form with add a new request to the Flow state **requests**. + +* **Page 2**: Iterate through all the requests and display the associated information. + +* **Page 3**: Display the entire App State. + + +Render All Pages +^^^^^^^^^^^^^^^^ + +.. literalinclude:: ./app.py + :lines: 274-284 + +**Page 1** + +.. literalinclude:: ./app.py + :lines: 193-241 + :emphasize-lines: 43 + +**Page 2** + +.. literalinclude:: ./app.py + :lines: 244-264 + +**Page 3** + +.. literalinclude:: ./app.py + :lines: 267-271 + +---- + +******** +Tutorial +******** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: 1. Implement the GithubRepoRunner Component + :description: Clone and execute script from a GitHub Repo. + :col_css: col-md-4 + :button_link: github_repo_runner_step_1.html + :height: 180 + :tag: Intermediate + +.. displayitem:: + :header: 2. Implement the PyTorch Lightning GithubRepoRunner Component + :description: Automate PyTorch Lightning execution + :col_css: col-md-4 + :button_link: github_repo_runner_step_2.html + :height: 180 + :tag: Advanced + +.. displayitem:: + :header: 3. Implement the Flow to manage user requests + :description: Dynamically create GithubRepoRunner + :col_css: col-md-4 + :button_link: github_repo_runner_step_3.html + :height: 180 + :tag: Intermediate + +.. displayitem:: + :header: Step 5: Put it all together + :description: + :col_css: col-md-4 + :button_link: github_repo_runner_step_5.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/examples/github_repo_runner/github_repo_runner_step_5.rst b/docs/source-app/examples/github_repo_runner/github_repo_runner_step_5.rst new file mode 100644 index 0000000..9b5b469 --- /dev/null +++ b/docs/source-app/examples/github_repo_runner/github_repo_runner_step_5.rst @@ -0,0 +1,75 @@ +:orphan: + +*************************** +Step 5: Put it all together +*************************** + +Let's dive in on how to develop the component with the following code: + +.. literalinclude:: ./app.py + :lines: 287- + +Run the application +^^^^^^^^^^^^^^^^^^^ + +Clone the Lightning repo and run the following command: + +.. code-block:: bash + + lightning run app docs/source/examples/github_repo_runner/app.py + +Add ``--cloud`` to run this application in the cloud. + +.. code-block:: bash + + lightning run app docs/source/examples/github_repo_runner/app.py --cloud + +---- + +********************** +More hands-on examples +********************** + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Develop a DAG + :description: Create a dag pipeline + :col_css: col-md-4 + :button_link: ../dag/dag.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: Develop a File Server + :description: Train multiple models with different parameters + :col_css: col-md-4 + :button_link: ../file_server/file_server.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: Develop a HPO Sweeper + :description: Train multiple models with different parameters + :col_css: col-md-4 + :button_link: ../hpo/hpo.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: Develop a Model Server + :description: Serve multiple models with different parameters + :col_css: col-md-4 + :button_link: ../model_server/model_server.html + :height: 150 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/examples/hands_on_example.rst b/docs/source-app/examples/hands_on_example.rst new file mode 100644 index 0000000..57fa1e5 --- /dev/null +++ b/docs/source-app/examples/hands_on_example.rst @@ -0,0 +1,50 @@ +:orphan: + +################# +Hands-on Examples +################# + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Build a DAG + :description: Learn how to orchestrate workflows + :col_css: col-md-6 + :button_link: dag/dag.html + :height: 180 + +.. displayitem:: + :header: Build a File Server + :description: Learn how to upload and download files + :col_css: col-md-6 + :button_link: file_server/file_server.html + :height: 180 + +.. displayitem:: + :header: Build a Github Repo Script Runner + :description: Learn how to configure dynamic execution from the UI + :col_css: col-md-6 + :button_link: github_repo_runner/github_repo_runner.html + :height: 180 + +.. displayitem:: + :header: Build a HPO Sweeper + :description: Learn how to scale your training + :col_css: col-md-6 + :button_link: hpo/hpo.html + :height: 180 + +.. displayitem:: + :header: Build a Model Server + :description: Learn how to server your models + :col_css: col-md-6 + :button_link: model_server_app_content.html + :height: 180 + +.. raw:: html + +
+
diff --git a/docs/source-app/examples/index.rst b/docs/source-app/examples/index.rst new file mode 100644 index 0000000..bb7e645 --- /dev/null +++ b/docs/source-app/examples/index.rst @@ -0,0 +1,36 @@ +######## +Examples +######## + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Develop a DAG workflow + :description: Develop sequential, non-reactive workflows + :col_css: col-md-4 + :button_link: dag/dag.html + :height: 150 + +.. displayitem:: + :header: Develop a File Server + :description: Develop a file server + :col_css: col-md-4 + :button_link: file_server/file_server.html + :height: 150 + +.. displayitem:: + :header: Develop a Github Repo Script Runner + :description: Build an app to run a Github repo + :col_css: col-md-4 + :button_link: github_repo_runner/github_repo_runner.html + :height: 150 + +.. displayitem:: + :header: Deploy a model + :description: Learn how to deploy a model + :col_css: col-md-4 + :button_link: model_server_app/model_server_app.html + :height: 150 diff --git a/docs/source-app/examples/model_server_app/app.py b/docs/source-app/examples/model_server_app/app.py new file mode 100644 index 0000000..9985014 --- /dev/null +++ b/docs/source-app/examples/model_server_app/app.py @@ -0,0 +1,34 @@ +from locust_component import Locust +from model_server import MLServer +from train import TrainModel + +from lightning import LightningApp, LightningFlow + + +class TrainAndServe(LightningFlow): + def __init__(self): + super().__init__() + self.train_model = TrainModel() + self.model_server = MLServer( + name="mnist-svm", + implementation="mlserver_sklearn.SKLearnModel", + workers=8, + ) + self.performance_tester = Locust(num_users=100) + + def run(self): + self.train_model.run() + self.model_server.run(self.train_model.best_model_path) + if self.model_server.alive(): + # The performance tester needs the model server to be up + # and running to be started, so the URL is added in the UI. + self.performance_tester.run(self.model_server.url) + + def configure_layout(self): + return [ + {"name": "Server", "content": self.model_server.url + "/docs"}, + {"name": "Server Testing", "content": self.performance_tester}, + ] + + +app = LightningApp(TrainAndServe()) diff --git a/docs/source-app/examples/model_server_app/load_testing.rst b/docs/source-app/examples/model_server_app/load_testing.rst new file mode 100644 index 0000000..97345de --- /dev/null +++ b/docs/source-app/examples/model_server_app/load_testing.rst @@ -0,0 +1,57 @@ +:orphan: + +*********************************** +3. Build the Load Testing Component +*********************************** + +Now, we are going to create a component to test the performance of your model server. + +We are going to use a python performance testing tool called `Locust `_. + +.. literalinclude:: ./locust_component.py + + +Finally, once the component is done, we need to crate a ``locustfile.py`` file which defines the format of the request to send to your model server. + +The endpoint to hit has the following format: ``/v2/models/{MODEL_NAME}/versions/{VERSION}/infer``. + +.. literalinclude:: ./locustfile.py + + +---- + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: 1. Build a Train Component + :description: Train a model and store its checkpoints with SKlearn + :col_css: col-md-4 + :button_link: train.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: 2. Build a Model Server Component + :description: Use MLServer to server your models + :col_css: col-md-4 + :button_link: model_server.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: 4. Putting everything together. + :description: Ensemble the components together and run the app + :col_css: col-md-4 + :button_link: putting_everything_together.html + :height: 150 + :tag: basic + +.. raw:: html + +
+
diff --git a/docs/source-app/examples/model_server_app/locust_component.py b/docs/source-app/examples/model_server_app/locust_component.py new file mode 100644 index 0000000..4351506 --- /dev/null +++ b/docs/source-app/examples/model_server_app/locust_component.py @@ -0,0 +1,42 @@ +import os +import subprocess + +from lightning import BuildConfig, LightningWork + + +class Locust(LightningWork): + def __init__(self, num_users: int = 100): + """This component checks the performance of a server. The server url is passed to its run method. + + Arguments: + num_users: Number of users emulated by Locust + """ + # Note: Using the default port 8089 of Locust. + super().__init__( + port=8089, + parallel=True, + cloud_build_config=BuildConfig(requirements=["locust"]), + ) + self.num_users = num_users + + def run(self, load_tested_url: str): + # 1: Create the locust command line. + cmd = " ".join( + [ + "locust", + "--master-host", + str(self.host), + "--master-port", + str(self.port), + "--host", + str(load_tested_url), + "-u", + str(self.num_users), + ] + ) + # 2: Create another process with locust + process = subprocess.Popen(cmd, cwd=os.path.dirname(__file__), shell=True) + + # 3: Wait for the process to finish. As locust is a server, + # this waits infinitely or if killed. + process.wait() diff --git a/docs/source-app/examples/model_server_app/locustfile.py b/docs/source-app/examples/model_server_app/locustfile.py new file mode 100644 index 0000000..198d6de --- /dev/null +++ b/docs/source-app/examples/model_server_app/locustfile.py @@ -0,0 +1,41 @@ +from locust import FastHttpUser, task +from sklearn import datasets +from sklearn.model_selection import train_test_split + + +class HelloWorldUser(FastHttpUser): + def __init__(self, *args, **kwargs): + super().__init__(*args, **kwargs) + self._prepare_inference_request() + + @task + def predict(self): + self.client.post( + "/v2/models/mnist-svm/versions/v0.0.1/infer", + json=self.inference_request, + ) + + def _prepare_inference_request(self): + # The digits dataset + digits = datasets.load_digits() + + # To apply a classifier on this data, + # we need to flatten the image, to + # turn the data in a (samples, feature) matrix: + n_samples = len(digits.images) + data = digits.images.reshape((n_samples, -1)) + + # Split data into train and test subsets + _, X_test, _, _ = train_test_split(data, digits.target, test_size=0.5, shuffle=False) + + x_0 = X_test[0:1] + self.inference_request = { + "inputs": [ + { + "name": "predict", + "shape": x_0.shape, + "datatype": "FP32", + "data": x_0.tolist(), + } + ] + } diff --git a/docs/source-app/examples/model_server_app/model_server.py b/docs/source-app/examples/model_server_app/model_server.py new file mode 100644 index 0000000..8562c63 --- /dev/null +++ b/docs/source-app/examples/model_server_app/model_server.py @@ -0,0 +1,88 @@ +import json +import subprocess + +from lightning import BuildConfig, LightningWork +from lightning.app.storage import Path + +# ML_SERVER_URL = https://github.com/SeldonIO/MLServer + + +class MLServer(LightningWork): + """This components uses SeldonIO MLServer library. + + The model endpoint: /v2/models/{MODEL_NAME}/versions/{VERSION}/infer. + + Arguments: + name: The name of the model for the endpoint. + implementation: The model loader class. + Example: "mlserver_sklearn.SKLearnModel". + Learn more here: $ML_SERVER_URL/tree/master/runtimes + workers: Number of server worker. + """ + + def __init__( + self, + name: str, + implementation: str, + workers: int = 1, + **kwargs, + ): + super().__init__( + parallel=True, + cloud_build_config=BuildConfig( + requirements=["mlserver", "mlserver-sklearn"], + ), + **kwargs, + ) + # 1: Collect the config's. + self.settings = { + "debug": True, + "parallel_workers": workers, + } + self.model_settings = { + "name": name, + "implementation": implementation, + } + # 2: Keep track of latest version + self.version = 1 + + def run(self, model_path: Path): + """The model is downloaded when the run method is invoked. + + Arguments: + model_path: The path to the trained model. + """ + # 1: Use the host and port at runtime so it works in the cloud. + # $ML_SERVER_URL/blob/master/mlserver/settings.py#L50 + if self.version == 1: + # TODO: Reload the next version model of the model. + + self.settings.update({"host": self.host, "http_port": self.port}) + + with open("settings.json", "w") as f: + json.dump(self.settings, f) + + # 2. Store the model-settings + # $ML_SERVER_URL/blob/master/mlserver/settings.py#L120 + self.model_settings["parameters"] = { + "version": f"v0.0.{self.version}", + "uri": str(model_path.absolute()), + } + with open("model-settings.json", "w") as f: + json.dump(self.model_settings, f) + + # 3. Launch the Model Server + subprocess.Popen("mlserver start .", shell=True) + + # 4. Increment the version for the next time run is called. + self.version += 1 + + else: + # TODO: Load the next model and unload the previous one. + pass + + def alive(self): + # Current hack, when the url is available, + # the server is up and running. + # This would be cleaned out and automated. + return self.url != "" diff --git a/docs/source-app/examples/model_server_app/model_server.rst b/docs/source-app/examples/model_server_app/model_server.rst new file mode 100644 index 0000000..283dc97 --- /dev/null +++ b/docs/source-app/examples/model_server_app/model_server.rst @@ -0,0 +1,48 @@ +:orphan: + +************************************* +2. Develop the Model Server Component +************************************* + +In the code below, we use `MLServer `_ which aims to provide an easy way to start serving your machine learning models through a REST and gRPC interface, +fully compliant with KFServing's V2 Dataplane spec. + +.. literalinclude:: ./model_server.py + +---- + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: 1. Develop a Train Component + :description: Train a model and store its checkpoints with SKlearn + :col_css: col-md-4 + :button_link: train.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: 3. Develop a Load Testing Component + :description: Use Locust to test your model servers + :col_css: col-md-4 + :button_link: load_testing.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: 4. Putting everything together. + :description: Ensemble the Components together and run the App + :col_css: col-md-4 + :button_link: putting_everything_together.html + :height: 150 + :tag: basic + +.. raw:: html + +
+
diff --git a/docs/source-app/examples/model_server_app/model_server_app.rst b/docs/source-app/examples/model_server_app/model_server_app.rst new file mode 100644 index 0000000..933c89d --- /dev/null +++ b/docs/source-app/examples/model_server_app/model_server_app.rst @@ -0,0 +1,15 @@ +:orphan: + +.. _model_server_example: + +###################### +Develop a Model Server +###################### + +**Audience:** Users who want to serve their trained models. + +**Prerequisite**: Reach :ref:`level 16+ `. + +---- + +.. include:: model_server_app_content.rst diff --git a/docs/source-app/examples/model_server_app/model_server_app_content.rst b/docs/source-app/examples/model_server_app/model_server_app_content.rst new file mode 100644 index 0000000..0a9280c --- /dev/null +++ b/docs/source-app/examples/model_server_app/model_server_app_content.rst @@ -0,0 +1,84 @@ + +********* +Objective +********* + +Create a simple application that trains and serves a `Sklearn `_ machine learning model with `MLServer from SeldonIO `_ + +---- + +***************** +Final Application +***************** + +Here is a gif of the final application built in this example. + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/ml_server_2.gif + +---- + +************* +System Design +************* + +In order to create such application, we need to build several components: + +* A Model Train Component that trains a model and provides its trained weights + +* A Model Server Component that serves as an API endpoint for the model generated by the **Model Train Component**. + +* A Load Testing Component that tests the model server works as expected. This could be used to CI/CD the performance of newly generated models (left to the users). + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/model_server_app_2.png + +Let's dive into the tutorial. + +---- + +******** +Tutorial +******** + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: 1. Build a Train Component + :description: Train a model and store its checkpoints with SKlearn + :col_css: col-md-4 + :button_link: train.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: 2. Build a Model Server Component + :description: Use MLServer to server your models + :col_css: col-md-4 + :button_link: model_server.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: 3. Build a Load Testing Component + :description: Use Locust to test your model servers + :col_css: col-md-4 + :button_link: load_testing.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: 4. Putting everything together. + :description: Ensemble the components together and run the app + :col_css: col-md-4 + :button_link: putting_everything_together.html + :height: 150 + :tag: basic + +.. raw:: html + +
+
diff --git a/docs/source-app/examples/model_server_app/putting_everything_together.rst b/docs/source-app/examples/model_server_app/putting_everything_together.rst new file mode 100644 index 0000000..48162a9 --- /dev/null +++ b/docs/source-app/examples/model_server_app/putting_everything_together.rst @@ -0,0 +1,80 @@ +:orphan: + +****************************** +4. Putting everything together +****************************** + +In the code below, we put together the **TrainWork**, the **MLServer** and the **Locust** components in an ``app.py`` file. + +.. literalinclude:: ./app.py + + +*********** +Run the App +*********** + +To run the app, simply open a terminal and execute this command: + +.. code-block:: bash + + lightning run app docs/source/examples/model_deploy_app/app.py + +Here is a gif of the UI. + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/ml_server_2.gif + +.. raw:: html + +
+ +Congrats, you have finished the **Build a Model Server** example ! + +---- + +****************** +Find more examples +****************** + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Develop a DAG + :description: Develop a DAG pipeline + :col_css: col-md-4 + :button_link: ../dag/dag.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: Develop a File Server + :description: Train multiple models with different parameters + :col_css: col-md-4 + :button_link: ../file_server/file_server.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: Develop a Github Repo Script Runner + :description: Run code from the internet in the cloud + :col_css: col-md-4 + :button_link: ../github_repo_runner/github_repo_runner.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: Develop a HPO Sweeper + :description: Train multiple models with different parameters + :col_css: col-md-4 + :button_link: ../hpo/hpo.html + :height: 150 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/examples/model_server_app/train.py b/docs/source-app/examples/model_server_app/train.py new file mode 100644 index 0000000..698e0d8 --- /dev/null +++ b/docs/source-app/examples/model_server_app/train.py @@ -0,0 +1,41 @@ +import joblib +from sklearn import datasets, svm +from sklearn.model_selection import train_test_split + +from lightning import LightningWork +from lightning.app.storage import Path + + +class TrainModel(LightningWork): + """This component trains a Sklearn SVC model on digits dataset.""" + + def __init__(self): + super().__init__() + # 1: Add element to the state. + self.best_model_path = None + + def run(self): + # 2: Load the Digits + digits = datasets.load_digits() + + # 3: To apply a classifier on this data, + # we need to flatten the image, to + # turn the data in a (samples, feature) matrix: + n_samples = len(digits.images) + data = digits.images.reshape((n_samples, -1)) + + # 4: Create a classifier: a support vector classifier + classifier = svm.SVC(gamma=0.001) + + # 5: Split data into train and test subsets + X_train, _, y_train, _ = train_test_split(data, digits.target, test_size=0.5, shuffle=False) + + # 6: We learn the digits on the first half of the digits + classifier.fit(X_train, y_train) + + # 7: Save the Sklearn model with `joblib`. + model_file_name = "mnist-svm.joblib" + joblib.dump(classifier, model_file_name) + + # 8: Keep a reference the the generated model. + self.best_model_path = Path("mnist-svm.joblib") diff --git a/docs/source-app/examples/model_server_app/train.rst b/docs/source-app/examples/model_server_app/train.rst new file mode 100644 index 0000000..fdb6f6a --- /dev/null +++ b/docs/source-app/examples/model_server_app/train.rst @@ -0,0 +1,49 @@ +:orphan: + +**************************** +1. Build the Train Component +**************************** + +In the code below, we create a work which trains a simple `SVC `_ model on the digits dataset (classification). + +Once the model is trained, it is saved and a reference :class:`~lightning.app.storage.path.Path` with ``best_model_path`` state attribute. + +.. literalinclude:: ./train.py + +---- + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: 2. Build a Model Server Component + :description: Use MLServer to server your models + :col_css: col-md-4 + :button_link: model_server.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: 3. Build a Load Testing Component + :description: Use Locust to test your model servers + :col_css: col-md-4 + :button_link: load_testing.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: 4. Putting everything together. + :description: Ensemble the components together and run the app + :col_css: col-md-4 + :button_link: putting_everything_together.html + :height: 150 + :tag: basic + +.. raw:: html + +
+
diff --git a/docs/source-app/examples/research_demo_app.rst b/docs/source-app/examples/research_demo_app.rst new file mode 100644 index 0000000..90276f9 --- /dev/null +++ b/docs/source-app/examples/research_demo_app.rst @@ -0,0 +1,5 @@ +:orphan: + +######################### +Build a Research Demo App +######################### diff --git a/docs/source-app/get_started/add_an_interactive_demo.rst b/docs/source-app/get_started/add_an_interactive_demo.rst new file mode 100644 index 0000000..0ad0e6b --- /dev/null +++ b/docs/source-app/get_started/add_an_interactive_demo.rst @@ -0,0 +1,15 @@ +:orphan: + +####################### +Add an Interactive Demo +####################### + +.. _add_an_interactive_Demo: + +**Required background:** Basic Python familiarity and complete the install guide. + +**Goal:** We'll walk you through the 4 key steps to run a Lightning App that trains and demos a model. + +---- + +.. include:: go_beyond_training_content.rst diff --git a/docs/source-app/get_started/build_model.rst b/docs/source-app/get_started/build_model.rst new file mode 100644 index 0000000..300b220 --- /dev/null +++ b/docs/source-app/get_started/build_model.rst @@ -0,0 +1,73 @@ +:orphan: + +.. _build_model: + +####################### +Build and Train a Model +####################### + +**Required background:** Basic Python familiarity and complete the guide. + +**Goal:** We'll walk you through the creation of a model using PyTorch Lightning. + +---- + +********************************* +A simple PyTorch Lightning script +********************************* + +Let's assume you already have a folder with those two files. + +.. code-block:: bash + + pl_project/ + train.py # your own script to train your models + requirements.txt # your python requirements. + +If you don't, simply create a ``pl_project`` folder with those two files and add the following `PyTorch Lightning `_ code in the ``train.py`` file. This code trains a simple ``AutoEncoder`` on `MNIST Dataset `_. + +.. literalinclude:: ../code_samples/convert_pl_to_app/train.py + +Add the following to the ``requirements.txt`` file. + +.. literalinclude:: ../code_samples/convert_pl_to_app/requirements.txt + +Simply run the following commands in your terminal to install the requirements and train the model. + +.. code-block:: bash + + pip install -r requirements.txt + python train.py + +Get through `PyTorch Lightning Introduction `_ to learn more. + +---- + +********** +Next Steps +********** + +.. raw:: html + +
+
+
+ +.. displayitem:: + :header: Evolve a Model into an ML System + :description: Develop an App to train a model in the cloud + :col_css: col-md-6 + :button_link: training_with_apps.html + :height: 180 + +.. displayitem:: + :header: Start from a Template ML System + :description: Learn about Apps, from a template. + :col_css: col-md-6 + :button_link: go_beyond_training.html + :height: 180 + +.. raw:: html + +
+
diff --git a/docs/source-app/get_started/go_beyond_training.rst b/docs/source-app/get_started/go_beyond_training.rst new file mode 100644 index 0000000..f45e7f9 --- /dev/null +++ b/docs/source-app/get_started/go_beyond_training.rst @@ -0,0 +1,14 @@ +:orphan: + +################################ +Start from an ML system template +################################ + +.. _go_beyond_training: + +**Required background:** Basic Python familiarity and complete the install guide. + +**Goal:** We'll walk you through the 4 key steps to run a Lightning App that trains and demos a model. + + +.. include:: go_beyond_training_content.rst diff --git a/docs/source-app/get_started/go_beyond_training_content.rst b/docs/source-app/get_started/go_beyond_training_content.rst new file mode 100644 index 0000000..769513a --- /dev/null +++ b/docs/source-app/get_started/go_beyond_training_content.rst @@ -0,0 +1,405 @@ +************************************************ +The *Train & Demo PyTorch Lightning* Application +************************************************ + +Find the *Train & Demo PyTorch Lightning* application in the `Lightning.ai App Gallery `_. + +Here is a recording of this App running locally and in the cloud with the same behavior. + +.. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/lightning_app_experience_cut.mp4 + :poster: https://pl-public-data.s3.amazonaws.com/assets_lightning/lightning_app_experience_cut.png + :width: 600 + :class: background-video + :autoplay: + :loop: + :muted: + +In the steps below, we are going to show you how to build this application. + +Here are `the entire App's code `_ and `its commented components. `_ + +---- + +************************* +Step 1: Install Lightning +************************* + +If you are using a virtual env, don't forget to activate it before running commands. +You must do so in every new shell. + +.. tip:: We highly recommend using virtual environments. + +.. code:: bash + + pip install lightning + +---- + +**************************************** +Step 2: Install the *Train and Demo* App +**************************************** +The first Lightning App we'll explore is an App to train and demo a machine learning model. + +.. + [|qs_code|], [|qs_live_app|]. + + .. |qs_live_app| raw:: html + + live app + + .. |qs_code| raw:: html + + code + + +Install this App by typing: + +.. code-block:: bash + + lightning install app lightning/quick-start + +Verify the App was succesfully installed: + +.. code-block:: bash + + cd lightning-quick-start + +---- + +*************************** +Step 3: Run the App locally +*************************** + +Run the app locally with the ``run`` command 🤯 + +.. code:: bash + + lightning run app app.py + +---- + +******************************** +Step 4: Run the App in the cloud +******************************** + +Add the ``--cloud`` argument to run on the `Lightning.AI cloud `_. 🤯🤯🤯 + +.. code:: bash + + lightning run app app.py --cloud + +.. + Your app should look like this one (|qs_live_app|) + +---- + +******************* +Understand the code +******************* +The App that we just launched trained a PyTorch Lightning model (although any framework works), then added an interactive demo. + +This is the App's code: + +.. code:: python + + # lightning-quick-start/app.py + import os.path as ops + import lightning as L + from quick_start.components import PyTorchLightningScript, ImageServeGradio + + class TrainDeploy(L.LightningFlow): + def __init__(self): + super().__init__() + self.train_work = PyTorchLightningScript( + script_path=ops.join(ops.dirname(__file__), "./train_script.py"), + script_args=["--trainer.max_epochs=5"], + ) + + self.serve_work = ImageServeGradio(L.CloudCompute()) + + def run(self): + # 1. Run the python script that trains the model + self.train_work.run() + + # 2. when a checkpoint is available, deploy + if self.train_work.best_model_path: + self.serve_work.run(self.train_work.best_model_path) + + def configure_layout(self): + tab_1 = {"name": "Model training", "content": self.train_work} + tab_2 = {"name": "Interactive demo", "content": self.serve_work} + return [tab_1, tab_2] + + app = L.LightningApp(TrainDeploy()) + +Let's break down the code section by section to understand what it is doing. + +---- + +1: Define root component +^^^^^^^^^^^^^^^^^^^^^^^^ + +A Lightning App provides a cohesive product experience for a set of unrelated components. + +The top-level component (Root) must subclass ``L.LightningFlow`` + + +.. code:: python + :emphasize-lines: 6 + + # lightning-quick-start/app.py + import os.path as ops + import lightning as L + from quick_start.components import PyTorchLightningScript, ImageServeGradio + + class TrainDeploy(L.LightningFlow): + def __init__(self): + super().__init__() + self.train_work = PyTorchLightningScript( + script_path=ops.join(ops.dirname(__file__), "./train_script.py"), + script_args=["--trainer.max_epochs=5"], + ) + + self.serve_work = ImageServeGradio(L.CloudCompute("cpu-small")) + + def run(self): + # 1. Run the python script that trains the model + self.train_work.run() + + # 2. when a checkpoint is available, deploy + if self.train_work.best_model_path: + self.serve_work.run(self.train_work.best_model_path) + + def configure_layout(self): + tab_1 = {"name": "Model training", "content": self.train_work} + tab_2 = {"name": "Interactive demo", "content": self.serve_work} + return [tab_1, tab_2] + + app = L.LightningApp(TrainDeploy()) + +---- + +2: Define components +^^^^^^^^^^^^^^^^^^^^ +In the __init__ method, we define the components that make up the App. In this case, we have 2 components, +a component to execute any PyTorch Lightning script (model training) and a second component to +start a Gradio server for demo purposes. + +.. code:: python + :emphasize-lines: 9, 14 + + # lightning-quick-start/app.py + import os.path as ops + import lightning as L + from quick_start.components import PyTorchLightningScript, ImageServeGradio + + class TrainDeploy(L.LightningFlow): + def __init__(self): + super().__init__() + self.train_work = PyTorchLightningScript( + script_path=ops.join(ops.dirname(__file__), "./train_script.py"), + script_args=["--trainer.max_epochs=5"], + ) + + self.serve_work = ImageServeGradio(L.CloudCompute("cpu-small")) + + def run(self): + # 1. Run the python script that trains the model + self.train_work.run() + + # 2. when a checkpoint is available, deploy + if self.train_work.best_model_path: + self.serve_work.run(self.train_work.best_model_path) + + def configure_layout(self): + tab_1 = {"name": "Model training", "content": self.train_work} + tab_2 = {"name": "Interactive demo", "content": self.serve_work} + return [tab_1, tab_2] + + app = L.LightningApp(TrainDeploy()) + +---- + +3: Define how components Flow +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +Every component has a ``run`` method. The run method defines the 🌊 Flow 🌊 of how components interact together. + +In this case, we train a model (until completion). When it's done AND there exists a checkpoint, we launch a +demo server: + +.. code:: python + :emphasize-lines: 18, 21, 22 + + # lightning-quick-start/app.py + import os.path as ops + import lightning as L + from quick_start.components import PyTorchLightningScript, ImageServeGradio + + class TrainDeploy(L.LightningFlow): + def __init__(self): + super().__init__() + self.train_work = PyTorchLightningScript( + script_path=ops.join(ops.dirname(__file__), "./train_script.py"), + script_args=["--trainer.max_epochs=5"], + ) + + self.serve_work = ImageServeGradio(L.CloudCompute("cpu-small")) + + def run(self): + # 1. Run the python script that trains the model + self.train_work.run() + + # 2. when a checkpoint is available, deploy + if self.train_work.best_model_path: + self.serve_work.run(self.train_work.best_model_path) + + def configure_layout(self): + tab_1 = {"name": "Model training", "content": self.train_work} + tab_2 = {"name": "Interactive demo", "content": self.serve_work} + return [tab_1, tab_2] + + app = L.LightningApp(TrainDeploy()) + +.. note:: If you've used other ML systems you'll be pleasantly surprised to not find decorators or YAML files. + +---- + +4: Connect web user interfaces +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +All our favorite tools normally have their own web user interfaces (UI). + +Implement the ``configure_layout`` method to connect them together: + +.. code:: python + :emphasize-lines: 24-27 + + # lightning-quick-start/app.py + import os.path as ops + import lightning as L + from quick_start.components import PyTorchLightningScript, ImageServeGradio + + class TrainDeploy(L.LightningFlow): + def __init__(self): + super().__init__() + self.train_work = PyTorchLightningScript( + script_path=ops.join(ops.dirname(__file__), "./train_script.py"), + script_args=["--trainer.max_epochs=5"], + ) + + self.serve_work = ImageServeGradio(L.CloudCompute("cpu-small")) + + def run(self): + # 1. Run the python script that trains the model + self.train_work.run() + + # 2. when a checkpoint is available, deploy + if self.train_work.best_model_path: + self.serve_work.run(self.train_work.best_model_path) + + def configure_layout(self): + tab_1 = {"name": "Model training", "content": self.train_work} + tab_2 = {"name": "Interactive demo", "content": self.serve_work} + return [tab_1, tab_2] + + app = L.LightningApp(TrainDeploy()) + +---- + +5: Init the ``app`` object +^^^^^^^^^^^^^^^^^^^^^^^^^^ +Initialize an ``app`` object with the ``TrainDeploy`` component (this won't run the App yet): + +.. code:: python + :emphasize-lines: 29 + + # lightning-quick-start/app.py + import os.path as ops + import lightning as L + from quick_start.components import PyTorchLightningScript, ImageServeGradio + + class TrainDeploy(L.LightningFlow): + def __init__(self): + super().__init__() + self.train_work = PyTorchLightningScript( + script_path=ops.join(ops.dirname(__file__), "./train_script.py"), + script_args=["--trainer.max_epochs=5"], + ) + + self.serve_work = ImageServeGradio(L.CloudCompute("cpu-small")) + + def run(self): + # 1. Run the python script that trains the model + self.train_work.run() + + # 2. when a checkpoint is available, deploy + if self.train_work.best_model_path: + self.serve_work.run(self.train_work.best_model_path) + + def configure_layout(self): + tab_1 = {"name": "Model training", "content": self.train_work} + tab_2 = {"name": "Interactive demo", "content": self.serve_work} + return [tab_1, tab_2] + + app = L.LightningApp(TrainDeploy()) + +---- + +****************************** +What components are supported? +****************************** +Any component can work with Lightning AI! + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/Lightning.gif + :alt: What is Lightning gif. + :width: 100 % + +---- + +********** +Next Steps +********** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Add components to your App + :description: Expand your App by adding components. + :col_css: col-md-4 + :button_link: ../workflows/extend_app.html + :height: 180 + +.. displayitem:: + :header: Build a component + :description: Learn to build your own component. + :col_css: col-md-4 + :button_link: ../workflows/build_lightning_component/index.html + :height: 180 + +.. displayitem:: + :header: Explore more Apps + :description: Explore more apps for inspiration. + :col_css: col-md-4 + :button_link: https://lightning.ai/apps + :height: 180 + +.. displayitem:: + :header: Under the hood + :description: Explore how it works under the hood. + :col_css: col-md-4 + :button_link: ../core_api/lightning_app/index.html + :height: 180 + +.. displayitem:: + :header: Run on your private cloud + :description: Run Lightning Apps on your private VPC or on-prem. + :button_link: ../workflows/run_on_private_cloud.html + :col_css: col-md-4 + :height: 180 + +.. raw:: html + +
+
diff --git a/docs/source-app/get_started/jumpstart_from_app_gallery.rst b/docs/source-app/get_started/jumpstart_from_app_gallery.rst new file mode 100644 index 0000000..5a21833 --- /dev/null +++ b/docs/source-app/get_started/jumpstart_from_app_gallery.rst @@ -0,0 +1,123 @@ +:orphan: + +##################################### +Start from Ready-to-Run Template Apps +##################################### + +.. _jumpstart_from_app_gallery: + +Anyone can build Apps for their own use cases and promote them on the `App Gallery `_. + +In return, you can benefit from the work of others and get started faster by re-using a ready-to-run App close to your own use case. + + +************* +User Workflow +************* + +#. Visit the `App Gallery `_ and look for an App close to your own use case. + + .. raw:: html + +
+ +#. If **Launch** is available, it means the App is live and ready to be used! Take it for a spin. + + .. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/launch_button.png + :alt: Launch Button on lightning.ai + :width: 100 % + +#. By clicking **Clone & Run**, a copy of the App is added to your account and an instance starts running. + + + .. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/clone_and_run.mp4 + :poster: https://pl-public-data.s3.amazonaws.com/assets_lightning/clone_and_run.png + :width: 600 + :class: background-video + :autoplay: + :loop: + :muted: + +#. If you found an App that matches what you need, move to **step 5**! Otherwise, go back to **step 1**. + + .. raw:: html + +
+ +#. Copy the installation command (optionally from the clipboard on the right). + + .. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/install_command.png + :alt: Install command on lightning.ai + :width: 100 % + +#. Copy the command to your local terminal. + + .. code-block:: bash + + lightning install app lightning/hackernews-app + +#. Go through the installation steps. + + .. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/install_an_app.mp4 + :poster: https://pl-public-data.s3.amazonaws.com/assets_lightning/install_an_app.png + :width: 600 + :class: background-video + :autoplay: + :loop: + :muted: + +#. Run the App locally. + + .. code-block:: bash + + cd LAI-Hackernews-App + lightning run app app.py + + .. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/hackernews.mp4 + :poster: https://pl-public-data.s3.amazonaws.com/assets_lightning/hackernews.png + :width: 600 + :class: background-video + :autoplay: + :loop: + :muted: + +#. Open the code with your favorite IDE, modify it, and run it back in the cloud. + + .. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/hackernews_modified.mp4 + :poster: https://pl-public-data.s3.amazonaws.com/assets_lightning/hackernews_modified.png + :width: 600 + :class: background-video + :autoplay: + :loop: + :muted: + +---- + +********** +Next Steps +********** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Add Component made by others to your App + :description: Add more functionality to your projects + :col_css: col-md-6 + :button_link: jumpstart_from_component_gallery.html + :height: 180 + +.. displayitem:: + :header: Level-up your skills with Lightning Apps + :description: From Basic to Advanced Skills + :col_css: col-md-6 + :button_link: ../levels/basic/index.html + :height: 180 + +.. raw:: html + +
+
+
diff --git a/docs/source-app/get_started/jumpstart_from_component_gallery.rst b/docs/source-app/get_started/jumpstart_from_component_gallery.rst new file mode 100644 index 0000000..95f7d57 --- /dev/null +++ b/docs/source-app/get_started/jumpstart_from_component_gallery.rst @@ -0,0 +1,151 @@ +:orphan: + +######################################## +Add Component made by others to your App +######################################## + +.. _jumpstart_from_component_gallery: + +Anyone can build components for their own use case and promote them on the `Component Gallery `_. + +In return, you can benefit from the work of others and add new functionalities to your Apps with minimal effort. + + +************* +User Workflow +************* + +#. Visit the `Component Gallery `_ and look for a Component close to something you want to do. + + .. raw:: html + +
+ +#. Check out the code for inspiration or simply install the component from PyPi and use it. + +---- + +************* +Success Story +************* + +The default `Train and Demo Application `_ trains a PyTorch Lightning +model and then starts a demo with `Gradio `_. + +.. code-block:: python + + import os.path as ops + import lightning as L + from quick_start.components import PyTorchLightningScript, ImageServeGradio + + + class TrainDeploy(L.LightningFlow): + def __init__(self): + super().__init__() + self.train_work = PyTorchLightningScript( + script_path=ops.join(ops.dirname(__file__), "./train_script.py"), + script_args=["--trainer.max_epochs=5"], + ) + + self.serve_work = ImageServeGradio(L.CloudCompute("cpu")) + + def run(self): + # 1. Run the python script that trains the model + self.train_work.run() + + # 2. when a checkpoint is available, deploy + if self.train_work.best_model_path: + self.serve_work.run(self.train_work.best_model_path) + + def configure_layout(self): + tab_1 = {"name": "Model training", "content": self.train_work} + tab_2 = {"name": "Interactive demo", "content": self.serve_work} + return [tab_1, tab_2] + + + app = L.LightningApp(TrainDeploy()) + +However, someone who wants to use this Aop (maybe you) found `Lightning HPO `_ +from browsing the `Component Gallery `_ and decided to give it a spin after checking the associated +`Github Repository `_. + +Once ``lightning_hpo`` installed, they improved the default App by easily adding HPO support to their project. + +Here is the resulting App. It is almost the same code, but it's way more powerful now! + +This is the power of `lightning.ai `_ ecosystem 🔥⚡🔥 + +.. code-block:: python + + import os.path as ops + import lightning as L + from quick_start.components import PyTorchLightningScript, ImageServeGradio + import optuna + from optuna.distributions import LogUniformDistribution + from lightning_hpo import Optimizer, BaseObjective + + + class HPOPyTorchLightningScript(PyTorchLightningScript, BaseObjective): + @staticmethod + def distributions(): + return {"model.lr": LogUniformDistribution(0.0001, 0.1)} + + + class TrainDeploy(L.LightningFlow): + def __init__(self): + super().__init__() + self.train_work = Optimizer( + script_path=ops.join(ops.dirname(__file__), "./train_script.py"), + script_args=["--trainer.max_epochs=5"], + objective_cls=HPOPyTorchLightningScript, + n_trials=4, + ) + + self.serve_work = ImageServeGradio(L.CloudCompute("cpu")) + + def run(self): + # 1. Run the python script that trains the model + self.train_work.run() + + # 2. when a checkpoint is available, deploy + if self.train_work.best_model_path: + self.serve_work.run(self.train_work.best_model_path) + + def configure_layout(self): + tab_1 = {"name": "Model training", "content": self.train_work.hi_plot} + tab_2 = {"name": "Interactive demo", "content": self.serve_work} + return [tab_1, tab_2] + + + app = L.LightningApp(TrainDeploy()) + +---- + +********** +Next Steps +********** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Start from Ready-to-Run Template Apps + :description: Jump-start your projects development + :col_css: col-md-6 + :button_link: jumpstart_from_app_gallery.html + :height: 180 + +.. displayitem:: + :header: Level-up your skills with Lightning Apps + :description: From Basic to Advanced Skills + :col_css: col-md-6 + :button_link: ../levels/basic/index.html + :height: 180 + +.. raw:: html + +
+
+
diff --git a/docs/source-app/get_started/training_with_apps.rst b/docs/source-app/get_started/training_with_apps.rst new file mode 100644 index 0000000..b7bf450 --- /dev/null +++ b/docs/source-app/get_started/training_with_apps.rst @@ -0,0 +1,125 @@ +:orphan: + +################################ +Evolve a model into an ML system +################################ + +.. _convert_pl_to_app: + +**Required background:** Basic Python familiarity and complete the :ref:`build_model` guide. + +**Goal:** We'll walk you through the two key steps to build your first Lightning App from your existing PyTorch Lightning scripts. + + +******************* +Training and beyond +******************* + +With `PyTorch Lightning `__, we abstracted distributed training and hardware, by organizing PyTorch code. +With `Lightning Apps `__, we unified the local and cloud experience while abstracting infrastructure. + +By using `PyTorch Lightning `__ and `Lightning Apps `__ +together, a completely new world of possibilities emerges. + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/pl_to_app_4.png + :alt: From PyTorch Lightning to Lightning App + :width: 100 % + +---- + +****************************************** +1. Write an App to run the train.py script +****************************************** + +This article continues where the :ref:`build_model` guide finished. + +Create an additional file ``app.py`` in the ``pl_project`` folder as follows: + +.. code-block:: bash + + pl_project/ + app.py + train.py + requirements.txt + +Inside the ``app.py`` file, add the following code. + +.. literalinclude:: ../code_samples/convert_pl_to_app/app.py + +This App runs the PyTorch Lightning script contained in the ``train.py`` file using the powerful :class:`~lightning.app.components.python.tracer.TracerPythonScript` component. This is really worth checking out! + +---- + +************************************************ +2. Run the train.py file locally or in the cloud +************************************************ + +First, go to the ``pl_folder`` folder from the local terminal and install the requirements. + +.. code-block:: bash + + cd pl_folder + pip install -r requirements.txt + +To run your app, copy the following command to your local terminal: + +.. code-block:: bash + + lightning run app app.py + +Simply add ``--cloud`` to run this application in the cloud with a GPU machine 🤯 + +.. code-block:: bash + + lightning run app app.py --cloud + + +Congratulations! Now, you know how to run a `PyTorch Lightning `_ script with Lightning Apps. + +Lightning Apps can make your ML system way more powerful, keep reading to learn how. + +---- + +********** +Next Steps +********** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Level-up with Lightning Apps + :description: From Basics to Advanced Skills + :col_css: col-md-4 + :button_link: ../levels/basic/index.html + :height: 180 + +.. displayitem:: + :header: Add an Interactive Demo + :description: Add a Gradio Demo once the training is finished + :col_css: col-md-4 + :button_link: add_an_interactive_demo.html + :height: 180 + +.. displayitem:: + :header: Add Model Serving + :description: Serve and load testing with MLServer and Locust + :col_css: col-md-4 + :button_link: ../examples/model_server_app/model_server_app.html + :height: 180 + +.. displayitem:: + :header: Add DAG Orchestration + :description: Organize your processing, training and metrics collection + :col_css: col-md-4 + :button_link: ../examples/dag/dag.html + :height: 180 + +.. displayitem:: + :header: Add Team Collaboration + :description: Create an app to run any PyTorch Lightning Script from Github + :col_css: col-md-4 + :button_link: ../examples/github_repo_runner/github_repo_runner.html + :height: 180 diff --git a/docs/source-app/get_started/what_app_can_do.rst b/docs/source-app/get_started/what_app_can_do.rst new file mode 100644 index 0000000..dc940c3 --- /dev/null +++ b/docs/source-app/get_started/what_app_can_do.rst @@ -0,0 +1,187 @@ +:orphan: + +############################################ +Discover what Lightning Apps can do in 5 min +############################################ + +.. _what_app_can_do: + +Lightning Apps can be plenty things, and while a picture is worth a thousand words, videos showing you examples should be worth even more. + + +***************************** +Flashy - Auto ML App (Public) +***************************** + +Train a model on any image or text dataset without writing any code. Flashy uses `React.js `_ for its frontend. + +Find `Flashy `_ on the App Gallery and the `Flashy codebase. `_ on GitHub. + +.. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/flashy.mp4 + :poster: https://pl-public-data.s3.amazonaws.com/assets_lightning/flashy.png + :width: 600 + :class: background-video + :autoplay: + :loop: + :muted: + +.. ---- + +.. *************************************** +.. NVIDIA Omniverse Sampling App (Private) +.. *************************************** + +.. Use `Nvidia Sampling Omniverse `_ to generate synthetic samples from 3D meshes and train an object detector on that data. + +.. .. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/Omniverse-Sampling.mp4 + :poster: https://pl-public-data.s3.amazonaws.com/assets_lightning/Omniverse-Sampling.png + :width: 600 + :class: background-video + :autoplay: + :loop: + :muted: + +---- + +********************* +Research App (Public) +********************* + +Share your paper ``bundled`` with the arxiv link, poster, live jupyter notebook, interactive demo to try the model, and more! + +Find the `Research App `_ on the App Gallery and the `Research App codebase. `_ on GitHub. + +.. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/research_app.mp4 + :poster: https://pl-public-data.s3.amazonaws.com/assets_lightning/research_app.png + :width: 600 + :class: background-video + :autoplay: + :loop: + :muted: + +---- + +************************************************ +ScratchPad - Notebook Manager for Team (Public) +************************************************ + +Run multiple Jupyter Notebooks on cloud CPUs or machines with multiple GPUs. + +Find the `ScratchPad App `_ on the App Gallery and the `ScratchPad App codebase `_ on GitHub. + +.. note:: ScratchPad is `tested end-to-end `_ on every Lightning App commit with `pytest `_. + +.. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/notebook_apps.mp4 + :poster: https://pl-public-data.s3.amazonaws.com/assets_lightning/notebook_apps.png + :width: 600 + :class: background-video + :autoplay: + :loop: + :muted: + +---- + +*********************** +InVideo Search (Public) +*********************** + +This App lets you find anything you're looking for inside a video. The engine is powered by `Open AI CLIP `_. + +Find the `InVideo Search App `_ on the App Gallery and the `InVideo Search App codebase. `_ in GitHub. + +.. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/video_search_2.mp4 + :poster: https://pl-public-data.s3.amazonaws.com/assets_lightning/video_search_2.png + :width: 600 + :class: background-video + :autoplay: + :loop: + :muted: + +---- + +****************************** +AI-powered HackerNews (Public) +****************************** + +Save yourself time, and get Hacker News story recommendations, chosen for you specifically. This Lightning App was designed to illustrate a full end-to-end MLOPs workflow aimed at enterprise recommendation systems. + +Find the `AI-powered HackerNews App `_ on the App Gallery and the `AI-powered HackerNews App codebase. `_ on GitHub. + +.. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/hackernews_app.mp4 + :poster: https://pl-public-data.s3.amazonaws.com/assets_lightning/hackernews_app.png + :width: 600 + :class: background-video + :autoplay: + :loop: + :muted: + +---- + +********************************************************************* +Lightning Apps can turn ML into scalable systems in days — not months +********************************************************************* + +Use the Lightning framework to develop any ML system: train and deploy a model, create an ETL pipeline, +or spin up a research demo — using the intuitive principles we pioneered with PyTorch Lightning. + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/apps_logos_2.png + :alt: Apps with Logos + :width: 100 % + +Anyone who knows Python can build a Lightning App, even without machine learning experience. + +Lightning Apps are: + +- cloud agnostic +- fault-tolerant, distributed, cost optimized +- production ready +- local and cloud debuggable +- highly reactive & interactive +- connect multiple UIs together +- built for team collaboration +- framework agnostic, use your own stack +- and much more + +.. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/lightning_app_experience_cut.mp4 + :poster: https://pl-public-data.s3.amazonaws.com/assets_lightning/lightning_app_experience_cut.png + :width: 600 + :class: background-video + :autoplay: + :loop: + :muted: + +********** +Next Steps +********** + +.. raw:: html + +
+
+
+ +.. displayitem:: + :header: Build & Train a Model + :description: Discover PyTorch Lightning and train your first Model. + :col_css: col-md-4 + :button_link: build_model.html + :height: 180 + +.. displayitem:: + :header: Evolve a Model into an ML System + :description: Develop an App to train a model in the cloud + :col_css: col-md-4 + :button_link: training_with_apps.html + :height: 180 + +.. displayitem:: + :header: Start from an ML system template + :description: Learn about Apps, from a template. + :col_css: col-md-4 + :button_link: go_beyond_training.html + :height: 180 + +.. raw:: html + +
+
diff --git a/docs/source-app/glossary/app_tree.rst b/docs/source-app/glossary/app_tree.rst new file mode 100644 index 0000000..c60d5d8 --- /dev/null +++ b/docs/source-app/glossary/app_tree.rst @@ -0,0 +1,113 @@ +:orphan: + +.. _app_component_tree: + +################### +App Component Tree +################### + +**Audience:** Users who want to know how components can be composed with each other. + +**Level:** Basic + +---- + +************************************** +What is an Application Component Tree? +************************************** + +Components can be nested to form component trees where the LightningFlows are its branches and LightningWorks are its leaves. + +This design enables users to organize and maintain their code with more ease, but more importantly, this helps creating an ecosystem with re-usable components. + +Here's a basic application with four flows and two works (associated tree structure): + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/tree.gif + :alt: Basic App Components + :width: 100 % + + +.. literalinclude:: ../code_samples/quickstart/app_comp.py + +A Lightning app runs all flows into a single process. Its flows coordinate the execution of the works each running in their own independent processes. + +---- + +*********************************************** +How do I define my application component tree? +*********************************************** + +In order to define your application component tree, you need create a tree of components and attach them to your root flow. + +You can attach your components in the **__init__** method of a flow. + +.. code-block:: python + + import lightning as L + + + class RootFlow(L.LightningFlow): + def __init__(self): + super().__init__() + # The `Work` component is attached here. + self.work = Work() + + # The `NestedFlow` component is attached here. + self.nested_flow = NestedFlow() + +Once done, simply add the root flow to a Lightning app as follows: + +.. code-block:: python + + app = L.LightningApp(RootFlow()) + +---- + +****************************************** +Is my application component tree static? +****************************************** + +No, Lightning supports dynamic flows and works. + +You can simply attach your components in the **run** method of a flow using the Python functions **hasattr**, **setattr**, and **getattr**. + +.. code-block:: python + + class RootFlow(L.LightningFlow): + def run(self): + + if not hasattr(self, "work"): + # The `Work` component is attached here. + setattr(self, "work", Work()) + # Run the `Work` component. + getattr(self, "work").run() + + if not hasattr(self, "nested_flow"): + # The `NestedFlow` component is attached here. + setattr(self, "nested_flow", NestedFlow()) + # Run the `NestedFlow` component. + getattr(self, "wonested_flowrk").run() + + +But it is usually more readable to use Lightning built-in :class:`~lightning.app.structures.Dict` or :class:`~lightning.app.structures.List` as follows: + +.. code-block:: python + + from lightning.app.structures import Dict + + + class RootFlow(L.LightningFlow): + def __init__(self): + super().__init__() + self.dict = Dict() + + def run(self): + if "work" not in self.dict: + # The `Work` component is attached here. + self.dict["work"] = Work() + self.dict["work"].run() + + if "nested_flow" not in self.dict: + # The `NestedFlow` component is attached here. + self.dict["nested_flow"] = NestedFlow() + self.dict["nested_flow"].run() diff --git a/docs/source-app/glossary/aws_arn.rst b/docs/source-app/glossary/aws_arn.rst new file mode 100644 index 0000000..fc136b5 --- /dev/null +++ b/docs/source-app/glossary/aws_arn.rst @@ -0,0 +1,83 @@ +:orphan: + +.. _aws_arn: + +####### +AWS ARN +####### + +**Audience:** Users who want to run on their AWS account + +**Level:** Intermediate + +---- + +******************* +What is an AWS ARN? +******************* +An AWS Amazon Resource Name (ARN) are unique identifiers of Amazon resources (datasets, buckets, machines, clusters) with +customized access controls. + +---- + +************* +Create an ARN +************* +To create an ARN, first install the AWS CLI + +.. code:: bash + + # Linux + curl "https://awscli.amazonaws.com/awscli-exe-linux-x86_64.zip" -o "awscliv2.zip" + unzip awscliv2.zip + sudo ./aws/install + + # MAC + curl "https://awscli.amazonaws.com/AWSCLIV2.pkg" -o "AWSCLIV2.pkg" + sudo installer -pkg AWSCLIV2.pkg -target / + + # WINDOWS + msiexec.exe /i https://awscli.amazonaws.com/AWSCLIV2.msi + +Or `follow the AWS guide `_. + +Then enter the following commands: + +.. code:: bash + + # TODO + +---- + +*********************** +Run on your AWS account +*********************** +To run on your own AWS account, set up a Lightning cluster (here we name it pikachu): + +.. code:: bash + + lightning create cluster pikachu --provider aws --role-arn arn:aws:iam::1234567890:role/lai-byoc --external-id dummy --region us-west-2 + +Run your code on the pikachu cluster by passing it into CloudCompute: + +.. code:: python + + # app.py + import lightning as L + + class LitWorker(L.LightningWork): + def run(self): + message = """ + ANY python code can run here such as: + - train a model + - launch a deployment server + - label data + - run a react app, dash app, streamlit app, etc... + - start a jupyter notebook + - subprocess.Popen('echo run any shell script, python scripts or non python files') + """ + print(message) + + # uses 1 cloud GPU (or your own hardware) + compute = L.CloudCompute('gpu', clusters=['pikachu']) + app = L.LightningApp(LitWorker(cloud_compute=compute)) diff --git a/docs/source-app/glossary/build_config/build_config.rst b/docs/source-app/glossary/build_config/build_config.rst new file mode 100644 index 0000000..43ba0b0 --- /dev/null +++ b/docs/source-app/glossary/build_config/build_config.rst @@ -0,0 +1,43 @@ +:orphan: + +.. _build_config: + +################### +Build Configuration +################### + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Basic + :description: Learn how to manage Python dependencies for an individual LightningWork + :col_css: col-md-6 + :button_link: build_config_basic.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: Intermediate + :description: Learn how to run custom build commands for a LightningWork + :col_css: col-md-6 + :button_link: build_config_intermediate.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Advanced + :description: Learn how to use a custom Docker image for a LightningWork + :col_css: col-md-6 + :button_link: build_config_advanced.html + :height: 150 + :tag: advanced + +.. raw:: html + +
+
diff --git a/docs/source-app/glossary/build_config/build_config_advanced.rst b/docs/source-app/glossary/build_config/build_config_advanced.rst new file mode 100644 index 0000000..bc6f5a2 --- /dev/null +++ b/docs/source-app/glossary/build_config/build_config_advanced.rst @@ -0,0 +1,63 @@ +:orphan: + +############################## +Build Configuration (Advanced) +############################## + +**Audience:** Users who want full control over the docker image that is being installed in the cloud. + +**Level:** Advanced + +Advanced users who need full control over the environment a LightningWork runs in can specify a custom docker image that will be deployed in the cloud. + + +---- + +****************** +Use a docker image +****************** + +Create a :class:`~lightning.app.utilities.packaging.build_config.BuildConfig` and provide a **publicly accessible** link to where the image is hosted: + +.. code-block:: python + + from lightning.app import LightningWork, BuildConfig + + + class MyWork(LightningWork): + def __init__(self): + super().__init__() + + # Using a publicly hosted docker image: + self.cloud_build_config = BuildConfig( + # This is one of the base images Lightning uses by default + image="ghcr.io/gridai/base-images:v1.8-gpu" + ) + + # Can also be combined with extra requirements + self.cloud_build_config = BuildConfig(image="...", requirements=["torchmetrics"]) + + +.. warning:: + Many public hosters like DockerHub apply rate limits for public images. We recommend to pull images from your own registry. + For example, you can set up a + `docker registry on GitHub `_. + + +.. note:: + - The build config only applies when running in the cloud and gets ignored otherwise. A local build config is currently not supported. + - Images from private registries are currently not supported. + +.. note:: + Custom docker images must have python installed. We'll use `virtualenv` from this system python to create a virtual environment. + We'll also configure the `virtualenv` to use the packages installed under system's python so your packages are not lost + +---- + + +********************* +Provide a docker file +********************* + +.. note:: + Not yet supported. Coming soon. diff --git a/docs/source-app/glossary/build_config/build_config_basic.rst b/docs/source-app/glossary/build_config/build_config_basic.rst new file mode 100644 index 0000000..633c173 --- /dev/null +++ b/docs/source-app/glossary/build_config/build_config_basic.rst @@ -0,0 +1,68 @@ +:orphan: + +########################### +Build Configuration (Basic) +########################### + +**Audience:** Users who need to install Python packages for an individual LightningWork. + +**Level:** Basic + +---- + +*********************************** +List dependencies in separate files +*********************************** + +If you are building an app with multiple LightningWorks that have different or even conflicting requirements, split your dependencies into individual files +for more granular control. + +.. code-block:: bash + + ├── app.py + ├── requirements.txt # Global requirements for the entire app + └── works + ├── serve + │ ├── requirements.txt # Requirements specific to the 'serve' work + │ └── serve.py # Source file for the LightningWork + └── train + ├── requirements.txt # Requirements specific to the 'train' work + └── train.py # Source file for the LightningWork + +The requirements.txt file must be located in the same directry as the source file of the LightningWork. +When the LightningWork starts up, it will pick up the requirements file if present and install all listed packages. + +.. note:: + This only applies when running in the cloud. The requirements.txt files get ignored when running locally. + +---- + +*********************************** +Define the requirements in the code +*********************************** + +Instead of listing the requirements in a file, you can also pass them to the LightningWork at runtime using the +:class:`~lightning.app.utilities.packaging.build_config.BuildConfig`: + +.. code-block:: python + :emphasize-lines: 7 + + from lightning.app import LightningWork, BuildConfig + + + class MyWork(LightningWork): + def __init__(self): + super().__init__() + self.cloud_build_config = BuildConfig(requirements=["torch>=1.8", "torchmetrics"]) + +.. note:: + The build config only applies when running in the cloud and gets ignored otherwise. A local build config is currently not supported. + +.. warning:: + Custom base images are not supported with the default CPU cloud compute. For example: + + .. code-block:: py + + class MyWork(LightningWork): + def __init__(self): + super().__init__(cloud_build_config=BuildConfig(image="my-custom-image")) # no cloud compute, for example default work diff --git a/docs/source-app/glossary/build_config/build_config_intermediate.rst b/docs/source-app/glossary/build_config/build_config_intermediate.rst new file mode 100644 index 0000000..de301c6 --- /dev/null +++ b/docs/source-app/glossary/build_config/build_config_intermediate.rst @@ -0,0 +1,56 @@ +:orphan: + +################################## +Build Configuration (Intermediate) +################################## + +**Audience:** Users who need to execute commands to configure the machine before a LightningWork runs on it. + +**Level:** Intermediate + +When a LightningWork machine starts up in the cloud, it uses a lightweight operating system with essential packages pre-installed. +If you need to install additional system packages or run other configuration steps before your code executes on that machine, it is possible to do so by createing a custom +:class:`~lightning.app.utilities.packaging.build_config.BuildConfig`: + +1. Subclass :class:`~lightning.app.utilities.packaging.build_config.BuildConfig`: + + .. code-block:: python + + from lightning.app import BuildConfig + + + @dataclass + class CustomBuildConfig(BuildConfig): + def build_commands(self): + return ["sudo apt-get install libsparsehash-dev"] + + +2. Set the build config on the LightningWork: + + .. code-block:: python + + from lightning.app import LightningWork + + + class MyWork(LightningWork): + def __init__(self): + super().__init__() + + # Use the custom build config + self.cloud_build_config = CustomBuildConfig() + + # Can also be combined with extra requirements + self.cloud_build_config = CustomBuildConfig(requirements=["torchmetrics"]) + +.. note:: + - When you need to execute commands or install tools that require more privileges than the current user has, you can use ``sudo`` without needing to provide a password, e.g., when installing system packages. + - The build config only applies when running in the cloud and gets ignored otherwise. A local build config is currently not supported. + +.. warning:: + Custom base images are not supported with the default CPU cloud compute. For example: + + .. code-block:: py + + class MyWork(LightningWork): + def __init__(self): + super().__init__(cloud_build_config=BuildConfig(image="my-custom-image")) # no cloud compute, for example default work diff --git a/docs/source-app/glossary/command_lines/command_lines.rst b/docs/source-app/glossary/command_lines/command_lines.rst new file mode 100644 index 0000000..1ad4cdf --- /dev/null +++ b/docs/source-app/glossary/command_lines/command_lines.rst @@ -0,0 +1,76 @@ +:orphan: + +############################ +Command-line Interface (CLI) +############################ + +**Audience:** Users looking to create a command line interface (CLI) for their application. + +---- + +************** +What is a CLI? +************** + +A Command-line Interface (CLI) is an user interface (UI) in a terminal to interact with a specific program. + +.. note:: + + The Lightning guideline to build CLI is `lightning ...` or ` ...`. + +As an example, Lightning provides a CLI to interact with your Lightning Apps and the `lightning.ai `_ platform as follows: + +.. code-block:: bash + + main + ├── create - Creates Lightning AI self-managed resources (clusters, etc…) + │ └── cluster - Creates a Lightning AI BYOC compute cluster with your cloud provider credentials. + ├── delete - Deletes Lightning AI self-managed resources (clusters, etc…) + │ └── cluster - Deletes a Lightning AI BYOC compute cluster and all associated cloud provider resources. + ├── fork - Forks an App. + ├── init - Initializes a Lightning App and/or Component. + │ ├── app + │ ├── component + │ ├── pl-app - Creates an App from your PyTorch Lightning source files. + │ └── react-ui - Creates a React UI to give a Lightning Component a React.js web UI + ├── install - Installs a Lightning App and/or Component. + │ ├── app + │ └── component + ├── list - Lists Lightning AI self-managed resources (clusters, etc…) + │ ├── apps - Lists your Lightning AI Apps. + │ └── clusters - Lists your Lightning AI BYOC compute clusters. + ├── login - Logs in to your lightning.ai account. + ├── logout - Logs out of your lightning.ai account. + ├── run - Runs a Lightning App locally or on the cloud. + │ └── app - Runs an App from a file. + ├── show - Shows given resource. + │ ├── cluster - Groups cluster commands inside show. + │ │ └── logs - Shows cluster logs. + │ └── logs - Shows cloud application logs. By default prints logs for all currently available Components. + ├── stop - Stops your App. + └── tree - Shows the command tree of your CLI. + +Learn more about `Command-line interfaces here `_. + +---- + +********** +Learn more +********** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Develop a Command Line Interface + :description: Learn how to develop a CLI for your App. + :col_css: col-md-6 + :button_link: ../../workflows/build_command_line_interface/index_content.html + :height: 150 + +.. raw:: html + +
+
diff --git a/docs/source-app/glossary/dag.rst b/docs/source-app/glossary/dag.rst new file mode 100644 index 0000000..ef85d33 --- /dev/null +++ b/docs/source-app/glossary/dag.rst @@ -0,0 +1,46 @@ +###################### +Directed Acyclic Graph +###################### +**Audience:** Users coming from MLOps to Lightning Apps, looking for more flexibility. + +---- + +***************************** +Is Lightning a DAG framework? +***************************** +No. + +A Lightning App enables developers to express complex, interactive applications that are impossible to create with DAGs. + +---- + +********************************* +Can I Build a DAG with Lightning? +********************************* +Yes! + +DAGs are one of the easiest Lightning Apps to build. For example, here's a `full app that defines a DAG <../examples/dag/dag.html>`_. + +---- + +******** +Examples +******** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Build a DAG + :description: Learn how to create a DAG with Lightning + :col_css: col-md-4 + :button_link: ../examples/dag/dag.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/glossary/debug_app.rst b/docs/source-app/glossary/debug_app.rst new file mode 100644 index 0000000..2d5c0d1 --- /dev/null +++ b/docs/source-app/glossary/debug_app.rst @@ -0,0 +1,3 @@ +:orphan: + +.. include:: ../workflows/debug_locally.rst diff --git a/docs/source-app/glossary/distributed_fe.rst b/docs/source-app/glossary/distributed_fe.rst new file mode 100644 index 0000000..36d64b0 --- /dev/null +++ b/docs/source-app/glossary/distributed_fe.rst @@ -0,0 +1,5 @@ +:orphan: + +##################### +Distributed Front-End +##################### diff --git a/docs/source-app/glossary/distributed_hardware.rst b/docs/source-app/glossary/distributed_hardware.rst new file mode 100644 index 0000000..0a64f5f --- /dev/null +++ b/docs/source-app/glossary/distributed_hardware.rst @@ -0,0 +1,5 @@ +:orphan: + +#################### +Distributed Hardware +#################### diff --git a/docs/source-app/glossary/environment_variables.rst b/docs/source-app/glossary/environment_variables.rst new file mode 100644 index 0000000..10c3e9a --- /dev/null +++ b/docs/source-app/glossary/environment_variables.rst @@ -0,0 +1,27 @@ +.. _environment_variables: + +********************* +Environment Variables +********************* + +If your App is using configuration values you don't want to commit with your App source code, you can use environment variables. + +Lightning allows you to set environment variables when running the App from the CLI with the `lightning run app` command. You can use environment variables to pass any values to the App, and avoiding sticking those values in the source code. + +Set one or multiple variables using the **--env** option: + +.. code:: bash + + lightning run app app.py --cloud --env FOO=BAR --env BAZ=FAZ + +Environment variables are available in all Flows and Works, and can be accessed as follows: + +.. code:: python + + import os + + print(os.environ["FOO"]) # BAR + print(os.environ["BAZ"]) # FAZ + +.. note:: + Environment variables are not encrypted. For sensitive values, we recommend using :ref:`Encrypted Secrets `. diff --git a/docs/source-app/glossary/event_loop.rst b/docs/source-app/glossary/event_loop.rst new file mode 100644 index 0000000..30d1bd3 --- /dev/null +++ b/docs/source-app/glossary/event_loop.rst @@ -0,0 +1,11 @@ +########## +Event loop +########## + +Drawing inspiration from modern web frameworks like `React.js `_, the Lightning App runs all flows in an **event loop** (forever), which is triggered several times a second after collecting any works' state change. + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/lightning_loop.gif + +When running a Lightning App in the cloud, the ``LightningWork`` run on different machines. LightningWork communicates any state changes to the **event loop** which re-executes the flow with the newly-collected works' state. + +.. _app_event_loop: diff --git a/docs/source-app/glossary/fault_tolerance.rst b/docs/source-app/glossary/fault_tolerance.rst new file mode 100644 index 0000000..b0ee6df --- /dev/null +++ b/docs/source-app/glossary/fault_tolerance.rst @@ -0,0 +1,7 @@ +:orphan: + +############### +Fault tolerance +############### + +.. note:: documentation under construction diff --git a/docs/source-app/glossary/index.rst b/docs/source-app/glossary/index.rst new file mode 100644 index 0000000..0f92d4b --- /dev/null +++ b/docs/source-app/glossary/index.rst @@ -0,0 +1,163 @@ +.. toctree:: + :maxdepth: 1 + :hidden: + + ios_and_android + app_tree + aws_arn + build_config/build_config + command_lines/command_lines + dag + event_loop + environment_variables + secrets + front ends <../workflows/add_web_ui/glossary_front_end> + Lightning app <../core_api/lightning_app/index> + sharing_components + scheduling + storage/storage + restful_api/restful_api + add web ui <../workflows/add_web_ui/glossary_ui> + use_local_lightning + +######## +Glossary +######## + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Android Lightning App + :description: Use Lightning with android apps. + :col_css: col-md-12 + :button_link: ios_and_android.html + :height: 100 + +.. displayitem:: + :header: App Components Tree + :description: Learn how components can be nested to form component trees where the LightningFlows are its branches and LightningWorks are its leaves. + :col_css: col-md-12 + :button_link: app_tree.html + :height: 100 + +.. displayitem:: + :header: AWS ARN + :description: Create an AWS ARN + :col_css: col-md-12 + :button_link: aws_arn.html + :height: 100 + +.. displayitem:: + :header: Build Configuration + :description: Prepare your requirements, add custom build commands or use docker image + :col_css: col-md-12 + :button_link: build_config/build_config.html + :height: 100 + +.. displayitem:: + :header: Command Line Interface (CLI) + :description: Learn about the Lightning CLI + :col_css: col-md-12 + :button_link: command_lines/command_lines.html + :height: 100 + +.. displayitem:: + :header: DAG + :description: Learn about directed acyclic graph, their properties and usage + :col_css: col-md-12 + :button_link: dag.html + :height: 100 + +.. displayitem:: + :header: Event Loop + :description: Learn how the Infinite Event Loop enables high distributed reactivity by triggering after collecting state changes. + :col_css: col-md-12 + :button_link: event_loop.html + :height: 100 + +.. displayitem:: + :header: Environment Variables + :description: Add secrets such as API keys or access tokens + :col_css: col-md-12 + :button_link: environment_variables.html + :height: 100 + +.. displayitem:: + :header: Encrypted Secrets + :description: Learn how to add passwords to your Lightning apps + :col_css: col-md-12 + :button_link: secrets.html + :height: 100 + +.. displayitem:: + :header: Frontend + :description: Customize your App View with any framework you want + :col_css: col-md-12 + :button_link: ../workflows/add_web_ui/glossary_front_end.html + :height: 100 + +.. displayitem:: + :header: iOS Lightning App + :description: Use Lightning with iOS apps. + :col_css: col-md-12 + :button_link: ios_and_android.html + :height: 100 + +.. displayitem:: + :header: Lightning App + :description: A Lightning app is a collection of connected components that form a workflow + :col_css: col-md-12 + :button_link: ../core_api/lightning_app/index.html + :height: 100 + +.. displayitem:: + :header: Mounts + :description: Mount Cloud Data + :col_css: col-md-6 + :button_link: mount.html + :height: 180 + +.. displayitem:: + :header: Sharing Components + :description: Let's create an ecosystem altogether + :col_css: col-md-12 + :button_link: sharing_components.html + :height: 100 + +.. displayitem:: + :header: Scheduling + :description: Orchestrate execution at specific times + :col_css: col-md-12 + :button_link: scheduling.html + :height: 100 + +.. displayitem:: + :header: Storage + :description: Easily share files even across multiple machines + :col_css: col-md-12 + :button_link: storage/storage.html + :height: 100 + +.. displayitem:: + :header: REST API + :description: Learn how to set up a RESTful API endpoint + :col_css: col-md-12 + :button_link: restful_api/restful_api.html + :height: 100 + +.. displayitem:: + :header: UI + :description: Combine multiple frameworks to create your own UI + :col_css: col-md-12 + :button_link: ../workflows/add_web_ui/glossary_ui.html + :height: 100 + +.. displayitem:: + :header: Using a development branch of Lightning on the Cloud + :description: Learn how to contribute to the Lightning framework in the cloud + :col_css: col-md-12 + :button_link: use_local_lightning.html + :height: 100 diff --git a/docs/source-app/glossary/ios_and_android.rst b/docs/source-app/glossary/ios_and_android.rst new file mode 100644 index 0000000..90aeecb --- /dev/null +++ b/docs/source-app/glossary/ios_and_android.rst @@ -0,0 +1,26 @@ + +############################################### +Apple and Android mobile devices with Lightning +############################################### + +Audience: Users who want to develop Lightning Apps for Apple or Android mobile devices. + +---- + +*********************************************************** +Develop a Lightning App for Apple or Android mobile devices +*********************************************************** + +There are a couple of ways you can go about building Lightning Apps that work on Apple or Android mobile devices. + +Option 1 +^^^^^^^^ + +You can develop a Lightning App that interacts with an iOS or Android app. +The ML and backend services live on the Lightning App, but the iOS or Android code (obj-c/swift or android) lives on the mobile devices. + +Option 2 +^^^^^^^^ + +You can build a mobile-first React Lightning App that works on both Apple and Android mobile devices. +The `InVideo app `_ is a good example of a Lightning App that does just that. diff --git a/docs/source-app/glossary/lightning_app_overview/index.rst b/docs/source-app/glossary/lightning_app_overview/index.rst new file mode 100644 index 0000000..09de273 --- /dev/null +++ b/docs/source-app/glossary/lightning_app_overview/index.rst @@ -0,0 +1,11 @@ +:orphan: + +########################### +Lightning Apps Key concepts +########################### + +**Audience:** Users who want to know how the 🤯 magic works under the hood. + +---- + +.. note:: This page is under construction diff --git a/docs/source-app/glossary/mount.rst b/docs/source-app/glossary/mount.rst new file mode 100644 index 0000000..a62d72b --- /dev/null +++ b/docs/source-app/glossary/mount.rst @@ -0,0 +1 @@ +.. include:: ../workflows/mount_cloud_object_store.rst diff --git a/docs/source-app/glossary/restful_api/restful_api.rst b/docs/source-app/glossary/restful_api/restful_api.rst new file mode 100644 index 0000000..a1128f2 --- /dev/null +++ b/docs/source-app/glossary/restful_api/restful_api.rst @@ -0,0 +1,53 @@ +:orphan: + +########### +RESTful API +########### + +**Audience:** Users looking to create an API in their App to allow users to activate functionalities from external sources. + +---- + +********************** +What is a RESTful API? +********************** + +A RESTful API is a set of external URL routes exposed by a server that enables clients to trigger some functionalities, such as getting or putting some data, uploading files, etc.. + +This provides great flexibility for users as they can easily discover functionalities made available by the App Builders. + +The Lightning App framework supports the four primary HTTP methods: `GET`, `POST`, `PUT`, `DELETE`. + +These methods are guidelines to organize your RESTful Services and help users understand your functionalities. + +* **`GET`:** Reads data from the server. +* **`POST`:** Creates new resources. +* **`PUT`:** Updates/replaces existing resources. +* **`DELETE`:** Deletes resources. + +Learn more about `HTTP Methods for RESTful Services here `_. + +The Lightning App framework uses the popular `FastAPI `_ and `Pydantic `_ frameworks under the hood. This means you can use all their features while building your App. + +---- + +********** +Learn more +********** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Develop a RESTful API + :description: Learn how to develop an API for your App. + :col_css: col-md-6 + :button_link: ../../workflows/build_rest_api/index_content.html + :height: 150 + +.. raw:: html + +
+
diff --git a/docs/source-app/glossary/scheduling.rst b/docs/source-app/glossary/scheduling.rst new file mode 100644 index 0000000..0e04dc3 --- /dev/null +++ b/docs/source-app/glossary/scheduling.rst @@ -0,0 +1,185 @@ +:orphan: + +########## +Scheduling +########## + +The Lightning Scheduling system makes it easy to schedule your components execution with any arbitrary conditions. + + +---- + +************************ +Schedule your components +************************ + +The LightningFlow has a ``schedule`` method which can be used to schedule your components. + +.. code-block:: python + + from lightning.app import LightningWork, LightningFlow + from lightning.app.storage import Path + + + class MyFlow(LightningFlow): + + def run(self): + if self.schedule("hourly"): + # run some code once every hour. + + if self.schedule("daily"): + # run some code once day. + + if self.schedule("daily") and anything_else: + # run some code once day if the anything else is also True. + + if self.schedule("2 4 * * mon,fri"): + # defined with cron syntax, run some code at 04:02 on every Monday and Friday. + +Learn more about the cron syntax `here `_ + +---- + +************** +Best Practices +************** + +In the example above, the line ``self.schedule("hourly")`` will return ``True`` for a **single** flow execution every hour. Mathematically, this is known as a dirac. + +1. Instantiate your component under the schedule method and run outside as follows: + +.. code-block:: python + + from lightning.app import LightningFlow + from lightning.app.structures import List + + class ScheduledDAG(LightningFlow): + def __init__(self): + super().__init__() + self.list = List() + + def run(self): + if self.schedule("hourly"): + # dynamically instantiate + # don't forget to always attach + # your components to the flow !!! + self.list.append(MyDAGFlow(...)) + + # run all dags, but the completed ones + # are cached and don't re-execute. + for dag in self.list: + dag.run() + + +2. Run a single work under the schedule with different arguments to have it re-run. + +.. code-block:: python + + from lightning.app import LightningFlow + from time import time + + class ScheduledDAG(LightningFlow): + def __init__(self): + super().__init__() + self.data_processor = DataProcessorWork(...) + + def run(self): + ... + if self.schedule("hourly"): + self.data_processor.run(trigger_time=time()) + + +3. Capture the event in the state and execute your sequential works outside. + +.. code-block:: python + + from lightning.app import LightningFlow + from time import time + + class ScheduledDAG(LightningFlow): + def __init__(self): + super().__init__() + self.should_execute = False + self.data_processor = DataProcessorWork(...) + self.training_work = KerasTrainingWork(...) + + def run(self): + ... + if self.schedule("hourly"): + self.should_execute = True + + # Runs in 10 min + if self.should_execute: + # Runs in 5 min + self.data_processor.run(trigger_time=time()) + if self.data_processor.has_succeeded: + # Runs in 5 min + self.training_work.run(self.data_processor.data) + if self.training_work.has_succeeded: + self.should_execute = False + +---- + +*********** +Limitations +*********** + +As stated above, the schedule acts as a dirac and is **True** for a single flow execution. +Therefore, sequential works execution under the schedule won't work as they don't complete within a single flow execution. + +Here is an example of something which **WON'T** work: + +.. code-block:: python + + from lightning.app import LightningFlow + from time import time + + class ScheduledDAG(LightningFlow): + def __init__(self): + super().__init__() + self.data_processor = DataProcessorWork(...) + self.training_work = KerasTrainingWork(...) + + def run(self): + ... + if self.schedule("hourly"): + # This finishes 5 min later + self.data_processor.run(trigger_time=time()) + if self.data_processor.has_succeeded: + # This will never be reached as the + # data processor will keep processing forever... + self.training_work.run(self.data_processor.data) + +---- + +************************** +Frequently Asked Questions +************************** + +- **Q: Can I use multiple nested scheduler?** No, as they might cancel themselves out, but you can capture the event of one to trigger the next one. + +- **Q: Can I use any arbitrary logic to schedule?** Yes, this design enables absolute flexibility, but you need to be careful to avoid bad practices. + +---- + +******** +Examples +******** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Build a DAG + :description: Learn how to schedule a DAG execution + :col_css: col-md-4 + :button_link: ../examples/dag/dag.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/glossary/secrets.rst b/docs/source-app/glossary/secrets.rst new file mode 100644 index 0000000..09a69ec --- /dev/null +++ b/docs/source-app/glossary/secrets.rst @@ -0,0 +1,74 @@ +.. _secrets: + +################# +Encrypted Secrets +################# + +Encrypted Secrets allow you to pass private data to your apps, like API keys, access tokens, database passwords, or other credentials, in a secure way without exposing them in your code. +Secrets provide you with a secure way to store this data in a way that is accessible to Apps so that they can authenticate third-party services/solutions. + +.. tip:: + For non-sensitive configuration values, we recommend using :ref:`plain-text Environment Variables `. + +************ +Add a secret +************ + +Add the secret to your profile on lightning.ai. +Log in to your lightning.ai account > **Profile** > **Secrets** tab > click the **+New** button. +Provide a name and value to your secret, for example, name could be "github_api_token". + +.. note:: + Secret names must start with a letter and can only contain letters, numbers, dashes, and periods. The Secret names must comply with `RFC1123 naming conventions `_. The Secret value has no restrictions. + +.. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning//encrypted_secrets_login.mp4 + :poster: https://pl-public-data.s3.amazonaws.com/assets_lightning//encrypted_secrets_login.png + :width: 600 + :class: background-video + :autoplay: + :loop: + :muted: + +************ +Use a secret +************ + +1. Add an environment variable to your app to read the secret. For example, add an "api_token" environment variable: + +.. code:: python + + import os + + component.connect(api_token=os.environ["api_token"]) + +2. Pass the secret to your app run with the following command: + +.. code:: bash + + lightning run app app.py --cloud --secret = + +In this example, the command would be: + +.. code:: bash + + lightning run app app.py --cloud --secret api_token=github_api_token + + +The ``--secret`` option can be used for multiple Secrets, and alongside the ``--env`` option. + +Here's an example: + +.. code:: bash + + lightning run app app.py --cloud --env FOO=bar --secret MY_APP_SECRET=my-secret --secret ANOTHER_SECRET=another-secret + + +---- + +****************** +How does this work +****************** + +When a Lightning App (App) **runs in the cloud**, a Secret can be exposed to the App using environment variables. +The value of the Secret is encrypted in the Lightning.ai database, and is only decrypted and accessible to +LightningFlow (Flow) or LightningWork (Work) processes in the cloud (when you use the ``--cloud`` option running your App). diff --git a/docs/source-app/glossary/sharing_components.rst b/docs/source-app/glossary/sharing_components.rst new file mode 100644 index 0000000..f9cc48c --- /dev/null +++ b/docs/source-app/glossary/sharing_components.rst @@ -0,0 +1,50 @@ +##################### +Sharing my components +##################### + +**Audience:** Users who want to know how to share component. + +**Level:** Basic + +---- + +******************************************** +Why should I consider sharing my components? +******************************************** + +Lightning is community driven and its core objective is to make AI accessible to everyone. + +By creating components and sharing them with everyone else, the barrier to entry will go down. + +---- + +************************************ +How should I organize my components? +************************************ + +By design, Lightning components are nested to form component trees where the ``LightningFlows`` are its branches and ``LightningWorks`` are its leaves. + +This design has two primary advantages: + +* This helps users organize and maintain their code with more ease. +* This also helps create an ecosystem with **reusable** components. + + +Now, imagine you have implemented a **KerasScriptRunner** component for training any `Keras `_ model with `Tensorboard UI `_ integrated. + +Here are the best practices steps before sharing the component: + +* **Testing**: Ensure your component is well tested by following the ref:`../testing` guide. +* **Documented**: Ensure your component has a docstring and comes with some usage explications. + +.. Note:: As a Lightning user, it helps to implement your components thinking someone else is going to use them. + +---- + +***************************************** +How should I proceed to share components? +***************************************** + +Once your component is ready, create a *PiPy* package with your own library and then it can be reused by anyone else. + +Here is a `Component Template `_ from `William Falcon `_ to guide your component. diff --git a/docs/source-app/glossary/storage/differences.rst b/docs/source-app/glossary/storage/differences.rst new file mode 100644 index 0000000..ed45edd --- /dev/null +++ b/docs/source-app/glossary/storage/differences.rst @@ -0,0 +1,78 @@ +:orphan: + +################################## +Differences between Drive and Path +################################## + +**Audience:** Users who want to share files between components. + + +The Lightning Storage system makes it easy to share files between LightningWork so you can run your app both locally and in the cloud without changing the code. + + +Lightning storage provides two solutions :class:`~lightning.app.storage.drive.Drive` and :class:`~lightning.app.storage.path.Path` to deal with files locally and in the cloud likewise. + + +---- + +***************** +What is a Drive ? +***************** + +The Drive object provides a central place for your components to share data. + +The drive acts as an isolate folder and any component can access it by knowing its name. + +Your components can put, list, get, delete files from and to the Drive (except LightningFlow's). + +---- + +**************** +What is a Path ? +**************** + +The Path object is a reference to a specific file or directory from a LightningWork and can be used to transfer those files to another LightningWork (one way, from source to destination). + +A good mental representation of the Path Object usage is the `relay race `_. +To make a transfer, the LightningWork Receiver asks (e.g when the path object is passed by the flow to the Receiver) +for a copy of the files (baton) owned by their LightningWork Producer (e.g the work that created the files). + +---- + +********************************* +When should I use Drive vs Path ? +********************************* + +The Drive should be used when you want to easily share data between components but the Path enables to create cleaner shareable +component where you want to exposes some files to be transferred (like an HPO component sharing the best model weights) for anyone else to use. + +The Drive is more intuitive and easier to get on-boarded with, but in more advanced use cases, you might appreciate the Path Object +which makes uni-directional files transfer simpler. + +---- + +.. raw:: html + +
+
+ +.. displayitem:: + :header: The Drive Object. + :description: Put, List and Get Files From a Shared Drive Disk. + :col_css: col-md-4 + :button_link: drive.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: The Path Object. + :description: Transfer Files From One Component to Another by Reference. + :col_css: col-md-4 + :button_link: path.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/glossary/storage/drive.rst b/docs/source-app/glossary/storage/drive.rst new file mode 100644 index 0000000..dffdb97 --- /dev/null +++ b/docs/source-app/glossary/storage/drive.rst @@ -0,0 +1,13 @@ +:orphan: + +.. _drive_storage: + +############# +Drive Storage +############# + +**Audience:** Users who want to put, list, and get files from a shared disk space. + +---- + +.. include:: ../../glossary/storage/drive_content_old.rst diff --git a/docs/source-app/glossary/storage/drive_content.rst b/docs/source-app/glossary/storage/drive_content.rst new file mode 100644 index 0000000..8ab7015 --- /dev/null +++ b/docs/source-app/glossary/storage/drive_content.rst @@ -0,0 +1,223 @@ +:orphan: + +************************** +What are Lightning Drives? +************************** + +Lightning Drives are shared app storage that allow you to share files between `LightningWork (Work) <../../core_api/lightning_work/index.html>`_ components, so that you distributed components can share files when running on the cloud. Using drives, you can run your Lightning App both locally and in the cloud without changing the code. + +The Drive object provides a central place for your components to share data. + +The Drive acts as an isolated folder and any component can access it by knowing its name. + +We currently support two types of Drives: Lightning-managed (``lit://``) and S3 (``s3://``). + ++-----------------------------------+-------------------------------------------------------------------------------------------------------------------------------+ +| Lightning-managed (``lit://``) | Allows read-write operations and are accessible through the Drive API from a Work. | +| | | +| | They allow your components to put, list, get, and delete files from and to the Drive (except LightningFlows). | ++-----------------------------------+-------------------------------------------------------------------------------------------------------------------------------+ +| S3 (``s3://``) | S3 is AWS S3 storage mounted at a filesystem mount point. S3 is read-only (for now) and its primary purpose is | +| | to give you a permanent location to access your training data. | +| | | +| | They allow your components to list and get files located on the Drive. | ++-----------------------------------+-------------------------------------------------------------------------------------------------------------------------------+ + +---- + +********************** +What Drives do for you +********************** + +Think of every instance of the Drive object acting like a Google Drive or like Dropbox. + +By sharing the Drive between components through the LightningFlow, +several components can have a shared place to read (S3 Drives) or read and write (Lightning-managed Drives) files from. + +S3 Drive Limitations +^^^^^^^^^^^^^^^^^^^^ + +These limitations only apply to S3 Drives: + +* There is no top level “shareable” S3 drive object. Each S3 Drive is owned by a particular Work. However, it’s possible to create a Drive with the same location across multiple Works. + +* S3 buckets cannot be mounted as Drives once a Work has been instantiated. The `Drive` object must be initialized passed to a Work at creation time. + +* Whenever a Drive is mounted to a Work, an indexing process will be done again for the provided S3 bucket. This may lead to performance issues with particularly large S3 buckets. For context, 1M files with 2-3 levels of nesting takes less than 1 second to index. + +---- + +************** +Create a Drive +************** + +In order to create a Drive, you simply need to pass its name with the prefix ``lit://`` or ``s3://``. + +.. note:: We do not support mounting single objects for S3 buckets, so there must be a trailing `/` in the s3:// URL. For example: ``s3://foo/bar/``. + +.. code-block:: python + + from lightning.app.storage import Drive + + # The identifier of this Drive is ``drive_1`` + # Note: You need to add Lightning protocol ``lit://`` as a prefix. + + drive_1 = Drive("lit://drive_1") + + # The identifier of this Drive is ``drive_2`` + drive_2 = Drive("s3://drive_2/") + +Any component can create a drive object for ``lit://`` Drives. + +.. code-block:: python + + from lightning.app import LightningFlow, LightningWork + from lightning.app.storage import Drive + + + class Flow(LightningFlow): + def __init__(self): + super().__init__() + self.drive_1 = Drive("lit://drive_1") + + def run(self): + ... + + + class Work(LightningWork): + def __init__(self): + super().__init__() + self.drive_1 = Drive("lit://drive_1") + + def run(self): + ... + +---- + +***************************** +Supported actions with Drives +***************************** + +A Lightning-managed Drive supports put, list, get, and delete actions. + +An S3 Drive supports list and get actions (for now). + +.. code-block:: python + + from lightning.app.storage import Drive + + drive = Drive("lit://drive") + + drive.list(".") # Returns [] as empty + + # Created file. + with open("a.txt", "w") as f: + f.write("Hello World !") + + drive.put("a.txt") + + drive.list(".") # Returns ["a.txt"] as the file copied in the Drive during the put action. + + drive.get("a.txt") # Get the file into the current worker + + drive.delete("a.txt") + + drive.list(".") # Returns [] as empty + +---- + +********************************** +Component interactions with Drives +********************************** + +Here is an illustrated code example on how to create drives within Works. + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/drive_2.png + +.. code-block:: python + + from lightning.app import LightningFlow, LightningWork, LightningApp + from lightning.app.storage import Drive + + + class Work_A(LightningWork): + def __init__(self): + super().__init__() + # The identifier of the Drive is ``drive_1`` + # Note: You need to add Lightning protocol ``lit://`` as a prefix. + self.drive_1 = Drive("lit://drive_1") + + def run(self): + # 1. Create a file. + with open("a.txt", "w") as f: + f.write("Hello World !") + + # 2. Put the file into the drive. + self.drive_1.put("a.txt") + + + class Work_B(LightningWork): + def __init__(self): + super().__init__() + + # Note: Work B has access 2 drives. + + # The identifier of this Drive is ``drive_1`` + self.drive_1 = Drive("lit://drive_1") + # The identifier of this Drive is ``drive_2`` + self.drive_2 = Drive("lit://drive_2") + + def run(self): + # 1. Create a file. + with open("b.txt", "w") as f: + f.write("Hello World !") + + # 2. Put the file into both drives. + self.drive_1.put("b.txt") + self.drive_2.put("b.txt") + + + class Work_C(LightningWork): + def __init__(self): + super().__init__() + self.drive_2 = Drive("lit://drive_2") + + def run(self): + # 1. Create a file. + with open("c.txt", "w") as f: + f.write("Hello World !") + + # 2. Put the file into the drive. + self.drive_2.put("c.txt") + +---- + +************************* +Transfer files with Drive +************************* + +In the example below, the Drive is created by the Flow and passed to its Works. + +The ``Work_1`` put a file **a.txt** in the **Drive("lit://this_drive_id")** and the ``Work_2`` can list and get the **a.txt** file from it. + +.. literalinclude:: ../../../../examples/app/drive/app.py + +---- + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Learn about the Path Object. + :description: Transfer Files From One Component to Another by Reference. + :col_css: col-md-4 + :button_link: path.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/glossary/storage/drive_content_old.rst b/docs/source-app/glossary/storage/drive_content_old.rst new file mode 100644 index 0000000..3c37f88 --- /dev/null +++ b/docs/source-app/glossary/storage/drive_content_old.rst @@ -0,0 +1,199 @@ +:orphan: + + +************ +About Drives +************ + +Lightning Drive storage makes it easy to share files between LightningWorks so you can run your Lightning App both locally and in the cloud without changing the code. + +The Drive object provides a central place for your components to share data. + +The Drive acts as an isolate folder and any component can access it by knowing its name. + +Your components can put, list, get, and delete files from and to the Drive (except LightningFlows). + +---- + +*********************** +What Drive does for you +*********************** + +Think of every instance of the Drive object acting like a Google Drive or like Dropbox. + +By sharing the Drive between components through the LightningFlow, +several components can have a shared place to read and write files from. + +---- + +************** +Create a Drive +************** + +In order to create a Drive, you simply need to pass its name with the prefix ``lit://`` as follows: + +.. code-block:: python + + from lightning.app.storage import Drive + + # The identifier of this Drive is ``drive_1`` + # Note: You need to add Lightning protocol ``lit://`` as a prefix. + + drive_1 = Drive("lit://drive_1") + + # The identifier of this Drive is ``drive_2`` + drive_2 = Drive("lit://drive_2") + +Any components can create a drive object. + +.. code-block:: python + + from lightning.app import LightningFlow, LightningWork + from lightning.app.storage import Drive + + + class Flow(LightningFlow): + def __init__(self): + super().__init__() + self.drive_1 = Drive("lit://drive_1") + + def run(self): + ... + + + class Work(LightningWork): + def __init__(self): + super().__init__() + self.drive_1 = Drive("lit://drive_1") + + def run(self): + ... + +---- + +***************************** +Supported actions with Drives +***************************** + +A Drive supports put, list, get, and delete actions. + +.. code-block:: python + + from lightning.app.storage import Drive + + drive = Drive("lit://drive") + + drive.list(".") # Returns [] as empty + + # Created file. + with open("a.txt", "w") as f: + f.write("Hello World !") + + drive.put("a.txt") + + drive.list(".") # Returns ["a.txt"] as the file copied in the Drive during the put action. + + drive.get("a.txt") # Get the file into the current worker + + drive.delete("a.txt") + + drive.list(".") # Returns [] as empty + +---- + +********************************** +Component interactions with Drives +********************************** + +Here is an illustrated code example on how to create drives within works. + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/drive_2.png + +.. code-block:: python + + from lightning.app import LightningFlow, LightningWork, LightningApp + from lightning.app.storage import Drive + + + class Work_A(LightningWork): + def __init__(self): + super().__init__() + # The identifier of the Drive is ``drive_1`` + # Note: You need to add Lightning protocol ``lit://`` as a prefix. + self.drive_1 = Drive("lit://drive_1") + + def run(self): + # 1. Create a file. + with open("a.txt", "w") as f: + f.write("Hello World !") + + # 2. Put the file into the drive. + self.drive_1.put("a.txt") + + + class Work_B(LightningWork): + def __init__(self): + super().__init__() + + # Note: Work B has access 2 drives. + + # The identifier of this Drive is ``drive_1`` + self.drive_1 = Drive("lit://drive_1") + # The identifier of this Drive is ``drive_2`` + self.drive_2 = Drive("lit://drive_2") + + def run(self): + # 1. Create a file. + with open("b.txt", "w") as f: + f.write("Hello World !") + + # 2. Put the file into both drives. + self.drive_1.put("b.txt") + self.drive_2.put("b.txt") + + + class Work_C(LightningWork): + def __init__(self): + super().__init__() + self.drive_2 = Drive("lit://drive_2") + + def run(self): + # 1. Create a file. + with open("c.txt", "w") as f: + f.write("Hello World !") + + # 2. Put the file into the drive. + self.drive_2.put("c.txt") + +---- + +***************************** +Transfer files with Drive +***************************** + +In the example below, the Drive is created by the flow and passed to its LightningWork's. + +The ``Work_1`` put a file **a.txt** in the **Drive("lit://this_drive_id")** and the ``Work_2`` can list and get the **a.txt** file from it. + +.. literalinclude:: ../../../../examples/app/drive/app.py + + +---- + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Learn about the Path Object. + :description: Transfer Files From One Component to Another by Reference. + :col_css: col-md-4 + :button_link: path.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/glossary/storage/path.rst b/docs/source-app/glossary/storage/path.rst new file mode 100644 index 0000000..3f4cba6 --- /dev/null +++ b/docs/source-app/glossary/storage/path.rst @@ -0,0 +1,326 @@ +:orphan: + +############ +Path Storage +############ + +**Audience:** Users who want to share files between components. + + +The Lightning Storage system makes it easy to share files between LightningWork so you can run your app both locally and in the cloud without changing the code. + +---- + +*********************** +What is a Path Object ? +*********************** + +The Path object is a reference to a specific file or directory from a LightningWork and can be used to transfer those files to another LightningWork (one way, from source to destination). + +A good mental representation of the Path Object usage is the `relay race `_. +To make a transfer, the receiver asks (e.g when the path object is passed by the flow to the receiver) +for a copy of the files (baton) owned by their producer (e.g the LightningWork which created the files). + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/path2.png + +******************************************* +How does the Path Object works internally ? +******************************************* + +To understand the Path Object internal, let's first answer this question: How do you locate a specific file or folder within a distributed system made of multiple machines ? + +You need to know on which machine the file or folder is located (e.g the LightningWork name uniquely identify its own machine in the cloud) and +then you need the local path of the file or folder on that machine. + +In simple words, the Lightning Path augments :class:`pathlib.Path` object by tracking on which machine the file or folder is located. + +---- + +************************** +When to use Path storage ? +************************** + +In the cloud, every :class:`~lightning.app.core.work.LightningWork` runs in a separate machine with its own filesystem. +This means files in one Work cannot be directly accessed in another like you would be able to when running the app locally. +But with Lightning Storage, this is easy: Simply declare which files need to be shared and Lightning will take care of the rest. + +.. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/path.mp4 + :width: 600 + :autoplay: + :loop: + :muted: + + +---- + + +*********************************** +Tell Lightning where your files are +*********************************** + +Convert every filesystem path you want to share with other LightningWorks to by adding ``lit://`` in front of it. + +.. code-block:: python + + from lightning.app import LightningWork + from lightning.app.storage import Path + + + class SourceWork(LightningWork): + def __init__(self): + super().__init__() + self.checkpoint_dir = None + + def run(self): + # Normally you would do: + # self.checkpoint_dir = "outputs/checkpoints" + # os.makedirs("outputs/checkpoints") + # ... + + # In Lightning, do: + self.checkpoint_dir = "lit://outputs/checkpoints" + os.makedirs(self.checkpoint_dir) + ... + + +Under the hood, we convert this string to a :class:`~lightning.app.storage.path.Path` object, which is a drop-in replacement for :class:`pathlib.Path` meaning it will work with :mod:`os`, :mod:`os.path` and :mod:`pathlib` filesystem operations out of the box! + + +---- + + +**************************** +Access files in another Work +**************************** + +Accessing files from another LightningWork is as easy as handing the path over by reference. +For example, share a directory by passing it as an input to the run method of the destination work: + +.. code-block:: python + :emphasize-lines: 12 + + from lightning.app import LightningFlow + + + class Flow(LightningFlow): + def __init__(self): + super().__init__() + self.source = SourceWork() + self.destination = DestinationWork() + + def run(self): + self.source.run() + # Pass the Path reference from one work to another + self.destination.run(self.source.checkpoint_dir) + + +When the destination Work starts, Lightning will automatically transfer the files to its filesystem (if they exist on the other end): + +.. code-block:: python + + class DestinationWork(LightningWork): + def run(self, checkpoint_dir): + # The directory is now accessible inside this Work + files = os.listdir(checkpoint_dir) + ... + + +The automatic transfer only happens if the referenced files already exist in the originating LightningWork and it will overwrite any files that already exist locally. +In all other cases, you can trigger the transfer manually. + + +---- + + +****************** +Get files manually +****************** + +If you need to access files at a specific time or transfer them multiple times, use ``.get()`` method: + +.. code-block:: python + + def run(self, checkpoint_dir): + ... + # Make the directory available + checkpoint_dir.get() + + # If the path already exists locally, you can force overwriting it + checkpoint_dir.get(overwrite=True) + + files = os.listdir(checkpoint_dir) + ... + + +Multiple calls to the ``.get()`` method will always result in file transfers, regardless of whether the files have changed or not. +If the path does not exist remotely, it will raise a ``FileNotFoundError``. +If you need to handle this case, the Path also offers a method to check if files exist remotely. + +---- + + +******************************** +Check if a file or folder exists +******************************** + +You can check if a path exists locally or remotely in the source Work using the ``.exists_local()`` and ``.exists_remote()`` methods: + +.. code-block:: python + + def run(self, checkpoint_dir): + if checkpoint_dir.exists_remote(): + # Get the file only if it exists in the source Work + checkpoint_dir.get() + + # OR + + if checkpoint_dir.exists_local(): + # Do something with the file if it exists locally + files = os.listdir(checkpoint_dir) + + +---- + + +************* +Persist files +************* + +If a LightningWork finishes or stops due to an interruption (e.g., due to insufficient credits), the filesystem and all files in it get deleted (unless running locally). +Lightning makes sure all Paths that are part of the state get stored and made accessible to the other Works that still need these files. + +.. code-block:: python + + from lightning.app.storage import Path + + + class Work(LightningWork): + def __init__(self): + super().__init__() + # The files in this path will be saved as an artifact when the Work finishes + self.checkpoint_dir = "lit://outputs/checkpoints" + + # The files in this path WON'T be saved because it is not declared as a Lightning Path + self.log_dir = "outputs/logs" + + +---- + + +********************************* +Example: Share a model checkpoint +********************************* + +A common workflow in ML is to use a checkpoint created by another component. +First, define a component that saves a checkpoint: + +.. code:: python + :emphasize-lines: 14-18 + + from lightning.app import LightningFlow, LightningWork + from lightning.app.storage import Path + import torch + import os + + + class ModelTraining(LightningWork): + def __init__(self, *args, **kwargs): + super().__init__(*args, **kwargs) + self.checkpoint_dir = "lit://outputs/checkpoints" + + def run(self): + # create a directory + os.makedirs(self.model_checkpoints_path, exist_ok=True) + # make fake checkpoints + checkpoint_1 = torch.tensor([0, 1, 2, 3, 4]) + checkpoint_2 = torch.tensor([0, 1, 2, 3, 4]) + torch.save(checkpoint_1, os.path.join(self.checkpoint_dir, "checkpoint_1.ckpt")) + torch.save(checkpoint_2, os.path.join(self.checkpoint_dir, "checkpoint_2.ckpt")) + + +Next, define a component that needs the checkpoints: + +.. code:: python + :emphasize-lines: 4, 7 + + class ModelDeploy(LightningWork): + def __init__(self, *args, **kwargs): + super().__init__() + + def run(self, checkpoint_dir): + ckpts = os.listdir(checkpoint_dir) + checkpoint_1 = torch.load(ckpts[0]) + checkpoint_2 = torch.load(ckpts[1]) + +Link both components via a parent component: + +.. code:: python + :emphasize-lines: 7 + + class Flow(LightningFlow): + def __init__(self): + super().__init__() + self.train = ModelTraining() + + # pass the checkpoint path + self.deploy = ModelDeploy() + + def run(self): + self.train.run() + self.deploy.run(checkpoint_dir=self.train.checkpoint_dir) + + + app = L.LightningApp(Flow()) + + +---- + +************************** +Frequently Asked Questions +************************** + +- **Q: Can files in a LightningWork be accessed inside the LightningFlow too?** + + No, LightningFlow is intentionally designed not to perform filesystem operations and computations and is intended to exclusively orchestrate Flow and Work. + +- **Q: Is it possible to reference any file using the Lightning lit:// path notation?** + + Yes, but only files for which the app has write permissions can be copied from Work to Work (apps don't run with root priviliges). + +- **Q: Can I access the Lightning Storage in my UI (StreamLit, Web, ...)?** + + This is currently not supported but will be in the future. + +- **Q: Should I define my lit:// path in the __init__ or the run method?** + + You can declare a Lightning path anywhere you'd like. However, the ``.get()`` and ``.exists_*()`` methods only work inside of the run method of a LightningWork. + +- **Q:How often does Lightning synchronize the files between my Work?** + + Lightning does not synchronize the files between works. It only transfers the files once when the Work ``run`` method starts. + But you can call ``Path.get()`` as many times as you wish to transfer the latest file into the current Work. + +- **Does Lightning provide me direct access to the shared cloud folder?** + + No, and this is on purpose. This restriction forces developers to build modular components that can be shared and integrated + into apps easily. This would be much harder to achieve if file paths in these components would reference a global shared storage. + +---- + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Learn about the Drive Object. + :description: Put, List and Get Files From a Shared Drive Disk. + :col_css: col-md-4 + :button_link: drive.html + :height: 180 + :tag: Basic + +.. raw:: html + +
+
diff --git a/docs/source-app/glossary/storage/storage.rst b/docs/source-app/glossary/storage/storage.rst new file mode 100644 index 0000000..af115a8 --- /dev/null +++ b/docs/source-app/glossary/storage/storage.rst @@ -0,0 +1,77 @@ +.. _storage: + +####### +Storage +####### + +**Audience:** Users who want to share files between components. + + +The Lightning Storage system makes it easy to share files between LightningWork so you can run your app both locally and in the cloud without changing the code. + + +Lightning storage provides two solutions :class:`~lightning.app.storage.drive.Drive` and :class:`~lightning.app.storage.path.Path` to deal with files locally and in the cloud likewise. + + +---- + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Learn about the differences between Drive vs Path. + :description: Learn about their differences. + :col_css: col-md-4 + :button_link: differences.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: The Drive Object. + :description: Put, List and Get Files From a Shared Drive Disk. + :col_css: col-md-4 + :button_link: drive.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: The Path Object. + :description: Transfer Files From One Component to Another by Reference. + :col_css: col-md-4 + :button_link: path.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
+ + +---- + +******** +Examples +******** + + + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Build a File Server + :description: Learn how to use Drive to upload / download files to your app. + :col_css: col-md-4 + :button_link: ../../examples/file_server/file_server.html + :height: 180 + :tag: Intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/glossary/use_local_lightning.rst b/docs/source-app/glossary/use_local_lightning.rst new file mode 100644 index 0000000..0987dd3 --- /dev/null +++ b/docs/source-app/glossary/use_local_lightning.rst @@ -0,0 +1,15 @@ +################################################################ +How to run an app on the cloud with a local version of lightning +################################################################ + +The lightning cloud uses the latest release by default. However, you might want to run your app with some local changes you've made to the lightning framework. To use your local version of lightning on the cloud, set the following environment variable: + +```bash +git clone https://github.com/Lightning-AI/lightning.git +cd lightning +pip install -e . +export PACKAGE_LIGHTNING=1 # <- this is the magic to use your version (not mainstream PyPI)! +lightning run app app.py --cloud +``` + +By seting `PACKAGE_LIGHTNING=1`, lightning packages the lightning source code in your local directory in addition to your app source code and uploads them to the cloud. diff --git a/docs/source-app/index.rst b/docs/source-app/index.rst new file mode 100644 index 0000000..8cebcd3 --- /dev/null +++ b/docs/source-app/index.rst @@ -0,0 +1,156 @@ +.. lightning documentation master file, created by + sphinx-quickstart on Sat Sep 19 16:37:02 2020. + You can adapt this file completely to your liking, but it should at least + contain the root `toctree` directive. + +####################### +Welcome to ⚡ Lightning +####################### +Build models, ML components and full stack AI apps ⚡ *Lightning fast*. + +**Featured examples of what you can do with Lightning:** + +| + +.. raw:: html + +
+
+ +.. app_card:: + :title: Develop and Train + :description: Train a model (32 GPUs) + :width: 280 + :image: https://lightning-ai-docs.s3.amazonaws.com/develop_n_train_v1.jpg + :target: levels/basic/real_lightning_component_implementations.html#ex-pytorch-lightning-trainer + :preview: levels/basic/real_lightning_component_implementations.html#ex-pytorch-lightning-trainer + :tags: Training + +.. app_card:: + :title: Serve and deploy + :description: Production diffusion server (<2s latency) + :width: 280 + :app_id: HvUwbEG90E + :image: https://lightning-ai-docs.s3.amazonaws.com/serve_n_deploy_v1.jpg + :deploy: https://lightning.ai + :target: https://01gbx4m78rbkpczdf5cpz2hpbh.litng-ai-03.litng.ai/root.api_component/ + :tags: Serving + +.. app_card:: + :title: Scale and build a product + :description: Production-ready generative AI app + :width: 280 + :app_id: HvUwbEG90E + :image: https://lightning-ai-docs.s3.amazonaws.com/scale_n_build_v1.jpg + :target: https://lightning.ai/muse + :tags: AI App + +.. raw:: html + +
+
+ +---- + +******************************** +Build self-contained, components +******************************** +Use Lightning, the hyper-minimalistic framework, to build machine learning components that can plug into existing ML workflows. +A Lightning component organizes arbitrary code to run on the cloud, manage its own infrastructure, cloud costs, networking, and more. +Focus on component logic and not engineering. + +Use components on their own, or compose them into full-stack AI apps with our next-generation Lightning orchestrator. + +.. raw:: html + +
+ +
+ +| + +| + +**Run an example component on the cloud**: + +.. include:: ./levels/basic/hero_components.rst + +| + +Components run the same on the cloud and locally on your choice of hardware. + +.. lit_tabs:: + :code_files: landing_app_run.bash + :highlights: 5 + :height: 150px + :code_only: True + +Explore pre-built community components in `our gallery `_. + +| + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Get started + :description: Learn to build Lightning components step-by-step. + :col_css: col-md-12 + :button_link: levels/basic/index.html + :height: 160 + :tag: 10 minutes + +.. raw:: html + +
+
+ +.. raw:: html + +
+ +.. toctree:: + :maxdepth: 1 + :caption: Home + + self + Install + +.. toctree:: + :maxdepth: 1 + :caption: Get started in steps + + Basic + Intermediate + Advanced + +.. toctree:: + :maxdepth: 1 + :caption: Core API Reference + + LightningApp + LightningFlow + LightningWork + +.. toctree:: + :maxdepth: 1 + :caption: Addons API Reference + + api_reference/components + api_reference/frontend + api_reference/runners + api_reference/storage + +.. toctree:: + :maxdepth: 1 + :caption: More + + Start from component templates + Start from app templates + Examples + Glossary + How-to diff --git a/docs/source-app/install/install_beginner.rst b/docs/source-app/install/install_beginner.rst new file mode 100644 index 0000000..f690ef7 --- /dev/null +++ b/docs/source-app/install/install_beginner.rst @@ -0,0 +1,117 @@ +:orphan: + +.. _install_beginner: + +############################# +What is a virtual environment +############################# +A virtual environment keeps the packages you install isolated from the rest of your system. +This allows you to work on multiple projects that have different and potentially conflicting requirements, and it +keeps your system Python installation clean. + +.. raw:: html + + + +---- + +We will describe two choices here, pick one: + + +1. :ref:`Python virtualenv `. +2. :ref:`Conda virtual environment `. + +---- + +.. _python-virtualenv: + +******************** +1. Python Virtualenv +******************** + +First, make sure that you have Python 3.8+ installed on your system. + +.. code-block:: bash + + python3 --version + +If you can't run the command above or it returns a version older than 3.8, +`install the latest version of Python `_. +After installing it, make sure you can run the above command without errors. + +---- + +Creating a Virtual Environment +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +When starting with a new Python project, you typically want to create a new Python virtual environment. +Navigate to the location of your project and run the following command: + +.. code-block:: bash + + python3 -m venv lightning + +The name of the environment here is *lightning* but you can choose any other name you like. +By running the above command, Python will create a new folder *lightning* in the current working directory. + +---- + +Activating the Virtual Environment +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +Before you can install packages into the environment, you need to activate it: + +.. code-block:: bash + + source lightning/bin/activate + +You need to do this step every time you want to work on your project / open the terminal. +With your virtual environment activated, you are now ready to +:doc:`install Lightning ` and get started with Apps! + +---- + +.. _conda: + +******** +2. Conda +******** + +To get started, you first need to download and install the `Miniconda package manager `_. +To check that the installation was successful, open an new terminal and run: + +.. code:: bash + + conda + +It should return a list of commands. + +---- + +Creating a Conda Environment +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +When starting with a new Python project, you typically want to create a new Conda virtual environment. +Navigate to the location of your project and run the following command: + +.. code-block:: bash + + conda create --yes --name lightning python=3.8 + +The name of the environment here is *lightning* but you can choose any other name you like. +Note how we can also specify the Python version here. + +---- + +Activating the Conda Environment +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +Before you can install packages into the environment, you need to activate it: + +.. code-block:: bash + + conda activate lightning + +You need to do this step every time you want to work on your project / open the terminal. +With your virtual environment activated, you are now ready to +:doc:`install Lightning ` and get started with Apps! diff --git a/docs/source-app/install/installation.rst b/docs/source-app/install/installation.rst new file mode 100644 index 0000000..294e268 --- /dev/null +++ b/docs/source-app/install/installation.rst @@ -0,0 +1,29 @@ + +.. _install: + + +############ +Installation +############ + +**Prerequisites**: Use Python 3.8.x or later (3.8.x, 3.9.x, 3.10.x). We also recommend you install in a virtual environment (learn how). + +.. lit_tabs:: + :descriptions: Pip; Macs, Apple Silicon (M1/M2/M3); Windows + :code_files: pip.bash; mac.bash; windows.bash + :tab_rows: 4 + :height: 180px + +---- + +************ +Troubleshoot +************ +If you encounter issues during installation join our community discord and share the output of the following command: + +.. code:: bash + + pip list | grep lightning + +.. join_slack:: + :align: left diff --git a/docs/source-app/install/mac.bash b/docs/source-app/install/mac.bash new file mode 100644 index 0000000..22825bb --- /dev/null +++ b/docs/source-app/install/mac.bash @@ -0,0 +1,5 @@ +# needed for M1/M2/M3 +export GRPC_PYTHON_BUILD_SYSTEM_OPENSSL=1 +export GRPC_PYTHON_BUILD_SYSTEM_ZLIB=1 + +pip install lightning diff --git a/docs/source-app/install/pip.bash b/docs/source-app/install/pip.bash new file mode 100644 index 0000000..f6d38b7 --- /dev/null +++ b/docs/source-app/install/pip.bash @@ -0,0 +1 @@ +pip install lightning diff --git a/docs/source-app/install/windows.bash b/docs/source-app/install/windows.bash new file mode 100644 index 0000000..150b04e --- /dev/null +++ b/docs/source-app/install/windows.bash @@ -0,0 +1,4 @@ +# install pip +# install git +# setup an alias for Python: python=python3 +# Add the root folder of Lightning to the Environment Variables to PATH diff --git a/docs/source-app/intro.rst b/docs/source-app/intro.rst new file mode 100644 index 0000000..c975ee7 --- /dev/null +++ b/docs/source-app/intro.rst @@ -0,0 +1,88 @@ +:orphan: + +.. _what: + +################### +What is Lightning? +################### + +Lightning is a free, modular, distributed, and open-source framework for building +AI applications where the components you want to use interact together. + +Lightning apps can be built for **any AI use case**, ranging from AI research to +production-ready pipelines (and everything in between!). + +By abstracting the engineering boilerplate, Lightning allows researchers, data scientists, and software engineers to +build highly-scalable, production-ready AI apps using the tools and technologies of their choice, +regardless of their level of engineering expertise. + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/Lightning.gif + :alt: What is Lightning gif. + :width: 100 % + +---- + +.. _why: + +*************** +Why Lightning? +*************** + + +Easy to learn +^^^^^^^^^^^^^ + +Lightning was built for creating AI apps, not for dev-ops. It offers an intuitive, pythonic +and highly composable interface that allows you to focus on solving the problems that are important to you. + +---- + +Quick to deliver +^^^^^^^^^^^^^^^^ + +Lightning speeds the development process by offering testable templates you can build from, +accelerating the process of moving from idea to prototype and finally to market. + +---- + +Easy to scale +^^^^^^^^^^^^^ + +Lightning provides a mirrored experience locally and in the cloud. The `lightning.ai `_. +cloud platform abstracts the infrastructure, so you can run your apps at any scale. + +---- + +Easy to collaborate +^^^^^^^^^^^^^^^^^^^ + +Lightning was built for collaboration. +By following the best MLOps practices provided through our documentation and example use cases, +you can deploy state-of-the-art ML applications that are ready to be used by teams of all sizes. + +---- + +***************************** +What's Novel With Lightning? +***************************** + + +Cloud Infra Made Simple and Pythonic +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +Lightning is for building reactive, scalable, cost effective, easy-to-maintain and reliable ML products in the cloud without worrying about infrastructure. Lightning provides several engineering novelties to enable this: + +#. **Reactivity**: Lightning allows you to run stateful components distributed across different machines, so you can design async, dynamic and reactive workflows in python, without having to define DAGs. + +#. **Scalable & Cost-Effective**: Lightning provides a granular and simple way to run components preemptively or on-demand and on any desired resource such as CPU or GPU. It also enables you to easily transfer artifacts from one machine to another. + +#. **Reliability**: + + #. **Checkpointing**: Lightning apps can be paused and resumed from generated state and artifact-based checkpoints. + #. **Resilience**: Lightning has a strong fault-tolerance foundation. Your application can be written and tested to be resilient for cloud hazards at the component level. + #. **Testing Tools**: Lightning provides you with tools and best practices you can use to develop and test your application. All of our built-in templates have unit integration and end-to-end tests. + +#. **Easy to maintain**: + + #. **Easy Debugging**: Lightning apps can be debugged locally and in the cloud with **breakpoints** in any components. + #. **Non-Invasive**: Lightning is the glue that connects all parts of your workflow, but this is done in a non-invasive way by formalizing API contracts between components. In other words, your application can run someone else's code with little assumption. diff --git a/docs/source-app/landing_app.py b/docs/source-app/landing_app.py new file mode 100644 index 0000000..d4f4ed8 --- /dev/null +++ b/docs/source-app/landing_app.py @@ -0,0 +1,12 @@ +# app.py +import lightning as L + + +class YourComponent(L.LightningWork): + def run(self): + print('RUN ANY PYTHON CODE HERE') + + +# run on a cloud machine ("cpu", "gpu", ...) +component = YourComponent(cloud_compute=L.CloudCompute("cpu")) +app = L.LightningApp(component) diff --git a/docs/source-app/landing_app_run.bash b/docs/source-app/landing_app_run.bash new file mode 100644 index 0000000..fd30621 --- /dev/null +++ b/docs/source-app/landing_app_run.bash @@ -0,0 +1,5 @@ +# install lightning +pip install lightning + +# run the app on the --cloud (--setup installs deps automatically) +lightning run app app.py --setup --cloud diff --git a/docs/source-app/levels/advanced/index.rst b/docs/source-app/levels/advanced/index.rst new file mode 100644 index 0000000..4ba7d09 --- /dev/null +++ b/docs/source-app/levels/advanced/index.rst @@ -0,0 +1,94 @@ +.. _advanced_level: + +.. toctree:: + :maxdepth: 1 + :hidden: + + start_dynamic_components + level_16 + level_17 + level_18 + level_19 + level_20 + +############### +Advanced skills +############### +Learn to build nested components with advanced functionality. + + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Level 9: Start dynamic components + :description: Learn to start works dynamically + :button_link: start_dynamic_components.html + :col_css: col-md-6 + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Level 10: Check component status + :description: Learn to use work status to coordinate complex apps. + :button_link: level_16.html + :col_css: col-md-6 + :height: 150 + :tag: advanced + +.. displayitem:: + :header: Level: Nest flows + :description: Learn to nest flows into other flows. + :button_link: level_14.html + :col_css: col-md-6 + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Level: Develop reactive apps. + :description: Learn to develop reactive Lightning Apps. Lightning shines with reactive workflows. + :button_link: level_14.html + :col_css: col-md-6 + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Level: Enable CLI commands for your app + :description: Speak to your app from a CLI over the network + :button_link: level_17.html + :col_css: col-md-6 + :height: 150 + :tag: advanced + +.. displayitem:: + :header: Level 11: Connect two components over the network + :description: Connect two LightningWorks over the network. + :button_link: level_14.html + :col_css: col-md-6 + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Level 13: Rerun components + :description: Learn to reuse components by passing different variables. + :button_link: level_17.html + :col_css: col-md-6 + :height: 150 + :tag: advanced + +.. displayitem:: + :header: Level 14: Handle Lightning App exceptions + :description: Learn to handle Lightning App exceptions. + :button_link: level_19.html + :col_css: col-md-6 + :height: 150 + :tag: advanced + +.. raw:: html + +
+
diff --git a/docs/source-app/levels/advanced/level_16.rst b/docs/source-app/levels/advanced/level_16.rst new file mode 100644 index 0000000..58c1e1f --- /dev/null +++ b/docs/source-app/levels/advanced/level_16.rst @@ -0,0 +1,10 @@ +########################### +Level 16: Check Work status +########################### +**Audience:** Users who want to stop/start Lightning Work based on a status. + +**Prereqs:** Level 16+ + +---- + +.. include:: ../../core_api/lightning_work/status_content.rst diff --git a/docs/source-app/levels/advanced/level_17.rst b/docs/source-app/levels/advanced/level_17.rst new file mode 100644 index 0000000..7f0f505 --- /dev/null +++ b/docs/source-app/levels/advanced/level_17.rst @@ -0,0 +1,10 @@ +########################## +Level 17: Rerun components +########################## +**Audience:** Users who want Work.run() to activate multiple times in an app. + +**Prereqs:** Level 16+ and read the `Event Loop guide <../glossary/event_loop.html>`_. + +---- + +.. include:: ../../workflows/run_work_once_content.rst diff --git a/docs/source-app/levels/advanced/level_18.rst b/docs/source-app/levels/advanced/level_18.rst new file mode 100644 index 0000000..c934d2f --- /dev/null +++ b/docs/source-app/levels/advanced/level_18.rst @@ -0,0 +1,10 @@ +############################################## +Level 18: Share objects between LightningWorks +############################################## +**Audience:** Users moving DataFrames or outputs, between Lightning Works (usually data engineers). + +**Prereqs:** Level 16+ and know about the Pandas library and read the `Access app state guide <../../access_app_state.html>`_. + +---- + +.. include:: ../../core_api/lightning_work/payload_content.rst diff --git a/docs/source-app/levels/advanced/level_19.rst b/docs/source-app/levels/advanced/level_19.rst new file mode 100644 index 0000000..99a859e --- /dev/null +++ b/docs/source-app/levels/advanced/level_19.rst @@ -0,0 +1,11 @@ +######################################### +Level 19: Handle Lightning App exceptions +######################################### + +**Audience:** Users who want to make Lightning Apps more robust to potential issues. + +**Prereqs:** Level 16+ + +---- + +.. include:: ../../core_api/lightning_work/handling_app_exception_content.rst diff --git a/docs/source-app/levels/advanced/level_20.rst b/docs/source-app/levels/advanced/level_20.rst new file mode 100644 index 0000000..1d045e8 --- /dev/null +++ b/docs/source-app/levels/advanced/level_20.rst @@ -0,0 +1,11 @@ +####################################### +Level 20: Enable dynamic LightningWorks +####################################### + +**Audience:** Users who want to create/run/stop multiple LightningWorks not defined at app instantiation. + +**Prereqs:** Level 16+ + +---- + +.. include:: ../../core_api/lightning_app/dynamic_work_content.rst diff --git a/docs/source-app/levels/advanced/start_dynamic_components.rst b/docs/source-app/levels/advanced/start_dynamic_components.rst new file mode 100644 index 0000000..39bc153 --- /dev/null +++ b/docs/source-app/levels/advanced/start_dynamic_components.rst @@ -0,0 +1,38 @@ +############################### +Level: Start dynamic components +############################### +**Audience:** Users who want to run a Lightning Component in parallel (asynchroneously). + +**Prereqs:** You must have finished the `Basic levels <../basic/>`_. + +---- + +.. include:: ../../workflows/run_work_in_parallel_content.rst + +---- + +********************************************** +Next steps: Share variables between components +********************************************** +Now that you know how to run components in parallel, we'll learn to share variables +across components to simplify complex workflows. + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Level 6: Share variables between components + :description: Learn to connect components + :col_css: col-md-12 + :button_link: share_variables_between_lightning_components.html + :height: 150 + :tag: 10 minutes + +.. raw:: html + +
+
diff --git a/docs/source-app/levels/basic/build_a_dag.rst b/docs/source-app/levels/basic/build_a_dag.rst new file mode 100644 index 0000000..dec9d40 --- /dev/null +++ b/docs/source-app/levels/basic/build_a_dag.rst @@ -0,0 +1,21 @@ +:orphan: + +########################### +Example: Deploy a model API +########################### +**Audience:** TODO: + +**Prereqs:** You have an app already running locally. + +---- + +**************************** +What is the Lightning Cloud? +**************************** +The Lightning Cloud is the platform that we've created to interface with the cloud providers. Today +the Lightning Cloud supports AWS. + +.. note:: Support for GCP and Azure is coming soon! + +To use the Lightning Cloud, you buy credits that are used to pay the cloud providers. If you want to run +on your own AWS credentials, please contact us (support@lightning.ai) so we can get your clusters set up for you. diff --git a/docs/source-app/levels/basic/build_a_lightning_component.rst b/docs/source-app/levels/basic/build_a_lightning_component.rst new file mode 100644 index 0000000..5ff60ed --- /dev/null +++ b/docs/source-app/levels/basic/build_a_lightning_component.rst @@ -0,0 +1,161 @@ +############################################## +Level 1: Package code in a lightning component +############################################## + +**Prereqs:** You know *basic* Python. + +**Goal:** In this guide you'll learn to develop `a Lightning component `_. + + +********************************* +Why you need Lightning components +********************************* +A Lightning component is a self-contained, modular machine-learning component +that you can plug into your existing ML workflows. A Lightning component organizes arbitrary code so it can run on the cloud, manages +its own infrastructure, cloud costs, networking and more. Connect components using your current workflow management tools or +our `next-generation reactive orchestrator <../intermediate/index.html>`_. + +Components run on the cloud or your laptop without code changes 🤯🤯. + +.. raw:: html + +
+ +
+ +| + +Organizing your code into Lightning components offers these benefits: + +.. collapse:: Build systems not scripts + + | + + The Lightning structure forces best practices so you don't have to be an expert production engineer. + Although it feels like you're writing a script, you are actually building a production-ready system. + +.. collapse:: Cost control + + | + + The component run-time has been optimized for cost management to support the largest machine-learning workloads. + Lower your cloud bill with machines that shut down or spin up faster. + +.. collapse:: For beginners: Code like an expert + + | + + Lightning embeds the best practices of building production-ready full stack AI apps into your + coding experience. You can write code like you normally do, and the Lightning structure + ensures your code is implicitly production ready... even if you're just doing research. + +.. collapse:: For experts: Scale with full control + + | + + if you know what you are doing, Lightning gives you full control to manage your own + scaling logic, fault-tolerance and even pre-provisioning, all from Python. We even give you + full flexibility to use tools like `terraform <../../cloud/customize_a_lightning_cluster.html>`_ to optimize cloud clusters for your Lightning apps. + +.. collapse:: Integrate into your current workflow tools + + | + + Lightning components are self-contained pieces of functionality. Add them to your current workflow + tools to quickly fill in gaps in your ML workflow such as monitoring drift, training LLMs and more. + You can (optionally) use the Lightning App to integrate components into a cohesive workflow. + +.. collapse:: Packaged code + + | + + Lightning apps bundles components into an app that runs in any environment. The same code will run on your laptop, + or any cloud or private clusters. You don't have to think about the cluster or know anything about the cloud. + +.. collapse:: Rapid iteration + + | + + Iterate through ideas in hours not months because you don't have to learn a million other concepts that the components + handle for you such as kubernetes, cost management, auto-scaling and more. + +.. collapse:: Modularity + + | + + Components are modular and inter-operable by design. Leverage our vibrant community of components so you don't + have to build each piece of the system yourself. + +---- + +***************** +Install Lightning +***************** +First, install Lightning. + +.. lit_tabs:: + :descriptions: Pip; Macs, Apple Silicon (M1/M2/M3); Windows + :code_files: /install/pip.bash; /install/mac.bash; /install/windows.bash + :tab_rows: 4 + :height: 180px + +---- + +************************** +Build your first component +************************** +A Lightning component organizes arbitrary code so it can run on the cloud, manages its own infrastructure, cloud costs, networking and more + +**Run one of these components!** + +.. include:: ./hero_components.rst + +| + +Components run the same on the cloud and locally on your choice of hardware. + +.. include:: /levels/basic/hero_run_setup.rst + +---- + +************ +Key features +************ +You now know enough to build a self-contained component that runs any Python code on the cloud that can be connected to form a +powerful Lightning app. Here are a few key features available to super-charge your work: + +.. lit_tabs:: + :titles: 15+ accelerators; Auto-stop idle machines; Auto-timeout submitted work; Use spot machines (~70% discount); Work with massive datasets; Mount cloud storage; Use a custom container + :code_files: ./key_features/accelerators.py; ./key_features/idle_machine.py; ./key_features/auto_timeout.py; ./key_features/spot.py; ./key_features/massive_dataset.py; ./key_features/mount_data.py; ./key_features/custom_container.py; + :highlights: 11;11;11;11;11;2,7,10, 11; 11 + :enable_run: true + :tab_rows: 3 + :height: 430px + +---- + +******************************************** +Next: Explore real component implementations +******************************************** +In this section we introduced components. Let's explore +real component implementations in-depth. + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Level 2: Explore real component implementations + :description: Go deep into real component implementations. + :col_css: col-md-12 + :button_link: real_lightning_component_implementations.html + :height: 150 + :tag: beginner + +.. raw:: html + +
+
diff --git a/docs/source-app/levels/basic/create_a_model_demo.rst b/docs/source-app/levels/basic/create_a_model_demo.rst new file mode 100644 index 0000000..da6f28c --- /dev/null +++ b/docs/source-app/levels/basic/create_a_model_demo.rst @@ -0,0 +1,21 @@ +:orphan: + +############################ +Example: Create a model demo +############################ +**Audience:** TODO: + +**Prereqs:** You have an app already running locally. + +---- + +**************************** +What is the Lightning Cloud? +**************************** +The Lightning Cloud is the platform that we've created to interface with the cloud providers. Today +the Lightning Cloud supports AWS. + +.. note:: Support for GCP and Azure is coming soon! + +To use the Lightning Cloud, you buy credits that are used to pay the cloud providers. If you want to run +on your own AWS credentials, please contact us (support@lightning.ai) so we can get your clusters set up for you. diff --git a/docs/source-app/levels/basic/deploy_ai_model_api.rst b/docs/source-app/levels/basic/deploy_ai_model_api.rst new file mode 100644 index 0000000..dec9d40 --- /dev/null +++ b/docs/source-app/levels/basic/deploy_ai_model_api.rst @@ -0,0 +1,21 @@ +:orphan: + +########################### +Example: Deploy a model API +########################### +**Audience:** TODO: + +**Prereqs:** You have an app already running locally. + +---- + +**************************** +What is the Lightning Cloud? +**************************** +The Lightning Cloud is the platform that we've created to interface with the cloud providers. Today +the Lightning Cloud supports AWS. + +.. note:: Support for GCP and Azure is coming soon! + +To use the Lightning Cloud, you buy credits that are used to pay the cloud providers. If you want to run +on your own AWS credentials, please contact us (support@lightning.ai) so we can get your clusters set up for you. diff --git a/docs/source-app/levels/basic/hello_components/code_run_cloud.bash b/docs/source-app/levels/basic/hello_components/code_run_cloud.bash new file mode 100644 index 0000000..6594fe0 --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/code_run_cloud.bash @@ -0,0 +1 @@ +lightning run app app.py --cloud diff --git a/docs/source-app/levels/basic/hello_components/code_run_cloud_setup.bash b/docs/source-app/levels/basic/hello_components/code_run_cloud_setup.bash new file mode 100644 index 0000000..ed69b30 --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/code_run_cloud_setup.bash @@ -0,0 +1 @@ +lightning run app app.py --setup --cloud diff --git a/docs/source-app/levels/basic/hello_components/code_run_cloud_yours.bash b/docs/source-app/levels/basic/hello_components/code_run_cloud_yours.bash new file mode 100644 index 0000000..ff74f6c --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/code_run_cloud_yours.bash @@ -0,0 +1,5 @@ +# first create a cluster (creation could take ~30 minutes) +lightning create cluster pikachu --provider aws --role-arn arn:aws:iam::1234567890:role/lai-byoc + +# run on that cluster +lightning run app app.py --cloud pikachu diff --git a/docs/source-app/levels/basic/hello_components/code_run_cloud_yours_setup.bash b/docs/source-app/levels/basic/hello_components/code_run_cloud_yours_setup.bash new file mode 100644 index 0000000..f2ff22d --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/code_run_cloud_yours_setup.bash @@ -0,0 +1,5 @@ +# first create a cluster (creation could take ~30 minutes) +lightning create cluster pikachu --provider aws --role-arn arn:aws:iam::1234567890:role/lai-byoc + +# run on that cluster +lightning run app app.py --setup --cloud pikachu diff --git a/docs/source-app/levels/basic/hello_components/code_run_local.bash b/docs/source-app/levels/basic/hello_components/code_run_local.bash new file mode 100644 index 0000000..8a00b45 --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/code_run_local.bash @@ -0,0 +1 @@ +lightning run app app.py diff --git a/docs/source-app/levels/basic/hello_components/code_run_local_setup.bash b/docs/source-app/levels/basic/hello_components/code_run_local_setup.bash new file mode 100644 index 0000000..11cc8a4 --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/code_run_local_setup.bash @@ -0,0 +1 @@ +lightning run app app.py --setup diff --git a/docs/source-app/levels/basic/hello_components/deploy_model.py b/docs/source-app/levels/basic/hello_components/deploy_model.py new file mode 100644 index 0000000..9847db3 --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/deploy_model.py @@ -0,0 +1,31 @@ +# !pip install torchvision +import lightning as L +from lightning.app.components.serve import PythonServer, Image, Number +import base64, io, torchvision, torch +from PIL import Image as PILImage + + +class PyTorchServer(PythonServer): + def setup(self): + self._model = torchvision.models.resnet18(pretrained=True) + self._device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu") + self._model.to(self._device) + + def predict(self, request): + image = base64.b64decode(request.image.encode("utf-8")) + image = PILImage.open(io.BytesIO(image)) + transforms = torchvision.transforms.Compose([ + torchvision.transforms.Resize(224), + torchvision.transforms.ToTensor(), + torchvision.transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]) + ]) + image = transforms(image) + image = image.to(self._device) + prediction = self._model(image.unsqueeze(0)) + return {"prediction": prediction.argmax().item()} + + +component = PyTorchServer( + input_type=Image, output_type=Number, cloud_compute=L.CloudCompute('gpu') +) +app = L.LightningApp(component) diff --git a/docs/source-app/levels/basic/hello_components/hello_world.py b/docs/source-app/levels/basic/hello_components/hello_world.py new file mode 100644 index 0000000..92b1063 --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/hello_world.py @@ -0,0 +1,12 @@ +# app.py +import lightning as L + + +class YourComponent(L.LightningWork): + def run(self): + print('RUN ANY PYTHON CODE HERE') + + + +component = YourComponent() +app = L.LightningApp(component) diff --git a/docs/source-app/levels/basic/hello_components/hello_world_gpu.py b/docs/source-app/levels/basic/hello_components/hello_world_gpu.py new file mode 100644 index 0000000..aa316f9 --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/hello_world_gpu.py @@ -0,0 +1,12 @@ +# app.py +import lightning as L + + +class YourComponent(L.LightningWork): + def run(self): + print('RUN ANY PYTHON CODE HERE') + +# run on a cloud machine ("cpu", "gpu", ...) +compute = L.CloudCompute("gpu") +component = YourComponent(cloud_compute=compute) +app = L.LightningApp(component) diff --git a/docs/source-app/levels/basic/hello_components/multi_node.py b/docs/source-app/levels/basic/hello_components/multi_node.py new file mode 100644 index 0000000..ad1bbb4 --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/multi_node.py @@ -0,0 +1,29 @@ +# !pip install torch +import lightning as L +from lightning.app.components import MultiNode + + +class MultiNodeComponent(L.LightningWork): + def run( + self, + main_address: str, + main_port: int, + node_rank: int, + world_size: int, + ): + print(f"ADD YOUR DISTRIBUTED CODE: {main_address=} {main_port=} {node_rank=} {world_size=}") + print("supports ANY ML library") + + + + + + + + + + +# gpu-multi-fast has 4 GPUs x 8 nodes = 32 GPUs +component = MultiNodeComponent(cloud_compute=L.CloudCompute("gpu-multi-fast")) +component = MultiNode(component, nodes=8) +app = L.LightningApp(component) diff --git a/docs/source-app/levels/basic/hello_components/pl_multinode.py b/docs/source-app/levels/basic/hello_components/pl_multinode.py new file mode 100644 index 0000000..9df12ec --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/pl_multinode.py @@ -0,0 +1,19 @@ +# app.py +import lightning as L +from lightning.app.components import LightningTrainerMultiNode +from lightning.pytorch.demos.boring_classes import BoringModel + + +class LightningTrainerDistributed(L.LightningWork): + def run(self): + model = BoringModel() + trainer = L.Trainer(max_epochs=10, strategy="ddp") + trainer.fit(model) + +# 8 GPUs: (2 nodes of 4 x v100) +component = LightningTrainerMultiNode( + LightningTrainerDistributed, + num_nodes=4, + cloud_compute=L.CloudCompute("gpu-fast-multi"), # 4 x v100 +) +app = L.LightningApp(component) diff --git a/docs/source-app/levels/basic/hello_components/pt_multinode.py b/docs/source-app/levels/basic/hello_components/pt_multinode.py new file mode 100644 index 0000000..8b39c74 --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/pt_multinode.py @@ -0,0 +1,60 @@ +# app.py +# ! pip install torch +import lightning as L +from lightning.app.components import MultiNode +import torch +from torch.nn.parallel.distributed import DistributedDataParallel + + +def distributed_train(local_rank: int, main_address: str, main_port: int, num_nodes: int, node_rank: int, nprocs: int): + # 1. SET UP DISTRIBUTED ENVIRONMENT + global_rank = local_rank + node_rank * nprocs + world_size = num_nodes * nprocs + + if torch.distributed.is_available() and not torch.distributed.is_initialized(): + torch.distributed.init_process_group( + "nccl" if torch.cuda.is_available() else "gloo", + rank=global_rank, + world_size=world_size, + init_method=f"tcp://{main_address}:{main_port}", + ) + + # 2. PREPARE DISTRIBUTED MODEL + model = torch.nn.Linear(32, 2) + device = torch.device(f"cuda:{local_rank}") if torch.cuda.is_available() else torch.device("cpu") + model = DistributedDataParallel(model, device_ids=[local_rank] if torch.cuda.is_available() else None).to(device) + + # 3. SETUP LOSS AND OPTIMIZER + criterion = torch.nn.MSELoss() + optimizer = torch.optim.SGD(model.parameters(), lr=0.01) + + # 4.TRAIN THE MODEL FOR 50 STEPS + for step in range(50): + model.zero_grad() + x = torch.randn(64, 32).to(device) + output = model(x) + loss = criterion(output, torch.ones_like(output)) + print(f"global_rank: {global_rank} step: {step} loss: {loss}") + loss.backward() + optimizer.step() + + # 5. VERIFY ALL COPIES OF THE MODEL HAVE THE SAME WEIGTHS AT END OF TRAINING + weight = model.module.weight.clone() + torch.distributed.all_reduce(weight) + assert torch.equal(model.module.weight, weight / world_size) + + print("Multi Node Distributed Training Done!") + +class PyTorchDistributed(L.LightningWork): + def run(self, main_address: str, main_port: int, num_nodes: int, node_rank: int): + nprocs = torch.cuda.device_count() if torch.cuda.is_available() else 1 + torch.multiprocessing.spawn( + distributed_train, + args=(main_address, main_port, num_nodes, node_rank, nprocs), + nprocs=nprocs + ) + +# 32 GPUs: (8 nodes x 4 v 100) +compute = L.CloudCompute("gpu-fast-multi") # 4xV100 +component = MultiNode(PyTorchDistributed, num_nodes=8, cloud_compute=compute) +app = L.LightningApp(component) diff --git a/docs/source-app/levels/basic/hello_components/run_ptl_script.py b/docs/source-app/levels/basic/hello_components/run_ptl_script.py new file mode 100644 index 0000000..f1d3497 --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/run_ptl_script.py @@ -0,0 +1,13 @@ +# app.py +# !curl https://raw.githubusercontent.com/Lightning-AI/lightning/master/examples/app/multi_node/pl_boring_script.py -o pl_boring_script.py +import lightning as L +from lightning.app.components.training import LightningTrainerScript + +# run script that trains PyTorch with the Lightning Trainer +model_script = 'pl_boring_script.py' +component = LightningTrainerScript( + model_script, + num_nodes=1, + cloud_compute=L.CloudCompute("gpu") +) +app = L.LightningApp(component) diff --git a/docs/source-app/levels/basic/hello_components/streamlit_demo.py b/docs/source-app/levels/basic/hello_components/streamlit_demo.py new file mode 100644 index 0000000..d5fb3b0 --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/streamlit_demo.py @@ -0,0 +1,30 @@ +# app.py +# !pip install streamlit omegaconf scipy +# !pip install torch +import lightning as L +import torch +from io import BytesIO +from functools import partial +from scipy.io.wavfile import write +import streamlit as st + + +class StreamlitApp(L.app.components.ServeStreamlit): + def build_model(self): + sample_rate = 48000 + model, _ = torch.hub.load('snakers4/silero-models', model='silero_tts',speaker="v3_en") + return partial(model.apply_tts, sample_rate=sample_rate, speaker="en_0"), sample_rate + + def render(self): + st.title("Text To Speech") + text = st.text_input("Text:", "Lightning Apps are the best!") + + if text: + model, sample_rate = self.model + audio_numpy = model(text).numpy() + audio = BytesIO() + write(audio, sample_rate, audio_numpy) + audio.seek(0) + st.audio(audio) + +app = L.LightningApp(StreamlitApp()) diff --git a/docs/source-app/levels/basic/hello_components/terraform_example.bash b/docs/source-app/levels/basic/hello_components/terraform_example.bash new file mode 100644 index 0000000..af88ef2 --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/terraform_example.bash @@ -0,0 +1,4 @@ +# TODO: show how to use terraform to create a cluster called pikachu + +# run the cluster +lightning run app app.py --cloud pickachu diff --git a/docs/source-app/levels/basic/hello_components/train_ptl.py b/docs/source-app/levels/basic/hello_components/train_ptl.py new file mode 100644 index 0000000..75c65ba --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/train_ptl.py @@ -0,0 +1,15 @@ +# A hello world component +# app.py +import lightning as L + + +class YourComponent(L.LightningWork): + def run(self): + print('RUN ANY PYTHON CODE HERE') + + + +# run on a cloud machine +compute = L.CloudCompute("cpu") +worker = YourComponent(cloud_compute=compute) +app = L.LightningApp(worker) diff --git a/docs/source-app/levels/basic/hello_components/train_pytorch.py b/docs/source-app/levels/basic/hello_components/train_pytorch.py new file mode 100644 index 0000000..7bfc3b5 --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/train_pytorch.py @@ -0,0 +1,28 @@ +# app.py +# ! pip install torch +import lightning as L +import torch + +class PyTorchComponent(L.LightningWork): + def run(self): + device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu") + model = torch.nn.Sequential(torch.nn.Linear(1, 1), + torch.nn.ReLU(), + torch.nn.Linear(1, 1)) + model.to(device) + criterion = torch.nn.MSELoss() + optimizer = torch.optim.SGD(model.parameters(), lr=0.1) + + for step in range(10000): + model.zero_grad() + x = torch.tensor([0.8]).to(device) + target = torch.tensor([1.0]).to(device) + output = model(x) + loss = criterion(output, target) + print(f'step: {step}. loss {loss}') + loss.backward() + optimizer.step() + +compute = L.CloudCompute('gpu') +componet = PyTorchComponent(cloud_compute=compute) +app = L.LightningApp(componet) diff --git a/docs/source-app/levels/basic/hello_components/xgboost.py b/docs/source-app/levels/basic/hello_components/xgboost.py new file mode 100644 index 0000000..fae593a --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/xgboost.py @@ -0,0 +1,21 @@ +# app.py +# !pip install scikit-learn xgboost +import lightning as L +from sklearn import datasets +from sklearn.model_selection import train_test_split +from xgboost import XGBClassifier + +class XGBoostComponent(L.LightningWork): + def run(self): + iris = datasets.load_iris() + X, y = iris.data, iris.target + + X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2) + + bst = XGBClassifier(verbosity=3) + bst.fit(X_train, y_train) + preds = bst.predict(X_test) + print(f'preds: {preds}') + + +app = L.LightningApp(XGBoostComponent()) diff --git a/docs/source-app/levels/basic/hello_components/xgboost_gpu.py b/docs/source-app/levels/basic/hello_components/xgboost_gpu.py new file mode 100644 index 0000000..2b52716 --- /dev/null +++ b/docs/source-app/levels/basic/hello_components/xgboost_gpu.py @@ -0,0 +1,22 @@ +# app.py +# !pip install sklearn xgboost +# !conda install py-xgboost-gpu +import lightning as L +from sklearn import datasets +from sklearn.model_selection import train_test_split +from xgboost import XGBClassifier + +class XGBoostComponent(L.LightningWork): + def run(self): + iris = datasets.load_iris() + X, y = iris.data, iris.target + + X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2) + + bst = XGBClassifier(tree_method='gpu_hist', gpu_id=0, verbosity=3) + bst.fit(X_train, y_train) + preds = bst.predict(X_test) + print(f'preds: {preds}') + +compute = L.CloudCompute('gpu') +app = L.LightningApp(XGBoostComponent(cloud_compute=compute)) diff --git a/docs/source-app/levels/basic/hero_components.rst b/docs/source-app/levels/basic/hero_components.rst new file mode 100644 index 0000000..da1d9d0 --- /dev/null +++ b/docs/source-app/levels/basic/hero_components.rst @@ -0,0 +1,8 @@ +.. lit_tabs:: + :titles: Hello world; Hello GPU world; PyTorch & ⚡⚡⚡ Trainer (1+ cloud GPUs); Train PyTorch (cloud GPU); Train PyTorch (32 cloud GPUs); Deploy a model on cloud GPUs; Run a model script; XGBoost; Streamlit demo + :code_files: /levels/basic/hello_components/hello_world.py; /levels/basic/hello_components/hello_world_gpu.py; /levels/basic/hello_components/pl_multinode.py; /levels/basic/hello_components/train_pytorch.py; /levels/basic/hello_components/pt_multinode.py; /levels/basic/hello_components/deploy_model.py; /levels/basic/hello_components/run_ptl_script.py; /levels/basic/hello_components/xgboost.py; /levels/basic/hello_components/streamlit_demo.py + :highlights: 7; 10, 11; 9-11, 16, 17; 4, 8, 12, 18-19, 26; 5, 10, 22, 27, 31, 41, 57-59; 3, 11-12, 25, 29; 7, 10; 15, 21; 9, 15, 24 + :works: [{"name":"root.work","spec":{"buildSpec":{"commands":[],"pythonDependencies":{"packageManager":"PACKAGE_MANAGER_PIP","packages":""}},"drives":[],"userRequestedComputeConfig":{"count":1,"diskSize":0,"name":"default","preemptible":false,"shmSize":0},"networkConfig":[{"name":"dzodf","port":61304}]}}];[{"name":"root.work","spec":{"buildSpec":{"commands":[],"pythonDependencies":{"packageManager":"PACKAGE_MANAGER_PIP","packages":""}},"drives":[],"networkConfig":[{"name":"qnlgd","port":61516}],"userRequestedComputeConfig":{"count":1,"diskSize":0,"name":"gpu","preemptible":false,"shmSize":0}}}];[{"name":"root.ws.0","spec":{"buildSpec":{"commands":[],"pythonDependencies":{"packageManager":"PACKAGE_MANAGER_PIP","packages":""}},"drives":[],"networkConfig":[{"name":"ajfrc","port":61553}],"userRequestedComputeConfig":{"count":1,"diskSize":0,"name":"gpu-fast-multi","preemptible":false,"shmSize":0}}},{"name":"root.ws.1","spec":{"buildSpec":{"commands":[],"pythonDependencies":{"packageManager":"PACKAGE_MANAGER_PIP","packages":""}},"drives":[],"networkConfig":[{"name":"ttyqc","port":61554}],"userRequestedComputeConfig":{"count":1,"diskSize":0,"name":"gpu-fast-multi","preemptible":false,"shmSize":0}}},{"name":"root.ws.2","spec":{"buildSpec":{"commands":[],"pythonDependencies":{"packageManager":"PACKAGE_MANAGER_PIP","packages":""}},"drives":[],"networkConfig":[{"name":"svyej","port":61555}],"userRequestedComputeConfig":{"count":1,"diskSize":0,"name":"gpu-fast-multi","preemptible":false,"shmSize":0}}},{"name":"root.ws.3","spec":{"buildSpec":{"commands":[],"pythonDependencies":{"packageManager":"PACKAGE_MANAGER_PIP","packages":""}},"drives":[],"networkConfig":[{"name":"parme","port":61556}],"userRequestedComputeConfig":{"count":1,"diskSize":0,"name":"gpu-fast-multi","preemptible":false,"shmSize":0}}}];[{"name":"root.work","spec":{"buildSpec":{"commands":[],"pythonDependencies":{"packageManager":"PACKAGE_MANAGER_PIP","packages":""}},"drives":[],"networkConfig":[{"name":"cutdu","port":61584}],"userRequestedComputeConfig":{"count":1,"diskSize":0,"name":"gpu","preemptible":false,"shmSize":0}}}];[{"name":"root.ws.0","spec":{"buildSpec":{"commands":[],"pythonDependencies":{"packageManager":"PACKAGE_MANAGER_PIP","packages":""}},"drives":[],"networkConfig":[{"name":"whhby","port":61613}],"userRequestedComputeConfig":{"count":1,"diskSize":0,"name":"gpu-fast-multi","preemptible":false,"shmSize":0}}},{"name":"root.ws.1","spec":{"buildSpec":{"commands":[],"pythonDependencies":{"packageManager":"PACKAGE_MANAGER_PIP","packages":""}},"drives":[],"networkConfig":[{"name":"yhjtf","port":61614}],"userRequestedComputeConfig":{"count":1,"diskSize":0,"name":"gpu-fast-multi","preemptible":false,"shmSize":0}}},{"name":"root.ws.2","spec":{"buildSpec":{"commands":[],"pythonDependencies":{"packageManager":"PACKAGE_MANAGER_PIP","packages":""}},"drives":[],"networkConfig":[{"name":"rqwkt","port":61615}],"userRequestedComputeConfig":{"count":1,"diskSize":0,"name":"gpu-fast-multi","preemptible":false,"shmSize":0}}},{"name":"root.ws.3","spec":{"buildSpec":{"commands":[],"pythonDependencies":{"packageManager":"PACKAGE_MANAGER_PIP","packages":""}},"drives":[],"networkConfig":[{"name":"pjdsj","port":61616}],"userRequestedComputeConfig":{"count":1,"diskSize":0,"name":"gpu-fast-multi","preemptible":false,"shmSize":0}}},{"name":"root.ws.4","spec":{"buildSpec":{"commands":[],"pythonDependencies":{"packageManager":"PACKAGE_MANAGER_PIP","packages":""}},"drives":[],"networkConfig":[{"name":"efdor","port":61617}],"userRequestedComputeConfig":{"count":1,"diskSize":0,"name":"gpu-fast-multi","preemptible":false,"shmSize":0}}},{"name":"root.ws.5","spec":{"buildSpec":{"commands":[],"pythonDependencies":{"packageManager":"PACKAGE_MANAGER_PIP","packages":""}},"drives":[],"networkConfig":[{"name":"pxmso","port":61618}],"userRequestedComputeConfig":{"count":1,"diskSize":0,"name":"gpu-fast-multi","preemptible":false,"shmSize":0}}},{"name":"root.ws.6","spec":{"buildSpec":{"commands":[],"pythonDependencies":{"packageManager":"PACKAGE_MANAGER_PIP","packages":""}},"drives":[],"networkConfig":[{"name":"feevy","port":61619}],"userRequestedComputeConfig":{"count":1,"diskSize":0,"name":"gpu-fast-multi","preemptible":false,"shmSize":0}}},{"name":"root.ws.7","spec":{"buildSpec":{"commands":[],"pythonDependencies":{"packageManager":"PACKAGE_MANAGER_PIP","packages":""}},"drives":[],"networkConfig":[{"name":"tbmse","port":61620}],"userRequestedComputeConfig":{"count":1,"diskSize":0,"name":"gpu-fast-multi","preemptible":false,"shmSize":0}}}];[{"name":"root.work","spec":{"buildSpec":{"commands":[],"pythonDependencies":{"packageManager":"PACKAGE_MANAGER_PIP","packages":""}},"drives":[],"networkConfig":[{"name":"umqqg","port":7777}],"userRequestedComputeConfig":{"count":1,"diskSize":0,"name":"gpu","preemptible":false,"shmSize":0}}}];[];[{"name":"root.work","spec":{"buildSpec":{"commands":[],"pythonDependencies":{"packageManager":"PACKAGE_MANAGER_PIP","packages":""}},"drives":[],"networkConfig":[{"name":"tggba","port":61729}],"userRequestedComputeConfig":{"count":1,"diskSize":0,"name":"default","preemptible":false,"shmSize":0}}}];[{"name":"root.work","spec":{"buildSpec":{"commands":[],"pythonDependencies":{"packageManager":"PACKAGE_MANAGER_PIP","packages":""}},"drives":[],"networkConfig":[{"name":"hpyaz","port":61763}],"userRequestedComputeConfig":{"count":1,"diskSize":0,"name":"default","preemptible":false,"shmSize":0}}}] + :enable_run: true + :tab_rows: 3 + :height: 620px diff --git a/docs/source-app/levels/basic/hero_run.rst b/docs/source-app/levels/basic/hero_run.rst new file mode 100644 index 0000000..4fdabf1 --- /dev/null +++ b/docs/source-app/levels/basic/hero_run.rst @@ -0,0 +1,6 @@ +.. lit_tabs:: + :titles: Lightning Cloud (fully-managed); Your AWS account; Your own hardware + :code_files: /levels/basic/hello_components/code_run_cloud.bash; /levels/basic/hello_components/code_run_cloud_yours.bash; /levels/basic/hello_components/code_run_local.bash + :tab_rows: 4 + :highlights: ; 5; 0 + :height: 195px diff --git a/docs/source-app/levels/basic/hero_run_setup.rst b/docs/source-app/levels/basic/hero_run_setup.rst new file mode 100644 index 0000000..2200f17 --- /dev/null +++ b/docs/source-app/levels/basic/hero_run_setup.rst @@ -0,0 +1,6 @@ +.. lit_tabs:: + :titles: Lightning Cloud (fully-managed); Your AWS account; Your own hardware + :code_files: /levels/basic/hello_components/code_run_cloud_setup.bash; /levels/basic/hello_components/code_run_cloud_yours_setup.bash; /levels/basic/hello_components/code_run_local_setup.bash + :tab_rows: 4 + :highlights: ; 5; 0 + :height: 195px diff --git a/docs/source-app/levels/basic/index.rst b/docs/source-app/levels/basic/index.rst new file mode 100644 index 0000000..2912b69 --- /dev/null +++ b/docs/source-app/levels/basic/index.rst @@ -0,0 +1,54 @@ +.. _level_basic: + +.. toctree:: + :maxdepth: 1 + :hidden: + + build_a_lightning_component + real_lightning_component_implementations + save_money_on_cloud_costs + +############ +Basic skills +############ +Learn to package your code into Lightning components which can plug into your existing ML workflows. + +A Lightning component organizes arbitrary code so it can run on the cloud, manages +its own infrastructure, cloud costs, networking and more. + + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Level 1: Package code in a Lightning component + :description: Learn to package your code into Lightning components which can plug into your existing ML workflows. + :button_link: build_a_lightning_component.html + :col_css: col-md-6 + :height: 170 + :tag: 10 minutes + +.. displayitem:: + :header: Level 2: Explore real component implementations + :description: Go deep into real component implementations. + :button_link: real_lightning_component_implementations.html + :col_css: col-md-6 + :height: 170 + :tag: 10 minutes + +.. displayitem:: + :header: Level 3: Save money on cloud costs + :description: Explore key Lightning features that save you cloud costs and improve performance. + :button_link: save_money_on_cloud_costs.html + :col_css: col-md-6 + :height: 150 + :tag: 10 minutes + +.. raw:: html + +
+
diff --git a/docs/source-app/levels/basic/key_features/accelerators.py b/docs/source-app/levels/basic/key_features/accelerators.py new file mode 100644 index 0000000..abfb4be --- /dev/null +++ b/docs/source-app/levels/basic/key_features/accelerators.py @@ -0,0 +1,21 @@ +# app.py +import lightning as L + + +class YourComponent(L.LightningWork): + def run(self): + print('RUN ANY PYTHON CODE HERE') + + +# custom accelerators +compute = L.CloudCompute('gpu') +component = YourComponent(cloud_compute=compute) +app = L.LightningApp(component) + +# OTHER ACCELERATORS: +# compute = L.CloudCompute('default') # 1 CPU +# compute = L.CloudCompute('cpu-medium') # 8 CPUs +# compute = L.CloudCompute('gpu') # 1 T4 GPU +# compute = L.CloudCompute('gpu-fast-multi') # 4 V100 GPU +# compute = L.CloudCompute('p4d.24xlarge') # AWS instance name (8 A100 GPU) +# compute = ... diff --git a/docs/source-app/levels/basic/key_features/auto_timeout.py b/docs/source-app/levels/basic/key_features/auto_timeout.py new file mode 100644 index 0000000..8d5e927 --- /dev/null +++ b/docs/source-app/levels/basic/key_features/auto_timeout.py @@ -0,0 +1,13 @@ +# app.py +import lightning as L + + +class YourComponent(L.LightningWork): + def run(self): + print('RUN ANY PYTHON CODE HERE') + + +# if the machine hasn't started after 60 seconds, cancel the work +compute = L.CloudCompute('gpu', wait_timeout=60) +component = YourComponent(cloud_compute=compute) +app = L.LightningApp(component) diff --git a/docs/source-app/levels/basic/key_features/custom_container.py b/docs/source-app/levels/basic/key_features/custom_container.py new file mode 100644 index 0000000..c1a5e61 --- /dev/null +++ b/docs/source-app/levels/basic/key_features/custom_container.py @@ -0,0 +1,13 @@ +# app.py +import lightning as L + + +class YourComponent(L.LightningWork): + def run(self): + print('RUN ANY PYTHON CODE HERE') + + +# custom image (from any provider) +config= L.BuildConfig(image="gcr.io/google-samples/hello-app:1.0") +component = YourComponent(cloud_build_config=config) +app = L.LightningApp(component) diff --git a/docs/source-app/levels/basic/key_features/idle_machine.py b/docs/source-app/levels/basic/key_features/idle_machine.py new file mode 100644 index 0000000..dc01572 --- /dev/null +++ b/docs/source-app/levels/basic/key_features/idle_machine.py @@ -0,0 +1,13 @@ +# app.py +import lightning as L + + +class YourComponent(L.LightningWork): + def run(self): + print('RUN ANY PYTHON CODE HERE') + + +# stop the machine when idle for 10 seconds +compute = L.CloudCompute('gpu', idle_timeout=10) +component = YourComponent(cloud_compute=compute) +app = L.LightningApp(component) diff --git a/docs/source-app/levels/basic/key_features/massive_dataset.py b/docs/source-app/levels/basic/key_features/massive_dataset.py new file mode 100644 index 0000000..e8673e3 --- /dev/null +++ b/docs/source-app/levels/basic/key_features/massive_dataset.py @@ -0,0 +1,13 @@ +# app.py +import lightning as L + + +class YourComponent(L.LightningWork): + def run(self): + print('RUN ANY PYTHON CODE HERE') + + +# use 100 GB of space on that machine (max size: 64 TB) +compute = L.CloudCompute('gpu', disk_size=100) +component = YourComponent(cloud_compute=compute) +app = L.LightningApp(component) diff --git a/docs/source-app/levels/basic/key_features/mount_data.py b/docs/source-app/levels/basic/key_features/mount_data.py new file mode 100644 index 0000000..1141983 --- /dev/null +++ b/docs/source-app/levels/basic/key_features/mount_data.py @@ -0,0 +1,13 @@ +import lightning as L +import os + + +class YourComponent(L.LightningWork): + def run(self): + os.listdir('/foo') + +# mount the files on the s3 bucket under this path +mount = L.Mount(source="s3://lightning-example-public/", mount_path="/foo") +compute = L.CloudCompute(mounts=mount) +component = YourComponent(cloud_compute=compute) +app = L.LightningApp(component) diff --git a/docs/source-app/levels/basic/key_features/spot.py b/docs/source-app/levels/basic/key_features/spot.py new file mode 100644 index 0000000..d3b0ac0 --- /dev/null +++ b/docs/source-app/levels/basic/key_features/spot.py @@ -0,0 +1,13 @@ +# app.py +import lightning as L + + +class YourComponent(L.LightningWork): + def run(self): + print('RUN ANY PYTHON CODE HERE') + +# spot machines can be turned off without notice, use for non-critical, resumable work +# request a spot machine, after 60 seconds of waiting switch to full-price +compute = L.CloudCompute('gpu', wait_timeout=60, spot=True) +component = YourComponent(cloud_compute=compute) +app = L.LightningApp(component) diff --git a/docs/source-app/levels/basic/real_lightning_component_implementations.rst b/docs/source-app/levels/basic/real_lightning_component_implementations.rst new file mode 100644 index 0000000..5e2fbc3 --- /dev/null +++ b/docs/source-app/levels/basic/real_lightning_component_implementations.rst @@ -0,0 +1,87 @@ +############################################### +Level 2: Explore real component implementations +############################################### +**Audience:** Users who want to deeply understand what is possible with Lightning components. + +**Prereqs:** You must have finished `level 1 <../basic/build_a_lightning_component.html>`_. + +---- + +*********************** +Real component examples +*********************** +Use this guide to understand what is happening in each type of component. +These are a few prototypical components. Since each component organizes +Python, you can build virtually infinite components for any use-case +you can think of. + +---- + +******************************* +Ex: PyTorch + Lightning Trainer +******************************* +This example shows how to train PyTorch with the Lightning trainer on your machine +or cloud GPUs without code changes. + +.. lit_tabs:: + :descriptions: import Lightning; We're using a demo LightningModule; Move your training code here (usually your main.py); Pass your component to the multi-node executor (it works on CPU or single GPUs also); Select the number of machines (nodes). Here we choose 4.; Choose from over 15+ machine types. This one has 4 v100 GPUs.; Initialize the App object that executes the component logic. + :code_files: /levels/basic/hello_components/pl_multinode.py; /levels/basic/hello_components/pl_multinode.py; /levels/basic/hello_components/pl_multinode.py; /levels/basic/hello_components/pl_multinode.py; /levels/basic/hello_components/pl_multinode.py; /levels/basic/hello_components/pl_multinode.py; /levels/basic/hello_components/pl_multinode.py; + :highlights: 2; 4; 9-11; 14-17; 16; 17; 19 + :enable_run: true + :tab_rows: 5 + :height: 420px + +| + +Run the component on the cloud: + +.. include:: /levels/basic/hero_run.rst + +---- + +********************************* +Ex: Deploy a PyTorch API endpoint +********************************* +This example shows how to deploy PyTorch and create an API + +.. lit_tabs:: + :descriptions: Shortcut to list dependencies without a requirements.txt file.; Import one of our serving components (high-performance ones are available on the enterprise tiers); Define the setup function to load your favorite pretrained models and do any kind of pre-processing.; Define the predict function which is called when the endpoint is hit.; Initialize the server and define the type of cloud machine to use. + :code_files: /levels/basic/hello_components/deploy_model.py; /levels/basic/hello_components/deploy_model.py; /levels/basic/hello_components/deploy_model.py; /levels/basic/hello_components/deploy_model.py; /levels/basic/hello_components/deploy_model.py; + :highlights: 1; 3; 10-12; 15-25; 28-30 + :enable_run: true + :tab_rows: 4 + :height: 620px + +| + +Run the component on the cloud: + +.. include:: /levels/basic/hero_run.rst + +---- + +************************* +Next: Save on cloud costs +************************* +Let's review key lightning features to help you run components more efficiently on the cloud +so you can save on cloud costs. + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Level 3: Save money on cloud costs + :description: Explore key Lightning features that save you cloud costs and improve performance. + :button_link: save_money_on_cloud_costs.html + :col_css: col-md-12 + :height: 150 + :tag: 10 minutes + +.. raw:: html + +
+
diff --git a/docs/source-app/levels/basic/run_jupyter_notebook_on_the_cloud.rst b/docs/source-app/levels/basic/run_jupyter_notebook_on_the_cloud.rst new file mode 100644 index 0000000..b39dfa1 --- /dev/null +++ b/docs/source-app/levels/basic/run_jupyter_notebook_on_the_cloud.rst @@ -0,0 +1,21 @@ +:orphan: + +############################################# +Example: Develop a Jupyter Notebook component +############################################# +**Audience:** TODO: + +**Prereqs:** You have an app already running locally. + +---- + +**************************** +What is the Lightning Cloud? +**************************** +The Lightning Cloud is the platform that we've created to interface with the cloud providers. Today +the Lightning Cloud supports AWS. + +.. note:: Support for GCP and Azure is coming soon! + +To use the Lightning Cloud, you buy credits that are used to pay the cloud providers. If you want to run +on your own AWS credentials, please contact us (support@lightning.ai) so we can get your clusters set up for you. diff --git a/docs/source-app/levels/basic/run_on_aws_account.rst b/docs/source-app/levels/basic/run_on_aws_account.rst new file mode 100644 index 0000000..ecf1542 --- /dev/null +++ b/docs/source-app/levels/basic/run_on_aws_account.rst @@ -0,0 +1,21 @@ +:orphan: + +To run on your own AWS account, first `create an AWS ARN <../../glossary/aws_arn.rst>`_. + +Next, set up a Lightning cluster (here we name it pikachu): + +.. code:: bash + + # TODO: need to remove --external-id dummy --region us-west-2 + lightning create cluster pikachu --provider aws --role-arn arn:aws:iam::1234567890:role/lai-byoc + +Run your code on the pikachu cluster by passing it into CloudCompute: + +.. code:: python + + compute = L.CloudCompute('gpu', clusters=['pikachu']) + app = L.LightningApp(LitWorker(cloud_compute=compute)) + +.. warning:: + + This feature is available only under early-access. Request access by emailing support@lightning.ai. diff --git a/docs/source-app/levels/basic/save_money_on_cloud_costs.rst b/docs/source-app/levels/basic/save_money_on_cloud_costs.rst new file mode 100644 index 0000000..5e75295 --- /dev/null +++ b/docs/source-app/levels/basic/save_money_on_cloud_costs.rst @@ -0,0 +1,56 @@ +################################## +Level 3: Save money on cloud costs +################################## +**Audience:** Users who want to use the AWS cloud efficiently. + +**Prereqs:** You must have finished `level 1 <../basic/build_a_lightning_component.html>`_. + +---- + +*********************************** +Save money with these optimizations +*********************************** +A Lightning component gives you fine-grain control over the cloud lifecycle of that component. + +Here are a few features that will enable you save a lot on your cloud costs: + +.. lit_tabs:: + :titles: 15+ accelerators; Auto-stop idle machines; Auto-timeout submitted work; Use spot machines (~70% discount); Work with massive datasets; Mount cloud storage; Use a custom container + :code_files: ./key_features/accelerators.py; ./key_features/idle_machine.py; ./key_features/auto_timeout.py; ./key_features/spot.py; ./key_features/massive_dataset.py; ./key_features/mount_data.py; ./key_features/custom_container.py; + :highlights: 11;11;11;11;11;1,7, 10, 11; 11 + :enable_run: true + :tab_rows: 3 + :height: 430px + +---- + +.. include:: ../../cloud/customize_a_lightning_cluster.rst + + +---- + +****************************** +Next: Coordinate 2+ components +****************************** +Now that you know how to organize arbitrary code inside a Lightning component, +learn to coordinate 2 or more components into workflows which we call Lightning apps. + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Intermediate skills + :description: Learn to coordinate 2+ components into workflows which we call Lightning apps. + :button_link: ../intermediate/index.html + :col_css: col-md-12 + :height: 170 + :tag: 15 minutes + +.. raw:: html + +
+
diff --git a/docs/source-app/levels/basic/scripts/toy_app_1_component.py b/docs/source-app/levels/basic/scripts/toy_app_1_component.py new file mode 100644 index 0000000..122f38c --- /dev/null +++ b/docs/source-app/levels/basic/scripts/toy_app_1_component.py @@ -0,0 +1,17 @@ +# app.py +import lightning as L + +class Component(L.LightningWork): + def run(self, x): + print(x) + + +class WorkflowOrchestrator(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.component = Component() + + def run(self): + self.component.run('i love Lightning') + +app = L.LightningApp(WorkflowOrchestrator()) diff --git a/docs/source-app/levels/basic/scripts/toy_app_1_component_pdb.py b/docs/source-app/levels/basic/scripts/toy_app_1_component_pdb.py new file mode 100644 index 0000000..93fef4f --- /dev/null +++ b/docs/source-app/levels/basic/scripts/toy_app_1_component_pdb.py @@ -0,0 +1,17 @@ +# app.py +import lightning as L + +class Component(L.LightningWork): + def run(self, x): + print(x) + L.pdb.set_trace() + +class WorkflowOrchestrator(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.component = Component() + + def run(self): + self.component.run('i love Lightning') + +app = L.LightningApp(WorkflowOrchestrator()) diff --git a/docs/source-app/levels/basic/train_pytorch_on_the_cloud.rst b/docs/source-app/levels/basic/train_pytorch_on_the_cloud.rst new file mode 100644 index 0000000..c3ef841 --- /dev/null +++ b/docs/source-app/levels/basic/train_pytorch_on_the_cloud.rst @@ -0,0 +1,21 @@ +:orphan: + +################################### +Example: Train PyTorch on the cloud +################################### +**Audience:** TODO: + +**Prereqs:** You have an app already running locally. + +---- + +**************************** +What is the Lightning Cloud? +**************************** +The Lightning Cloud is the platform that we've created to interface with the cloud providers. Today +the Lightning Cloud supports AWS. + +.. note:: Support for GCP and Azure is coming soon! + +To use the Lightning Cloud, you buy credits that are used to pay the cloud providers. If you want to run +on your own AWS credentials, please contact us (support@lightning.ai) so we can get your clusters set up for you. diff --git a/docs/source-app/levels/expert/index.rst b/docs/source-app/levels/expert/index.rst new file mode 100644 index 0000000..28cd56d --- /dev/null +++ b/docs/source-app/levels/expert/index.rst @@ -0,0 +1,90 @@ +:orphan: + +.. _expert_level: + +.. toctree:: + :maxdepth: 1 + :hidden: + +############# +Expert skills +############# + + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Level : Use custom containers + :description: Learn to use a custom cloud container. + :button_link: build_a_machine_learning_workflow.html + :col_css: col-md-6 + :height: 150 + :tag: basic + +.. displayitem:: + :header: Level : Customize your cluster creation + :description: Learn to use a custom cloud container. + :button_link: build_a_machine_learning_workflow.html + :col_css: col-md-6 + :height: 150 + :tag: basic + + +.. raw:: html + +
+
+ +---- + +********************* +Intermediate Examples +********************* +As you work through the intermediate levels, try these examples: + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Example: Develop a Github Repo Script Runner + :description: Develop a workflow to execute Github Repos + :button_link: ../../examples/github_repo_runner/github_repo_runner.html + :col_css: col-md-6 + :height: 150 + :tag: basic + +.. displayitem:: + :header: Example: Develop a file server + :description: Create a simple Lightning App (App) that allows users to upload files and list the uploaded files. + :button_link: ../../examples/file_server/file_server.html + :col_css: col-md-6 + :height: 150 + :tag: basic + +.. displayitem:: + :header: Example: Develop a Jupyter Notebook component + :description: Develop a LightningWork that runs a notebook on the cloud. + :button_link: run_jupyter_notebook_on_the_cloud.html + :col_css: col-md-6 + :height: 150 + :tag: basic + +.. displayitem:: + :header: Example: Create a model demo + :description: Demo POCs and MVPs which can be shared with a public web user interface. + :button_link: create_a_model_demo.html + :col_css: col-md-6 + :height: 150 + :tag: basic + +.. raw:: html + +
+
diff --git a/docs/source-app/levels/intermediate/connect_lightning_components.rst b/docs/source-app/levels/intermediate/connect_lightning_components.rst new file mode 100644 index 0000000..14c2e9d --- /dev/null +++ b/docs/source-app/levels/intermediate/connect_lightning_components.rst @@ -0,0 +1,116 @@ +#################################################### +Level 4: Connect components into a full stack AI app +#################################################### + +**Audience:** Users who want to build apps with multiple components. + +**Prereqs:** You know how to `build a component <../basic/build_a_lightning_component.html>`_. + +---- + +**************************** +What is a full stack AI app? +**************************** +In the ML world, workflows coordinate multiple pieces of code working together. In Lightning, +when we coordinate 2 or more `Lightning components <../basic/build_a_lightning_component.html>`_ working together, +we instead call it a Lightning App. The difference will become more obvious when we introduce reactive +workflows in the advanced section. + +For the time being, we'll go over how to coordinate 2 components together in a traditional workflow setting +and explain how it works. + +.. note:: If you've used workflow tools for Python, this page describes conventional DAGs. + In `level 6 <./run_lightning_work_in_parallel.html>`_, we introduce reactive workflows that generalize beyond DAGs + so you can build complex systems without much effort. + +---- + +*********** +The toy app +*********** + +In this app, we define two components that run across 2 separate machines. One to train a model on a GPU machine and one to analyze the model +on a separate CPU machine. We save money by stopping the GPU machine when the work is done. + +.. lit_tabs:: + :titles: Import Lightning; Define Component 1; Define Component 2; Orchestrator; Connect component 1; Connect component 2; Implement run; Train; Analyze; Define app placeholder + :descriptions: First, import Lightning; This component trains a model on a GPU machine; This component analyzes a model on a CPU machine; Define the LightningFlow that orchestrates components; Component 1 will run on a CPU machine; Component 2 will run on an accelerated GPU machine; Describe the workflow in the run method; Training runs first and completes; Analyze runs after training completes; This allows the app to be runnable + :code_files: ./level_2_scripts/hello_app.py; ./level_2_scripts/hello_app.py; ./level_2_scripts/hello_app.py; ./level_2_scripts/hello_app.py; ./level_2_scripts/hello_app.py; ./level_2_scripts/hello_app.py; ./level_2_scripts/hello_app.py; ./level_2_scripts/hello_app.py; ./level_2_scripts/hello_app.py; ./level_2_scripts/hello_app.py + :highlights: 2; 5-7; 9-11; 13; 16; 17; 19; 20; 21; 23 + :enable_run: true + :tab_rows: 4 + :height: 460px + +| + +Now run the app: + +.. lit_tabs:: + :titles: Run on Lightning cloud; Your own hardware + :descriptions: Run to see these 2 components execute on separate machines 🤯; Run it locally without code changes 🤯🤯; + :code_files: ./level_2_scripts/code_run_cloud.bash; ./level_2_scripts/code_run_local.bash + :tab_rows: 7 + :height: 195px + +| + +Now you can develop distributed cloud apps on your laptop 🤯🤯🤯🤯! + +---- + +************* +Now you know: +************* + +Without going out of your way, you're now doing the following: (Hint: Click **visualize** to see an animation describing the code). + +.. lit_tabs:: + :titles: Orchestration; Distributed cloud computing; Multi-machine communication; Multi-machine communication; Multi-cloud; + :descriptions: Define orchestration in Python with full control-flow; The two pieces of independent Python code ran on separate machines 🤯🤯; The text "CPU machine 1" was sent from the flow machine to the machine running the TrainComponent; The text "GPU machine 2" was sent from the flow machine to the machine running the AnalyzeComponent; The full Lightning app can move across clusters and clouds + :code_files: ./level_2_scripts/hello_app.py; ./level_2_scripts/hello_app.py; ./level_2_scripts/hello_app.py; ./level_2_scripts/hello_app.py; ./level_2_scripts/multi_cloud.bash + :tab_rows: 4 + :highlights: 19-21; 16-17; 20; 21; 2, 6, 10 + :images: | | | | + :height: 470px + +---- + +********************* +Maintain full control +********************* +Although we've abstracted the infrastructure, you still have full control when you need it: + +.. lit_tabs:: + :titles: Scheduler; Crontab syntax; Auto-scaling; Organized Python; Full terraform control; + :descriptions: Although you can use Python timers, we have a scheduler short-hand; You can also use full cron syntax; Code your own auto-scaling syntax (Lightning plays well with Kubernetes); *Remember* components organize ANY Python code which can even call external non-python scripts such as optimized C++ model servers ;Experts have the option to use terraform to configure Lightning clusters + :code_files: ./level_2_scripts/hello_app_scheduler.py; ./level_2_scripts/hello_app_cron.py; ./level_2_scripts/hello_app_auto_scale.py; ./level_2_scripts/organized_app_python.py; ./level_2_scripts/tr.bash + :tab_rows: 4 + :highlights: 24; 24; 21, 24, 27, 28; 9, 16, 17; 5 + :height: 700px + +---- + +************************* +Next: Review how to debug +************************* +The next levels does a 2 minute review to make sure you know how to debug a Lightning app. + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Level 5: Debug a Lightning App + :description: Learn to debug a lightning app. + :button_link: debug_a_lightning_app.html + :col_css: col-md-12 + :height: 170 + :tag: 10 minutes + +.. raw:: html + +
+
diff --git a/docs/source-app/levels/intermediate/debug_a_lightning_app.rst b/docs/source-app/levels/intermediate/debug_a_lightning_app.rst new file mode 100644 index 0000000..856be5a --- /dev/null +++ b/docs/source-app/levels/intermediate/debug_a_lightning_app.rst @@ -0,0 +1,48 @@ +############################## +Level 5: Debug A Lightning app +############################## +**Audience:** Users who want to debug a distributed app locally. + +**Prereqs:** You must have finished the `Basic levels <../basic/>`_. + +---- + +****************** +Enable breakpoints +****************** +To enable a breakpoint, use `L.pdb.set_trace()` (note direct python pdb support is work in progress and open to contributions). + +.. lit_tabs:: + :descriptions: Toy app; Add a breakpoint. When the program runs, it will stop at this line. + :code_files: ./debug_app_scripts/toy_app_1_component.py; ./debug_app_scripts/toy_app_1_component_pdb.py + :highlights: ; 7 + :enable_run: true + :tab_rows: 3 + :height: 350px + +---- + +********************************* +Next: Run a component in parallel +********************************* +Learn to run components in parallel to enable more powerful workflows. + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Level 6: Run a Lightning component in parallel + :description: Learn when and how to run Components in parallel (asynchronous). + :button_link: run_lightning_work_in_parallel.html + :col_css: col-md-12 + :height: 150 + :tag: 15 minutes + +.. raw:: html + +
+
diff --git a/docs/source-app/levels/intermediate/debug_app_scripts/debug_app.py b/docs/source-app/levels/intermediate/debug_app_scripts/debug_app.py new file mode 100644 index 0000000..9e3d9c9 --- /dev/null +++ b/docs/source-app/levels/intermediate/debug_app_scripts/debug_app.py @@ -0,0 +1,25 @@ +# app.py +import lightning as L +from lightning.app.runners import MultiProcessRuntime + + +class TrainComponent(L.LightningWork): + def run(self, x): + print(f'train a model on {x}') + +class AnalyzeComponent(L.LightningWork): + def run(self, x): + print(f'analyze model on {x}') + +class WorkflowOrchestrator(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.train = TrainComponent() + self.analyze = AnalyzeComponent() + + def run(self): + self.train.run("GPU machine 1") + self.analyze.run("CPU machine 2") + +app = L.LightningApp(WorkflowOrchestrator()) +MultiProcessRuntime(app).dispatch() diff --git a/docs/source-app/levels/intermediate/debug_app_scripts/toy_app.py b/docs/source-app/levels/intermediate/debug_app_scripts/toy_app.py new file mode 100644 index 0000000..44273e6 --- /dev/null +++ b/docs/source-app/levels/intermediate/debug_app_scripts/toy_app.py @@ -0,0 +1,24 @@ +# app.py +import lightning as L + + + +class TrainComponent(L.LightningWork): + def run(self, x): + print(f'train a model on {x}') + +class AnalyzeComponent(L.LightningWork): + def run(self, x): + print(f'analyze model on {x}') + +class WorkflowOrchestrator(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.train = TrainComponent() + self.analyze = AnalyzeComponent() + + def run(self): + self.train.run("CPU machine 1") + self.analyze.run("CPU machine 2") + +app = L.LightningApp(WorkflowOrchestrator()) diff --git a/docs/source-app/levels/intermediate/debug_app_scripts/toy_app_1_component.py b/docs/source-app/levels/intermediate/debug_app_scripts/toy_app_1_component.py new file mode 100644 index 0000000..122f38c --- /dev/null +++ b/docs/source-app/levels/intermediate/debug_app_scripts/toy_app_1_component.py @@ -0,0 +1,17 @@ +# app.py +import lightning as L + +class Component(L.LightningWork): + def run(self, x): + print(x) + + +class WorkflowOrchestrator(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.component = Component() + + def run(self): + self.component.run('i love Lightning') + +app = L.LightningApp(WorkflowOrchestrator()) diff --git a/docs/source-app/levels/intermediate/debug_app_scripts/toy_app_1_component_pdb.py b/docs/source-app/levels/intermediate/debug_app_scripts/toy_app_1_component_pdb.py new file mode 100644 index 0000000..93fef4f --- /dev/null +++ b/docs/source-app/levels/intermediate/debug_app_scripts/toy_app_1_component_pdb.py @@ -0,0 +1,17 @@ +# app.py +import lightning as L + +class Component(L.LightningWork): + def run(self, x): + print(x) + L.pdb.set_trace() + +class WorkflowOrchestrator(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.component = Component() + + def run(self): + self.component.run('i love Lightning') + +app = L.LightningApp(WorkflowOrchestrator()) diff --git a/docs/source-app/levels/intermediate/embed_web_ui_into_lightningwork.rst b/docs/source-app/levels/intermediate/embed_web_ui_into_lightningwork.rst new file mode 100644 index 0000000..3be6a9e --- /dev/null +++ b/docs/source-app/levels/intermediate/embed_web_ui_into_lightningwork.rst @@ -0,0 +1,40 @@ +###################################### +Level 9: Embed graphical UIs into work +###################################### +**Audience:** Users who need to embed a Graphical UI in their Lightning Apps. + +**Prereqs:** You have finished `Level 8 `_. + +---- + +.. include:: ../../workflows/add_web_ui/index_content.rst + +---- + +******************************************* +Next steps: Practice adapting app templates +******************************************* +One of the most exciting powers of Lightning is the ability +to start an app from a template, replace or add components +and build a powerful system. + +---- + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Level 10: Practice adapting app templates + :description: Practice starting apps from templates and evolving them by replacing or adding components. + :button_link: start_from_lightning_app_templates.html + :col_css: col-md-12 + :height: 150 + +.. raw:: html + +
+
diff --git a/docs/source-app/levels/intermediate/index.rst b/docs/source-app/levels/intermediate/index.rst new file mode 100644 index 0000000..ed5c391 --- /dev/null +++ b/docs/source-app/levels/intermediate/index.rst @@ -0,0 +1,87 @@ +.. _intermediate_level: + +.. toctree:: + :maxdepth: 1 + :hidden: + + connect_lightning_components + debug_a_lightning_app + run_lightning_work_in_parallel + share_variables_between_lightning_components + share_files_between_components + embed_web_ui_into_lightningwork + start_from_lightning_app_templates + +################### +Intermediate skills +################### +Learn to coordinate 2+ components into workflows which we call Lightning apps. + + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Level 4: Coordinate 2+ components in a workflow + :description: Learn to coordinate 2_ components in a workflow which we call a Lightning app. + :button_link: connect_lightning_components.html + :col_css: col-md-6 + :height: 170 + :tag: 15 minutes + +.. displayitem:: + :header: Level 5: Debug a Lightning App + :description: Learn to debug a lightning app. + :button_link: debug_a_lightning_app.html + :col_css: col-md-6 + :height: 170 + :tag: 2 minutes + +.. displayitem:: + :header: Level 6: Run a Lightning component in parallel + :description: Learn when and how to run Components in parallel (asynchronous). + :button_link: run_lightning_work_in_parallel.html + :col_css: col-md-6 + :height: 150 + :tag: 10 minutes + +.. displayitem:: + :header: Level 7: Share variables between components + :description: Share variables between Lightning components. + :button_link: share_variables_between_lightning_components.html + :col_css: col-md-6 + :height: 150 + :tag: 15 minutes + +.. displayitem:: + :header: Level 8: Share files between components + :description: Learn how Drives share files between components + :button_link: share_files_between_components.html + :col_css: col-md-6 + :height: 150 + :tag: 20 minutes + +.. displayitem:: + :header: Level 9: Render a web UI with other components + :description: Learn how to embed graphical UIs like react, vue, streamlit and notebook UIs into a lightning workflow. + :button_link: embed_web_ui_into_lightningwork.html + :col_css: col-md-6 + :height: 150 + :tag: 15 minutes + +.. displayitem:: + :header: Level 10: Practice adapting app templates + :description: Practice starting apps from templates and evolving them by replacing or adding components. + :button_link: start_from_lightning_app_templates.html + :col_css: col-md-6 + :height: 150 + :tag: intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/levels/intermediate/level_12.rst b/docs/source-app/levels/intermediate/level_12.rst new file mode 100644 index 0000000..60c2390 --- /dev/null +++ b/docs/source-app/levels/intermediate/level_12.rst @@ -0,0 +1,12 @@ +:orphan: + +###################### +Level 12: Flow vs Work +###################### +**Audience:** Users who need to do non trivial workloads in their apps. + +**Prereqs:** Level 8+ + +---- + +.. include:: ../../workflows/build_lightning_component/from_scratch_component_content.rst diff --git a/docs/source-app/levels/intermediate/level_2_scripts/code_run_cloud.bash b/docs/source-app/levels/intermediate/level_2_scripts/code_run_cloud.bash new file mode 100644 index 0000000..6594fe0 --- /dev/null +++ b/docs/source-app/levels/intermediate/level_2_scripts/code_run_cloud.bash @@ -0,0 +1 @@ +lightning run app app.py --cloud diff --git a/docs/source-app/levels/intermediate/level_2_scripts/code_run_local.bash b/docs/source-app/levels/intermediate/level_2_scripts/code_run_local.bash new file mode 100644 index 0000000..8a00b45 --- /dev/null +++ b/docs/source-app/levels/intermediate/level_2_scripts/code_run_local.bash @@ -0,0 +1 @@ +lightning run app app.py diff --git a/docs/source-app/levels/intermediate/level_2_scripts/hello_app.py b/docs/source-app/levels/intermediate/level_2_scripts/hello_app.py new file mode 100644 index 0000000..d6ce3ea --- /dev/null +++ b/docs/source-app/levels/intermediate/level_2_scripts/hello_app.py @@ -0,0 +1,23 @@ +# app.py +import lightning as L + + +class TrainComponent(L.LightningWork): + def run(self, x): + print(f'train a model on {x}') + +class AnalyzeComponent(L.LightningWork): + def run(self, x): + print(f'analyze model on {x}') + +class WorkflowOrchestrator(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.train = TrainComponent(cloud_compute=L.CloudCompute('cpu')) + self.analyze = AnalyzeComponent(cloud_compute=L.CloudCompute('gpu')) + + def run(self): + self.train.run("CPU machine 1") + self.analyze.run("GPU machine 2") + +app = L.LightningApp(WorkflowOrchestrator()) diff --git a/docs/source-app/levels/intermediate/level_2_scripts/hello_app_auto_scale.py b/docs/source-app/levels/intermediate/level_2_scripts/hello_app_auto_scale.py new file mode 100644 index 0000000..b26d49c --- /dev/null +++ b/docs/source-app/levels/intermediate/level_2_scripts/hello_app_auto_scale.py @@ -0,0 +1,30 @@ +# app.py +import lightning as L + + +class TrainComponent(L.LightningWork): + def run(self, x): + print(f'train a model on {x}') + +class AnalyzeComponent(L.LightningWork): + def run(self, x): + print(f'analyze model on {x}') + +class WorkflowOrchestrator(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.train = TrainComponent(cloud_compute=L.CloudCompute('cpu')) + self.analyze = AnalyzeComponent(cloud_compute=L.CloudCompute('gpu')) + + def run(self): + # run() starts the machine + self.train.run("GPU machine 1") + + # stop() stops the machine + self.train.stop() + + # run analysis ONLY when machine 1 stopped + if self.train.status.STOPPED: + self.analyze.run("CPU machine 2") + +app = L.LightningApp(WorkflowOrchestrator()) diff --git a/docs/source-app/levels/intermediate/level_2_scripts/hello_app_cron.py b/docs/source-app/levels/intermediate/level_2_scripts/hello_app_cron.py new file mode 100644 index 0000000..a7a3ee6 --- /dev/null +++ b/docs/source-app/levels/intermediate/level_2_scripts/hello_app_cron.py @@ -0,0 +1,27 @@ +# app.py +import lightning as L + + +class TrainComponent(L.LightningWork): + def run(self, x): + print(f'train a model on {x}') + +class AnalyzeComponent(L.LightningWork): + def run(self, x): + print(f'analyze model on {x}') + +class WorkflowOrchestrator(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.train = TrainComponent(cloud_compute=L.CloudCompute('cpu')) + self.analyze = AnalyzeComponent(cloud_compute=L.CloudCompute('gpu')) + + def run(self): + # run training once + self.train.run("GPU machine 1") + + # run analysis once, then every hour again... + if self.schedule("5 4 * * *"): + self.analyze.run("CPU machine 2") + +app = L.LightningApp(WorkflowOrchestrator()) diff --git a/docs/source-app/levels/intermediate/level_2_scripts/hello_app_scheduler.py b/docs/source-app/levels/intermediate/level_2_scripts/hello_app_scheduler.py new file mode 100644 index 0000000..1e655c2 --- /dev/null +++ b/docs/source-app/levels/intermediate/level_2_scripts/hello_app_scheduler.py @@ -0,0 +1,27 @@ +# app.py +import lightning as L + + +class TrainComponent(L.LightningWork): + def run(self, x): + print(f'train a model on {x}') + +class AnalyzeComponent(L.LightningWork): + def run(self, x): + print(f'analyze model on {x}') + +class WorkflowOrchestrator(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.train = TrainComponent(cloud_compute=L.CloudCompute('cpu')) + self.analyze = AnalyzeComponent(cloud_compute=L.CloudCompute('gpu')) + + def run(self): + # run training once + self.train.run("GPU machine 1") + + # run analysis once, then every hour again... + if self.schedule("hourly"): + self.analyze.run("CPU machine 2") + +app = L.LightningApp(WorkflowOrchestrator()) diff --git a/docs/source-app/levels/intermediate/level_2_scripts/multi_cloud.bash b/docs/source-app/levels/intermediate/level_2_scripts/multi_cloud.bash new file mode 100644 index 0000000..840208d --- /dev/null +++ b/docs/source-app/levels/intermediate/level_2_scripts/multi_cloud.bash @@ -0,0 +1,10 @@ +# run on lightning cloud (fully managed) +lightning run app app.py --cloud + +# run on a cluster you created called pikachu +lightning create cluster pikachu --provider aws --role-arn arn:aws:iam::1234567890:role/lai-byoc +lightning run app app.py --cloud pikachu + +# run on a cluster you created called bolt +lightning create cluster bolt --provider aws --role-arn arn:aws:iam::1234567890:role/lai-byoc +lightning run app app.py --cloud bolt diff --git a/docs/source-app/levels/intermediate/level_2_scripts/organized_app_python.py b/docs/source-app/levels/intermediate/level_2_scripts/organized_app_python.py new file mode 100644 index 0000000..8b174ad --- /dev/null +++ b/docs/source-app/levels/intermediate/level_2_scripts/organized_app_python.py @@ -0,0 +1,36 @@ +# app.py +import subprocess +import lightning as L + + +class ExternalModelServer(L.LightningWork): + def run(self, x): + # compile + process = subprocess.Popen('g++ model_server.cpp -o model_server') + process.wait() + process = subprocess.Popen('./model_server') + process.wait() + +class LocustLoadTester(L.LightningWork): + def run(self, x): + cmd = f'locust --master-host {self.host} --master-port {self.port}' + process = subprocess.Popen(cmd) + process.wait() + +class WorkflowOrchestrator(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.serve = ExternalModelServer( + cloud_compute=L.CloudCompute('cpu'), parallel=True + ) + self.load_test = LocustLoadTester(cloud_compute=L.CloudCompute('cpu')) + + def run(self): + # start the server (on a CPU machine 1) + self.serve.run() + + # load testing when the server is up (on a separate cpu machine 2) + if self.serve.state.RUNNING: + self.load_test.run() + +app = L.LightningApp(WorkflowOrchestrator()) diff --git a/docs/source-app/levels/intermediate/level_2_scripts/tr.bash b/docs/source-app/levels/intermediate/level_2_scripts/tr.bash new file mode 100644 index 0000000..30c8d19 --- /dev/null +++ b/docs/source-app/levels/intermediate/level_2_scripts/tr.bash @@ -0,0 +1,5 @@ +# custom control for optimized clusters with tools like terraform +# are only supported on the enterprise tier (support@lightning.ai) + +# once the cluster is created you can run any app on it +lightning run app app.py --cloud my-custom-optimized-cluster diff --git a/docs/source-app/levels/intermediate/level_9.rst b/docs/source-app/levels/intermediate/level_9.rst new file mode 100644 index 0000000..344c321 --- /dev/null +++ b/docs/source-app/levels/intermediate/level_9.rst @@ -0,0 +1,16 @@ +:orphan: + +################### +Level 9: Event loop +################### +**Audience:** Users who want to build reactive Lightning Apps and move beyond DAGs. + +**Prereqs:** Level 8+ + +---- + +Drawing inspiration from modern web frameworks like `React.js `_, the Lightning App runs all flows in an **event loop** (forever), which is triggered several times a second after collecting any works' state change. + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/lightning_loop.gif + +When running a Lightning App in the cloud, the ``LightningWork`` run on different machines. LightningWork communicates any state changes to the **event loop** which re-executes the flow with the newly-collected works' state. diff --git a/docs/source-app/levels/intermediate/run_lightning_work_in_parallel.rst b/docs/source-app/levels/intermediate/run_lightning_work_in_parallel.rst new file mode 100644 index 0000000..b74fdac --- /dev/null +++ b/docs/source-app/levels/intermediate/run_lightning_work_in_parallel.rst @@ -0,0 +1,38 @@ +############################################## +Level 6: Run a Lightning component in parallel +############################################## +**Audience:** Users who want to run a Lightning Component in parallel (asynchroneously). + +**Prereqs:** You must have finished `Level 5 `_. + +---- + +.. include:: ../../workflows/run_work_in_parallel_content.rst + +---- + +********************************************** +Next steps: Share variables between components +********************************************** +Now that you know how to run components in parallel, we'll learn to share variables +across components to simplify complex workflows. + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Level 7: Share variables between components + :description: Learn to connect components + :col_css: col-md-12 + :button_link: share_variables_between_lightning_components.html + :height: 150 + :tag: 10 minutes + +.. raw:: html + +
+
diff --git a/docs/source-app/levels/intermediate/scripts/.storage/a b/docs/source-app/levels/intermediate/scripts/.storage/a new file mode 100644 index 0000000..1c6c4cc Binary files /dev/null and b/docs/source-app/levels/intermediate/scripts/.storage/a differ diff --git a/docs/source-app/levels/intermediate/scripts/.storage/embeddings b/docs/source-app/levels/intermediate/scripts/.storage/embeddings new file mode 100644 index 0000000..af3ee63 Binary files /dev/null and b/docs/source-app/levels/intermediate/scripts/.storage/embeddings differ diff --git a/docs/source-app/levels/intermediate/scripts/a b/docs/source-app/levels/intermediate/scripts/a new file mode 100644 index 0000000..1c6c4cc Binary files /dev/null and b/docs/source-app/levels/intermediate/scripts/a differ diff --git a/docs/source-app/levels/intermediate/scripts/comms_1.py b/docs/source-app/levels/intermediate/scripts/comms_1.py new file mode 100644 index 0000000..0411820 --- /dev/null +++ b/docs/source-app/levels/intermediate/scripts/comms_1.py @@ -0,0 +1,18 @@ +# app.py +import lightning as L + +class Component(L.LightningWork): + def run(self, x): + print(f'MACHINE 1: this string came from machine 0: "{x}"') + print('MACHINE 1: this string is on machine 1') + +class WorkflowOrchestrator(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.component = Component() + + def run(self): + x = 'hello from machine 0' + self.component.run(x) + +app = L.LightningApp(WorkflowOrchestrator()) diff --git a/docs/source-app/levels/intermediate/scripts/debug_app.py b/docs/source-app/levels/intermediate/scripts/debug_app.py new file mode 100644 index 0000000..9e3d9c9 --- /dev/null +++ b/docs/source-app/levels/intermediate/scripts/debug_app.py @@ -0,0 +1,25 @@ +# app.py +import lightning as L +from lightning.app.runners import MultiProcessRuntime + + +class TrainComponent(L.LightningWork): + def run(self, x): + print(f'train a model on {x}') + +class AnalyzeComponent(L.LightningWork): + def run(self, x): + print(f'analyze model on {x}') + +class WorkflowOrchestrator(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.train = TrainComponent() + self.analyze = AnalyzeComponent() + + def run(self): + self.train.run("GPU machine 1") + self.analyze.run("CPU machine 2") + +app = L.LightningApp(WorkflowOrchestrator()) +MultiProcessRuntime(app).dispatch() diff --git a/docs/source-app/levels/intermediate/scripts/embeddings b/docs/source-app/levels/intermediate/scripts/embeddings new file mode 100644 index 0000000..af3ee63 Binary files /dev/null and b/docs/source-app/levels/intermediate/scripts/embeddings differ diff --git a/docs/source-app/levels/intermediate/scripts/toy_app.py b/docs/source-app/levels/intermediate/scripts/toy_app.py new file mode 100644 index 0000000..44273e6 --- /dev/null +++ b/docs/source-app/levels/intermediate/scripts/toy_app.py @@ -0,0 +1,24 @@ +# app.py +import lightning as L + + + +class TrainComponent(L.LightningWork): + def run(self, x): + print(f'train a model on {x}') + +class AnalyzeComponent(L.LightningWork): + def run(self, x): + print(f'analyze model on {x}') + +class WorkflowOrchestrator(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.train = TrainComponent() + self.analyze = AnalyzeComponent() + + def run(self): + self.train.run("CPU machine 1") + self.analyze.run("CPU machine 2") + +app = L.LightningApp(WorkflowOrchestrator()) diff --git a/docs/source-app/levels/intermediate/scripts/toy_payload.py b/docs/source-app/levels/intermediate/scripts/toy_payload.py new file mode 100644 index 0000000..f6c744c --- /dev/null +++ b/docs/source-app/levels/intermediate/scripts/toy_payload.py @@ -0,0 +1,31 @@ +# app.py +import lightning as L + + +class EmbeddingProcessor(L.LightningWork): + def __init__(self, *args, **kwargs): + super().__init__(*args, **kwargs) + self.embeddings = None + + def run(self): + print('PROCESSOR: Generating embeddings...') + fake_embeddings = [[1, 2, 3], [2, 3, 4]] + self.embeddings = L.storage.Payload(fake_embeddings) + +class EmbeddingServer(L.LightningWork): + def run(self, payload): + print('SERVER: Using embeddings from processor', payload) + embeddings = payload.value + print('serving embeddings sent from EmbeddingProcessor: ', embeddings) + +class WorkflowOrchestrator(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.processor = EmbeddingProcessor() + self.server = EmbeddingServer() + + def run(self): + self.processor.run() + self.server.run(self.processor.embeddings) + +app = L.LightningApp(WorkflowOrchestrator()) diff --git a/docs/source-app/levels/intermediate/scripts/two_comms_non_ml.py b/docs/source-app/levels/intermediate/scripts/two_comms_non_ml.py new file mode 100644 index 0000000..23e8cd6 --- /dev/null +++ b/docs/source-app/levels/intermediate/scripts/two_comms_non_ml.py @@ -0,0 +1,36 @@ +# app.py +import lightning as L +import time + +class A(L.LightningWork): + def __init__(self, *args, **kwargs): + super().__init__(*args, **kwargs) + self.msg_changed = False + self.new_msg = '' + + def run(self): + # pretend to train and save a checkpoint every 10 steps + for step in (range(1000)): + time.sleep(1.0) + if step % 10 == 0: + self.msg_changed = True + self.new_msg = f'A is at step: {step}' + print(self.new_msg) + +class B(L.LightningWork): + def run(self, msg): + print(f'B: message from A: {msg}') + +class Example(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.a = A(parallel=True) + self.b = B(parallel=True) + + def run(self): + self.a.run() + if self.a.msg_changed: + self.a.msg_changed = False + self.b.run(self.a.new_msg) + +app = L.LightningApp(Example()) diff --git a/docs/source-app/levels/intermediate/scripts/two_work_comms.py b/docs/source-app/levels/intermediate/scripts/two_work_comms.py new file mode 100644 index 0000000..5e02b33 --- /dev/null +++ b/docs/source-app/levels/intermediate/scripts/two_work_comms.py @@ -0,0 +1,35 @@ +# app.py +import lightning as L +import time + +class TrainComponent(L.LightningWork): + def __init__(self, *args, **kwargs): + super().__init__(*args, **kwargs) + self.last_checkpoint_path = None + + def run(self): + # pretend to train and save a checkpoint every 10 steps + for step in (range(1000)): + time.sleep(1.0) + fake_loss = round(1/(step + 0.00001), 4) + print(f'{step=}: {fake_loss=} ') + if step % 10 == 0: + self.last_checkpoint_path = f'/some/path/{step=}_{fake_loss=}' + print(f'TRAIN COMPONENT: saved new checkpoint: {self.last_checkpoint_path}') + +class ModelDeploymentComponent(L.LightningWork): + def run(self, new_checkpoint): + print(f'DEPLOY COMPONENT: load new model from checkpoint: {new_checkpoint}') + +class ContinuousDeployment(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.train = TrainComponent(parallel=True) + self.model_deployment = ModelDeploymentComponent(parallel=True) + + def run(self): + self.train.run() + if self.train.last_checkpoint_path: + self.model_deployment.run(self.train.last_checkpoint_path) + +app = L.LightningApp(ContinuousDeployment()) diff --git a/docs/source-app/levels/intermediate/share_files_between_components.rst b/docs/source-app/levels/intermediate/share_files_between_components.rst new file mode 100644 index 0000000..3fa24de --- /dev/null +++ b/docs/source-app/levels/intermediate/share_files_between_components.rst @@ -0,0 +1,41 @@ +####################################### +Level 8: Share files between components +####################################### +**Audience:** Users who are moving large files such as artifacts or datasets. + +**Prereqs:** Level 6+ + +---- + +**** +TODO +**** +TODO + +---- + +************************************************* +Next steps: Render a web UI with other components +************************************************* +Now that we know the key ways of sharing files and variables, +we'll apply it to embed web UIs alongside components. + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Level 9: Render a web UI with other components + :description: Learn how to embed graphical UIs like react, vue, streamlit and notebook UIs into a lightning workflow. + :button_link: embed_web_ui_into_lightningwork.html + :col_css: col-md-12 + :height: 150 + :tag: 15 minutes + +.. raw:: html + +
+
diff --git a/docs/source-app/levels/intermediate/share_variables_between_lightning_components.rst b/docs/source-app/levels/intermediate/share_variables_between_lightning_components.rst new file mode 100644 index 0000000..b0ce06d --- /dev/null +++ b/docs/source-app/levels/intermediate/share_variables_between_lightning_components.rst @@ -0,0 +1,162 @@ +########################################### +Level 7: Share variables between components +########################################### +**Audience:** Users who want to share variables and files across Lightning components. + +**Prereqs:** You must have finished `intermediate level 5+ `_. + +---- + +**************************************** +Send a variable from Flow to a Component +**************************************** +When a variable is defined on the LightningFlow (orchestrator), and +then it's passed into functions for the work components, under the hood +Lightning sends the variables across the machines for you automatically. + +.. lit_tabs:: + :descriptions: Remember this component may live on its own machine; The flow may be on a separate machine as well; This variable is on the flow machine; When passed to the work component, it is actually sent across the network under the hood.; When it prints here, it prints on the work component machine (not the flow machine); The second string was directly created on machine 1 + :code_files: ./scripts/comms_1.py; ./scripts/comms_1.py; ./scripts/comms_1.py; ./scripts/comms_1.py; ./scripts/comms_1.py; ./scripts/comms_1.py + :highlights: 4-7; 9-16; 15; 16; 6; 7; + :enable_run: true + :tab_rows: 3 + :height: 380px + +| + +.. collapse:: CLI output + + .. code-block:: + + $ lightning run app app.py --open-ui=false + + Your Lightning App is starting. This won't take long. + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + MACHINE 1: this string came from machine 0: "hello from machine 0" + MACHINE 1: this string is on machine 1 + +| + +In this example, we learned that we can send variables to components like in regular Python. +On a local machine, it will behave like Python. When the workflow is distributed on the cloud, +it makes network calls under the hood, but still functions like Python to you. + +---- + +************************************** +Send a variable between two components +************************************** +A majority of workflows (especially in ML), require components to respond to a change in a component +likely running on a separate machine or even cluster. + +Example Continuous deployment: Every time a model saves a checkpoint, we redeploy a model: + +.. lit_tabs:: + :descriptions: Define a component that simulates training; Define a component that simulates deployment; Training will happen in parallel over a long period; The deployment server also runs in parallel forever; Start training in parallel (could take months); Whenever the model has a checkpoint deploy; When the checkpoint is updated, model re-deploys + :code_files: ./scripts/two_work_comms.py; ./scripts/two_work_comms.py; ./scripts/two_work_comms.py; ./scripts/two_work_comms.py; ./scripts/two_work_comms.py; ./scripts/two_work_comms.py; ./scripts/two_work_comms.py + :highlights: 5-18; 20-22; 27; 28; 31; 32, 33; 33 + :enable_run: true + :tab_rows: 3 + :height: 690px + +| + +.. collapse:: CLI output: + + .. code:: + + $ lightning run app app.py --open-ui=false + + Your Lightning App is starting. This won't take long. + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + step=0: fake_loss=100000.0 + TRAIN COMPONENT: saved new checkpoint: /some/path/step=0_fake_loss=100000.0 + step=1: fake_loss=1.0 + DEPLOY COMPONENT: load new model from checkpoint: /some/path/step=0_fake_loss=100000.0 + step=2: fake_loss=0.5 + step=3: fake_loss=0.3333 + step=4: fake_loss=0.25 + step=5: fake_loss=0.2 + step=6: fake_loss=0.1667 + step=7: fake_loss=0.1429 + step=8: fake_loss=0.125 + step=9: fake_loss=0.1111 + step=10: fake_loss=0.1 + TRAIN COMPONENT: saved new checkpoint: /some/path/step=10_fake_loss=0.1 + DEPLOY COMPONENT: load new model from checkpoint: /some/path/step=10_fake_loss=0.1 + step=11: fake_loss=0.0909 + step=12: fake_loss=0.0833 + step=13: fake_loss=0.0769 + step=14: fake_loss=0.0714 + step=15: fake_loss=0.0667 + step=16: fake_loss=0.0625 + step=17: fake_loss=0.0588 + step=18: fake_loss=0.0556 + step=19: fake_loss=0.0526 + step=20: fake_loss=0.05 + TRAIN COMPONENT: saved new checkpoint: /some/path/step=20_fake_loss=0.05 + DEPLOY COMPONENT: load new model from checkpoint: /some/path/step=20_fake_loss=0.05 + step=21: fake_loss=0.0476 + +---- + +******************************************** +Send a large variable between two components +******************************************** +For large variables such as arrays, tensors, embeddings and so on, use Payload to enable +transfering them across components. + +.. lit_tabs:: + :descriptions: Let's define a component to simulate generating embeddings (from a DB, feature store, etc...); This component simulates a server that will use the embeddings.; Run the component to generate the embeddings; Simulate embeddings as an array. Here you would query a DB, load from a feature store or disk or even use a neural network to extract the embedding.; Allow the embeddings to be transfered efficiently by wrapping them in the Payload object.; Pass the variable to the EmbeddingServer (just the pointer).; The data gets transfered once you use the .value attribute in the other component. + :code_files: ./scripts/toy_payload.py; ./scripts/toy_payload.py; ./scripts/toy_payload.py; ./scripts/toy_payload.py; ./scripts/toy_payload.py; ./scripts/toy_payload.py; ./scripts/toy_payload.py; + :highlights: 5-13; 15-19; 28; 12; 13; 29; 18 + :enable_run: true + :tab_rows: 3 + :height: 600px + +| + +.. collapse:: CLI output + + .. code:: + + $ lightning run app app.py --open-ui=false + + Your Lightning App is starting. This won't take long. + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + PROCESSOR: Generating embeddings... + SERVER: Using embeddings from processor + serving embeddings sent from EmbeddingProcessor: [[1, 2, 3], [2, 3, 4]] + +| + +The payload object keeps the data on the machine and passes a pointer +to the data around the app until the data is needed by a component. + +---- + +****************************************** +Next steps: Share files between components +****************************************** +Now that you know how to run components in parallel, we'll learn to share variables +across components to simplify complex workflows. + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Level 8: Share files between components + :description: Learn to share files between components. + :col_css: col-md-12 + :button_link: share_files_between_components.html + :height: 150 + :tag: 10 minutes + +.. raw:: html + +
+
diff --git a/docs/source-app/levels/intermediate/start_from_lightning_app_templates.rst b/docs/source-app/levels/intermediate/start_from_lightning_app_templates.rst new file mode 100644 index 0000000..ceb497c --- /dev/null +++ b/docs/source-app/levels/intermediate/start_from_lightning_app_templates.rst @@ -0,0 +1,34 @@ +############################################ +Level 10: Start from lightning app templates +############################################ +**Audience:** All users who want to move quickly with Lightning + +**Prereqs:** You have finished `Level 9 `_. + +---- + +**************************************************** +Next step: Learn to build powerful nested components +**************************************************** +Now that you can build powerful apps, learn to build nested components +that can do things like start dynamic works and connect to each other +via networking or CLI commands. + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Advanced skills + :description: Learn to build nested components with advanced functionality. + :button_link: ../advanced/index.html + :col_css: col-md-12 + :height: 170 + +.. raw:: html + +
+
diff --git a/docs/source-app/make.bat b/docs/source-app/make.bat new file mode 100644 index 0000000..9b56514 --- /dev/null +++ b/docs/source-app/make.bat @@ -0,0 +1,35 @@ +@ECHO OFF + +pushd %~dp0 + +REM Command file for Sphinx documentation + +if "%SPHINXBUILD%" == "" ( + set SPHINXBUILD=sphinx-build +) +set SOURCEDIR=. +set BUILDDIR=../build + +if "%1" == "" goto help + +%SPHINXBUILD% >NUL 2>NUL +if errorlevel 9009 ( + echo. + echo.The 'sphinx-build' command was not found. Make sure you have Sphinx + echo.installed, then set the SPHINXBUILD environment variable to point + echo.to the full path of the 'sphinx-build' executable. Alternatively you + echo.may add the Sphinx directory to PATH. + echo. + echo.If you don't have Sphinx installed, grab it from + echo.http://sphinx-doc.org/ + exit /b 1 +) + +%SPHINXBUILD% -M %1 %SOURCEDIR% %BUILDDIR% %SPHINXOPTS% +goto end + +:help +%SPHINXBUILD% -M help %SOURCEDIR% %BUILDDIR% %SPHINXOPTS% + +:end +popd diff --git a/docs/source-app/moving_to_the_cloud.rst b/docs/source-app/moving_to_the_cloud.rst new file mode 100644 index 0000000..86478fc --- /dev/null +++ b/docs/source-app/moving_to_the_cloud.rst @@ -0,0 +1,122 @@ +:orphan: + +.. _moving_to_the_cloud: + +#################### +Moving to the Cloud +#################### + +.. warning:: This is in progress and not yet fully supported. + +In the :ref:`quick_start` guide, you learned how to implement a simple app +that trains an image classifier and serve it once trained. + +In this tutorial, you'll learn how to extend that application so that it works seamlessly +both locally and in the cloud. + +---- + +******************************** +Step 1: Distributed Application +******************************** + + +Distributed Storage +^^^^^^^^^^^^^^^^^^^ + +When running your application in a fully-distributed setting, the data available on one machine won't necessarily be available on another. + +To solve this problem, Lightning introduces the :class:`~lightning.app.storage.Path` object. +This ensures that your code can run both locally and in the cloud. + +The :class:`~lightning.app.storage.Path` object keeps track of the work which creates +the path. This enables Lightning to transfer the files correctly in a distributed setting. + +Instead of passing a string representing a file or directory, Lightning simply wraps +them into a :class:`~lightning.app.storage.Path` object and makes them an attribute of your LightningWork. + +Without doing this conscientiously for every single path, your application will fail in the cloud. + +In the example below, a file written by **SourceFileWork** is being transferred by the flow +to the **DestinationFileAndServeWork** work. The Path object is the reference to the file. + +.. literalinclude:: ../../examples/app/boring/app.py + :emphasize-lines: 5, 22, 28, 48 + +In the ``scripts/serve.py`` file, we are creating a **FastApi Service** running on port ``1111`` +that returns the content of the file received from **SourceFileWork** when +a post request is sent to ``/file``. + +.. literalinclude:: ../../examples/app/boring/scripts/serve.py + :emphasize-lines: 21, 23-26 + +---- + +Distributed Frontend +^^^^^^^^^^^^^^^^^^^^ + +In the above example, the **FastAPI Service** was running on one machine, +and the frontend UI in another. + +In order to assemble them, you need to do two things: + +* Provide **port** argument to your work's ``__init__`` method to expose a single service. + +Here's how to expose the port: + +.. literalinclude:: ../../examples/app/boring/app.py + :emphasize-lines: 8 + :lines: 33-44 + + +And here's how to expose your services within the ``configure_layout`` flow hook: + +.. literalinclude:: ../../examples/app/boring/app.py + :emphasize-lines: 5 + :lines: 53-57 + +In this example, we're appending ``/file`` to our **FastApi Service** url. +This means that our ``Boring Tab`` triggers the ``get_file_content`` from the **FastAPI Service** +and embeds its content as an `IFrame `_. + +.. literalinclude:: ../../examples/app/boring/scripts/serve.py + :lines: 23-26 + + +Here's a visualization of the application described above: + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/storage_ui.gif + :alt: Storage API Animation + :width: 100 % + +---- + +***************************** +Step 2: Scalable Application +***************************** + +The benefit of defining long-running code inside a +:class:`~lightning.app.core.work.LightningWork` +component is that you can run it on different hardware +by providing :class:`~lightning.app.utilities.packaging.cloud_compute.CloudCompute` to +the ``__init__`` method of your :class:`~lightning.app.core.work.LightningWork`. + +By adapting the :ref:`quick_start` example as follows, you can easily run your component on multiple GPUs: + + +Without doing much, you’re now running a script on its own cluster of machines! 🤯 + +---- + +***************************** +Step 3: Resilient Application +***************************** + +We designed Lightning with a strong emphasis on supporting failure cases. +The framework shines when the developer embraces our fault-tolerance best practices, +enabling them to create ML applications with a high degree of complexity as well as a strong support +for unhappy cases. + +An entire section would be dedicated to this concept. + +TODO diff --git a/docs/source-app/quickstart.rst b/docs/source-app/quickstart.rst new file mode 100644 index 0000000..6df9b26 --- /dev/null +++ b/docs/source-app/quickstart.rst @@ -0,0 +1,126 @@ +:orphan: + +.. _quick_start: + +############ +Quick Start +############ + +In this guide, we'll run an application that trains +an image classification model with the `MNIST Dataset `_, +and uses `Gradio `_ to serve it. + +---- + +********************** +Step 1 - Installation +********************** + +First, you'll need to install Lightning. You can find the complete guide here. + +Then, you'll need to install the `Lightning Quick Start package `_. + +.. code-block:: bash + + lightning install app lightning/quick-start + +And download the training script used by the App: + + +---- + +********************** +Step 2 - Run the app +********************** + +To run your app, copy the following command to your local terminal: + +.. code-block:: bash + + lightning run app app.py + +And that's it! + +.. admonition:: You should see the app logs in your terminal. + :class: dropdown + + .. code-block:: console + + Your Lightning App is starting. This won't take long. + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + + Global seed set to 42 + + GPU available: True (mps), used: False + TPU available: False, using: 0 TPU cores + IPU available: False, using: 0 IPUs + + | Name | Type | Params | In sizes | Out sizes + ------------------------------------------------------------------ + 0 | model | Net | 1.2 M | [1, 1, 28, 28] | [1, 10] + 1 | val_acc | Accuracy | 0 | ? | ? + ------------------------------------------------------------------ + 1.2 M Trainable params + 0 Non-trainable params + 1.2 M Total params + Epoch 4: 100%|█████████████████████████| 16/16 [00:00<00:00, 32.31it/s, loss=0.0826, v_num=0] + `Trainer.fit` stopped: `max_epochs=5` reached. + + Running on local URL: http://127.0.0.1:62782/ + ... + + +The app will open your browser and show an interactive demo: + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/qiuck-start-tensorboard-tab.png + :alt: Quick Start UI - Model Training Tab + :width: 100 % + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/quick-start-gradio-tab.png + :alt: Quick Start UI - Interactive Demo Tab + :width: 100 % + +---- + +This app behind the scenes +^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +This application has one flow component which coordinates two works executing their own python script. +Once the training is finished, the trained model weights are passed to the serve component. + + +Here is how the components of a Lightning app are structured: + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/quick_start_components.gif + :alt: Quick Start Application + :width: 100 % + +Here is the application timeline: + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/timeline.gif + :alt: Quick Start Timeline Application + :width: 100 % + +---- + +************************************** +Steps 3 - Build your app in the cloud +************************************** + +Simply add ``--cloud`` to run this application in the cloud 🤯 + +.. code-block:: bash + + lightning run app app.py --cloud + +Congratulations! You've now run your first application with Lightning. + +---- + +*********** +Next Steps +*********** + +To learn how to build and modify apps, go to the :ref:`basics`. + +To learn how to create UIs for your apps, read :ref:`ui_and_frontends`. diff --git a/docs/source-app/testing.rst b/docs/source-app/testing.rst new file mode 100644 index 0000000..ed2d6db --- /dev/null +++ b/docs/source-app/testing.rst @@ -0,0 +1,155 @@ +:orphan: + +.. _testing: + +####################### +Productionize your Apps +####################### + +TODO: Cleanup + +At the core of our system is an integration testing framework that will allow for a first-class experience creating integration tests for Lightning Apps. This document will explain how we can create a lightning app test, how we can execute it, and where to find more information. + +---- + +*********** +Philosophy +*********** + +Testing a Lightning app is unique. It is a superset of an application that converges machine learning, API development, and UI development. With that in mind, there are several philosophies (or "best practices") that you should adhere to: + + +#. **Control your app state** - With integration and end to end tests, you have the capabilities of controlling your app's state through dependency injection. Use it! +#. **Integration focuses on the work, End to End focuses on the app** - When writing tests, think of the depth and breath of what you are writing. Write many integration tests since they are relatively cheap, while keeping the end to end tests for holistic app testing. +#. **Don't overthink it** - What needs to be tested? What is the order of risk? These are the questions you should build with before writing your first line of code. Writing tests for the sake of writing tests is an exercise in futility. Write meaningful, impactful tests. +#. **Test Isolation** - Write your tests in an isolated manner. No two tests should ever depend on each other. +#. **Use your framework** - Testing apps should be framework agnostic. +#. **Have fun!** - At the heart of testing is experimentation. Like any experiment, tests begin with a hypothesis of workability, but you can extend that to be more inclusive. Ask the question, write the test to answer your question, and make sure you have fun while doing it. + +---- + +**************************************** +Anatomy of a Lightning integration test +**************************************** + +The following is a PyTest example of an integration test using the ``lightning.app.testing`` module. + +.. code-block:: python + + import os + + from lightning.app import _PROJECT_ROOT + from lightning.app.testing import application_testing, LightningTestApp + from lightning.app.utilities.enum import AppStage + + + class TestLightningAppInt(TestLightningApp): + def run_once(self) -> bool: + if self.root.counter > 1: + print("V0 App End") + self.stage = AppStage.STOPPING + return True + return super().run_once() + + + def test_v0_app_example(): + command_line = [ + os.path.join(_PROJECT_ROOT, "examples/app_v0/app.py"), + "--blocking", + "False", + "--multiprocess", + "--open-ui", + "False", + ] + result = application_testing(TestLightningAppInt, command_line) + assert "V0 App End" in str(result.stdout_bytes) + assert result.exit_code == 0 + +---- + +Setting up the app +^^^^^^^^^^^^^^^^^^ + +Lightning apps are unique in that they represent a full stack model for your machine learning application. To be clear, the integration tests are *NOT* going to touch the UI flow. Instead we inject your application with helper methods that, when executed, can assist in validating your application. + +To get started, you simply need to import the following: + +.. code-block:: python + + from lightning.app.testing import application_testing, LightningTestApp + +We will discuss ``application_testing`` in a bit, but first let's review the structure of ``LightningTestApp``. + +---- + +LightningTestApp +^^^^^^^^^^^^^^^^^ + +The :class:`lightning.app.testing.testing.LightningTestApp` class is available to use for provisioning and setting up your testing needs. Note that you do not need this class to move forward with testing. Any application that inherits ``LightningApp`` should suffice as long as you override the correct methods. Reviewing the TestLightnigApp we see some overrides that are already there. Please revuew the class for more information. + +.. code-block:: python + + class TestLightningAppInt(LightningTestApp): + def run_once(self) -> bool: + if self.root.counter > 1: + print("V0 App End") + self.stage = AppStage.STOPPING + return True + return super().run_once() + +We create a test class overriding the ``run_once`` function. This function helps control the flow of your application and is ran first. In this example we are calling ``self.root.counter`` and checking if the job has executed once. If so, we want to print out ``V0 App End`` and set the ``self.stage`` to ``AppStage.STOPPING``. This is how we control the flow through state. Your situation might be different, so experiment and see what you can do! + +Besides ``run_once`` there are a few other overrides available: + + +* ``on_before_run_once`` - This runs before your ``run_once`` function kicks off. You can set up your application pre-conditions here. +* ``on_after_run_once`` - Similar to ``on_before_run_once`` but after the ``run_once`` method is called. + +These methods will skew your tests, so use them when needed. + +---- + +The Test +^^^^^^^^ + +We provide ``application_testing`` as a helper funtion to get your application up and running for testing. It uses ``click``\ 's invocation tooling underneath. + +.. code-block:: + + command_line = [ + os.path.join(_PROJECT_ROOT, "examples/app_v0/app.py"), + "--blocking", + "False", + "--open-ui", + "False", + ] + +First in the list for ``command_line`` is the location of your script. It is an external file. In this example we have ``_PROJECT_ROOT`` but this is *not* a helper constant for you to utilize. You will need to provide the location yourself. + +Next there are a couple of options you can leverage: + +* ``blocking`` - Blocking is an app status that says "Do not run until I click run in the UI". For our integration test, since we are not using the UI, we are setting this to "False". +* ``open-ui`` - We set this to false since this is the routine that opens a browser for your local execution. + +Once you have your commandline ready, you will then be able to kick off the test and gather results: + +.. code-block:: python + + result = application_testing(TestLightningAppInt, command_line) + +As mentioned earlier, ``application_testing`` is a helper method that allows you to inject your TestLightningApp class (with overrides) and the commandline flags. Once the process is done it returns the results back for parsing. + +.. code-block:: python + + assert "V0 App End" in str(result.stdout_bytes) + assert result.exit_code == 0 + +Since we injected "V0 App End" to the end of our test flow. The state was changed to ``AppStatus.STOPPING`` which means the process is done. Finally, we check the result's exit code to make sure that we did not throw an error during execution. + +---- + +************ +End to End +************ + +TODO diff --git a/docs/source-app/ui_and_frontends.rst b/docs/source-app/ui_and_frontends.rst new file mode 100644 index 0000000..53e50cd --- /dev/null +++ b/docs/source-app/ui_and_frontends.rst @@ -0,0 +1,23 @@ +:orphan: + +.. _ui_and_frontends: + +################ +UI and Frontends +################ + + +The Lightning framework allows you to create customized, interactive UIs with the framework of your choice. + +You can easily embed other tools and services (like a GitHub repo, a `FastAPI Service `_, an `arXiv `_ paper or a `Dask Cluster `_ Admin page), or create a complete UI from scratch. + + +To get started, you can use built-in templates for the following frameworks: + +* `React.js `_ +* `StreamLit `_ + + + +To keep learning about Lightning, check out :ref:`moving_to_the_cloud`. +This section covers best practices to seamlessly make your Lightning code work both locally and in the cloud. diff --git a/docs/source-app/workflows/access_app_state/access_app_state.rst b/docs/source-app/workflows/access_app_state/access_app_state.rst new file mode 100644 index 0000000..1e23328 --- /dev/null +++ b/docs/source-app/workflows/access_app_state/access_app_state.rst @@ -0,0 +1,59 @@ +.. _access_app_state: + +################ +Access App State +################ + +**Audience:** Users who want to know how the App State can be accessed. + +**Level:** Basic + +********************** +What is the App State? +********************** + +In Lightning, each component is stateful and their state is composed of all attributes defined within their **__init__** method. + +The **App State** is the collection of all the components' states forming the App. + +************************************ +What is special about the App State? +************************************ + +The **App State** is always up-to-date, even running an App in the cloud on multiple machines. +This means that every time an attribute is modified in a Work, that information is automatically +broadcasted to the Flow. With this mechanism, any Component can **react** to any other +Component's **state changes** through the Flow and complex systems can be easily implemented. +Lightning requires a state based driven mindset when implementing the Flow. + +*************************************** +When do I need to access the App State? +*************************************** + +As a user, you are interacting with your component attributes, so most likely, +you won't need to access the Component's state directly, but it can be helpful to +understand how the state works under the hood. + +For example, here we define a **Flow** component and **Work** component, where the Work increments a counter indefinitely and the Flow prints its state which contains the Work. + +You can easily check the state of your entire App as follows: + +.. literalinclude:: ../../code_samples/quickstart/app_01.py + +Run the App with: + +.. code-block:: bash + + lightning run app docs/quickstart/app_01.py + +And here's the output you get when running the App using **Lightning CLI**: + +.. code-block:: console + + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + State: {'works': {'w': {'vars': {'counter': 1}}}} + State: {'works': {'w': {'vars': {'counter': 2}}}} + State: {'works': {'w': {'vars': {'counter': 3}}}} + State: {'works': {'w': {'vars': {'counter': 3}}}} + State: {'works': {'w': {'vars': {'counter': 4}}}} + ... diff --git a/docs/source-app/workflows/add_components/index.rst b/docs/source-app/workflows/add_components/index.rst new file mode 100644 index 0000000..ca95e44 --- /dev/null +++ b/docs/source-app/workflows/add_components/index.rst @@ -0,0 +1,31 @@ +:orphan: + +########################### +Add a component to your app +########################### +**Audience:** Users looking to expand the functionality of their Lightning apps. + +---- + +******************* +Install a component +******************* + +Any Lightning component can be installed with: + +.. code:: python + + lightning install component org/the-component-name + +`Browse all community-built components here `_. + +.. note:: Components are being populated daily + +---- + +********************** +Contribute a component +********************** +One of the first principles of the Lightning community is to code something *once* for the benefit or everyone! + +To contribute a component, `follow this guide <../build_lightning_component/index.html>`_. diff --git a/docs/source-app/workflows/add_server/any_server.rst b/docs/source-app/workflows/add_server/any_server.rst new file mode 100644 index 0000000..2e26b88 --- /dev/null +++ b/docs/source-app/workflows/add_server/any_server.rst @@ -0,0 +1,185 @@ +######################### +Enable any server (basic) +######################### +**Audience:** Users who want to enable an arbitrary server/UI. + +**Prereqs:** Basic python knowledge. + +---- + +***************** +What is a server? +***************** +A server is a program that enables other programs or users to connect to it. As long as your server can listen on a port, +you can enable it with a Lightning App. + +---- + +*************************** +Add a server to a component +*************************** +Any server that listens on a port, can be enabled via a work. For example, here's a plain python server: + +.. code:: python + :emphasize-lines: 11-12 + + import socketserver + from http import HTTPStatus, server + + + class PlainServer(server.SimpleHTTPRequestHandler): + def do_GET(self): + self.send_response(HTTPStatus.OK) + self.end_headers() + # Data must be passed as bytes to the `self.wfile.write` call + html = b"

Hello lit world

" + self.wfile.write(html) + + + httpd = socketserver.TCPServer(("localhost", "3000"), PlainServer) + httpd.serve_forever() + +To enable the server inside the component, start the server in the run method and use the ``self.host`` and ``self.port`` properties: + +.. code:: python + :emphasize-lines: 14-15 + + import lightning as L + import socketserver + from http import HTTPStatus, server + + + class PlainServer(server.SimpleHTTPRequestHandler): + def do_GET(self): + self.send_response(HTTPStatus.OK) + self.end_headers() + # Data must be passed as bytes to the `self.wfile.write` call + html = b"

Hello lit world

" + self.wfile.write(html) + + + class LitServer(L.LightningWork): + def run(self): + httpd = socketserver.TCPServer((self.host, self.port), PlainServer) + httpd.serve_forever() + +---- + +************************************** +Route the server in the root component +************************************** +The final step, is to tell the Root component in which tab to render this component's output: +In this case, we render the ``LitServer`` output in the ``home`` tab of the application. + +.. code:: python + :emphasize-lines: 20, 23, 28 + + import lightning as L + import socketserver + from http import HTTPStatus, server + + + class PlainServer(server.SimpleHTTPRequestHandler): + def do_GET(self): + self.send_response(HTTPStatus.OK) + self.end_headers() + # Data must be passed as bytes to the `self.wfile.write` call + html = b"

Hello lit world

" + self.wfile.write(html) + + + class LitServer(L.LightningWork): + def run(self): + httpd = socketserver.TCPServer((self.host, self.port), PlainServer) + httpd.serve_forever() + + + class Root(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_server = LitServer(parallel=True) + + def run(self): + self.lit_server.run() + + def configure_layout(self): + tab1 = {"name": "home", "content": self.lit_server} + return tab1 + + + app = L.LightningApp(Root()) + +We use the ``parallel=True`` argument of ``LightningWork`` to run the server in parallel +while the rest of the Lightning App runs everything else. + +---- + +*********** +Run the app +*********** +Start the app to see your new UI! + +.. code:: bash + + lightning run app app.py + +To run the app on the cloud, use the ``--cloud`` argument. + +.. code:: bash + + lightning run app app.py --cloud + +---- + +***************************************** +Interact with a component from the server +***************************************** +TODO: how do we do this? + + +---- + +***************************************** +Interact with the server from a component +***************************************** +TODO: how do we do this? + +---- + +******** +Examples +******** +Here are a few example apps that expose a server via a component: + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Example: Tensorboard + :description: TODO + :col_css: col-md-4 + :button_link: example_app.html + :height: 150 + +.. displayitem:: + :header: Example: Streamlit + :description: TODO + :col_css: col-md-4 + :button_link: example_app.html + :height: 150 + +.. displayitem:: + :header: Example: React + :description: TODO + :col_css: col-md-4 + :button_link: example_app.html + :height: 150 + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/add_server/flask_basic.rst b/docs/source-app/workflows/add_server/flask_basic.rst new file mode 100644 index 0000000..38ca282 --- /dev/null +++ b/docs/source-app/workflows/add_server/flask_basic.rst @@ -0,0 +1,155 @@ +############################### +Add a web UI with Flask (basic) +############################### +**Audience:** Users who want to enable a flask app within a component. + +**Prereqs:** Basic python knowledge. + +---- + +************** +What is Flask? +************** +Flask is a web framework, that lets you develop web applications in Python easily. + +---- + +************************ +Add Flask to a component +************************ +First, define your flask app as you normally would without Lightning: + +.. code:: python + :emphasize-lines: 9 + + from flask import Flask + + flask_app = Flask(__name__) + + + @flask_app.route("/") + def hello(): + return "Hello, World!" + + + flask_app.run(host="0.0.0.0", port=80) + +To enable the server inside the component, start the Flask server in the run method and use the ``self.host`` and ``self.port`` properties: + +.. code:: python + :emphasize-lines: 12 + + import lightning as L + from flask import Flask + + + class LitFlask(L.LightningWork): + def run(self): + flask_app = Flask(__name__) + + @flask_app.route("/") + def hello(): + return "Hello, World!" + + flask_app.run(host=self.host, port=self.port) + +---- + +************************************** +Route the server in the root component +************************************** +The final step, is to tell the Root component in which tab to render this component's output: +In this case, we render the ``LitFlask`` output in the ``home`` tab of the application. + +.. code:: python + :emphasize-lines: 17, 23 + + import lightning as L + from flask import Flask + + + class LitFlask(L.LightningWork): + def run(self): + flask_app = Flask(__name__) + + @flask_app.route("/") + def hello(): + return "Hello, World!" + + flask_app.run(host=self.host, port=self.port) + + + class Root(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_flask = LitFlask(parallel=True) + + def run(self): + self.lit_flask.run() + + def configure_layout(self): + tab1 = {"name": "home", "content": self.lit_flask} + return tab1 + + + app = L.LightningApp(Root()) + +We use the ``parallel=True`` argument of ``LightningWork`` to run the server in the background +while the rest of the Lightning App runs everything else. + +---- + +*********** +Run the app +*********** +Start the app to see your new UI! + +.. code:: bash + + lightning run app app.py + +To run the app on the cloud, use the ``--cloud`` argument. + +.. code:: bash + + lightning run app app.py --cloud + +---- + +******** +Examples +******** +Here are a few example apps that expose a Flask server via a component: + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Example 1 + :description: TODO + :col_css: col-md-4 + :button_link: example_app.html + :height: 150 + +.. displayitem:: + :header: Example 2 + :description: TODO + :col_css: col-md-4 + :button_link: example_app.html + :height: 150 + +.. displayitem:: + :header: Example 3 + :description: TODO + :col_css: col-md-4 + :button_link: example_app.html + :height: 150 + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/add_server/index.rst b/docs/source-app/workflows/add_server/index.rst new file mode 100644 index 0000000..1429b08 --- /dev/null +++ b/docs/source-app/workflows/add_server/index.rst @@ -0,0 +1,8 @@ +################################### +Run a server within a Lightning App +################################### +Any type of server can run inside a Lightning App. + +---- + +.. include:: index_content.rst diff --git a/docs/source-app/workflows/add_server/index_content.rst b/docs/source-app/workflows/add_server/index_content.rst new file mode 100644 index 0000000..d362369 --- /dev/null +++ b/docs/source-app/workflows/add_server/index_content.rst @@ -0,0 +1,35 @@ +.. toctree:: + :maxdepth: 1 + :hidden: + + any_server + flask_basic + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Any server + :description: Learn how to enable any server inside a Lightning App. + :col_css: col-md-6 + :button_link: any_server.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: Flask + :description: Learn how to add a Flask server inside a Lightning App. + :col_css: col-md-6 + :button_link: flask_basic.html + :height: 150 + :tag: basic + + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/add_web_link.rst b/docs/source-app/workflows/add_web_link.rst new file mode 100644 index 0000000..01ffdf6 --- /dev/null +++ b/docs/source-app/workflows/add_web_link.rst @@ -0,0 +1,54 @@ +############## +Add a web link +############## +**Audience:** Users who want to link to other pages from their app. + +---- + +************** +Add a url link +************** +In this example we'll replicate |urls_link|. + +To add a url link to an app, simply specify it in the ``configure_layout`` method +and connect the UIs. Create a file named **app.py** with this code: + +.. |urls_link| raw:: html + + the app running here + +.. code:: python + :emphasize-lines: 7,11 + + import lightning as L + + class LitApp(L.LightningFlow): + def configure_layout(self): + tab_1 = { + "name": "Logger", + "content": "https://bit.ly/tb-aasae" + } + tab_2 = { + "name": "Paper", + "content": "https://arxiv.org/pdf/2107.12329.pdf" + } + return tab_1, tab_2 + + app = L.LightningApp(LitApp()) + +---- + +*********** +Run the app +*********** +Run the app locally to see it! + +.. code:: python + + lightning run app app.py + +Now run it on the cloud as well: + +.. code:: python + + lightning run app app.py --cloud diff --git a/docs/source-app/workflows/add_web_ui/angular_js_intermediate.rst b/docs/source-app/workflows/add_web_ui/angular_js_intermediate.rst new file mode 100644 index 0000000..095dee3 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/angular_js_intermediate.rst @@ -0,0 +1,6 @@ +:orphan: + +########################################### +Add a web UI with Angular.js (intermediate) +########################################### +coming... diff --git a/docs/source-app/workflows/add_web_ui/dash/basic.rst b/docs/source-app/workflows/add_web_ui/dash/basic.rst new file mode 100644 index 0000000..4316fc1 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/dash/basic.rst @@ -0,0 +1,221 @@ +############################## +Add a web UI with Dash (basic) +############################## +**Audience:** Users who want to add a web UI with Dash by Plotly. + +**Prereqs:** Basic python knowledge. + +---- + +************* +What is Dash? +************* +`Dash `_ is the original low-code framework for rapidly building data apps in Python, R, Julia, and F# (experimental). + +Install Dash with: + +.. code:: bash + + pip install dash + +---- + +************************ +Create the dash demo app +************************ + +To explain how to use Dash with Lightning, let's build a simple app with Dash. + + +.. + To explain how to use Dash with Lightning, let's replicate the |dash_link|. + + .. |dash_link| raw:: html + + example running here + +In the next few sections we'll build an app step-by-step. +First **create a file named app.py** with the app content: + +.. code:: bash + + import lightning as L + import dash + import plotly.express as px + + class LitDash(L.LightningWork): + def run(self): + dash_app = dash.Dash(__name__) + X = [1, 2, 3, 4, 5, 6] + Y = [2, 4, 8, 16, 32, 64] + fig = px.line(x=X, y=Y) + + dash_app.layout = dash.html.Div(children=[ + dash.html.H1(children='⚡ Hello Dash + Lightning⚡'), + dash.html.Div(children='The Dash framework running inside a ⚡ Lightning App'), + dash.dcc.Graph(id='example-graph', figure=fig) + ]) + + dash_app.run_server(host=self.host, port=self.port) + + class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_dash = LitDash(parallel=True) + + def run(self): + self.lit_dash.run() + + def configure_layout(self): + tab1 = {"name": "home", "content": self.lit_dash} + return tab1 + + app = L.LightningApp(LitApp()) + + +add 'dash' to a requirements.txt file: + +.. code:: bash + + echo "dash" >> requirements.txt + +this is a best practice to make apps reproducible. + +---- + +*********** +Run the app +*********** +Run the app locally to see it! + +.. code:: python + + lightning run app app.py + +Now run it on the cloud as well: + +.. code:: python + + lightning run app app.py --cloud + +---- + +************************ +Step-by-step walkthrough +************************ +In this section, we explain each part of this code in detail. + +---- + +0. Define a Dash app +^^^^^^^^^^^^^^^^^^^^ +First, find the dash app you want to integrate. In this example, that app looks like: + +.. code:: python + + import dash + import plotly.express as px + + dash_app = dash.Dash(__name__) + X = [1, 2, 3, 4, 5, 6] + Y = [2, 4, 8, 16, 32, 64] + fig = px.line(x=X, y=Y) + + dash_app.layout = dash.html.Div(children=[ + dash.html.H1(children='⚡ Hello Dash + Lightning⚡'), + dash.html.Div(children='The Dash framework running inside a ⚡ Lightning App'), + dash.dcc.Graph(id='example-graph', figure=fig) + ]) + + dash_app.run_server(host='0.0.0.0', port=80) + +This dash app plots a simple line curve along with some HTMlapp. +`Visit the Dash documentation for the full API `_. + +---- + +1. Add Dash to a component +^^^^^^^^^^^^^^^^^^^^^^^^^^ +Add the dash app to the run method of a ``LightningWork`` component and run the server on that component's **host** and **port**: + +.. code:: python + :emphasize-lines: 6, 18 + + import lightning as L + import dash + import plotly.express as px + + class LitDash(L.LightningWork): + def run(self): + dash_app = dash.Dash(__name__) + X = [1, 2, 3, 4, 5, 6] + Y = [2, 4, 8, 16, 32, 64] + fig = px.line(x=X, y=Y) + + dash_app.layout = dash.html.Div(children=[ + dash.html.H1(children='⚡ Hello Dash + Lightning⚡'), + dash.html.Div(children='The Dash framework running inside a ⚡ Lightning App'), + dash.dcc.Graph(id='example-graph', figure=fig) + ]) + + dash_app.run_server(host=self.host, port=self.port) + + class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_dash = LitDash(parallel=True) + + def run(self): + self.lit_dash.run() + + def configure_layout(self): + tab1 = {"name": "home", "content": self.lit_dash} + return tab1 + + app = L.LightningApp(LitApp()) + +---- + +2. Route the UI in the root component +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +The final step, is to tell the Root component in which tab to render this component's UI. +In this case, we render the ``LitDash`` UI in the ``home`` tab of the application. + +.. code:: python + :emphasize-lines: 23, 29 + + import lightning as L + import dash + import plotly.express as px + + class LitDash(L.LightningWork): + def run(self): + dash_app = dash.Dash(__name__) + X = [1, 2, 3, 4, 5, 6] + Y = [2, 4, 8, 16, 32, 64] + fig = px.line(x=X, y=Y) + + dash_app.layout = dash.html.Div(children=[ + dash.html.H1(children='⚡ Hello Dash + Lightning⚡'), + dash.html.Div(children='The Dash framework running inside a ⚡ Lightning App'), + dash.dcc.Graph(id='example-graph', figure=fig) + ]) + + dash_app.run_server(host=self.host, port=self.port) + + class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_dash = LitDash(parallel=True) + + def run(self): + self.lit_dash.run() + + def configure_layout(self): + tab1 = {"name": "home", "content": self.lit_dash} + return tab1 + + app = L.LightningApp(LitApp()) + +We use the ``parallel=True`` argument of ``LightningWork`` to run the server in the background +while the rest of the Lightning App runs everything else. diff --git a/docs/source-app/workflows/add_web_ui/dash/index.rst b/docs/source-app/workflows/add_web_ui/dash/index.rst new file mode 100644 index 0000000..5abb444 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/dash/index.rst @@ -0,0 +1,84 @@ +:orphan: + +.. toctree:: + :maxdepth: 1 + :hidden: + + basic + intermediate + +###################### +Add a web UI with Dash +###################### + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: 1: Connect Dash + :description: Learn how to connect a Dash app. + :col_css: col-md-6 + :button_link: basic.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: 2: Enable two-way communication + :description: Enable two-way communication between the dash app and a Lightning App. + :col_css: col-md-6 + :button_link: intermediate.html + :height: 150 + :tag: [docs coming soon] + +.. raw:: html + +
+
+ +---- + +******** +Examples +******** +Here are a few example apps that use a Dash web UI. + + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Example 1 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :button_link: ../../../contribute_app.html + :height: 150 + :tag: Waiting for contributed example + +.. displayitem:: + :header: Example 2 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :button_link: ../../../contribute_app.html + :height: 150 + :tag: Waiting for contributed example + +.. displayitem:: + :header: Example 3 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :button_link: ../../../contribute_app.html + :height: 150 + :tag: Waiting for contributed example + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/add_web_ui/dash/intermediate.rst b/docs/source-app/workflows/add_web_ui/dash/intermediate.rst new file mode 100644 index 0000000..c13b34b --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/dash/intermediate.rst @@ -0,0 +1,42 @@ +##################################### +Add a web UI with Dash (intermediate) +##################################### +**Audience:** Users who want to communicate between the Lightning App and Dash. + +**Prereqs:** Must have read the `dash basic `_ guide. + +---- + +******************************* +Interact with the App from Dash +******************************* + +In the example below, every time you change the select year on the dashboard, this is directly communicated to the flow +and another work process the associated data frame with the provided year. + +.. literalinclude:: intermediate_plot.py + +Here is how the app looks like once running: + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/dash_plot.gif + +---- + +*********************************** +Interact with Dash from a component +*********************************** + +In the example below, when you click the toggle, the state of the work appears. + +Install the following libraries if you want to run the app. + +```bash +pip install dash_daq dash_renderjson +``` + +.. literalinclude:: intermediate_state.py + + +Here is how the app looks like once running: + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/dash_state.gif diff --git a/docs/source-app/workflows/add_web_ui/dash/intermediate_plot.py b/docs/source-app/workflows/add_web_ui/dash/intermediate_plot.py new file mode 100644 index 0000000..4d8733b --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/dash/intermediate_plot.py @@ -0,0 +1,86 @@ +from typing import Optional + +import pandas as pd +import plotly.express as px +from dash import Dash, dcc, html, Input, Output + +import lightning as L +from lightning.app.storage import Payload + + +class LitDash(L.LightningWork): + def __init__(self): + super().__init__(parallel=True) + self.df = None + self.selected_year = None + + def run(self): + df = pd.read_csv("https://raw.githubusercontent.com/plotly/datasets/master/gapminderDataFiveYear.csv") + self.df = Payload(df) + + dash_app = Dash(__name__) + + dash_app.layout = html.Div( + [ + dcc.Graph(id="graph-with-slider"), + dcc.Slider( + df["year"].min(), + df["year"].max(), + step=None, + value=df["year"].min(), + marks={str(year): str(year) for year in df["year"].unique()}, + id="year-slider", + ), + ] + ) + + @dash_app.callback(Output("graph-with-slider", "figure"), Input("year-slider", "value")) + def update_figure(selected_year): + self.selected_year = selected_year + filtered_df = df[df.year == selected_year] + + fig = px.scatter( + filtered_df, + x="gdpPercap", + y="lifeExp", + size="pop", + color="continent", + hover_name="country", + log_x=True, + size_max=55, + ) + + fig.update_layout(transition_duration=500) + + return fig + + dash_app.run_server(host=self.host, port=self.port) + + +class Processor(L.LightningWork): + def run(self, df: Payload, selected_year: Optional[str]): + if selected_year: + df = df.value + filtered_df = df[df.year == selected_year] + print(f"[PROCESSOR|selected_year={selected_year}]") + print(filtered_df) + + +class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_dash = LitDash() + self.processor = Processor(parallel=True) + + def run(self): + self.lit_dash.run() + + # Launch some processing based on the Dash Dashboard. + self.processor.run(self.lit_dash.df, self.lit_dash.selected_year) + + def configure_layout(self): + tab1 = {"name": "home", "content": self.lit_dash} + return tab1 + + +app = L.LightningApp(LitApp()) diff --git a/docs/source-app/workflows/add_web_ui/dash/intermediate_state.py b/docs/source-app/workflows/add_web_ui/dash/intermediate_state.py new file mode 100644 index 0000000..d2e37a5 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/dash/intermediate_state.py @@ -0,0 +1,39 @@ +import dash +import dash_daq as daq +import dash_renderjson +from dash import html, Input, Output + +import lightning as L +from lightning.app.utilities.state import AppState + + +class LitDash(L.LightningWork): + def run(self): + dash_app = dash.Dash(__name__) + + dash_app.layout = html.Div([daq.ToggleSwitch(id="my-toggle-switch", value=False), html.Div(id="output")]) + + @dash_app.callback(Output("output", "children"), [Input("my-toggle-switch", "value")]) + def display_output(value): + if value: + state = AppState() + state._request_state() + return dash_renderjson.DashRenderjson(id="input", data=state._state, max_depth=-1, invert_theme=True) + + dash_app.run_server(host=self.host, port=self.port) + + +class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_dash = LitDash(parallel=True) + + def run(self): + self.lit_dash.run() + + def configure_layout(self): + tab1 = {"name": "home", "content": self.lit_dash} + return tab1 + + +app = L.LightningApp(LitApp()) diff --git a/docs/source-app/workflows/add_web_ui/example_app.rst b/docs/source-app/workflows/add_web_ui/example_app.rst new file mode 100644 index 0000000..e5d2cbb --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/example_app.rst @@ -0,0 +1,7 @@ +:orphan: + +########### +Example App +########### + +This is an example app that needs to be built for this part of the docs. diff --git a/docs/source-app/workflows/add_web_ui/glossary_front_end.rst b/docs/source-app/workflows/add_web_ui/glossary_front_end.rst new file mode 100644 index 0000000..ce51ef1 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/glossary_front_end.rst @@ -0,0 +1,9 @@ +######## +Frontend +######## +Web pages visible to users are also known as **front-ends**. Lightning Apps can have multiple +types of Frontends. + +---- + +.. include:: index_content.rst diff --git a/docs/source-app/workflows/add_web_ui/glossary_ui.rst b/docs/source-app/workflows/add_web_ui/glossary_ui.rst new file mode 100644 index 0000000..bc9e4f5 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/glossary_ui.rst @@ -0,0 +1,9 @@ +################### +UI (User Interface) +################### +We use (UI) as short for a **web page** with interactions. Lightning Apps can have multiple +types of UIs. + +---- + +.. include:: index_content.rst diff --git a/docs/source-app/workflows/add_web_ui/gradio/basic.rst b/docs/source-app/workflows/add_web_ui/gradio/basic.rst new file mode 100644 index 0000000..4f5ab87 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/gradio/basic.rst @@ -0,0 +1,217 @@ +################################ +Add a web UI with Gradio (basic) +################################ +**Audience:** Users who want to add a web UI written with Python. + +**Prereqs:** Basic python knowledge. + +---- + +*************** +What is Gradio? +*************** +Gradio is a Python library that automatically generates a web interface to demo a machine learning model. + +---- + +***************** +Install gradio +***************** +First, install gradio. + +.. code:: bash + + pip install gradio + +---- + +************************** +Create the gradio demo app +************************** +To explain how to use Gradio with Lightning, let's replicate the |gradio_link|. + +.. |gradio_link| raw:: html + + example running here + +In the next few sections we'll build an app step-by-step. +First **create a file named app.py** with the app content: + +.. code:: python + + import lightning as L + from lightning.app.components import ServeGradio + import gradio as gr + + class LitGradio(ServeGradio): + + inputs = gr.inputs.Textbox(default='lightning', label='name input') + outputs = gr.outputs.Textbox(label='output') + examples = [["hello lightning"]] + + def predict(self, input_text): + return self.model(input_text) + + def build_model(self): + fake_model = lambda x: f"hello {x}" + return fake_model + + class RootFlow(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_gradio = LitGradio() + + def run(self): + self.lit_gradio.run() + + def configure_layout(self): + return [{"name": "home", "content": self.lit_gradio}] + + app = L.LightningApp(RootFlow()) + +add "gradio" to a requirements.txt file: + +.. code:: bash + + echo 'gradio' >> requirements.txt + +this is a best practice to make apps reproducible. + +---- + +*********** +Run the app +*********** +Run the app locally to see it! + +.. code:: python + + lightning run app app.py + +Now run it on the cloud as well: + +.. code:: python + + lightning run app app.py --cloud + +---- + +************************ +Step-by-step walkthrough +************************ +In this section, we explain each part of this code in detail. + +---- + +Create a Gradio component +^^^^^^^^^^^^^^^^^^^^^^^^^ +To create a Gradio component, simply take any Gradio app and subclass it from ``ServeGradio``. +If you haven't created a Gradio demo, you have to implement the following elements: + +1. Input which is text. +2. Output which is text. +3. A build_model function. +4. A predict function. + +| + +Here's an example: + +.. code:: python + :emphasize-lines: 4 + + from lightning.app.components import ServeGradio + import gradio as gr + + class LitGradio(ServeGradio): + + inputs = gr.inputs.Textbox(default='lightning', label='name input') + outputs = gr.outputs.Textbox(label='output') + + def predict(self, input_text): + return self.model(input_text) + + def build_model(self): + fake_model = lambda x: f"hello {x}" + return fake_model + +This fake model simply concatenates 2 strings. + +---- + +Route the UI in the root component +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +Now, tell the Root component in which tab to render this component's UI. +In this case, we render the ``LitGradio`` UI in the ``home`` tab of the application. + +.. code:: python + :emphasize-lines: 21, 27 + + import lightning as L + from lightning.app.components import ServeGradio + import gradio as gr + + class LitGradio(ServeGradio): + + inputs = gr.inputs.Textbox(default='lightning', label='name input') + outputs = gr.outputs.Textbox(label='output') + examples = [["hello lightning"]] + + def predict(self, input_text): + return self.model(input_text) + + def build_model(self): + fake_model = lambda x: f"hello {x}" + return fake_model + + class RootFlow(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_gradio = LitGradio() + + def run(self): + self.lit_gradio.run() + + def configure_layout(self): + return [{"name": "home", "content": self.lit_gradio}] + + app = L.LightningApp(RootFlow()) + +---- + +Call run +^^^^^^^^ +Finally, don't forget to call run inside the Root Flow to serve the Gradio app. + +.. code:: python + :emphasize-lines: 24 + + import lightning as L + from lightning.app.components import ServeGradio + import gradio as gr + + class LitGradio(ServeGradio): + + inputs = gr.inputs.Textbox(default='lightning', label='name input') + outputs = gr.outputs.Textbox(label='output') + examples = [["hello lightning"]] + + def predict(self, input_text): + return self.model(input_text) + + def build_model(self): + fake_model = lambda x: f"hello {x}" + return fake_model + + class RootFlow(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_gradio = LitGradio() + + def run(self): + self.lit_gradio.run() + + def configure_layout(self): + return [{"name": "home", "content": self.lit_gradio}] + + app = L.LightningApp(RootFlow()) diff --git a/docs/source-app/workflows/add_web_ui/gradio/index.rst b/docs/source-app/workflows/add_web_ui/gradio/index.rst new file mode 100644 index 0000000..740ae93 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/gradio/index.rst @@ -0,0 +1,84 @@ +:orphan: + +.. toctree:: + :maxdepth: 1 + :hidden: + + basic + intermediate + +######################## +Add a web UI with Gradio +######################## + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: 1: Connect Gradio + :description: Learn how to connect Gradio to a Lightning Component. + :col_css: col-md-6 + :button_link: basic.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: 2: Enable two-way communication + :description: Enable two-way communication between Gradio and a Lightning App. + :col_css: col-md-6 + :button_link: intermediate.html + :height: 150 + :tag: [documentation coming soon] + +.. raw:: html + +
+
+ +---- + +******** +Examples +******** +Here are a few example apps that use a Gradio web UI. + + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Example 1 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :button_link: ../../../contribute_app.html + :height: 150 + :tag: Waiting for contributed example + +.. displayitem:: + :header: Example 2 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :button_link: ../../../contribute_app.html + :height: 150 + :tag: Waiting for contributed example + +.. displayitem:: + :header: Example 3 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :button_link: ../../../contribute_app.html + :height: 150 + :tag: Waiting for contributed example + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/add_web_ui/gradio/intermediate.rst b/docs/source-app/workflows/add_web_ui/gradio/intermediate.rst new file mode 100644 index 0000000..bb20d56 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/gradio/intermediate.rst @@ -0,0 +1,21 @@ +####################################### +Add a web UI with Gradio (intermediate) +####################################### + +.. note:: documentation coming soon. + + +************************************* +Interact with a component from the UI +************************************* + +.. warning:: is there such a thing for this with gradio? + + +---- + +************************************* +Interact with the UI from a component +************************************* + +.. warning:: is there such a thing for this with gradio? diff --git a/docs/source-app/workflows/add_web_ui/html/basic.rst b/docs/source-app/workflows/add_web_ui/html/basic.rst new file mode 100644 index 0000000..cb9bb52 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/html/basic.rst @@ -0,0 +1,166 @@ +############################## +Add a web UI with HTML (basic) +############################## +**Audience:** Users who want to add a web UI written in HTMlapp. + +**Prereqs:** Basic html knowledge. + +---- + +************* +What is HTML? +************* +HyperText Markup Language (HTML) is the Language used to create web pages. Use HTML for simple +web user interfaces that tend to be more static. + +For reactive web applications, we recommend using: React.js, Angular.js or Vue.js + +---- + +******************* +Create an HTML page +******************* +The first step is to create an HTML file named **index.html**: + +.. code:: html + + + + + + +

Hello World

+ + + +---- + +************************ +Create the HTML demo app +************************ + +.. + To explain how to use html with Lightning, let's replicate the |html_app_link|. + + .. |html_app_link| raw:: html + + example running here + +In the next few sections we'll build an app step-by-step. +First **create a file named app.py** with the app content (in the same folder as index.html): + +.. code:: bash + + # app.py + import lightning as L + import lightning.app.frontend as frontend + + + class HelloComponent(L.LightningFlow): + def configure_layout(self): + return frontend.StaticWebFrontend(serve_dir='.') + + + class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.hello_component = HelloComponent() + + def run(self): + self.hello_component.run() + + def configure_layout(self): + tab1 = {"name": "home", "content": self.hello_component} + return tab1 + + + app = L.LightningApp(LitApp()) + +---- + +*********** +Run the app +*********** +Run the app locally to see it! + +.. code:: python + + lightning run app app.py + +Now run it on the cloud as well: + +.. code:: python + + lightning run app app.py --cloud + +---- + +************************ +Step-by-step walkthrough +************************ +In this section, we explain each part of this code in detail. + +---- + +Enable an HTML UI for the component +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +Give the component an HTML UI, by returning a ``StaticWebFrontend`` object from the ``configure_layout`` method: + +.. code:: bash + :emphasize-lines: 6,7 + + # app.py + import lightning as L + import lightning.app.frontend as frontend + + class HelloComponent(L.LightningFlow): + def configure_layout(self): + return frontend.StaticWebFrontend(serve_dir='.') + + class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.hello_component = HelloComponent() + + def run(self): + self.hello_component.run() + + def configure_layout(self): + tab1 = {"name": "home", "content": self.hello_component} + return tab1 + + app = L.LightningApp(LitApp()) + +The folder path given in ``StaticWebFrontend(serve_dir=)`` must point to a folder with an ``index.html`` page. + +---- + +Route the UI in the root component +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +The final step, is to tell the Root component in which tab to render this component's UI. +In this case, we render the ``HelloComponent`` UI in the ``home`` tab of the application. + +.. code:: python + :emphasize-lines: 18, 19 + + # app.py + import lightning as L + import lightning.app.frontend as frontend + + class HelloComponent(L.LightningFlow): + def configure_layout(self): + return frontend.StaticWebFrontend(serve_dir='.') + + class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.hello_component = HelloComponent() + + def run(self): + self.hello_component.run() + + def configure_layout(self): + tab1 = {"name": "home", "content": self.hello_component} + return tab1 + + app = L.LightningApp(LitApp()) diff --git a/docs/source-app/workflows/add_web_ui/html/index.rst b/docs/source-app/workflows/add_web_ui/html/index.rst new file mode 100644 index 0000000..0eae930 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/html/index.rst @@ -0,0 +1,87 @@ +:orphan: + +.. toctree:: + :maxdepth: 1 + :hidden: + + basic + intermediate + +###################### +Add a web UI with HTML +###################### +**Audience:** Users who want to add a web UI using plain html. + +**Prereqs:** Basic html knowledge. + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: 1: Connect HTML + :description: Learn how to connect an HTML app. + :col_css: col-md-6 + :button_link: basic.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: 2: Enable two-way communication + :description: Enable two-way communication between HTML and a Lightning App. + :col_css: col-md-6 + :button_link: intermediate.html + :height: 150 + :tag: [docs coming soon] + +.. raw:: html + +
+
+ +---- + +******** +Examples +******** +Here are a few example apps that use an HTML web UI. + + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Example 1 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :button_link: ../../../contribute_app.html + :height: 150 + :tag: Waiting for contributed example + +.. displayitem:: + :header: Example 2 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :button_link: ../../../contribute_app.html + :height: 150 + :tag: Waiting for contributed example + +.. displayitem:: + :header: Example 3 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :button_link: ../../../contribute_app.html + :height: 150 + :tag: Waiting for contributed example + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/add_web_ui/html/intermediate.rst b/docs/source-app/workflows/add_web_ui/html/intermediate.rst new file mode 100644 index 0000000..e2d0f96 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/html/intermediate.rst @@ -0,0 +1,20 @@ +##################################### +Add a web UI with HTML (intermediate) +##################################### +**Audience:** Users who want to add a web UI using plain html. + +**Prereqs:** Must have read the `html basic `_ guide. + +---- + +******************************* +Interact with the App from HTML +******************************* +.. note:: documentation in progress + +---- + +*********************************** +Interact with HTML from a component +*********************************** +.. note:: documentation in progress diff --git a/docs/source-app/workflows/add_web_ui/index.rst b/docs/source-app/workflows/add_web_ui/index.rst new file mode 100644 index 0000000..79c0f16 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/index.rst @@ -0,0 +1,10 @@ + +############################# +Add a web user interface (UI) +############################# + +**Audience:** Users who want to add a UI to their Lightning Apps + +---- + +.. include:: index_content.rst diff --git a/docs/source-app/workflows/add_web_ui/index_content.rst b/docs/source-app/workflows/add_web_ui/index_content.rst new file mode 100644 index 0000000..f3d516c --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/index_content.rst @@ -0,0 +1,121 @@ +************************************* +Web UIs for non Javascript Developers +************************************* + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Dash + :description: Learn how to add a web UI built in Python with Dash. + :col_css: col-md-4 + :button_link: ../../workflows/add_web_ui/dash/index.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: Gradio + :description: Learn how to add a web UI built in Python with Gradio. + :col_css: col-md-4 + :button_link: ../../workflows/add_web_ui/gradio/index.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: Panel + :description: Learn how to add a web UI built in Python with Panel. + :col_css: col-md-4 + :button_link: ../../workflows/add_web_ui/panel/index.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: Jupyter Notebook + :description: Learn how to enable a web UI that is a Jupyter Notebook. + :col_css: col-md-4 + :button_link: ../../workflows/add_web_ui/jupyter_basic.html + :height: 150 + :tag: [docs coming soon] + +.. displayitem:: + :header: Streamlit + :description: Learn how to add a web UI built in Python with Streamlit. + :col_css: col-md-4 + :button_link: ../../workflows/add_web_ui/streamlit/index.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: JustPy + :description: Learn how to add a web UI built in Python with JustPy. + :col_css: col-md-4 + :button_link: ../../workflows/add_web_ui/justpy/index.html + :height: 150 + :tag: basic + +.. raw:: html + +
+
+ +---- + +********************************* +Web UIs for Javascript Developers +********************************* + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Any javascript framework + :description: Learn how to link up any javascript framework to a Lightning app. + :col_css: col-md-4 + :button_link: ../../workflows/add_web_ui/integrate_any_javascript_framework.html + :height: 150 + :tag: advanced + +.. displayitem:: + :header: Angular.js + :description: Learn how to add a web UI built in Javascript with Angular.js + :col_css: col-md-4 + :button_link: ../../workflows/add_web_ui/angular_js_intermediate.html + :height: 150 + :tag: [Docs coming soon] + +.. displayitem:: + :header: HTML + :description: Learn how to add a web UI built with html. + :col_css: col-md-4 + :button_link: ../../workflows/add_web_ui/html/index.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: React.js + :description: Learn how to add a web UI built in Javascript with React.js + :col_css: col-md-4 + :button_link: ../../workflows/add_web_ui/react/index.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Vue.js + :description: Learn how to add a web UI built in Javascript with Vue.js + :col_css: col-md-4 + :button_link: ../../workflows/add_web_ui/vue_js_intermediate.html + :height: 150 + :tag: [Docs coming soon] + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/add_web_ui/integrate_any_javascript_framework.rst b/docs/source-app/workflows/add_web_ui/integrate_any_javascript_framework.rst new file mode 100644 index 0000000..f1da660 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/integrate_any_javascript_framework.rst @@ -0,0 +1,164 @@ +:orphan: + +################################## +Integrate any javascript framework +################################## +**Audience:** Advanced web developers with complex apps that may not have been covered by the other tutorials + +**Pre-requisites:** Intermediate knowledge of html and javascript + +---- + +************************ +Import LightningState.js +************************ +To connect any javascript framework, import the `LightningState.js `_ library. +LightningState.js enables two-way communication between a javascript framework and a Lightning app. + +To import this library, add this to your html: + +.. code:: html + + + +Once it's imported, use it inside your app, this example uses it inside a React App: + +.. code-block:: + :emphasize-lines: 1, 5 + + import { useLightningState } from "./hooks/useLightningState"; + import cloneDeep from "lodash/cloneDeep"; + + function App() { + const { lightningState, updateLightningState } = useLightningState(); + + const modify_and_send_back_the_state = async (event: ChangeEvent) => { + if (lightningState) { + const newLightningState = cloneDeep(lightningState); + // Update the state and send it back. + newLightningState.flows.counter += 1 + + updateLightningState(newLightningState); + } + }; + + return ( +
+
+ ); + } + + export default App; + +---- + +************************ +Update the Lightning app +************************ +Use `updateLightningState` to update the lightning app. Here we update a vairable called counter. + +.. code-block:: + :emphasize-lines: 11 + + import { useLightningState } from "./hooks/useLightningState"; + import cloneDeep from "lodash/cloneDeep"; + + function App() { + const { lightningState, updateLightningState } = useLightningState(); + + const modify_and_send_back_the_state = async (event: ChangeEvent) => { + if (lightningState) { + const newLightningState = cloneDeep(lightningState); + // Update the state and send it back. + newLightningState.flows.counter += 1 + + updateLightningState(newLightningState); + } + }; + + return ( +
+
+ ); + } + + export default App; + +---- + +************************************** +Receive updates from the Lightning app +************************************** +Whenever a variable in the Lightning app changes, the javascript app will receive those values via `lightningState`. + +Extract any variable from the state and update the javascript app: + +.. code-block:: + :emphasize-lines: 5 + + import { useLightningState } from "./hooks/useLightningState"; + import cloneDeep from "lodash/cloneDeep"; + + function App() { + const { lightningState, updateLightningState } = useLightningState(); + + const modify_and_send_back_the_state = async (event: ChangeEvent) => { + if (lightningState) { + const newLightningState = cloneDeep(lightningState); + // Update the state and send it back. + newLightningState.flows.counter += 1 + + updateLightningState(newLightningState); + } + }; + + return ( +
+
+ ); + } + + export default App; + +---- + +******** +Examples +******** + +See this in action in these examples: + + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: React.js + :description: Explore how React.js uses lightningState.js + :col_css: col-md-4 + :button_link: react/communicate_between_react_and_lightning.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Example 2 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :height: 150 + :tag: Waiting for contributed example + +.. displayitem:: + :header: Example 3 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :height: 150 + :tag: Waiting for contributed example + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/add_web_ui/jupyter_basic.rst b/docs/source-app/workflows/add_web_ui/jupyter_basic.rst new file mode 100644 index 0000000..61f58ab --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/jupyter_basic.rst @@ -0,0 +1,70 @@ +:orphan: + +##################################### +Add a Jupyter Notebook web UI (basic) +##################################### +**Audience:** Users who want to enable a Jupyter notebook UI. + +**Prereqs:** Basic python knowledge. + +TODO + +---- + +*************************** +What is a Jupyter Notebook? +*************************** + +TODO + +---- + +******************* +Install Jupyter Lab +******************* + +First, install Jupyter Lab. + +.. code:: bash + + pip install jupyterlab + +---- + +******** +Examples +******** +Here are a few example apps that use Jupyter Lab. + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Example 1 + :description: TODO + :col_css: col-md-4 + :button_link: angular_js_intermediate.html + :height: 150 + +.. displayitem:: + :header: Example 2 + :description: TODO + :col_css: col-md-4 + :button_link: angular_js_intermediate.html + :height: 150 + +.. displayitem:: + :header: Example 3 + :description: TODO + :col_css: col-md-4 + :button_link: angular_js_intermediate.html + :height: 150 + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/add_web_ui/justpy/index.rst b/docs/source-app/workflows/add_web_ui/justpy/index.rst new file mode 100644 index 0000000..bf25a18 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/justpy/index.rst @@ -0,0 +1,92 @@ +:orphan: + +######################## +Add a web UI with JustPy +######################## + + +****** +JustPy +****** + +The `JustPy `_ framework is an object oriented high-level Python Web Framework that requires no JavaScript programming, while at the same time providing the full flexibility of a frontend framework. + +Additionally, it provides a higher level API called `Quasar `_ with stylized components. + + +You can install ``justpy`` from PyPi. + +.. code-block:: + + pip install justpy + +******* +Example +******* + + +In the following example, we are creating a simple UI with 2 buttons. +When clicking the first button, the flow state ``counter`` is incremented and re-rendered on the UI. + + +First of all, you would need to import the ``JustPyFrontend`` and return it from the ``configure_layout`` hook of the flow. + +.. code-block:: + + from typing import Callable + + from lightning import LightningApp, LightningFlow + from lightning.app.frontend import JustPyFrontend + + + class Flow(LightningFlow): + def __init__(self): + super().__init__() + self.counter = 0 + + def run(self): + print(self.counter) + + def configure_layout(self): + return JustPyFrontend(render_fn=render_fn) + +Secondly, you would need to implement a ``render_fn`` that takes as input a ``get_state`` function and return a function. + + +.. code-block:: + + def render_fn(get_state: Callable) -> Callable: + import justpy as jp + + def webpage(): + wp = jp.QuasarPage(dark=True) + # the `a=wp` argument adds the div to the web page + d = jp.Div(classes="q-pa-md q-gutter-sm", a=wp) + container = jp.QBtn(color="primary", text="Counter: 0") + + async def click(*_): + state = get_state() + state.counter += 1 + container.text = f"Counter: {state.counter}" + + button = jp.QBtn(color="primary", text="Click Me!", click=click) + + d.add(button) + d.add(container) + + return wp + + return webpage + + +Finally, you can wrap your flow in a LightningAp. + +.. code-block:: + + app = LightningApp(Flow()) + +Now, you can run the Lightning App with: + +.. code-block:: + + lightning run app app.py diff --git a/docs/source-app/workflows/add_web_ui/panel/basic.rst b/docs/source-app/workflows/add_web_ui/panel/basic.rst new file mode 100644 index 0000000..8e72036 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/panel/basic.rst @@ -0,0 +1,369 @@ +:orphan: + +############################### +Add a web UI with Panel (basic) +############################### + +**Audience:** Users who want to add a web UI written with Python and Panel. + +**Prereqs:** Basic Python knowledge. + +---- + +************** +What is Panel? +************** + +`Panel`_ and the `HoloViz`_ ecosystem provide unique and powerful +features such as big data visualization using `DataShader`_, easy cross filtering +using `HoloViews`_, streaming and much more. + +* Panel is highly flexible and ties into the PyData and Jupyter ecosystems as you can develop in notebooks and use ipywidgets. You can also develop in .py files. + +* Panel is one of the most popular data app frameworks in Python with `more than 400.000 downloads a month `_. It's especially popular in the scientific community. + +* Panel is used, for example, by Rapids to power `CuxFilter`_, a CuDF based big data visualization framework. + +* Panel can be deployed on your favorite server or cloud including `Lightning`_. + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/panel-intro.gif + :alt: Example Panel App + + Example Panel App + +Panel is **particularly well suited for Lightning Apps** that need to display live progress. This is because the Panel server can react +to state changes and asynchronously push messages from the server to the client using web socket communication. + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/panel-streaming-intro.gif + :alt: Example Panel Streaming App + + Example Panel Streaming App + +Install Panel with: + +.. code:: bash + + pip install panel + +---- + +********************* +Run a basic Panel App +********************* + +In the next few sections, we'll build an App step-by-step. + +First, create a file named ``app_panel.py`` with the App content: + +.. code:: python + + # app_panel.py + + import panel as pn + + pn.panel("Hello **Panel ⚡** World").servable() + +Then, create a file named ``app.py`` with the following App content: + +.. code:: python + + # app.py + + import lightning as L + from lightning.app.frontend import PanelFrontend + + + class LitPanel(L.LightningFlow): + + def configure_layout(self): + return PanelFrontend("app_panel.py") + + + class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_panel = LitPanel() + + def run(self): + self.lit_panel.run() + + def configure_layout(self): + return {"name": "home", "content": self.lit_panel} + + + app = L.LightningApp(LitApp()) + +Finally, add ``panel`` to your ``requirements.txt`` file: + +.. code:: bash + + echo 'panel' >> requirements.txt + +.. note:: This is a best practice to make Apps reproducible. + +---- + +*********** +Run the App +*********** + +Run the App locally: + +.. code:: bash + + lightning run app app.py + +The App should look like this: + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/panel-lightning-basic.png + :alt: Basic Panel Lightning App + + Basic Panel Lightning App + +Now, run it on the cloud: + +.. code:: bash + + lightning run app app.py --cloud + +---- + +************************* +Step-by-step walk-through +************************* + +In this section, we explain each part of the code in detail. + +---- + +0. Define a Panel app +^^^^^^^^^^^^^^^^^^^^^ + +First, find the Panel app you want to integrate. In this example, that app looks like: + +.. code:: python + + import panel as pn + + pn.panel("Hello **Panel ⚡** World").servable() + +Refer to the `Panel documentation `_ and `awesome-panel.org `_ for more complex examples. + +---- + +1. Add Panel to a Component +^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +Link this app to the Lightning App by using the ``PanelFrontend`` class which needs to be returned from +the ``configure_layout`` method of the Lightning Component you want to connect to Panel. + +.. code:: python + :emphasize-lines: 7-10 + + import lightning as L + from lightning.app.frontend import PanelFrontend + + + class LitPanel(L.LightningFlow): + + def configure_layout(self): + return PanelFrontend("app_panel.py") + + + class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_panel = LitPanel() + + def run(self): + self.lit_panel.run() + + def configure_layout(self): + return {"name": "home", "content": self.lit_panel} + + + app = L.LightningApp(LitApp()) + +The argument of the ``PanelFrontend`` class, points to the script, notebook, or function that +runs your Panel app. + +---- + +2. Route the UI in the root component +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +The second step, is to tell the Root component in which tab to render this component's UI. +In this case, we render the ``LitPanel`` UI in the ``home`` tab of the app. + +.. code:: python + :emphasize-lines: 19-20 + + import lightning as L + from lightning.app.frontend import PanelFrontend + + + class LitPanel(L.LightningFlow): + + def configure_layout(self): + return PanelFrontend("app_panel.py") + + + class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_panel = LitPanel() + + def run(self): + self.lit_panel.run() + + def configure_layout(self): + return {"name": "home", "content": self.lit_panel} + + app = L.LightningApp(LitApp()) + +---- + +************* +Tips & Tricks +************* + +0. Use autoreload while developing +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +To speed up your development workflow, you can run your Lightning App with Panel **autoreload** by +setting the environment variable ``PANEL_AUTORELOAD`` to ``yes``. + +Try running the following: + +.. code-block:: + + PANEL_AUTORELOAD=yes lightning run app app.py + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/panel-lightning-autoreload.gif + :alt: Basic Panel Lightning App with autoreload + + Basic Panel Lightning App with autoreload + +1. Theme your App +^^^^^^^^^^^^^^^^^ + +To theme your App you, can use the Lightning accent color ``#792EE5`` with the `FastListTemplate`_. + +Try replacing the contents of ``app_panel.py`` with the following: + +.. code:: bash + + # app_panel.py + + import panel as pn + import plotly.express as px + + ACCENT = "#792EE5" + + pn.extension("plotly", sizing_mode="stretch_width", template="fast") + pn.state.template.param.update( + title="⚡ Hello Panel + Lightning ⚡", accent_base_color=ACCENT, header_background=ACCENT + ) + + pn.config.raw_css.append( + """ + .bk-root:first-of-type { + height: calc( 100vh - 200px ) !important; + } + """ + ) + + + def get_panel_theme(): + """Returns 'default' or 'dark'""" + return pn.state.session_args.get("theme", [b"default"])[0].decode() + + + def get_plotly_template(): + if get_panel_theme() == "dark": + return "plotly_dark" + return "plotly_white" + + + def get_plot(length=5): + xseries = [index for index in range(length + 1)] + yseries = [x**2 for x in xseries] + fig = px.line( + x=xseries, + y=yseries, + template=get_plotly_template(), + color_discrete_sequence=[ACCENT], + range_x=(0, 10), + markers=True, + ) + fig.layout.autosize = True + return fig + + + length = pn.widgets.IntSlider(value=5, start=1, end=10, name="Length") + dynamic_plot = pn.panel( + pn.bind(get_plot, length=length), sizing_mode="stretch_both", config={"responsive": True} + ) + pn.Column(length, dynamic_plot).servable() + + +Install some additional libraries and remember to add the dependencies to the ``requirements.txt`` file: + + +.. code:: bash + + echo 'plotly' >> requirements.txt + echo 'pandas' >> requirements.txt + +Finally run the App + +.. code:: bash + + lightning run app app.py + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/panel-lightning-theme.gif + :alt: Basic Panel Plotly Lightning App with theming + + Basic Panel Plotly Lightning App with theming + +.. _Panel: https://panel.holoviz.org/ +.. _FastListTemplate: https://panel.holoviz.org/reference/templates/FastListTemplate.html#templates-gallery-fastlisttemplate +.. _HoloViz: https://holoviz.org/ +.. _DataShader: https://datashader.org/ +.. _HoloViews: https://holoviews.org/ +.. _Lightning: https://lightning.ai/ +.. _CuxFilter: https://github.com/rapidsai/cuxfilter +.. _AwesomePanel: https://awesome-panel.org/home + + +---- + +********** +Next Steps +********** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: 2: Enable two-way communication + :description: Enable two-way communication between Panel and a Lightning App. + :col_css: col-md-6 + :button_link: intermediate.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Add a web user interface (UI) + :description: Users who want to add a UI to their Lightning Apps + :col_css: col-md-6 + :button_link: ../index.html + :height: 150 + :tag: intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/add_web_ui/panel/index.rst b/docs/source-app/workflows/add_web_ui/panel/index.rst new file mode 100644 index 0000000..0d48a1d --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/panel/index.rst @@ -0,0 +1,85 @@ +:orphan: + +.. toctree:: + :maxdepth: 1 + :hidden: + + basic + intermediate + +####################### +Add a web UI with Panel +####################### + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: 1: Connect Panel + :description: Learn how to connect Panel to a Lightning Component. + :col_css: col-md-6 + :button_link: basic.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: 2: Enable two-way communication + :description: Enable two-way communication between Panel and a Lightning App. + :col_css: col-md-6 + :button_link: intermediate.html + :height: 150 + :tag: intermediate + +.. raw:: html + +
+
+ +---- + +******** +Examples +******** + +Here are a few example apps that use a Panel web UI. + + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Example 1 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :button_link: ../../../contribute_app.html + :height: 150 + :tag: Waiting for contributed example + +.. displayitem:: + :header: Example 2 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :button_link: ../../../contribute_app.html + :height: 150 + :tag: Waiting for contributed example + +.. displayitem:: + :header: Example 3 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :button_link: ../../../contribute_app.html + :height: 150 + :tag: Waiting for contributed example + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/add_web_ui/panel/intermediate.rst b/docs/source-app/workflows/add_web_ui/panel/intermediate.rst new file mode 100644 index 0000000..be09e98 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/panel/intermediate.rst @@ -0,0 +1,210 @@ +:orphan: + +###################################### +Add a web UI with Panel (intermediate) +###################################### + +**Audience:** Users who want to communicate between the Lightning App and Panel. + +**Prereqs:** Must have read the `Panel basic `_ guide. + +---- + +************************************** +Interact with the Component from Panel +************************************** + +The ``PanelFrontend`` enables user interactions with the Lightning App using widgets. +You can modify the state variables of a Lightning Component using the ``AppStateWatcher``. + +For example, here we increase the ``count`` variable of the Lightning Component every time a user +presses a button: + +.. code:: python + + # app_panel.py + + import panel as pn + from lightning.app.frontend import AppStateWatcher + + pn.extension(sizing_mode="stretch_width") + + app = AppStateWatcher() + + submit_button = pn.widgets.Button(name="submit") + + @pn.depends(submit_button, watch=True) + def submit(_): + app.state.count += 1 + + @pn.depends(app.param.state) + def current_count(_): + return f"current count: {app.state.count}" + + pn.Column( + submit_button, + current_count, + ).servable() + + + +.. code:: python + + # app.py + + import lightning as L + from lightning.app.frontend import PanelFrontend + + class LitPanel(L.LightningFlow): + def __init__(self): + super().__init__() + self.count = 0 + self.last_count = 0 + + def run(self): + if self.count != self.last_count: + self.last_count = self.count + print("Count changed to: ", self.count) + + def configure_layout(self): + return PanelFrontend("app_panel.py") + + + class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_panel = LitPanel() + + def run(self): + self.lit_panel.run() + + def configure_layout(self): + return {"name": "home", "content": self.lit_panel} + + + app = L.LightningApp(LitApp()) + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/panel-lightning-counter-from-frontend.gif + :alt: Panel Lightning App updating a counter from the frontend + + Panel Lightning App updating a counter from the frontend + +---- + +************************************ +Interact with Panel from a Component +************************************ + +To update the `PanelFrontend` from any Lightning Component, update the property in the Component. +Make sure to call the ``run`` method from the parent component. + +In this example, we update the ``count`` value of the Component: + +.. code:: python + + # app_panel.py + + import panel as pn + from lightning.app.frontend import AppStateWatcher + + app = AppStateWatcher() + + pn.extension(sizing_mode="stretch_width") + + def counter(state): + return f"Counter: {state.count}" + + last_update = pn.bind(counter, app.param.state) + + pn.panel(last_update).servable() + +.. code:: python + + # app.py + + from datetime import datetime as dt + from lightning.app.frontend import PanelFrontend + + import lightning as L + + + class LitPanel(L.LightningFlow): + def __init__(self): + super().__init__() + self.count = 0 + self._last_update = dt.now() + + def run(self): + now = dt.now() + if (now - self._last_update).microseconds >= 250: + self.count += 1 + self._last_update = now + print("Counter changed to: ", self.count) + + def configure_layout(self): + return PanelFrontend("app_panel.py") + + + class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_panel = LitPanel() + + def run(self): + self.lit_panel.run() + + def configure_layout(self): + tab1 = {"name": "home", "content": self.lit_panel} + return tab1 + + app = L.LightningApp(LitApp()) + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/panel-lightning-counter-from-component.gif + :alt: Panel Lightning App updating a counter from the component + + Panel Lightning App updating a counter from the Component + +---- + +************* +Tips & Tricks +************* + +* Caching: Panel provides the easy to use ``pn.state.cache`` memory based, ``dict`` caching. If you are looking for something persistent try `DiskCache `_ its really powerful and simple to use. You can use it to communicate large amounts of data between the components and frontend(s). + +* Notifications: Panel provides easy to use `notifications `_. You can for example use them to provide notifications about runs starting or ending. + +* Tabulator Table: Panel provides the `Tabulator table `_ which features expandable rows. The table is useful to provide for example an overview of you runs. But you can dig into the details by clicking and expanding the row. + +* Task Scheduling: Panel provides easy to use `task scheduling `_. You can use this to for example read and display files created by your components on a scheduled basis. + +* Terminal: Panel provides the `Xterm.js terminal `_ which can be used to display live logs from your components and allow you to provide a terminal interface to your component. + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/panel-lightning-github-runner.gif + :alt: Panel Lightning App running models on github + + Panel Lightning App running models on GitHub + +---- + +********** +Next Steps +********** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Add a web user interface (UI) + :description: Users who want to add a UI to their Lightning Apps + :col_css: col-md-6 + :button_link: ../index.html + :height: 150 + :tag: intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/add_web_ui/react/communicate_between_react_and_lightning.rst b/docs/source-app/workflows/add_web_ui/react/communicate_between_react_and_lightning.rst new file mode 100644 index 0000000..be92d75 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/react/communicate_between_react_and_lightning.rst @@ -0,0 +1,58 @@ +####################################### +Communicate Between React and Lightning +####################################### +**Audience:** Anyone who wants to add a web user interface (UI) written in react to their app. + +**pre-requisites:** Make sure you've already connected the React and Lightning app. + +**Difficulty level:** intermediate. + +---- + +************ +Example code +************ +To illustrate how to communicate between a React app and a lightning App, we'll be using the `example_app.py` file +which `lightning init react-ui `_ created: + +.. literalinclude:: ../../../../../src/lightning/app/cli/react-ui-template/example_app.py + +and the App.tsx file also created by `lightning init react-ui `_: + +.. literalinclude:: ../../../../../src/lightning/app/cli/react-ui-template/ui/src/App.tsx + +---- + +****************************** +Update React --> Lightning app +****************************** +To change the Lightning app from the React app, use `updateLightningState`. + +In this example, when you press **Start printing** in the React UI, it toggles +the `react_ui.vars.should_print`: + +.. literalinclude:: ../../../../../src/lightning/app/cli/react-ui-template/ui/src/App.tsx + :emphasize-lines: 20, 21, 23 + +By changing that variable in the Lightning app state, it sets **react_ui.should_print** to True, which enables the +Lightning app to print: + +.. literalinclude:: ../../../../../src/lightning/app/cli/react-ui-template/example_app.py + :emphasize-lines: 10, 22 + +---- + +****************************** +Update React <-- Lightning app +****************************** +To change the React app from the Lightning app, use the values from the `lightningState`. + +In this example, when the `react_ui.counter`` increaes in the Lightning app: + +.. literalinclude:: ../../../../../src/lightning/app/cli/react-ui-template/example_app.py + :emphasize-lines: 18, 24 + +The React UI updates the text on the screen to reflect the count + +.. literalinclude:: ../../../../../src/lightning/app/cli/react-ui-template/ui/src/App.tsx + :emphasize-lines: 15 diff --git a/docs/source-app/workflows/add_web_ui/react/connect_react_and_lightning.rst b/docs/source-app/workflows/add_web_ui/react/connect_react_and_lightning.rst new file mode 100644 index 0000000..1fb78d1 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/react/connect_react_and_lightning.rst @@ -0,0 +1,107 @@ +################################ +Connect React to a Lightning app +################################ +**Audience:** Users who already have a react app and want to connect it to a Lightning app. + +**pre-requisites:** Make sure you already have a react app you want to connect. + +**Difficulty level:** intermediate. + +---- + +************ +Example code +************ +To illustrate how to connect a React app and a lightning App, we'll be using the `example_app.py` file +which `lightning init react-ui `_ created: + +.. literalinclude:: ../../../../../src/lightning/app/cli/react-ui-template/example_app.py + +and the App.tsx file also created by `lightning init react-ui `_: + +.. literalinclude:: ../../../../../src/lightning/app/cli/react-ui-template/ui/src/App.tsx + +---- + +************************************* +Connect the component to the react UI +************************************* +The first step is to connect the dist folder of the react app using `StaticWebFrontend`: + +.. literalinclude:: ../../../../../src/lightning/app/cli/react-ui-template/example_app.py + :emphasize-lines: 13 + +the dist folder must contain an index.html file which is generated by the compilating command `yarn build` which +we'll explore later. + +---- + +********************************** +Connect component to the root flow +********************************** +Next, connect your component to the root flow. Display the react app on the tab of your choice +using `configure_layout`: + +.. literalinclude:: ../../../../../src/lightning/app/cli/react-ui-template/example_app.py + :emphasize-lines: 19, 27 + +---- + +********************************* +Connect React and Lightning state +********************************* +At this point, the React app will render in the Lightning app. Test it out! + +.. code:: bash + + lightning run app example_app.py + +However, to make powerful React+Lightning apps, you must also connect the Lightning App state to the react app. +These lines enable two-way communication between the react app and the Lightning app. + +.. literalinclude:: ../../../../../src/lightning/app/cli/react-ui-template/ui/src/App.tsx + :emphasize-lines: 10, 13 + +---- + +**************** +Component vs App +**************** +Notice that in this guide, we connected a single react app to a single component. + +.. literalinclude:: ../../../../../src/lightning/app/cli/react-ui-template/example_app.py + :emphasize-lines: 6-13 + +You can use this single react app for the FULL Lightning app, or you can specify a React app for EACH component. + +.. code:: python + :emphasize-lines: 5, 9, 18-20 + + import lightning as L + + + class ComponentA(L.LightningFlow): + def configure_layout(self): + return L.app.frontend.StaticWebFrontend(Path(__file__).parent / "react_app_1/dist") + + + class ComponentB(L.LightningFlow): + def configure_layout(self): + return L.app.frontend.StaticWebFrontend(Path(__file__).parent / "react_app_2/dist") + + + class HelloLitReact(L.LightningFlow): + def __init__(self): + super().__init__() + self.react_app_1 = ComponentA() + self.react_app_2 = ComponentB() + + def configure_layout(self): + tab_1 = {"name": "App 1", "content": self.react_app_1} + tab_2 = {"name": "App 2", "content": self.react_app_2} + return tab_1, tab_2 + + + app = L.LightningApp(HelloLitReact()) + +This is a powerful idea that allows each Lightning component to have a self-contained web UI. diff --git a/docs/source-app/workflows/add_web_ui/react/create_react_template.rst b/docs/source-app/workflows/add_web_ui/react/create_react_template.rst new file mode 100644 index 0000000..4e48f39 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/react/create_react_template.rst @@ -0,0 +1,51 @@ +###################################### +Create a React Template (intermediate) +###################################### +**Audience:** Anyone who wants to add a web user interface (UI) written in react to their app. + +---- + +************** +What is react? +************** +`React.js `_ is a JavaScript library for building user interfaces. +A huge number of websites are written in React.js (like Facebook). + +---- + +************************ +Bring your own React app +************************ +If you already have a React.js app, then you don't need the section below. However, it might be helpful +to see our React template so you can understand how to connect it to a Lightning app. + +---- + +**************************** +Create the react-ui template +**************************** +Lightning can generate a react-ui template out of the box (generated with `Vite `_). + +Run this command to set up a react-ui template for a component: + +.. code:: bash + + lightning init react-ui + +If everything was succesful, run the example_app.py listed in the output of the command: + +.. code:: bash + + INFO: Checking pre-requisites for react + INFO: + found npm version: 8.5.5 + found node version: 16.15.0 + found yarn version: 1.22.10 + + ... + ... + + ⚡ run the example_app.py to see it live! + lightning run app react-ui/example_app.py + +If the command didn't work, make sure to install `npm+nodejs `_, and `yarn `_. diff --git a/docs/source-app/workflows/add_web_ui/react/index.rst b/docs/source-app/workflows/add_web_ui/react/index.rst new file mode 100644 index 0000000..ba0f8d9 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/react/index.rst @@ -0,0 +1,106 @@ +:orphan: + +.. toctree:: + :maxdepth: 1 + :hidden: + + create_react_template + connect_react_and_lightning + communicate_between_react_and_lightning + react_development_workflow + +########################## +Add a web UI with React.js +########################## +**Audience:** Anyone who wants to add a web user interface (UI) written in react to their app. + +**Prereqs:** Basic html knowledge. + +---- + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: 1: Create a React project template + :description: Use our React template to start a react app or bring your own. + :col_css: col-md-6 + :button_link: create_react_template.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: 2: Connect a React app and a Lightning app + :description: Learn how to connect a React app to a Lightning app. + :col_css: col-md-6 + :button_link: connect_react_and_lightning.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: 3: Communicate between React and Lightning + :description: Learn how to communicate between a React app and a Lightning app. + :col_css: col-md-6 + :button_link: communicate_between_react_and_lightning.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: 4: Develop like a React pro + :description: Learn the development workflow of a React developer. + :col_css: col-md-6 + :button_link: react_development_workflow.html + :height: 150 + :tag: intermediate + +.. raw:: html + +
+
+ +---- + +******** +Examples +******** +Here are a few example apps that use a React web UI. + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Example 1 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :button_link: ../../../contribute_app.html + :height: 150 + :tag: Waiting for contributed example + +.. displayitem:: + :header: Example 2 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :button_link: ../../../contribute_app.html + :height: 150 + :tag: Waiting for contributed example + +.. displayitem:: + :header: Example 3 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :button_link: ../../../contribute_app.html + :height: 150 + :tag: Waiting for contributed example + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/add_web_ui/react/react_development_workflow.rst b/docs/source-app/workflows/add_web_ui/react/react_development_workflow.rst new file mode 100644 index 0000000..02d855f --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/react/react_development_workflow.rst @@ -0,0 +1,27 @@ +######################################### +Add a web UI with React.js (intermediate) +######################################### +**Audience:** Anyone who wants to add a web user interface (UI) written in react to their app. + +**pre-requisites:** You already have a React app connected with a Lightning app. + +---- + +********************** +Develop your react app +********************** +Every time you make a change to your React.js app, you must call `yarn build` to apply the changes (this is a React.js thing): + +.. code:: bash + + # if you're lost, the right folder has a package.json in it + cd folder-with-ui-folder/ui + yarn build + +This can get very repetitive, there is a "hot reload" command that you can enable with: + +.. code:: bash + + # TODO + +There are many other tricks that React.js developers use to improve their development speed. diff --git a/docs/source-app/workflows/add_web_ui/streamlit/basic.rst b/docs/source-app/workflows/add_web_ui/streamlit/basic.rst new file mode 100644 index 0000000..ced0314 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/streamlit/basic.rst @@ -0,0 +1,186 @@ +################################### +Add a web UI with Streamlit (basic) +################################### +**Audience:** Users who want to add a web UI written with Python. + +**Prereqs:** Basic python knowledge. + +---- + +****************** +What is Streamlit? +****************** +Streamlit is a web user interface builder for Python developers. Streamlit builds beautiful web pages +directly from Python. + +Install Streamlit with: + +.. code:: bash + + pip install streamlit + +---- + +************************* +Run a basic streamlit app +************************* + +.. + To explain how to use Streamlit with Lightning, let's replicate the |st_link|. + + .. |st_link| raw:: html + + example running here + +In the next few sections we'll build an app step-by-step. +First **create a file named app.py** with the app content: + +.. code:: python + + # app.py + import lightning as L + import lightning.app.frontend as frontend + import streamlit as st + + def your_streamlit_app(lightning_app_state): + st.write('hello world') + + class LitStreamlit(L.LightningFlow): + def configure_layout(self): + return frontend.StreamlitFrontend(render_fn=your_streamlit_app) + + class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_streamlit = LitStreamlit() + + def run(self): + self.lit_streamlit.run() + + def configure_layout(self): + tab1 = {"name": "home", "content": self.lit_streamlit} + return tab1 + + app = L.LightningApp(LitApp()) + +add "streamlit" to a requirements.txt file: + +.. code:: bash + + echo 'streamlit' >> requirements.txt + +this is a best practice to make apps reproducible. + +---- + +*********** +Run the app +*********** +Run the app locally to see it! + +.. code:: python + + lightning run app app.py + +Now run it on the cloud as well: + +.. code:: python + + lightning run app app.py --cloud + +---- + +************************ +Step-by-step walkthrough +************************ +In this section, we explain each part of this code in detail. + +---- + +0. Define a streamlit app +^^^^^^^^^^^^^^^^^^^^^^^^^ +First, find the streamlit app you want to integrate. In this example, that app looks like: + +.. code:: python + + import streamlit as st + + def your_streamlit_app(): + st.write('hello world') + +Refer to the `Streamlit documentation `_ for more complex examples. + +---- + +1. Add Streamlit to a component +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +Link this function to the Lightning App by using the ``StreamlitFrontend`` class which needs to be returned from +the ``configure_layout`` method of the Lightning component you want to connect to Streamlit. + +.. code:: python + :emphasize-lines: 9-11 + + # app.py + import lightning as L + import lightning.app.frontend as frontend + import streamlit as st + + def your_streamlit_app(lightning_app_state): + st.write('hello world') + + class LitStreamlit(L.LightningFlow): + def configure_layout(self): + return frontend.StreamlitFrontend(render_fn=your_streamlit_app) + + class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_streamlit = LitStreamlit() + + def run(self): + self.lit_streamlit.run() + + def configure_layout(self): + tab1 = {"name": "home", "content": self.lit_streamlit} + return tab1 + + app = L.LightningApp(LitApp()) + +The ``render_fn`` argument of the ``StreamlitFrontend`` class, points to a function that runs your Streamlit app. +The first argument to the function is the lightning app state. Any changes to the app state update the app. + +---- + +2. Route the UI in the root component +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +The second step, is to tell the Root component in which tab to render this component's UI. +In this case, we render the ``LitStreamlit`` UI in the ``home`` tab of the application. + +.. code:: python + :emphasize-lines: 22 + + # app.py + import lightning as L + import lightning.app.frontend as frontend + import streamlit as st + + def your_streamlit_app(lightning_app_state): + st.write('hello world') + + class LitStreamlit(L.LightningFlow): + def configure_layout(self): + return frontend.StreamlitFrontend(render_fn=your_streamlit_app) + + class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_streamlit = LitStreamlit() + + def run(self): + self.lit_streamlit.run() + + def configure_layout(self): + tab1 = {"name": "home", "content": self.lit_streamlit} + return tab1 + + app = L.LightningApp(LitApp()) diff --git a/docs/source-app/workflows/add_web_ui/streamlit/index.rst b/docs/source-app/workflows/add_web_ui/streamlit/index.rst new file mode 100644 index 0000000..2496729 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/streamlit/index.rst @@ -0,0 +1,84 @@ +:orphan: + +.. toctree:: + :maxdepth: 1 + :hidden: + + basic + intermediate + +########################### +Add a web UI with Streamlit +########################### + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: 1: Connect Streamlit + :description: Learn how to connect Streamlit to a Lightning Component. + :col_css: col-md-6 + :button_link: basic.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: 2: Enable two-way communication + :description: Enable two-way communication between Streamlit and a Lightning App. + :col_css: col-md-6 + :button_link: intermediate.html + :height: 150 + :tag: intermediate + +.. raw:: html + +
+
+ +---- + +******** +Examples +******** +Here are a few example apps that use a Streamlit web UI. + + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Example 1 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :button_link: ../../../contribute_app.html + :height: 150 + :tag: Waiting for contributed example + +.. displayitem:: + :header: Example 2 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :button_link: ../../../contribute_app.html + :height: 150 + :tag: Waiting for contributed example + +.. displayitem:: + :header: Example 3 + :description: Show off your work! Contribute an example. + :col_css: col-md-4 + :button_link: ../../../contribute_app.html + :height: 150 + :tag: Waiting for contributed example + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/add_web_ui/streamlit/intermediate.rst b/docs/source-app/workflows/add_web_ui/streamlit/intermediate.rst new file mode 100644 index 0000000..bd10fe6 --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/streamlit/intermediate.rst @@ -0,0 +1,105 @@ +########################################## +Add a web UI with Streamlit (intermediate) +########################################## +**Audience:** Users who want to communicate between the Lightning App and Streamlit. + +**Prereqs:** Must have read the `streamlit basic `_ guide. + +---- + +************************************ +Interact with the App from Streamlit +************************************ +The streamlit UI enables user interactions with the Lightning App via UI elements like buttons. +To modify the variables of a Lightning component, access the ``lightning_app_state`` variable in . + +For example, here we increase the count variable of the Lightning Component every time a user presses a button: + +.. code:: python + :emphasize-lines: 8, 14 + + # app.py + import lightning as L + import lightning.app.frontend as frontend + import streamlit as st + + + def your_streamlit_app(lightning_app_state): + if st.button("press to increase count"): + lightning_app_state.count += 1 + st.write(f"current count: {lightning_app_state.count}") + + + class LitStreamlit(L.LightningFlow): + def __init__(self): + super().__init__() + self.count = 0 + + def configure_layout(self): + return frontend.StreamlitFrontend(render_fn=your_streamlit_app) + + + class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_streamlit = LitStreamlit() + + def run(self): + self.lit_streamlit.run() + + def configure_layout(self): + tab1 = {"name": "home", "content": self.lit_streamlit} + return tab1 + + + app = L.LightningApp(LitApp()) + +---- + +**************************************** +Interact with Streamlit from a component +**************************************** +To update the streamlit UI from any Lightning component, update the property in the component and make sure to call ``run`` from the +parent component. + +In this example we update the value of the counter from the component: + +.. code:: python + :emphasize-lines: 7, 15 + + # app.py + import lightning as L + import lightning.app.frontend as frontend + import streamlit as st + + + def your_streamlit_app(lightning_app_state): + st.write(f"current count: {lightning_app_state.count}") + + + class LitStreamlit(L.LightningFlow): + def __init__(self): + super().__init__() + self.count = 0 + + def run(self): + self.count += 1 + + def configure_layout(self): + return frontend.StreamlitFrontend(render_fn=your_streamlit_app) + + + class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_streamlit = LitStreamlit() + + def run(self): + self.lit_streamlit.run() + + def configure_layout(self): + tab1 = {"name": "home", "content": self.lit_streamlit} + return tab1 + + + app = L.LightningApp(LitApp()) diff --git a/docs/source-app/workflows/add_web_ui/vue_js_intermediate.rst b/docs/source-app/workflows/add_web_ui/vue_js_intermediate.rst new file mode 100644 index 0000000..e8d9f3e --- /dev/null +++ b/docs/source-app/workflows/add_web_ui/vue_js_intermediate.rst @@ -0,0 +1,6 @@ +:orphan: + +####################################### +Add a web UI with Vue.js (intermediate) +####################################### +coming... diff --git a/docs/source-app/workflows/arrange_tabs/arrange_app_basic.rst b/docs/source-app/workflows/arrange_tabs/arrange_app_basic.rst new file mode 100644 index 0000000..91c0e53 --- /dev/null +++ b/docs/source-app/workflows/arrange_tabs/arrange_app_basic.rst @@ -0,0 +1,69 @@ +######################## +Arrange app tabs (basic) +######################## +**Audience:** Users who want to control the layout of their app user interface. + +---- + +***************************** +Enable a full-page single tab +***************************** + +To enable a single tab on the app UI, return a single dictionary from the ``configure_layout`` method: + +.. code:: python + :emphasize-lines: 9 + + import lightning as L + + + class DemoComponent(L.demo.dumb_component): + def configure_layout(self): + tab1 = {"name": "THE TAB NAME", "content": self.component_a} + return tab1 + + + app = L.LightningApp(DemoComponent()) + + +The "name" key defines the visible name of the tab on the UI. It also shows up in the URL. +The **"content"** key defines the target component to render in that tab. +When returning a single tab element like shown above, the UI will display it in full-page mode. + + +---- + +******************** +Enable multiple tabs +******************** + +.. code:: python + :emphasize-lines: 7 + + import lightning as L + + + class DemoComponent(L.demo.dumb_component): + def configure_layout(self): + tab1 = {"name": "Tab A", "content": self.component_a} + tab2 = {"name": "Tab B", "content": self.component_b} + return tab1, tab2 + + + app = L.LightningApp(DemoComponent()) + +The order matters! Try any of the following configurations: + +.. code:: python + :emphasize-lines: 4, 9 + + def configure_layout(self): + tab1 = {"name": "Tab A", "content": self.component_a} + tab2 = {"name": "Tab B", "content": self.component_b} + return tab1, tab2 + + + def configure_layout(self): + tab1 = {"name": "Tab A", "content": self.component_a} + tab2 = {"name": "Tab B", "content": self.component_b} + return tab2, tab1 diff --git a/docs/source-app/workflows/arrange_tabs/arrange_app_intermediate.rst b/docs/source-app/workflows/arrange_tabs/arrange_app_intermediate.rst new file mode 100644 index 0000000..c87965b --- /dev/null +++ b/docs/source-app/workflows/arrange_tabs/arrange_app_intermediate.rst @@ -0,0 +1,20 @@ +############################### +Arrange app tabs (intermediate) +############################### +TODO: + +---- + +*********************************** +Render components with a defined UI +*********************************** + +component directly + +---- + +************* +Render a link +************* + +tensorboard link diff --git a/docs/source-app/workflows/arrange_tabs/index.rst b/docs/source-app/workflows/arrange_tabs/index.rst new file mode 100644 index 0000000..f639c02 --- /dev/null +++ b/docs/source-app/workflows/arrange_tabs/index.rst @@ -0,0 +1,5 @@ +################ +Arrange App Tabs +################ + +.. include:: index_content.rst diff --git a/docs/source-app/workflows/arrange_tabs/index_content.rst b/docs/source-app/workflows/arrange_tabs/index_content.rst new file mode 100644 index 0000000..66ac932 --- /dev/null +++ b/docs/source-app/workflows/arrange_tabs/index_content.rst @@ -0,0 +1,34 @@ +.. toctree:: + :maxdepth: 1 + :hidden: + + arrange_app_basic + arrange_app_intermediate + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Basic + :description: Learn how to enable and layout your app UI + :col_css: col-md-6 + :button_link: arrange_app_basic.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: Intermediate + :description: Learn about all the possible ways of rendering a component. + :col_css: col-md-6 + :button_link: arrange_app_intermediate.html + :height: 150 + :tag: intermediate + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/build_command_line_interface/app.py b/docs/source-app/workflows/build_command_line_interface/app.py new file mode 100644 index 0000000..e5abeee --- /dev/null +++ b/docs/source-app/workflows/build_command_line_interface/app.py @@ -0,0 +1,35 @@ +from commands.notebook.run import RunNotebook, RunNotebookConfig +from lit_jupyter import JupyterLab + +import lightning as L +from lightning.app.structures import Dict + + +class Flow(L.LightningFlow): + def __init__(self): + super().__init__() + self.notebooks = Dict() + + # 1. Annotates the handler input with the Notebook config. + def run_notebook(self, config: RunNotebookConfig): + if config.name in self.notebooks: + return f"The Notebook {config.name} already exists." + else: + # 2. Dynamically creates the Notebook if it doesn't exist and runs it. + self.notebooks[config.name] = JupyterLab( + cloud_compute=L.CloudCompute(config.cloud_compute) + ) + self.notebooks[config.name].run() + return f"The Notebook {config.name} was created." + + def configure_commands(self): + # 3. Returns a list of dictionaries with the format: + # {"command_name": CustomClientCommand(method=self.custom_server_handler)} + return [{"run notebook": RunNotebook(method=self.run_notebook)}] + + def configure_layout(self): + # 4. Dynamically displays the Notebooks in the Lightning App View. + return [{"name": n, "content": w} for n, w in self.notebooks.items()] + + +app = L.LightningApp(Flow()) diff --git a/docs/source-app/workflows/build_command_line_interface/cli.rst b/docs/source-app/workflows/build_command_line_interface/cli.rst new file mode 100644 index 0000000..ffd9bc4 --- /dev/null +++ b/docs/source-app/workflows/build_command_line_interface/cli.rst @@ -0,0 +1,144 @@ +:orphan: + +########################################### +1. Develop a CLI with server side code only +########################################### + +We are going to learn how to create a simple command-line interface. + +Lightning provides a flexible way to create complex CLI without much effort. + +---- + +************************* +1. Implement a simple CLI +************************* + +To create your first CLI, you need to override the :class:`~lightning.app.core.flow.LightningFlow.configure_commands` hook and return a list of dictionaries where the keys are the commands and the values are the server side handlers. + +First, create a file ``app.py`` and copy-paste the following code in to the file: + +.. literalinclude:: example_command.py + +---- + +************** +2. Run the App +************** + +Execute the following command in a terminal: + +.. code-block:: + + lightning run app app.py + +The following appears the terminal: + +.. code-block:: + + Your Lightning App is starting. This won't take long. + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + [] + +---- + +*************************** +3. Connect to a running App +*************************** + +In another terminal, connect to the running App. +When you connect to an App, the Lightning CLI is replaced by the App CLI. To exit the App CLI, you need to run ``lightning disconnect``. + +.. code-block:: + + lightning connect localhost + +To see a list of available commands: + +.. code-block:: + + lightning --help + You are connected to the cloud Lightning App: localhost. + Usage: lightning [OPTIONS] COMMAND [ARGS]... + + --help Show this message and exit. + + Lightning App Commands + add Add a name. + +To find the arguments of the commands: + +.. code-block:: + + lightning add --help + You are connected to the cloud Lightning App: localhost. + Usage: lightning add [ARGS]... + + Options + name: Add description + +---- + +******************** +4. Execute a command +******************** + +Trigger the command line exposed by your App: + +.. code-block:: + + lightning add --name=my_name + WARNING: Lightning Command Line Interface is an experimental feature and unannounced changes are likely. + +In your first terminal, **Received name: my_name** and **["my_name"]** are printed. + +.. code-block:: + + Your Lightning App is starting. This won't take long. + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + [] + Received name: my_name + ["my_name] + +---- + +************************** +5. Disconnect from the App +************************** + +To exit the App CLI, you need to run ``lightning disconnect``. + +.. code-block:: + + lightning disconnect + You are disconnected from the local Lightning App. + +---- + +********** +Learn more +********** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: 2. Implement a CLI with client side code execution + :description: Learn how to develop a complex API for your application + :col_css: col-md-6 + :button_link: cli_client.html + :height: 150 + +.. displayitem:: + :header: Develop a RESTful API + :description: Learn how to develop an API for your application. + :col_css: col-md-6 + :button_link: ../build_rest_api/index.html + :height: 150 + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/build_command_line_interface/cli_client.rst b/docs/source-app/workflows/build_command_line_interface/cli_client.rst new file mode 100644 index 0000000..f97062c --- /dev/null +++ b/docs/source-app/workflows/build_command_line_interface/cli_client.rst @@ -0,0 +1,175 @@ +:orphan: + +###################################################### +2. Develop a CLI with server and client code execution +###################################################### + +We've learned how to create a simple command-line interface. But in real-world use-cases, an App Builder wants to provide more complex functionalities where trusted code is executed on the client side. + +Lightning provides a flexible way to create complex CLI without much effort. + +In this example, we’ll create a CLI to dynamically run Notebooks: + + +---- + +************************** +1. Implement a complex CLI +************************** + +First of all, lets' create the following file structure: + +.. code-block:: python + + app_folder/ + commands/ + notebook/ + run.py + app.py + +We'll use the `Jupyter-Component `_. Follow the installation steps on the repo to install the Component. + +Add the following code to ``commands/notebook/run.py``: + +.. literalinclude:: commands/notebook/run.py + +Add the following code to ``app.py``: + +.. literalinclude:: app.py + +---- + +********************************************** +2. Run the App and check the API documentation +********************************************** + +In a terminal, run the following command and open ``http://127.0.0.1:7501/docs`` in a browser. + +.. code-block:: python + + lightning run app app.py + Your Lightning App is starting. This won't take long. + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + +---- + +*************************** +3. Connect to a running App +*************************** + +In another terminal, connect to the running App. +When you connect to an App, the Lightning CLI is replaced by the App CLI. To exit the App CLI, you need to run ``lightning disconnect``. + +.. code-block:: + + lightning connect localhost + + Storing `run_notebook` under /Users/thomas/.lightning/lightning_connection/commands/run_notebook.py + You can review all the downloaded commands under /Users/thomas/.lightning/lightning_connection/commands folder. + You are connected to the local Lightning App. + +To see a list of available commands: + +.. code-block:: + + lightning --help + + You are connected to the cloud Lightning App: localhost. + Usage: lightning [OPTIONS] COMMAND [ARGS]... + + --help Show this message and exit. + + Lightning App Commands + run notebook Run a Notebook. + + +To find the arguments of the commands: + +.. code-block:: + + lightning run notebook --help + + You are connected to the cloud Lightning App: localhost. + usage: notebook [-h] [--name NAME] [--cloud_compute CLOUD_COMPUTE] + + Run Notebook Parser + + optional arguments: + -h, --help show this help message and exit + --name NAME + --cloud_compute CLOUD_COMPUTE + +---- + +******************** +4. Execute a command +******************** + +And then you can trigger the command-line exposed by your App. + +Run the first Notebook with the following command: + +.. code-block:: python + + lightning run notebook --name="my_notebook" + WARNING: Lightning Command Line Interface is an experimental feature and unannounced changes are likely. + The notebook my_notebook was created. + +And run a second notebook. + +.. code-block:: python + + lightning run notebook --name="my_notebook_2" + WARNING: Lightning Command Line Interface is an experimental feature and unannounced changes are likely. + The notebook my_notebook_2 was created. + +Here is a recording of the Lightning App: + +.. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/commands_1.mp4 + :poster: https://pl-public-data.s3.amazonaws.com/assets_lightning/commands_1.png + :width: 600 + :class: background-video + :autoplay: + :loop: + :muted: + +************************** +5. Disconnect from the App +************************** + +To exit the App CLI, you need to run **lightning disconnect**. + +.. code-block:: + + lightning disconnect + You are disconnected from the local Lightning App. + +---- + +********** +Learn more +********** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: 1. Develop a CLI with server side code only + :description: Learn how to develop a simple CLI for your App. + :col_css: col-md-6 + :button_link: cli.html + :height: 150 + +.. displayitem:: + :header: Develop a RESTful API + :description: Learn how to develop an API for your App. + :col_css: col-md-6 + :button_link: ../build_rest_api/index.html + :height: 150 + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/build_command_line_interface/commands/__init__.py b/docs/source-app/workflows/build_command_line_interface/commands/__init__.py new file mode 100644 index 0000000..e69de29 diff --git a/docs/source-app/workflows/build_command_line_interface/commands/notebook/__init__.py b/docs/source-app/workflows/build_command_line_interface/commands/notebook/__init__.py new file mode 100644 index 0000000..e69de29 diff --git a/docs/source-app/workflows/build_command_line_interface/commands/notebook/run.py b/docs/source-app/workflows/build_command_line_interface/commands/notebook/run.py new file mode 100644 index 0000000..e0a6463 --- /dev/null +++ b/docs/source-app/workflows/build_command_line_interface/commands/notebook/run.py @@ -0,0 +1,33 @@ +from argparse import ArgumentParser +from uuid import uuid4 + +from pydantic import BaseModel + +from lightning.app.utilities.commands import ClientCommand + + +class RunNotebookConfig(BaseModel): + name: str + cloud_compute: str + + +class RunNotebook(ClientCommand): + description = "Run a Notebook." + + def run(self): + # 1. Define your own argument parser. You can use argparse, click, etc... + parser = ArgumentParser(description='Run Notebook Parser') + parser.add_argument("--name", type=str, default=None) + parser.add_argument("--cloud_compute", type=str, default="cpu") + hparams = parser.parse_args() + + # 2. Invoke the server side handler by sending a payload. + response = self.invoke_handler( + config=RunNotebookConfig( + name=hparams.name or str(uuid4()), + cloud_compute=hparams.cloud_compute, + ), + ) + + # 3. Print the server response. + print(response) diff --git a/docs/source-app/workflows/build_command_line_interface/example_command.py b/docs/source-app/workflows/build_command_line_interface/example_command.py new file mode 100644 index 0000000..4d837fc --- /dev/null +++ b/docs/source-app/workflows/build_command_line_interface/example_command.py @@ -0,0 +1,25 @@ +from lightning import LightningApp, LightningFlow + + +class Flow(LightningFlow): + def __init__(self): + super().__init__() + self.names = [] + + def run(self): + print(self.names) + + def add_name(self, name: str): + """Add a name.""" + print(f"Received name: {name}") + self.names.append(name) + + def configure_commands(self): + # This can be invoked with `lightning add --name=my_name` + commands = [ + {"add": self.add_name}, + ] + return commands + + +app = LightningApp(Flow()) diff --git a/docs/source-app/workflows/build_command_line_interface/index.rst b/docs/source-app/workflows/build_command_line_interface/index.rst new file mode 100644 index 0000000..1f1b1b1 --- /dev/null +++ b/docs/source-app/workflows/build_command_line_interface/index.rst @@ -0,0 +1,55 @@ +############################ +Command-line Interface (CLI) +############################ + +**Audience:** Users looking to create a command line interface (CLI) for their application. + +---- + +************** +What is a CLI? +************** + +A Command-line Interface (CLI) is an user interface (UI) in a terminal to interact with a specific program. + +.. note:: + + The Lightning guideline to build CLI is `lightning ...` or ` ...`. + +As an example, Lightning provides a CLI to interact with your Lightning Apps and the `lightning.ai `_ platform as follows: + +.. code-block:: bash + + main + ├── create - Creates Lightning AI self-managed resources (clusters, etc…) + │ └── cluster - Creates a Lightning AI BYOC compute cluster with your cloud provider credentials. + ├── delete - Deletes Lightning AI self-managed resources (clusters, etc…) + │ └── cluster - Deletes a Lightning AI BYOC compute cluster and all associated cloud provider resources. + ├── fork - Forks an App. + ├── init - Initializes a Lightning App and/or Component. + │ ├── app + │ ├── component + │ ├── pl-app - Creates an App from your PyTorch Lightning source files. + │ └── react-ui - Creates a React UI to give a Lightning Component a React.js web UI + ├── install - Installs a Lightning App and/or Component. + │ ├── app + │ └── component + ├── list - Lists Lightning AI self-managed resources (clusters, etc…) + │ ├── apps - Lists your Lightning AI Apps. + │ └── clusters - Lists your Lightning AI BYOC compute clusters. + ├── login - Logs in to your lightning.ai account. + ├── logout - Logs out of your lightning.ai account. + ├── run - Runs a Lightning App locally or on the cloud. + │ └── app - Runs an App from a file. + ├── show - Shows given resource. + │ ├── cluster - Groups cluster commands inside show. + │ │ └── logs - Shows cluster logs. + │ └── logs - Shows cloud application logs. By default prints logs for all currently available Components. + ├── stop - Stops your App. + └── tree - Shows the command tree of your CLI. + +Learn more about `Command-line interfaces here `_. + +---- + +.. include:: index_content.rst diff --git a/docs/source-app/workflows/build_command_line_interface/index_content.rst b/docs/source-app/workflows/build_command_line_interface/index_content.rst new file mode 100644 index 0000000..ced369d --- /dev/null +++ b/docs/source-app/workflows/build_command_line_interface/index_content.rst @@ -0,0 +1,51 @@ +************************************** +Develop a command line interface (CLI) +************************************** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: 1. Develop a CLI with server side code only + :description: Learn how to develop a simple CLI for your application + :col_css: col-md-6 + :button_link: cli.html + :height: 150 + +.. displayitem:: + :header: 2. Develop a CLI with server and client code execution + :description: Learn how to develop a complex CLI for your application + :col_css: col-md-6 + :button_link: cli_client.html + :height: 150 + +.. raw:: html + +
+
+ + +---- + +********** +Learn more +********** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Develop a RESTful API + :description: Learn how to develop an API for your application. + :col_css: col-md-6 + :button_link: ../build_rest_api/index.html + :height: 150 + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/build_command_line_interface/post_example.py b/docs/source-app/workflows/build_command_line_interface/post_example.py new file mode 100644 index 0000000..4597b3d --- /dev/null +++ b/docs/source-app/workflows/build_command_line_interface/post_example.py @@ -0,0 +1,26 @@ +import lightning as L +from lightning.app.api import Post + + +class Flow(L.LightningFlow): + # 1. Define the state + def __init__(self): + super().__init__() + self.names = [] + + # 2. Optional, but used to validate names + def run(self): + print(self.names) + + # 3. Method executed when a request is received. + def handle_post(self, name: str): + self.names.append(name) + return f'The name {name} was registered' + + # 4. Defines this Component's Restful API. You can have several routes. + def configure_api(self): + # Your own defined route and handler + return [Post(route="/name", method=self.handle_post)] + + +app = L.LightningApp(Flow()) diff --git a/docs/source-app/workflows/build_lightning_app/from_pytorch_lightning_script.rst b/docs/source-app/workflows/build_lightning_app/from_pytorch_lightning_script.rst new file mode 100644 index 0000000..2fcfb71 --- /dev/null +++ b/docs/source-app/workflows/build_lightning_app/from_pytorch_lightning_script.rst @@ -0,0 +1,109 @@ +####################################################### +Develop a Lightning App from a PyTorch Lightning script +####################################################### + +**Audience:** Users who want to develop a Lightning App (App) from their PyTorch Lightning (PL) scripts. + +---- + +************************************************************* +What developing a Lightning App from a PL script does for you +************************************************************* + +Developing an App from a PL script allows you to immediately run on the cloud and share the progress with friends. +Once you're happy with your model, you can immediately expand beyond just model development to things like +making your own inference APIs, research demos, or even speeding up your data pipeline. + +The PyTorch Lightning App is your entry point to the full end-to-end ML licefycle. + +---- + +****************** +Develop a template +****************** + +To develop a template from a PyTorch Lightning script, use this command: + +.. code:: bash + + lightning init pl-app path/to/the/pl_script.py + + +If your script is not at the root of the project folder, and you'd like to include all source files within that folder, you can specify the root path as the first argument: + +.. code:: bash + + lightning init pl-app path/to/project/root path/to/the/pl_script.py + + +The default trainer App lets you train a model with a beautiful UI locally and on the cloud with zero effort! + +---- + +*********** +Run the App +*********** + +.. note:: This section is under construction. + +Run the App locally: + +.. code:: bash + + lightning run app pl-app/app.py + +Or run the App on the cloud so you can share with collaborators and even use all the cloud GPUs you want. + +.. code:: bash + + lightning run app pl-app/app.py --cloud + + +.. figure:: https://storage.googleapis.com/grid-packages/pytorch-lightning-app/docs-thumbnail.png + :alt: Screenshot of the PyTorch Lightning app running in the cloud + + +---- + +******************* +Modify the template +******************* + +The command above generates an App file like this: + +.. note:: TODO: list the file and show how to extend it + +.. code:: python + + from your_app_name import ComponentA, ComponentB + + import lightning as L + + + class LitApp(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.component_a = ComponentA() + self.component_b = ComponentB() + + def run(self): + self.component_a.run() + self.component_b.run() + + + app = L.LightningApp(LitApp()) + +Now you can add your own components as you wish! + +---- + +************ +Known issues +************ + +- The UI takes a couple seconds to load when opening the App, so please be patient. +- The timer resets when refreshing the page. +- The UI for adding new environment variables does not provide an option to delete an entry. +- A bug exists that leaves the script hanging at the start of training when using the DDP strategy. +- DDP-spawn is not supported due to pickling issues. +- It is currently not possible to submit a new run once the script has finished or failed. diff --git a/docs/source-app/workflows/build_lightning_app/from_scratch.rst b/docs/source-app/workflows/build_lightning_app/from_scratch.rst new file mode 100644 index 0000000..9042f10 --- /dev/null +++ b/docs/source-app/workflows/build_lightning_app/from_scratch.rst @@ -0,0 +1,11 @@ +#################################### +Develop a Lightning App from Scratch +#################################### + +**Audience:** Users who want to develop a Lightning App from scratch. + +**Prereqs:** You must have finished the `Basic levels `_. + +---- + +.. include:: from_scratch_content.rst diff --git a/docs/source-app/workflows/build_lightning_app/from_scratch_content.rst b/docs/source-app/workflows/build_lightning_app/from_scratch_content.rst new file mode 100644 index 0000000..7641b4f --- /dev/null +++ b/docs/source-app/workflows/build_lightning_app/from_scratch_content.rst @@ -0,0 +1,60 @@ + +************** +WAIT! +************** +Before you build a Lightning App from scratch, see if you can find an app that is similar to what you need +in the `Lightning App Gallery `_. + +Once you find the Lightning App you want, press "Clone & Run" to see it running on the cloud, then download the code +and change what you want! + +---- + +****************** +Build from scratch +****************** +If you didn't find a Lightning App similar to the one you need, simply create a file named **app.py** with these contents: + +.. code:: python + + import lightning as L + + + class WordComponent(L.LightningWork): + def __init__(self, word): + super().__init__() + self.word = word + + def run(self): + print(self.word) + + + class LitApp(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.hello = WordComponent("hello") + self.world = WordComponent("world") + + def run(self): + print("This is a simple Lightning app, make a better app!") + self.hello.run() + self.world.run() + + + app = L.LightningApp(LitApp()) + +---- + +Run the Lightning App +^^^^^^^^^^^^^^^^^^^^^ +Run the Lightning App locally: + +.. code:: bash + + lightning run app app.py + +Run the Lightning App on the cloud: + +.. code:: bash + + lightning run app app.py --cloud diff --git a/docs/source-app/workflows/build_lightning_app/index.rst b/docs/source-app/workflows/build_lightning_app/index.rst new file mode 100644 index 0000000..e60f035 --- /dev/null +++ b/docs/source-app/workflows/build_lightning_app/index.rst @@ -0,0 +1,11 @@ +:orphan: + +####################### +Develop a Lightning App +####################### + +A Lightning App (App) is a collection of components interacting together. Learn how to develop a basic App template. + +---- + +.. include:: index_content.rst diff --git a/docs/source-app/workflows/build_lightning_app/index_content.rst b/docs/source-app/workflows/build_lightning_app/index_content.rst new file mode 100644 index 0000000..45264d8 --- /dev/null +++ b/docs/source-app/workflows/build_lightning_app/index_content.rst @@ -0,0 +1,32 @@ +.. toctree:: + :maxdepth: 1 + :hidden: + + from_scratch + from_pytorch_lightning_script + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Develop a Lightning App from scratch + :description: Learn how to Develop a Lightning App from scratch + :col_css: col-md-6 + :button_link: from_scratch.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: Develop an App from a PyTorch Lightning script + :description: Share your PyTorch Lightning training on the cloud, run on cloud GPUs, or extend your App + :col_css: col-md-6 + :button_link: from_pytorch_lightning_script.html + :height: 150 + :tag: basic + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/build_lightning_component/basic.rst b/docs/source-app/workflows/build_lightning_component/basic.rst new file mode 100644 index 0000000..07fac58 --- /dev/null +++ b/docs/source-app/workflows/build_lightning_component/basic.rst @@ -0,0 +1,9 @@ +############################# +Develop a Lightning Component +############################# + +**Audience:** Users who want to develop a Lightning Component. + +---- + +.. include:: from_scratch_component_content.rst diff --git a/docs/source-app/workflows/build_lightning_component/from_scratch_component_content.rst b/docs/source-app/workflows/build_lightning_component/from_scratch_component_content.rst new file mode 100644 index 0000000..a42be9b --- /dev/null +++ b/docs/source-app/workflows/build_lightning_component/from_scratch_component_content.rst @@ -0,0 +1,153 @@ +******************************* +LightningFlow vs. LightningWork +******************************* + +.. _flow_vs_work: + +.. raw:: html + + Choosing between LightningFlow and LightningWork + +There are two types of components in Lightning, **LightningFlow** and **LightningWork**. + +Use a **LightningFlow** component for any programming logic that runs in less than 1 second. + +.. code:: python + + for i in range(10): + print(f"{i}: this kind of code belongs in a LightningFlow") + +Use a **LightningWork** component for any programming logic that takes more than 1 second or requires its own hardware. + +.. code:: python + + from time import sleep + + for i in range(100000): + sleep(2.0) + print(f"{i} LightningWork: work that is long running or may never end (like a server)") + +---- + +************************************************** +What developing a Lightning Component does for you +************************************************** +Lightning Components break up complex systems into modular components. The first obvious benefit is that components +can be reused across other apps. This means you can build once, test it and forget it. + +As a researcher it also means that your code can be taken to production without needing a team of engineers to help +productionize it. + +As a machine learning engineer, it means that your cloud system is: + +- fault tolerant +- cloud agnostic +- testable (unlike YAML/CI/CD code) +- version controlled +- enables cross-functional collaboration + +---- + +************** +WAIT! +************** +Before you build a Lightning component from scratch, see if you can find a component that is similar to what you need +in the `Lightning component Gallery `_. + +Once you find the component you want, download the code and change what you want! + +---- + +***************************************** +Build a Lighitning component from scratch +***************************************** +If you didn't find a Lightning component similar to the one you need, you can build one from scratch. + +---- + +Build a LightningFlow +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +To implement a LightningFlow, simply subclass ``LightningFlow`` and define the run method: + +.. code:: python + :emphasize-lines: 5 + + # app.py + import lightning as L + + + class LitFlow(L.LightningFlow): + def run(self): + for i in range(10): + print(f"{i}: this kind of code belongs in a LightningFlow") + + + app = L.LightningApp(LitFlow()) + +run the app + +.. code:: bash + + lightning run app app.py + +---- + +Build a LightningWork +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +Only implement a LightningWork if this particular piece of code: + +- takes more than 1 second to execute +- requires its own set of cloud resources +- or both + +To implement a LightningWork, simply subclass ``LightningWork`` and define the run method: + +.. code:: python + :emphasize-lines: 6 + + # app.py + from time import sleep + import lightning as L + + + class LitWork(L.LightningWork): + def run(self): + for i in range(100000): + sleep(2.0) + print(f"{i} LightningWork: work that is long running or may never end (like a server)") + +A LightningWork must always be attached to a LightningFlow and explicitely asked to ``run()``: + +.. code:: python + :emphasize-lines: 13, 16 + + from time import sleep + import lightning as L + + + class LitWork(L.LightningWork): + def run(self): + for i in range(100000): + sleep(2.0) + print(f"{i} LightningWork: work that is long running or may never end (like a server)") + + + class LitFlow(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_work = LitWork() + + def run(self): + self.lit_work.run() + + + app = L.LightningApp(LitFlow()) + +run the app + +.. code:: bash + + lightning run app app.py diff --git a/docs/source-app/workflows/build_lightning_component/index.rst b/docs/source-app/workflows/build_lightning_component/index.rst new file mode 100644 index 0000000..8620a9b --- /dev/null +++ b/docs/source-app/workflows/build_lightning_component/index.rst @@ -0,0 +1,11 @@ +:orphan: + +############################# +Develop a Lightning Component +############################# + +A Lightning App (App) is a collection of components interacting together. Learn how to build a Lightning Component (Component) in this section. + +---- + +.. include:: index_content.rst diff --git a/docs/source-app/workflows/build_lightning_component/index_content.rst b/docs/source-app/workflows/build_lightning_component/index_content.rst new file mode 100644 index 0000000..abf26e3 --- /dev/null +++ b/docs/source-app/workflows/build_lightning_component/index_content.rst @@ -0,0 +1,122 @@ +.. toctree:: + :maxdepth: 1 + :hidden: + + basic + ../add_components/index + +.. toctree:: + :maxdepth: 1 + :hidden: + + intermediate + ../run_work_in_parallel + ../run_work_once + +.. toctree:: + :maxdepth: 1 + :hidden: + + ../enable_fault_tolerance + +****** +Basics +****** +.. raw:: html + +
+
+ +.. displayitem:: + :header: Develop a Lightning Component + :description: Learn the basics of developing a Lightning Component + :col_css: col-md-4 + :button_link: basic.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: Explore community Lightning Components + :description: Discover community-built Lightning Components + :col_css: col-md-4 + :button_link: https://lightning.ai/components + :height: 150 + :tag: basic + +.. raw:: html + +
+
+ +---- + +************ +Intermediate +************ + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Add a UI to a component + :description: Learn about all the possible ways of rendering a component. + :col_css: col-md-4 + :button_link: intermediate.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Run LightningWork in parallel + :description: Learn about running LightningWork in parallel. + :col_css: col-md-4 + :button_link: ../run_work_in_parallel.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Run LightningWork once + :description: Learn about running LightningWork multiple times or once. + :col_css: col-md-4 + :button_link: ../run_work_once.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Publish a Lightning component + :description: Learn the basics of publishing a Lightning component. + :col_css: col-md-4 + :button_link: publish_a_component.html + :height: 150 + :tag: intermediate + +.. raw:: html + +
+
+ + +---- + +******** +Advanced +******** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Enable fault tolerance + :description: Learn how to make a component fault tolerant. + :col_css: col-md-4 + :button_link: ../enable_fault_tolerance.html + :height: 150 + :tag: advanced + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/build_lightning_component/intermediate.rst b/docs/source-app/workflows/build_lightning_component/intermediate.rst new file mode 100644 index 0000000..f38f7c7 --- /dev/null +++ b/docs/source-app/workflows/build_lightning_component/intermediate.rst @@ -0,0 +1,71 @@ +############################################ +Develop a Lightning Component (intermediate) +############################################ + +**Audience:** Users who want to connect a UI to a Lightning Component (Component). + +---- + +***************************** +Add a web user interface (UI) +***************************** +Every lightning component can have its own user interface (UI). Lightning components support any kind +of UI interface such as dash, gradio, panel, react.js, streamlit, vue.js, web urls, +etc...(`full list here <../add_web_ui/index.html>`_). + +Let's say that we have a user interface defined in html: + +.. code:: html + + + + + + +

Hello World

+ + + +To *connect* this user interface to the Component, define the configure_layout method: + +.. code:: python + :emphasize-lines: 5, 6 + + import lightning as L + + + class LitHTMLComponent(L.LightningFlow): + def configure_layout(self): + return L.app.frontend.StaticWebFrontend(serve_dir="path/to/folder/with/index.html/inside") + +Finally, route the Component's UI through the root Component's **configure_layout** method: + +.. code:: python + :emphasize-lines: 14 + + # app.py + import lightning as L + + + class LitHTMLComponent(L.LightningFlow): + def configure_layout(self): + return L.app.frontend.StaticWebFrontend(serve_dir="path/to/folder/with/index.html/inside") + + + class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.lit_html_component = LitHTMLComponent() + + def configure_layout(self): + tab1 = {"name": "home", "content": self.lit_html_component} + return tab1 + + + app = L.LightningApp(LitApp()) + +Run your App and you'll see the UI on the Lightning App view: + +.. code:: bash + + lightning run app app.py diff --git a/docs/source-app/workflows/build_lightning_component/publish_a_component.rst b/docs/source-app/workflows/build_lightning_component/publish_a_component.rst new file mode 100644 index 0000000..bb5ec75 --- /dev/null +++ b/docs/source-app/workflows/build_lightning_component/publish_a_component.rst @@ -0,0 +1,59 @@ +############################# +Publish a Lightning Component +############################# + +**Audience:** Users who want to build a Ligthtning Component (Component) to publish to the Lightning Gallery + +---- + +*********************************** +Develop a Component from a template +*********************************** + +The fastest way to build a Component that is ready to be published to the component Gallery is to use +the default template. + +Generate your Component template with this command: + +.. code:: python + + lightning init component your-component-name + +---- + +***************** +Run the Component +***************** + +To test that your Component works, first install all dependencies: + +.. code:: bash + + cd your-component + pip install -r requirements.txt + pip install -e . + +Now import your Component and use it in a Lightning App: + +.. code:: python + + # app.py + from your_component import TemplateComponent + import lightning as L + + class LitApp(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.your_component = TemplateComponent() + + def run(self): + print('this is a simple Lightning app to verify your component is working as expected') + self.your_component.run() + + app = L.LightningApp(LitApp()) + +and run the app: + +.. code:: bash + + lightning run app app.py diff --git a/docs/source-app/workflows/build_rest_api/add_api.rst b/docs/source-app/workflows/build_rest_api/add_api.rst new file mode 100644 index 0000000..eeb91b0 --- /dev/null +++ b/docs/source-app/workflows/build_rest_api/add_api.rst @@ -0,0 +1,104 @@ +:orphan: + +############################ +Add an API Route to your App +############################ + +In order to add a new route, you need to override the :class:`~lightning.app.core.flow.LightningFlow.configure_api` hook and return a list of :class:`~lightning.app.api.:class:`~lightning.app.api.http_methods.HttpMethod` such as :class:`~lightning.app.api.:class:`~lightning.app.api.http_methods.Get`, :class:`~lightning.app.api.:class:`~lightning.app.api.http_methods.Post`, :class:`~lightning.app.api.:class:`~lightning.app.api.http_methods.Put`, :class:`~lightning.app.api.:class:`~lightning.app.api.http_methods.Delete`. + +---- + +********************** +1. Create a simple App +********************** + +We're going to create a single route ``/name`` that takes a string input ``name`` and stores the value within the ``names`` attribute of the flow state. + +Create a file called ``app.py`` and copy-paste the following code in to the file: + +.. literalinclude:: post_example.py + +---- + +************** +2. Run the App +************** + +Execute the following command in a terminal: + +.. code-block:: + + lightning run app app.py + +The following appears: + +.. code-block:: + + Your Lightning App is starting. This won't take long. + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + +---- + +**************** +3. Check the API +**************** + +The Lightning App framework automatically generates API documentation from your App using `Swagger UI `_. + +You can access it by accessing the following URL: ``http://127.0.0.1:7501/docs`` in your browser and validate your API with the route ``/name`` directly from the documentation page as shown below. + +.. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/rest_post.mp4 + :poster: https://pl-public-data.s3.amazonaws.com/assets_lightning/rest_png.png + :width: 600 + :class: background-video + :autoplay: + :loop: + :muted: + +Alternatively, you can invoke the route directly from a second terminal using `curl `_. + +.. code-block:: + + curl -X 'POST' \ + 'http://127.0.0.1:7501/name?name=my_name' \ + -H 'accept: application/json' \ + -d '' + + "The name my_name was registered" + +And you can see the following in your first terminal running your App. + +.. code-block:: + + Your Lightning App is starting. This won't take long. + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + [] + ["my_name"] + +************************************** +Develop a command line interface (CLI) +************************************** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Add Requests Validation + :description: Learn how to use pydantic with your API. + :col_css: col-md-6 + :button_link: request_validation.html + :height: 150 + +.. displayitem:: + :header: Develop a Command Line Interface (CLI) + :description: Learn how to develop an CLI for your App. + :col_css: col-md-6 + :button_link: ../build_command_line_interface/index.html + :height: 150 + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/build_rest_api/index.rst b/docs/source-app/workflows/build_rest_api/index.rst new file mode 100644 index 0000000..8b9192f --- /dev/null +++ b/docs/source-app/workflows/build_rest_api/index.rst @@ -0,0 +1,34 @@ +:orphan: + +########### +RESTful API +########### + +**Audience:** Users looking to create an API in their App to allow users to activate functionalities from external sources. + +---- + +********************** +What is a RESTful API? +********************** + +A RESTful API is a set of external URL routes exposed by a server that enables clients to trigger some functionalities, such as getting or putting some data, uploading files, etc.. + +This provides great flexibility for users as they can easily discover functionalities made available by the App Builders. + +The Lightning App framework supports the four primary HTTP methods: `GET`, `POST`, `PUT`, `DELETE`. + +These methods are guidelines to organize your RESTful Services and help users understand your functionalities. + +* **`GET`:** Reads data from the server. +* **`POST`:** Creates new resources. +* **`PUT`:** Updates/replaces existing resources. +* **`DELETE`:** Deletes resources. + +Learn more about `HTTP Methods for RESTful Services here `_. + +The Lightning App framework uses the popular `FastAPI `_ and `Pydantic `_ frameworks under the hood. This means you can use all their features while building your App. + +---- + +.. include:: index_content.rst diff --git a/docs/source-app/workflows/build_rest_api/index_content.rst b/docs/source-app/workflows/build_rest_api/index_content.rst new file mode 100644 index 0000000..9f77225 --- /dev/null +++ b/docs/source-app/workflows/build_rest_api/index_content.rst @@ -0,0 +1,50 @@ +************** +Develop an API +************** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Add an API Route to your App + :description: Learn how to develop a simple API for your App. + :col_css: col-md-6 + :button_link: add_api.html + :height: 150 + +.. displayitem:: + :header: Add Requests Validation + :description: Learn how to use pydantic with your API. + :col_css: col-md-6 + :button_link: cli_client.html + :height: 150 + +.. raw:: html + +
+
+ +---- + +********** +Learn more +********** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Develop a Command-line Interface + :description: Learn how to develop an CLI for your App. + :col_css: col-md-6 + :button_link: ../build_command_line_interface/index.html + :height: 150 + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/build_rest_api/models.py b/docs/source-app/workflows/build_rest_api/models.py new file mode 100644 index 0000000..7ebb3ac --- /dev/null +++ b/docs/source-app/workflows/build_rest_api/models.py @@ -0,0 +1,6 @@ +from pydantic import BaseModel + + +# 1. Subclass the BaseModel and defines your payload format. +class NamePostConfig(BaseModel): + name: str diff --git a/docs/source-app/workflows/build_rest_api/post_example.py b/docs/source-app/workflows/build_rest_api/post_example.py new file mode 100644 index 0000000..0ba2405 --- /dev/null +++ b/docs/source-app/workflows/build_rest_api/post_example.py @@ -0,0 +1,25 @@ +import lightning as L +from lightning.app.api import Post + + +class Flow(L.LightningFlow): + # 1. Define the state + def __init__(self): + super().__init__() + self.names = [] + + # 2. Optional, but used to validate names + def run(self): + print(self.names) + + # 3. Method executed when a request is received. + def handle_post(self, name: str): + self.names.append(name) + return f'The name {name} was registered' + + # 4. Defines this Component's Restful API. You can have several routes. + def configure_api(self): + return [Post(route="/name", method=self.handle_post)] + + +app = L.LightningApp(Flow()) diff --git a/docs/source-app/workflows/build_rest_api/post_example_pydantic.py b/docs/source-app/workflows/build_rest_api/post_example_pydantic.py new file mode 100644 index 0000000..f32dc3f --- /dev/null +++ b/docs/source-app/workflows/build_rest_api/post_example_pydantic.py @@ -0,0 +1,32 @@ +from models import NamePostConfig # 2. Import your custom model. + +import lightning as L +from lightning.app.api import Post + + +class Flow(L.LightningFlow): + # 1. Define the state + def __init__(self): + super().__init__() + self.names = [] + + # 2. Optional, but used to validate names + def run(self): + print(self.names) + + # 3. Annotate your input with your custom pydantic model. + def handle_post(self, config: NamePostConfig): + self.names.append(config.name) + return f'The name {config} was registered' + + # 4. Defines this Component's Restful API. You can have several routes. + def configure_api(self): + return [ + Post( + route="/name", + method=self.handle_post, + ) + ] + + +app = L.LightningApp(Flow()) diff --git a/docs/source-app/workflows/build_rest_api/request_validation.rst b/docs/source-app/workflows/build_rest_api/request_validation.rst new file mode 100644 index 0000000..6caaccd --- /dev/null +++ b/docs/source-app/workflows/build_rest_api/request_validation.rst @@ -0,0 +1,69 @@ +:orphan: + +*********************** +Add Requests Validation +*********************** + +The Lightning App framework uses the popular `FastAPI `_ and `Pydantic `_ frameworks under the hood. This means you can use all their features while building your App. + +pydantic enables fast data validation and settings management using Python type annotations and FastAPI is a modern, fast (high-performance), web framework for building APIs. + +You can easily use pydantic by defining your own payload format. + +.. literalinclude:: models.py + +Then, type your handler input with your custom model. + +.. literalinclude:: post_example_pydantic.py + +After running the updated App, the App documentation ``/name`` has changed and takes JSON with ``{"name": ...}`` as input. + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/rest_post_pydantic.png + :alt: Rest API with pydantic + :width: 100 % + +You can invoke the RESTful API route ``/name`` with the following command: + +.. code-block:: bash + + curl -X 'POST' \ + 'http://127.0.0.1:7501/name' \ + -H 'accept: application/json' \ + -H 'Content-Type: application/json' \ + -d '{ + "name": "my_name" + }' + +.. note:: + + Using curl, you can pass a JSON payload using the ``-d`` argument. + +---- + +********** +Learn more +********** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Add an API Route to your App + :description: Learn how to develop a simple API for your App. + :col_css: col-md-6 + :button_link: add_api.html + :height: 150 + +.. displayitem:: + :header: Develop a Command Line Interface (CLI) + :description: Learn how to develop an CLI for your App. + :col_css: col-md-6 + :button_link: ../build_command_line_interface/index.html + :height: 150 + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/byoc/aws_cli.rst b/docs/source-app/workflows/byoc/aws_cli.rst new file mode 100644 index 0000000..4bfea35 --- /dev/null +++ b/docs/source-app/workflows/byoc/aws_cli.rst @@ -0,0 +1,135 @@ +:orphan: + +.. _aws_cli: + + +############################ +Create AWS role with AWS CLI +############################ + +1. Install AWS CLI (see instructions `here `_). + +2. Protect your role by creating a hard to guess password that will be used to authenticate Lightning (You will need to pass it to Lightning for authentication). In our example we will use `dummy`. + +3. Create a role called `lightning-cloud` using the following command (replace with your own): + +.. code:: bash + + aws iam create-role \ + --role-name lightning-cloud \ + --assume-role-policy-document '{"Statement":[{"Action":"sts:AssumeRole","Effect": "Allow", "Principal": {"AWS": "arn:aws:iam::748115360335:root"}, "Condition": {"StringEquals": {"sts:ExternalId": ""}}}]}' \ + --description " " \ + --max-session-duration 43200 + +4. Create a file `iam-policy.json` with the following permissions required for Lightning to manage cloud infrastructure for you: + +.. code:: json + + { + "Version": "2012-10-17", + "Statement": [ + { + "Action": [ + "autoscaling:*", + "cloudwatch:*", + "codebuild:*", + "ec2:*", + "ecr:*", + "eks:*", + "elasticloadbalancing:*", + "events:*", + "guardduty:*", + "iam:*", + "logs:*", + "route53resolver:*", + "s3:*", + "sns:*", + "sqs:*", + "tag:GetResources", + "resource-groups:SearchResources" + ], + "Effect": "Allow", + "Resource": "*" + }, + { + "Effect": "Allow", + "Action": "iam:CreateServiceLinkedRole", + "Resource": "*", + "Condition": { + "StringLike": { + "iam:AWSServiceName": [ + "guardduty.amazonaws.com", + "malware-protection.guardduty.amazonaws.com" + ] + } + } + }, + { + "Effect": "Allow", + "Action": "iam:CreateServiceLinkedRole", + "Resource": "*", + "Condition": { + "StringEquals": { + "iam:AWSServiceName": [ + "autoscaling.amazonaws.com", + "ec2scheduled.amazonaws.com", + "elasticloadbalancing.amazonaws.com", + "spot.amazonaws.com", + "spotfleet.amazonaws.com", + "transitgateway.amazonaws.com" + ] + } + } + } + ] + } + +5. Create a IAM policy and associate it with the role we just created, and pass in the path to your new file: + +.. code:: bash + + aws iam create-policy \ + --policy-name lightning-cloud \ + --description "policy granting lightning controlplane permissions" \ + --policy-document file:///my_dir/iam-policy.json + +6. Fetch the role ARN so you can attach the policy: + +.. code:: bash + + aws iam get-role --role-name lightning-cloud --output json --query Role.Arn + +7. Attach the policy to the IAM role you just created: + +.. code:: bash + + aws iam attach-role-policy \ + --role-name lightning-cloud \ + --policy-arn arn:aws:iam::1234567890:policy/lightning-cloud + +------ + +********************** +Next: Create a cluster +********************** + +You are now ready to create a Lightning cluster! + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Create cluster + :description: Create an AWS cluster for running ligthning apps, skip to step 2 + :button_link: create_cluster.html + :col_css: col-md-12 + :height: 170 + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/byoc/aws_console.rst b/docs/source-app/workflows/byoc/aws_console.rst new file mode 100644 index 0000000..75877f9 --- /dev/null +++ b/docs/source-app/workflows/byoc/aws_console.rst @@ -0,0 +1,101 @@ +:orphan: + +.. _aws_console: + + +########################################### +Create AWS role with AWS management console +########################################### + +See the following video for instructions: + +.. video:: https://lightningaidev.wpengine.com/wp-content/uploads/2022/12/byoc.mp4 + :width: 600 + :autoplay: + :loop: + :muted: + + +1.1- Create a role +------------------ + +The created role will give Lightning AI access (by specifying Ligthning account id), and will + +1. Sign in to your AWS account. (If you don’t have an AWS account, create one). + +2. On AWS console search for IAM > Roles > Create role. + + In your new role set the following: + + * Trusted entity type -> AWS account. + + * An AWS account -> Another AWS account -> Account id: 748115360335. (This is Lightning's account id). + +3. Protect your role by creating a hard to guess password that will be used to authenticate Lightning (You will need to pass it to Lightning for authnetication). + + * Set Require external ID: + +4. Click "Next" + + +1.2- Create a policy +-------------------- + +1. Click "Create policy" -> A new tab opens to the Create policy page. + +2. Click the JSON tab and copy-paste the `contents of this JSON file ` into the JSON workspace. + +.. note: Ignore the warnings generated by AWS. + +3. Click "Next:Tags" (you can skip this step) + +4. Complete policy creation by adding a meaningful name and description to the policy. + + For example: + + Name -> "lightning-cloud" + + Description -> "permission to manage EC2 instances" + +5. Add policy to the role: Return to the browser tab that you were using to create a role. +Refresh the policy list and select the custom policy you just created (in this case “lai-byoc-policy”). The policy should appear at the top of the Policy List. + +6. Click "Next". + +7. Provide a meaningful name and description for the role, and click “Create Role”. + + For example: + + Name -> "lightning-cloud" + + Description -> "Role for Lightning cloud permissions" + +Congrats! You now successfully added the set up permissions needed for lightning to create a cluster. + + +------ + +********************** +Next: Create a cluster +********************** + +You are now ready to create a Lightning cluster! + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Create cluster + :description: Create an AWS cluster for running ligthning apps, skip to step 2 + :button_link: create_cluster.html + :col_css: col-md-12 + :height: 170 + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/byoc/create_cluster.rst b/docs/source-app/workflows/byoc/create_cluster.rst new file mode 100644 index 0000000..4e7994b --- /dev/null +++ b/docs/source-app/workflows/byoc/create_cluster.rst @@ -0,0 +1,146 @@ +:orphan: + +.. _create_cluster: + + +################## +Create AWS cluster +################## + +**Audience:** Users looking to create a cluster to run Lightning Apps on their own private cloud infrastructure. + +**Prereqs:** basic familiarity with cloud provider infrastructure management. + +.. note:: This feature is currently available for early access! To create your own cluster `contact us `_. + + +---- + +******************************************* +Step 1- Create roles and permissions on AWS +******************************************* + +In this step you’ll be creating a role on your cloud provider that allows Lightning to manage resources on your behalf (for example, creating EC2 instances for your cluster). +To do this you can use the AWS CLI or the AWS management console. + +You will only have to preform this step once, and the same role can be used to create multiple clusters. + +---- + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Create role with AWS CLI + :description: Create role with AWS CLI + :col_css: col-md-4 + :button_link: aws_cli.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: Create role with AWS console + :description: Create role with AWS console + :col_css: col-md-4 + :button_link: aws_console.html + :height: 180 + :tag: Basic + +.. raw:: html + +
+
+ + +---- + + +**************************** +Step 2- Get ARN for new role +**************************** + +To start a cluster, Lightning will need the external-id you set in step 1, and the ARN role. Click on your new role to find them (note: you need the ARN listed at the top of the page, not the one in “trusted entitles”). + + +Record the ARN and the external ID. You’ll need them for your next step. + +----- + +************************************** +Step 3-Create a Lightning BYOC cluster +************************************** + +Now that you have created a role and policy on AWS, you can start creating Lightning clusters. + +Create a Lightning BYOC cluster using the following command: + +.. code:: bash + + lightning create cluster --role-arn --external-id + +Here's an example: + +.. code:: bash + + lightning create cluster my-byoc-cluster --role-arn arn:aws:iam::1234567890:role/lai-byoc --external-id dummy + +.. note:: Cluster creation is going to take an hour or more after you run this command. +.. note:: Only us-east-1, us-east-2, us-west-1 and us-west-2 are supported today. + + +Parameters +========== + ++------------------------+----------------------------------------------------------------------------------------------------+ +|Parameter | Description | ++========================+====================================================================================================+ +| cluster_id | The name of the cluster to be created. | +| | | +| | Cluster names can only contain lowercase letters, numbers, and periodic hyphens ( - ). | ++------------------------+----------------------------------------------------------------------------------------------------+ +| role-arn | AWS IAM Role ARN used to provision resources | ++------------------------+----------------------------------------------------------------------------------------------------+ +| external-id | AWS IAM Role external ID | +| | | +| | To read more on what the AWS external ID is and why it's useful go | +| | `here `_| ++------------------------+----------------------------------------------------------------------------------------------------+ + +---- + +******************************************* +View a list of your Lightning BYOC clusters +******************************************* + +.. code:: bash + + lightning list clusters + +--- + +****************************** +Next: Run apps on your cluster +****************************** + +Once your cluster is running, you can start running Lightning apps on your cluster. + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Run apps on your cluster + :description: Learn how to start apps on your Lightning cluster + :button_link: run_on_cluster.html + :col_css: col-md-12 + :height: 170 + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/byoc/delete_cluster.rst b/docs/source-app/workflows/byoc/delete_cluster.rst new file mode 100644 index 0000000..c71a7c9 --- /dev/null +++ b/docs/source-app/workflows/byoc/delete_cluster.rst @@ -0,0 +1,28 @@ +:orphan: + +.. _delete_cluster: + + +******************************* +Delete a Lightning BYOC cluster +******************************* + +Once you no longer need a Lightning cluster you can delete it with the following command: + +.. code:: bash + + lightning delete cluster + +Deleting a cluster will remove any apps data from Lighting (including logs and metadata) and all reources associated with the cluster. Any artifacts created in the object storage of your cluster will not be deleted. + +.. warning:: Using the ``--force`` parameter when deleting a cluster does not clean up any resources managed by Lightning AI. Check your cloud provider to verify that existing cloud resources are deleted. + +.. warning:: This process may take a few minutes to complete, but once started it CANNOT be rolled back. Deletion permanently removes not only the BYOC cluster from being managed by Lightning AI, but tears down every BYOC resource Lightning AI managed (for that cluster id) in the host cloud. All object stores, container registries, logs, compute nodes, volumes, etc. are deleted and cannot be recovered. + +.. warning:: + + Under the hood the deletion selects cloud provider resources via the tags + `lightning/cluster` and + `kubernetes.io/cluster/` + + Do not use these tags in any cloud resources you create yourself, as they will be subject to deletion when the cluster is deleted. diff --git a/docs/source-app/workflows/byoc/index.rst b/docs/source-app/workflows/byoc/index.rst new file mode 100644 index 0000000..494a700 --- /dev/null +++ b/docs/source-app/workflows/byoc/index.rst @@ -0,0 +1,60 @@ +.. _byoc: + +################################# +Run Apps on your own cloud (BYOC) +################################# + +**Audience:** Users looking to run Lightning Apps on their own private cloud infrastructure. + +.. note:: This feature is currently available for early access! To create your own cluster `contact us `_. + + +---- + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Create an AWS cluster + :description: Create an AWS cluster + :col_css: col-md-4 + :button_link: create_cluster.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: Run app on your cluster + :description: How to run apps on your Lighnting Cluster + :col_css: col-md-4 + :button_link: run_on_cluster.html + :height: 180 + :tag: Basic + +.. displayitem:: + :header: Delete a cluster + :description: Delete a cluster + :col_css: col-md-4 + :button_link: delete_cluster.html + :height: 180 + :tag: Basic + +.. raw:: html + +
+
+ + +---- + + + +******************** +Why create a cluster +******************** + +You can use Lightning clusters to run Lightning apps on your own cloud provider account in order to protect your data and use your cloud provider's credits. The control for these clusters runs on the Lightning managed cloud, but the data plane, including the clusters, services, and apps, is located within your own cloud provider account. + +Once the cluster is created, Lightning Cloud controlplane will take over, +managing the lifecycle of the cloud infrastructure required to run Lightning Apps. diff --git a/docs/source-app/workflows/byoc/run_on_cluster.rst b/docs/source-app/workflows/byoc/run_on_cluster.rst new file mode 100644 index 0000000..209ab41 --- /dev/null +++ b/docs/source-app/workflows/byoc/run_on_cluster.rst @@ -0,0 +1,27 @@ +:orphan: + +.. _run_on_cluster: + + +********************************* +Run app on your Lightning Cluster +********************************* + +Once your cluster is running, you can run any Lightning App on your cluster. To run an App on the Lightning BYOC cluster, use ``--cloud –cluster-id `` in the command: + +.. code:: bash + + lightning run app app.py --cloud --cluster-id + +Here’s an example: + +.. code:: bash + + lightning run app app.py --cloud --cluster-id my-byoc-cluster + + +View the status of your App using the following command: + +.. code:: bash + + lightning list apps diff --git a/docs/source-app/workflows/debug_locally.rst b/docs/source-app/workflows/debug_locally.rst new file mode 100644 index 0000000..cd5a5a8 --- /dev/null +++ b/docs/source-app/workflows/debug_locally.rst @@ -0,0 +1,5 @@ +:orphan: + +##################################### +Debug a Distributed Cloud App Locally +##################################### diff --git a/docs/source-app/workflows/enable_fault_tolerance.rst b/docs/source-app/workflows/enable_fault_tolerance.rst new file mode 100644 index 0000000..b1630d4 --- /dev/null +++ b/docs/source-app/workflows/enable_fault_tolerance.rst @@ -0,0 +1,5 @@ +:orphan: + +###################### +Enable Fault Tolerance +###################### diff --git a/docs/source-app/workflows/extend_app.rst b/docs/source-app/workflows/extend_app.rst new file mode 100644 index 0000000..2e17af4 --- /dev/null +++ b/docs/source-app/workflows/extend_app.rst @@ -0,0 +1,59 @@ +###################### +Extend an Existing App +###################### +You can extend a Lightning App by using community components or building your own. + +---- + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Add more Components + :description: Extend an App by adding a prebuilt component. + :col_css: col-md-4 + :button_link: add_components/index.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: Add a web user interface (UI) + :description: Extend an App by adding a web user interface (UI) + :col_css: col-md-4 + :button_link: add_web_ui/index.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: Add a URL link + :description: Extend an App by adding a web URL link + :col_css: col-md-4 + :button_link: add_web_link.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: Build a Component + :description: Extend an App by building a Component + :col_css: col-md-4 + :button_link: build_lightning_component/index.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: Add a server + :description: Extend an App by adding a server to a Component. + :col_css: col-md-4 + :button_link: add_server/index.html + :height: 150 + :tag: Intermediate + + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/index.rst b/docs/source-app/workflows/index.rst new file mode 100644 index 0000000..801c6cc --- /dev/null +++ b/docs/source-app/workflows/index.rst @@ -0,0 +1,202 @@ +.. toctree:: + :maxdepth: 1 + :hidden: + + access_app_state/access_app_state + add_web_ui/index + add_web_link + secrets <../glossary/secrets> + arrange_tabs/index + connect components <../levels/intermediate/connect_lightning_components> + build components <../levels/basic/build_a_lightning_component> + run_work_once + cloud compute <../core_api/lightning_work/compute> + build_command_line_interface/index + rest API <../glossary/restful_api/restful_api> + extend_app + build_lightning_component/publish_a_component + byoc/index + ssh/index + add_server/index + run_app_on_cloud/index + run_work_in_parallel + drive <../glossary/storage/drive> + share_app + share_files_between_components + +####### +How to: +####### + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Access the App State + :description: Learn to work with the app state + :col_css: col-md-4 + :button_link: access_app_state/access_app_state.html + :height: 180 + +.. displayitem:: + :header: Add a web user interface + :description: Learn how to add React, StreamLit, Dash to your App. + :col_css: col-md-4 + :button_link: add_web_ui/index.html + :height: 180 + +.. displayitem:: + :header: Add a web link + :description: Learn how to embed external websites + :col_css: col-md-4 + :button_link: add_web_link.html + :height: 180 + +.. displayitem:: + :header: Add encrypted secrets + :description: Learn how to organize your UI + :col_css: col-md-4 + :button_link: ../glossary/secrets.html + :height: 180 + +.. displayitem:: + :header: Arrange App tabs + :description: Learn how to organize your UI + :col_css: col-md-4 + :button_link: arrange_tabs/index.html + :height: 180 + +.. displayitem:: + :header: Build a Lightning App + :description: Simple App to get started + :col_css: col-md-4 + :button_link: ../levels/basic/connect_lightning_components.html + :height: 180 + +.. displayitem:: + :header: Build a Lightning Component + :description: Understand how to separated the glue from the actual work + :col_css: col-md-4 + :button_link: ../levels/basic/build_a_lightning_component.html + :height: 180 + +.. displayitem:: + :header: Cache Work run calls + :description: Understand how to trigger a work run method + :col_css: col-md-4 + :button_link: run_work_once.html + :height: 180 + +.. displayitem:: + :header: Customize your cloud compute + :description: Select machines to run on + :col_css: col-md-4 + :button_link: ../core_api/lightning_work/compute.html + :height: 180 + +.. displayitem:: + :header: Develop a Command Line Interface (CLI) + :description: Learn to develop a CLI + :col_css: col-md-4 + :button_link: build_command_line_interface/index.html + :height: 180 + +.. displayitem:: + :header: Develop a Lightning App + :description: Learn to connect components together into a Lightning App + :col_css: col-md-4 + :button_link: ../levels/basic/connect_lightning_components.html + :height: 180 + +.. displayitem:: + :header: Develop a REST API + :description: Learn to deploy a model behind a REST API + :col_css: col-md-4 + :button_link: ../glossary/restful_api/restful_api.html + :height: 180 + +.. displayitem:: + :header: Extend an existing App + :description: Learn where to go next with an App + :col_css: col-md-4 + :button_link: extend_app.html + :height: 180 + +.. displayitem:: + :header: Publish a Lightning Component + :description: Share your components with others + :col_css: col-md-4 + :button_link: build_lightning_component/publish_a_component.html + :height: 180 + +.. displayitem:: + :header: Run Apps on your cloud account (BYOC) + :description: Share your components with others + :col_css: col-md-4 + :button_link: byoc/index.html + :height: 180 + +.. displayitem:: + :header: Run a server within a Lightning App + :description: Lightning Work can be infinite jobs + :col_css: col-md-4 + :button_link: add_server/index.html + :height: 180 + +.. displayitem:: + :header: Run an App on the cloud + :description: Learn how to get things done in the cloud with ease + :col_css: col-md-4 + :button_link: run_app_on_cloud/index.html + :height: 180 + +.. displayitem:: + :header: Run Works in parallel + :description: Learn how to make your Work non blocking + :col_css: col-md-4 + :button_link: run_work_in_parallel.html + :height: 180 + +.. displayitem:: + :header: Save files + :description: Learn how to save files in a work by using Drive + :col_css: col-md-4 + :button_link: ../glossary/storage/drive.html + :height: 180 + +.. displayitem:: + :header: Share an App + :description: Learn how to share your work with others + :col_css: col-md-4 + :button_link: share_app.html + :height: 180 + +.. displayitem:: + :header: Share files between components + :description: Learn how Lightning Storage emulates a single filesystem in a distributed setting + :col_css: col-md-4 + :button_link: share_files_between_components.html + :height: 180 + +.. displayitem:: + :header: Debug cloud apps via SSH + :description: Learn how to get SSH access to your App + :col_css: col-md-4 + :button_link: ssh/index.html + :height: 180 + +.. displayitem:: + :header: Mount Cloud Data + :description: Learn how Lightning Mounts are used to make the contents of an cloud object store bucket available on disk when running in the cloud. + :col_css: col-md-4 + :button_link: mount_cloud_object_store.html + :height: 180 + + + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/mount_cloud_object_store.rst b/docs/source-app/workflows/mount_cloud_object_store.rst new file mode 100644 index 0000000..72e6fa0 --- /dev/null +++ b/docs/source-app/workflows/mount_cloud_object_store.rst @@ -0,0 +1,141 @@ +:orphan: + +############## +Add Cloud Data +############## + +**Audience:** Users who want to read files stored in a Cloud Object Bucket in an app. + +****************************** +Mounting Public AWS S3 Buckets +****************************** + +=================== +Add Mount to a Work +=================== + +To mount data from a cloud bucket to your app compute, initialize a :class:`~lightning.app.storage.mount.Mount` +object with the source path of the s3 bucket and the absolute directory path where it should be mounted and +pass the :class:`~lightning.app.storage.mount.Mount` to the :class:`~lightning.app.utilities.packaging.cloud_compute.CloudCompute` +of the :class:`~lightning.app.core.work.LightningWork` it should be mounted on. + +In this example, we will mount an S3 bucket: ``s3://ryft-public-sample-data/esRedditJson/`` to ``/content/esRedditJson/``. + +.. code-block:: python + + from lightning.app import CloudCompute + from lightning.app.storage import Mount + + self.my_work = MyWorkClass( + cloud_compute=CloudCompute( + mounts=Mount( + source="s3://ryft-public-sample-data/esRedditJson/", + mount_path="/content/esRedditJson/", + ), + ) + ) + +You can also pass multiple mounts to a single work by passing a ``List[Mount(...), ...]`` to the +``CloudCompute(mounts=...)`` argument. + +.. note:: + + * Mounts supported up to 1 Million files, 5GB per file. Need larger mounts? Contact support@lightning.ai + * When adding multiple mounts, each one should have a unique ``mount_path``. + * A maximum of 10 :class:`~lightning.app.storage.mount.Mount`\s can be added to a :class:`~lightning.app.core.work.LightningWork`. + +======================= +Read Files From a Mount +======================= + +Once a :class:`~lightning.app.storage.mount.Mount` object is passed to :class:`~lightning.app.utilities.packaging.cloud_compute.CloudCompute`, +you can access, list, or read any file from the mount under the specified ``mount_path``, just like you would if it +was on your local machine. + +Assuming your ``mount_path`` is ``"/content/esRedditJson/"`` you can do the following: + +---------- +Read Files +---------- + +.. code-block:: python + + with open("/content/esRedditJson/esRedditJson1", "r") as f: + some_data = f.read() + + # do something with "some_data"... + +---------- +List Files +---------- + +.. code-block:: python + + files = os.listdir("/content/esRedditJson/") + +-------------------- +See the Full Example +-------------------- + +.. code-block:: python + :emphasize-lines: 10,15 + + import os + + import lightning as L + from lightning.app import CloudCompute + from lightning.app.storage import Mount + + class ReadMount(L.LightningWork): + def run(self): + # Print a list of files stored in the mounted S3 Bucket. + files = os.listdir("/content/esRedditJson/") + for file in files: + print(file) + + # Read the contents of a particular file in the bucket "esRedditJson1" + with open("/content/esRedditJson/esRedditJson1", "r") as f: + some_data = f.read() + # do something with "some_data"... + + class Flow(L.LightningFlow): + def __init__(self): + super().__init__() + self.my_work = ReadMount( + cloud_compute=CloudCompute( + mounts=Mount( + source="s3://ryft-public-sample-data/esRedditJson/", + mount_path="/content/esRedditJson/", + ), + ) + ) + + def run(self): + self.my_work.run() + +.. note:: + + When running a Lighting App on your local machine, any :class:`~lightning.app.utilities.packaging.cloud_compute.CloudCompute` + configuration (including a :class:`~lightning.app.storage.mount.Mount`) is ignored at runtime. If you need access to + these files on your local disk, you should download a copy of them to your machine. + +.. note:: + + Mounted files from an S3 bucket are ``read-only``. Any modifications, additions, or deletions + to files in the mounted directory will not be reflected in the cloud object store. + +---- + +********************************************** +Mounting Private AWS S3 Buckets - Coming Soon! +********************************************** + +We'll Let you know when this feature is ready! + +---- + +************************************************ +Mounting Google Cloud GCS Buckets - Coming Soon! +************************************************ + +We'll Let you know when this feature is ready! diff --git a/docs/source-app/workflows/run_app_on_cloud/cloud_files.rst b/docs/source-app/workflows/run_app_on_cloud/cloud_files.rst new file mode 100644 index 0000000..dfef0dc --- /dev/null +++ b/docs/source-app/workflows/run_app_on_cloud/cloud_files.rst @@ -0,0 +1,69 @@ +.. _ignore: + +################################## +Configure Your Lightning Cloud App +################################## + +**Audience:** Users who want to control Lightning App files on the cloud. + +---- + +************************************** +Ignore file uploads to Lightning cloud +************************************** +Running Lightning Apps on the cloud will upload the source code of your app to the cloud. You can use ``.lightningignore`` file(s) to ignore files or directories while uploading. The `.lightningignore` file follows the same format as a `.gitignore` +file. + +For example, the source code directory below with the ``.lightningignore`` file will ignore the file named +``model.pt`` and directory named ``data_dir``. + +.. code:: bash + + . + ├── README.md + ├── app.py + ├── data_dir + │ ├── image1.png + │ ├── image2.png + │ └── ... + ├── .lightningignore + ├── requirements.txt + └── model.pt + +.. code:: bash + + ~/project/home ❯ cat .lightningignore + model.pt + data_dir + +A sample ``.lightningignore`` file can be found `here `_. + +If you are a component author and your components creates local files that you want to ignore, you can do: + +.. code-block:: python + + class MyComponent(L.LightningWork): # or L.LightningFlow + def __init__(self): + super().__init__() + self.lightningignore = ("model.pt", "data_dir") + + +This has the benefit that the files will be ignored automatically for all the component users, making an easier +transition between running locally vs in the cloud. + +---- + +******************* +Structure app files +******************* + +We recommend your app contain the following files: + +.. code:: bash + + . + ├── .lightning (auto-generated- conatins Lightning configuration) + ├── .lightningignore (contains files not to upload to the cloud) + ├── app.py + ├── README.md (optional- a markdown description of your app) + └── requirements.txt (optional- conatins all your app dependencies) diff --git a/docs/source-app/workflows/run_app_on_cloud/index.rst b/docs/source-app/workflows/run_app_on_cloud/index.rst new file mode 100644 index 0000000..55bc3b6 --- /dev/null +++ b/docs/source-app/workflows/run_app_on_cloud/index.rst @@ -0,0 +1,5 @@ +##################### +Run apps on the cloud +##################### + +.. include:: index_content.rst diff --git a/docs/source-app/workflows/run_app_on_cloud/index_content.rst b/docs/source-app/workflows/run_app_on_cloud/index_content.rst new file mode 100644 index 0000000..b0f6757 --- /dev/null +++ b/docs/source-app/workflows/run_app_on_cloud/index_content.rst @@ -0,0 +1,115 @@ +.. _run_app_in_cloud: + +.. toctree:: + :maxdepth: 1 + :hidden: + + cloud_files + lightning_cloud + on_prem + on_your_own_machine + +**Audience:** Users who want to share or scale Lightning Apps. + +---- + +***************************** +Run on Lightning Public Cloud +***************************** + +You can run Lightning Apps for free on the Public Lightning cloud with a single flag! + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Run on Lightning Cloud + :description: Learn how to run on the Lightning public cloud + :col_css: col-md-4 + :button_link: lightning_cloud.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: Choose Hardware + :description: Configure you app cloud resources + :col_css: col-md-4 + :button_link: ../../core_api/lightning_work/compute.html + :height: 150 + :tag: Basic + +.. displayitem:: + :header: Set Environment Variables + :description: Manage your environment variables in the cloud + :col_css: col-md-4 + :button_link: ../../glossary/environment_variables.html + :height: 150 + :tag: Basic + +.. displayitem:: + :header: Configure Your Lightning Cloud App + :description: Customize your cloud apps files + :col_css: col-md-4 + :button_link: cloud_files.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: Manage App Dependancies + :description: Configure your python requirements or use a custom docker image + :col_css: col-md-4 + :button_link: ../../glossary/build_config/build_config.html + :height: 150 + :tag: Intermediate + +.. displayitem:: + :header: Share Files Between Works + :description: Learn more about data transfering + :col_css: col-md-4 + :button_link: ../../glossary/storage/storage.html + :height: 150 + :tag: Intermediate + +.. raw:: html + +
+
+ +---- + +************ +Other Clouds +************ + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Run On Your Own Machine + :description: Run Lightning Apps on any machine + :col_css: col-md-4 + :button_link: on_your_own_machine.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: Run On Your Private Cloud + :description: Run Lightning Apps on your own cloud + :col_css: col-md-4 + :button_link: on_prem.html + :height: 150 + :tag: basic + + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/run_app_on_cloud/lightning_cloud.rst b/docs/source-app/workflows/run_app_on_cloud/lightning_cloud.rst new file mode 100644 index 0000000..aaa9d7b --- /dev/null +++ b/docs/source-app/workflows/run_app_on_cloud/lightning_cloud.rst @@ -0,0 +1,67 @@ +####################### +Run an App on the Cloud +####################### + +**Audience:** Users who want to share their apps or run on specialized hardware (like GPUs). + +---- + +********************************* +Run on the public Lightning cloud +********************************* +To run any app on the public lightning cloud use the ``--cloud`` argument: + +.. code:: bash + + lightning run app app.py --cloud + + +.. note:: + By default, running your apps on the public Lightning cloud is free of charge using default CPUs, and any app uploaded to the Lightning cloud will be shared with the community (source code and app view will be public). If you would like to make your apps private please `contact us `_. + +If your app contains ``LightningWork`` components that require more compute resources, such as larger CPUs or **GPUs**, you'll need to add credits to your Lightning AI account. + + +---- + +************************** +Add dependencies to my app +************************** + + +Add all dependencies required to run your app to a `requirements.txt` file in your app's directory. Read :ref:`build_config` for more details. + + + +---- + + +******** +Name app +******** + +Simply use the ``--name`` flag when running your app, for example: + +.. code:: bash + + lightning run app app.py --cloud --name my-awesome-app + +Alternatively, you can change the name of the app in the ``.lightning`` file: + +.. code:: bash + + ~/project/home ❯ cat .lightning + name: my-awesome-app + +The ``.lightning`` file is a general configuration file. +To learn more about optional configuration file parameters, see :class:`~lightning.utilities.packaging.app_config.AppConfig`. + +------ + +******************** +Choose Cloud Compute +******************** + +You can configure the hardware your app is running on by setting a :class:`~lightning.utilities.packaging.cloud_compute.CloudCompute` object onto the ``cloud_compute`` property of your work's. + +Learn more with the :ref:`cloud_compute` guide diff --git a/docs/source-app/workflows/run_app_on_cloud/on_prem.rst b/docs/source-app/workflows/run_app_on_cloud/on_prem.rst new file mode 100644 index 0000000..be0a954 --- /dev/null +++ b/docs/source-app/workflows/run_app_on_cloud/on_prem.rst @@ -0,0 +1,6 @@ +########################### +Run an App on Private Cloud +########################### + + +To run Lightning apps on a private or on-prem cluster, `contact us `_. diff --git a/docs/source-app/workflows/run_app_on_cloud/on_your_own_machine.rst b/docs/source-app/workflows/run_app_on_cloud/on_your_own_machine.rst new file mode 100644 index 0000000..8226a1a --- /dev/null +++ b/docs/source-app/workflows/run_app_on_cloud/on_your_own_machine.rst @@ -0,0 +1,26 @@ +####################### +Run on your own machine +####################### + +**Audience:** Users who want to run Lightning App on a remote machine. + +---- + +*********** +Run via ssh +*********** +To run a Lightning App on any machine, simply ssh to the machine and run the app directly + +.. code:: bash + + # Copy over credentials from your local machine to your cloud machine + scp ~/.lightning/credentials.json your_name@your_cloud_machine:~/.lightning + + # log into your cloud machine + ssh your_name@your_cloud_machine + + # get your code on the machine and install deps + ... + + # start the app + lightning run app app.py diff --git a/docs/source-app/workflows/run_app_snippet.rst b/docs/source-app/workflows/run_app_snippet.rst new file mode 100644 index 0000000..57d2ae0 --- /dev/null +++ b/docs/source-app/workflows/run_app_snippet.rst @@ -0,0 +1,33 @@ +:orphan: + +*********** +Run the app +*********** + +.. raw:: html + +
+
+ +Run the app with the ``run`` command + +.. code:: bash + + lightning run app app.py + +.. raw:: html + +
+
+ + +Add the ``--cloud`` argument to run on the `lightning cloud `_. + +.. code:: bash + + lightning run app app.py --cloud + +.. raw:: html + +
+
diff --git a/docs/source-app/workflows/run_components_on_different_hardware.rst b/docs/source-app/workflows/run_components_on_different_hardware.rst new file mode 100644 index 0000000..9685c34 --- /dev/null +++ b/docs/source-app/workflows/run_components_on_different_hardware.rst @@ -0,0 +1,5 @@ +:orphan: + +#################################### +Run components on different hardware +#################################### diff --git a/docs/source-app/workflows/run_on_private_cloud.rst b/docs/source-app/workflows/run_on_private_cloud.rst new file mode 100644 index 0000000..84d64e9 --- /dev/null +++ b/docs/source-app/workflows/run_on_private_cloud.rst @@ -0,0 +1,26 @@ +:orphan: + +###################### +Run on a private cloud +###################### +**Audience:** Users looking to run Lightning apps on their private cloud accounts. + +---- + +****************************** +Run on a private cloud account +****************************** +For enterprise, startups and University use-cases, Lightning AI can run on your own AWS account (with your own credentials), with all the infrastructure fully managed by us. +To enable this, contact our support team to get started: + +onprem@lightning.ai + +---- + + +*********** +Run on-prem +*********** +For enterprise-level security with full control of the Lightning AI system on your own on-prem cluster, contact our support team to get started: + +onprem@lightning.ai diff --git a/docs/source-app/workflows/run_work_in_parallel.rst b/docs/source-app/workflows/run_work_in_parallel.rst new file mode 100644 index 0000000..90c7b7b --- /dev/null +++ b/docs/source-app/workflows/run_work_in_parallel.rst @@ -0,0 +1,10 @@ +############################# +Run LightningWork in parallel +############################# +**Audience:** Users who want to run a LightningWork in parallel (asynchroneously). + +**Prereqs:** You must have finished the `Basic levels <../basic/>`_. + +---- + +.. include:: run_work_in_parallel_content.rst diff --git a/docs/source-app/workflows/run_work_in_parallel_content.rst b/docs/source-app/workflows/run_work_in_parallel_content.rst new file mode 100644 index 0000000..1c8d5b3 --- /dev/null +++ b/docs/source-app/workflows/run_work_in_parallel_content.rst @@ -0,0 +1,41 @@ + + + +************************************ +When to run a Components in parallel +************************************ +Run LightningWork in parallel when you want to execute work in the background or at the same time as another work. +An example of when this comes up in machine learning is when data streams-in while a model trains. + +---- + +************ +Toy example +************ +By default, a Component must complete before the next one runs. We can enable one +component to start in parallel which allows the code to proceed without having +to wait for the first one to finish. + +.. lit_tabs:: + :descriptions: No parallel components; Allow the train component to run in parallel; When the component runs, it will run in parallel; The next component is unblocked and can now immediately run. + :code_files: /workflows/scripts/parallel/toy_app.py; /workflows/scripts/parallel/toy_parallel.py; /workflows/scripts/parallel/toy_parallel.py; /workflows/scripts/parallel/toy_parallel.py; + :highlights: ; 18; 23; 24; + :enable_run: true + :tab_rows: 3 + :height: 540px + +---- + +******************************* +Multiple components in parallel +******************************* +In this example, we start all 3 components at once. The first two start in parallel, which +allows the third component to run without waiting for the others to finish. + +.. lit_tabs:: + :descriptions: No parallel components; Enable 2 components to run in parallel; Start both components together in parallel; Last component is not blocked and can start immediately. + :code_files: /workflows/scripts/parallel/toy_two_parallel_not_started.py; /workflows/scripts/parallel/toy_two_parallel.py; /workflows/scripts/parallel/toy_two_parallel.py; /workflows/scripts/parallel/toy_two_parallel.py + :highlights: ; 18, 19; 23, 24; 25 + :enable_run: true + :tab_rows: 3 + :height: 540px diff --git a/docs/source-app/workflows/run_work_once.rst b/docs/source-app/workflows/run_work_once.rst new file mode 100644 index 0000000..240cde3 --- /dev/null +++ b/docs/source-app/workflows/run_work_once.rst @@ -0,0 +1,13 @@ +########################## +Cache LightningWork Runs +########################## + +**Audience:** Users who want to know how ``LightningWork`` works. + +**Level:** Advanced + +**Prereqs**: Level 16+ and read the `Event Loop guide <../glossary/event_loop.html>`_. + +---- + +.. include:: run_work_once_content.rst diff --git a/docs/source-app/workflows/run_work_once_content.rst b/docs/source-app/workflows/run_work_once_content.rst new file mode 100644 index 0000000..c1890fe --- /dev/null +++ b/docs/source-app/workflows/run_work_once_content.rst @@ -0,0 +1,151 @@ + +******************************************************** +What caching the calls of Work's run method does for you +******************************************************** + +By default, the run method in a LightningWork (Work) "remembers" (caches) the input arguments it is getting called with and does not execute again if called with the same arguments again. +In other words, the run method only executes when the input arguments have never been seen before. + +You can turn caching on or off: + +.. code-block:: python + + # Run only when the input arguments change (default) + work = MyWork(cache_calls=True) + + # Run everytime regardless of whether input arguments change or not + work = MyWork(cache_calls=False) + +To better understand this, imagine that every day you want to sequentially download and process some data and then train a model on that data. +As explained in the `Event Loop guide <../glossary/event_loop.html>`_, the Lightning App runs within an infinite while loop, so the pseudo-code of your application might looks like this: + +.. code-block:: python + + from datetime import datetime + + # Lightning code + while True: # This is the Lightning Event Loop + + # Your code + today = datetime.now().strftime("%D") # '05/25/22' + data_processor.run(today) + train_model.run(data_processor.data) + +In this scenario, you want your components to run ``once`` a day, and no more than that! But your code is running within an infinite loop, how can this even work? +This is where the Work's internal caching mechanism comes in. By default, Lightning caches a hash of the input provided to its run method and won't re-execute the method if the same input is provided again. +In the example above, the **data_processor** component run method receives the string **"05/25/22"**. It runs one time and any further execution during the day is skipped until tomorrow is reached and the work run method receives **06/25/22**. This logic applies everyday. +This caching mechanism is inspired from how `React.js Components and Props `_ renders websites. Only changes to the inputs re-trigger execution. + +*************** +Caching Example +*************** + +Here's an example of this behavior with LightningWork: + +.. code:: python + :emphasize-lines: 11, 17 + + import lightning as L + + + class ExampleWork(L.LightningWork): + def run(self, *args, **kwargs): + print(f"I received the following props: args: {args} kwargs: {kwargs}") + + + work = ExampleWork() + work.run(value=1) + + # Providing the same value. This won't run as already cached. + work.run(value=1) + work.run(value=1) + work.run(value=1) + work.run(value=1) + + # Changing the provided value. This isn't cached and will run again. + work.run(value=10) + +And you should see the following by running the code above: + +.. code-block:: console + + $ python example.py + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + # After you have clicked `run` on the UI. + I received the following props: args: () kwargs: {'value': 1} + I received the following props: args: () kwargs: {'value': 10} + +As you can see, the intermediate run didn't execute, as we would expected when ``cache_calls=True``. + +*********************************** +Implications of turning caching off +*********************************** + +By setting ``cache_calls=False``, Lightning won't cache the return value and re-execute the run method on every call. + +.. code:: python + :emphasize-lines: 7 + + from lightning.app import LightningWork + + + class ExampleWork(LightningWork): + def run(self, *args, **kwargs): + print(f"I received the following props: args: {args} kwargs: {kwargs}") + + + work = ExampleWork(cache_calls=False) + work.run(value=1) + + # Providing the same value. This won't run as already cached. + work.run(value=1) + work.run(value=1) + work.run(value=1) + work.run(value=1) + + # Changing the provided value. This isn't cached and will run again. + work.run(value=10) + +.. code-block:: console + + $ python example.py + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + # After you have clicked `run` on the UI. + I received the following props: args: () kwargs: {'value': 1} + I received the following props: args: () kwargs: {'value': 1} + I received the following props: args: () kwargs: {'value': 1} + I received the following props: args: () kwargs: {'value': 1} + I received the following props: args: () kwargs: {'value': 1} + I received the following props: args: () kwargs: {'value': 10} + +Be aware than when setting both ``cache_calls=False`` and ``parallel=False`` to a work, the code after the ``self.work.run()`` is unreachable +as the work continuously execute in a blocking way. + +.. code-block:: python + :emphasize-lines: 9-10 + + from lightning.app import LightningApp, LightningFlow, LightningWork + + + class Flow(LightningFlow): + def __init__(self): + super().__init__() + + self.work = Work(cache_calls=False, parallel=False) + + def run(self): + print("HERE BEFORE") + self.work.run() + print("HERE AFTER") + + + app = LightningApp(Flow()) + +.. code-block:: console + + $ lightning run app app.py + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + print("HERE BEFORE") + print("HERE BEFORE") + print("HERE BEFORE") + ... diff --git a/docs/source-app/workflows/schedule_apps.rst b/docs/source-app/workflows/schedule_apps.rst new file mode 100644 index 0000000..7b596cd --- /dev/null +++ b/docs/source-app/workflows/schedule_apps.rst @@ -0,0 +1,5 @@ +:orphan: + +################# +Schedule App Runs +################# diff --git a/docs/source-app/workflows/scripts/parallel/toy_app.py b/docs/source-app/workflows/scripts/parallel/toy_app.py new file mode 100644 index 0000000..05f25fd --- /dev/null +++ b/docs/source-app/workflows/scripts/parallel/toy_app.py @@ -0,0 +1,27 @@ +# app.py +import lightning as L + + +class TrainComponent(L.LightningWork): + def run(self, message): + for i in range(100000000000): + print(message, i) + +class AnalyzeComponent(L.LightningWork): + def run(self, message): + for i in range(100000000000): + print(message, i) + +class LitWorkflow(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.train = TrainComponent(cloud_compute=L.CloudCompute('cpu')) + self.analyze = AnalyzeComponent(cloud_compute=L.CloudCompute('cpu')) + + + def run(self): + self.train.run("machine A counting") + self.analyze.run("machine B counting") + + +app = L.LightningApp(LitWorkflow()) diff --git a/docs/source-app/workflows/scripts/parallel/toy_parallel.py b/docs/source-app/workflows/scripts/parallel/toy_parallel.py new file mode 100644 index 0000000..00d6178 --- /dev/null +++ b/docs/source-app/workflows/scripts/parallel/toy_parallel.py @@ -0,0 +1,27 @@ +# app.py +import lightning as L + + +class TrainComponent(L.LightningWork): + def run(self, message): + for i in range(100000000000): + print(message, i) + +class AnalyzeComponent(L.LightningWork): + def run(self, message): + for i in range(100000000000): + print(message, i) + +class LitWorkflow(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.train = TrainComponent(cloud_compute=L.CloudCompute('cpu'), parallel=True) + self.analyze = AnalyzeComponent(cloud_compute=L.CloudCompute('cpu')) + + + def run(self): + self.train.run("machine A counting") + self.analyze.run("machine B counting") + + +app = L.LightningApp(LitWorkflow()) diff --git a/docs/source-app/workflows/scripts/parallel/toy_two_parallel.py b/docs/source-app/workflows/scripts/parallel/toy_two_parallel.py new file mode 100644 index 0000000..1b04e4e --- /dev/null +++ b/docs/source-app/workflows/scripts/parallel/toy_two_parallel.py @@ -0,0 +1,27 @@ +# app.py +import lightning as L + + +class TrainComponent(L.LightningWork): + def run(self, message): + for i in range(100000000000): + print(message, i) + +class AnalyzeComponent(L.LightningWork): + def run(self, message): + for i in range(100000000000): + print(message, i) + +class LitWorkflow(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.train = TrainComponent(cloud_compute=L.CloudCompute('cpu'), parallel=True) + self.baseline_1 = TrainComponent(cloud_compute=L.CloudCompute('cpu'), parallel=True) + self.analyze = AnalyzeComponent(cloud_compute=L.CloudCompute('cpu')) + + def run(self): + self.train.run("machine A counting") + self.baseline_1.run("machine C counting") + self.analyze.run("machine B counting") + +app = L.LightningApp(LitWorkflow()) diff --git a/docs/source-app/workflows/scripts/parallel/toy_two_parallel_not_started.py b/docs/source-app/workflows/scripts/parallel/toy_two_parallel_not_started.py new file mode 100644 index 0000000..61fc9d1 --- /dev/null +++ b/docs/source-app/workflows/scripts/parallel/toy_two_parallel_not_started.py @@ -0,0 +1,27 @@ +# app.py +import lightning as L + + +class TrainComponent(L.LightningWork): + def run(self, message): + for i in range(100000000000): + print(message, i) + +class AnalyzeComponent(L.LightningWork): + def run(self, message): + for i in range(100000000000): + print(message, i) + +class LitWorkflow(L.LightningFlow): + def __init__(self) -> None: + super().__init__() + self.train = TrainComponent(cloud_compute=L.CloudCompute('cpu')) + self.baseline_1 = TrainComponent(cloud_compute=L.CloudCompute('cpu')) + self.analyze = AnalyzeComponent(cloud_compute=L.CloudCompute('cpu')) + + def run(self): + self.train.run("machine A counting") + self.baseline_1.run("machine C counting") + self.analyze.run("machine B counting") + +app = L.LightningApp(LitWorkflow()) diff --git a/docs/source-app/workflows/share_app.rst b/docs/source-app/workflows/share_app.rst new file mode 100644 index 0000000..87045bd --- /dev/null +++ b/docs/source-app/workflows/share_app.rst @@ -0,0 +1,33 @@ +############ +Share an App +############ +**Audience:** Users who want to show off their work. + +---- + +*********************************** +Option 1: Run on the cloud to share +*********************************** +To share an app, simply run your app on the cloud: + +.. code:: bash + + lightning run app app.py --cloud + +Then share the link that's generated (`like this one `_). + +---- + +********************************** +Option 2: Expose a tunnel to share +********************************** +If you'd like to share yourself, feel free to run the app in local mode +and expose the URlapp. + +Run local: + +.. code:: bash + + lightning run app app.py + +And then, use one of the many guides to `expose a tunnel `_. diff --git a/docs/source-app/workflows/share_files_between_components.rst b/docs/source-app/workflows/share_files_between_components.rst new file mode 100644 index 0000000..4eddc68 --- /dev/null +++ b/docs/source-app/workflows/share_files_between_components.rst @@ -0,0 +1,120 @@ +:orphan: + +############################## +Share Files Between Components +############################## + +.. note:: The contents of this page is still in progress! + +**Audience:** Users who want to share files between components. + +---- + +********************************** +Why do I need distributed storage? +********************************** +In a Lightning App some components can be executed on their own hardware. Distributed storage +enables a file saved by a component on one machine to be used by components in other machines (transparently). + +If you've asked the question "how do I use the checkpoint from this model to deploy this other thing", you've +needed distributed storage. + +---- + +************ +Write a file +************ +To write a file, first create a reference to the file with the :class:`~lightning.app.storage.Path` class, then write to it: + +.. code:: python + + from lightning.app.storage import Path + + # file reference + boring_file_reference = Path("boring_file.txt") + + # write to that file + with open(self.boring_file_reference, "w") as f: + f.write("yolo") + + +---- + +********** +Use a file +********** +To use a file, pass the reference to the file: + +.. code:: python + + f = open(boring_file_reference, "r") + print(f.read()) + +---- + +.. + ******************************** + Create a directory - coming soon + ******************************** + + + ---- + + ****************************** + Use a directory - coming soon + ****************************** + TODO + + ---- + +********************************* +Example: Share a model checkpoint +********************************* +A common workflow in ML is to use a checkpoint created by another component. +First, define a component that saves a checkpoint: + +.. literalinclude:: ./share_files_between_components/app.py + :lines: -19 + +Next, define a component that needs the checkpoints: + +.. literalinclude:: ./share_files_between_components/app.py + :lines: 20-31 + +Link both components via a parent component: + +.. literalinclude:: ./share_files_between_components/app.py + :lines: 32- + + +Run the app above with the following command: + +.. code-block:: bash + + lightning run app docs/source/workflows/share_files_between_components/app.py + +.. code-block:: console + + Your Lightning App is starting. This won't take long. + INFO: Your app has started. View it in your browser: http://127.0.0.1:7501/view + Loaded checkpoint_1: tensor([0, 1, 2, 3, 4]) + Loaded checkpoint_2: tensor([0, 1, 2, 3, 4]) + + +For example, here we save a file on one component and use it in another component: + +.. code:: python + + from lightning.app.storage import Path + + + class ComponentA(LightningWork): + def __init__(self): + super().__init__() + self.boring_path = None + + def run(self): + # This should be used as a REFERENCE to the file. + self.boring_path = Path("boring_file.txt") + with open(self.boring_path, "w") as f: + f.write(FILE_CONTENT) diff --git a/docs/source-app/workflows/share_files_between_components/app.py b/docs/source-app/workflows/share_files_between_components/app.py new file mode 100644 index 0000000..6b89248 --- /dev/null +++ b/docs/source-app/workflows/share_files_between_components/app.py @@ -0,0 +1,48 @@ +import os + +import torch + +import lightning as L +from lightning.app.storage import Path + + +class ModelTraining(L.LightningWork): + def __init__(self, *args, **kwargs): + super().__init__(*args, **kwargs) + self.checkpoints_path = Path("./checkpoints") + + def run(self): + # make fake checkpoints + checkpoint_1 = torch.tensor([0, 1, 2, 3, 4]) + checkpoint_2 = torch.tensor([0, 1, 2, 3, 4]) + os.makedirs(self.checkpoints_path, exist_ok=True) + checkpoint_path = str(self.checkpoints_path / "checkpoint_{}.ckpt") + torch.save(checkpoint_1, str(checkpoint_path).format("1")) + torch.save(checkpoint_2, str(checkpoint_path).format("2")) + + +class ModelDeploy(L.LightningWork): + def __init__(self, ckpt_path, *args, **kwargs): + super().__init__() + self.ckpt_path = ckpt_path + + def run(self): + ckpts = os.listdir(self.ckpt_path) + checkpoint_1 = torch.load(os.path.join(self.ckpt_path, ckpts[0])) + checkpoint_2 = torch.load(os.path.join(self.ckpt_path, ckpts[1])) + print(f"Loaded checkpoint_1: {checkpoint_1}") + print(f"Loaded checkpoint_2: {checkpoint_2}") + + +class LitApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.train = ModelTraining() + self.deploy = ModelDeploy(ckpt_path=self.train.checkpoints_path) + + def run(self): + self.train.run() + self.deploy.run() + + +app = L.LightningApp(LitApp()) diff --git a/docs/source-app/workflows/ssh/index.rst b/docs/source-app/workflows/ssh/index.rst new file mode 100644 index 0000000..e0bcbc1 --- /dev/null +++ b/docs/source-app/workflows/ssh/index.rst @@ -0,0 +1,119 @@ + +######################## +Debug cloud apps via SSH +######################## + +**Audience:** Users that want to debug their cloud apps on their own machine. + +SSH allows you to access Lightning components running on Lightning cloud in real-time using your own local machine. +This can be used for debugging apps running on the cloud: inspecting file system or monitoring the runtime environment. +This is often the case with applications that rely on GPUs. + +You can inspect the entire file system and monitor the runtime environment. + +---- + +************************ +Add SSH key to Lightning +************************ + +Before you can SSH to cloud machines, you will need to generate a new private SSH key, add it to the SSH agent, and add the public SSH key to your account on Lightning. +The following steps are one-time setup to allow you to SSH into your cloud machines. + + +Step 1: Create an SSH key +========================== + +Open a terminal and run the following command (replace email with the address you used in your lightning.ai account): + +.. code:: bash + + # make the ssh key (if you don't have one) + $ ssh-keygen -t ed25519 -C "your_email@example.com" + +This creates a new SSH key, using the provided email as a label. + +At the prompt, type a secure passphrase. + +.. code:: bash + + > Enter passphrase (empty for no passphrase): [Type a passphrase] + > Enter same passphrase again: [Type passphrase again] + + +Step 2: Add your key to Lightning +================================= + +You can add SSH keys using Lightning.ai website (Lightning.ai > Profile > Keys) or via this CLI command: + +.. code:: bash + + $ lightning create ssh-key --public-key ~/.ssh/id_ed25519.pub + +You are now ready to access your Lightning Flow and Work containers. + +---- + +********************************************************** +SSH to your cloud app +********************************************************** + +Ensure you have a running Lightning application in the cloud: + +.. code:: bash + + $ lightning run app app.py --cloud --name my-app + + +Next, start your ssh-agent in the background: + +.. code:: bash + + # add the key to the ssh-agent (to avoid having to explicitly state key on each connection) + # to start the agent, run the following + $ eval "$(ssh-agent -s)" + > Agent pid 12345 + +Add your generated ssh key: + +.. code:: bash + + $ ssh-add ~/.ssh/id_ed25519 + +Verify your ssh-key is properly loaded: + +.. code:: bash + + $ ssh-add -L + ssh-ed25519 AAAAC3NzaC1lZDI1NTE5AAAAIAn8mYRnRG1banQcfXPCUC6R8FvQS+YgfIsl70/dD3Te your_email@example.com + + +You can now SSH any app you are running on the cloud. + +To view all apps you can simple use this following: + +.. code:: bash + + $ lightning list apps + +Or, to select an app via a prompt: + +.. code:: bash + + $ lightning ssh + +To connect to a specific app flow use: + +.. code:: bash + + $ lightning list apps + $ lightning ssh --app-name # taken from previous app listing + +To connect to a LightningWork component use: + +.. code:: bash + + $ lightning ssh --app-name --component-name + +The component name is the variable name of your LightningWork instances in Python. +If you want to access your flow, use "flow" as component name. diff --git a/docs/source-app/workflows/test_an_app.rst b/docs/source-app/workflows/test_an_app.rst new file mode 100644 index 0000000..c51ae3a --- /dev/null +++ b/docs/source-app/workflows/test_an_app.rst @@ -0,0 +1,5 @@ +:orphan: + +########### +Test an App +########### diff --git a/docs/source-fabric/Makefile b/docs/source-fabric/Makefile new file mode 100644 index 0000000..268e095 --- /dev/null +++ b/docs/source-fabric/Makefile @@ -0,0 +1,19 @@ +# Minimal makefile for Sphinx documentation +# + +# You can set these variables from the command line. +SPHINXOPTS = -T -W +SPHINXBUILD = sphinx-build +SOURCEDIR = . +BUILDDIR = ../build + +# Put it first so that "make" without argument is like "make help". +help: + @$(SPHINXBUILD) -M help "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O) + +.PHONY: help Makefile + +# Catch-all target: route all unknown targets to Sphinx using the new +# "make mode" option. $(O) is meant as a shortcut for $(SPHINXOPTS). +%: Makefile + @$(SPHINXBUILD) -M $@ "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O) diff --git a/docs/source-fabric/_static/copybutton.js b/docs/source-fabric/_static/copybutton.js new file mode 100644 index 0000000..453363c --- /dev/null +++ b/docs/source-fabric/_static/copybutton.js @@ -0,0 +1,64 @@ +/* Copied from the official Python docs: https://docs.python.org/3/_static/copybutton.js */ +$(document).ready(function() { + /* Add a [>>>] button on the top-right corner of code samples to hide + * the >>> and ... prompts and the output and thus make the code + * copyable. */ + var div = $('.highlight-python .highlight,' + + '.highlight-python3 .highlight,' + + '.highlight-pycon .highlight,' + + '.highlight-default .highlight'); + var pre = div.find('pre'); + + // get the styles from the current theme + pre.parent().parent().css('position', 'relative'); + var hide_text = 'Hide the prompts and output'; + var show_text = 'Show the prompts and output'; + var border_width = pre.css('border-top-width'); + var border_style = pre.css('border-top-style'); + var border_color = pre.css('border-top-color'); + var button_styles = { + 'cursor':'pointer', 'position': 'absolute', 'top': '0', 'right': '0', + 'border-color': border_color, 'border-style': border_style, + 'border-width': border_width, 'color': border_color, 'text-size': '75%', + 'font-family': 'monospace', 'padding-left': '0.2em', 'padding-right': '0.2em', + 'border-radius': '0 3px 0 0' + } + + // create and add the button to all the code blocks that contain >>> + div.each(function(index) { + var jthis = $(this); + if (jthis.find('.gp').length > 0) { + var button = $('>>>'); + button.css(button_styles) + button.attr('title', hide_text); + button.data('hidden', 'false'); + jthis.prepend(button); + } + // tracebacks (.gt) contain bare text elements that need to be + // wrapped in a span to work with .nextUntil() (see later) + jthis.find('pre:has(.gt)').contents().filter(function() { + return ((this.nodeType == 3) && (this.data.trim().length > 0)); + }).wrap(''); + }); + + // define the behavior of the button when it's clicked + $('.copybutton').click(function(e){ + e.preventDefault(); + var button = $(this); + if (button.data('hidden') === 'false') { + // hide the code output + button.parent().find('.go, .gp, .gt').hide(); + button.next('pre').find('.gt').nextUntil('.gp, .go').css('visibility', 'hidden'); + button.css('text-decoration', 'line-through'); + button.attr('title', show_text); + button.data('hidden', 'true'); + } else { + // show the code output + button.parent().find('.go, .gp, .gt').show(); + button.next('pre').find('.gt').nextUntil('.gp, .go').css('visibility', 'visible'); + button.css('text-decoration', 'none'); + button.attr('title', hide_text); + button.data('hidden', 'false'); + } + }); +}); diff --git a/docs/source-fabric/_static/images/icon.svg b/docs/source-fabric/_static/images/icon.svg new file mode 100644 index 0000000..e88fc19 --- /dev/null +++ b/docs/source-fabric/_static/images/icon.svg @@ -0,0 +1,9 @@ + + + + + + + + + diff --git a/docs/source-fabric/_static/images/logo-large.svg b/docs/source-fabric/_static/images/logo-large.svg new file mode 100644 index 0000000..39531f9 --- /dev/null +++ b/docs/source-fabric/_static/images/logo-large.svg @@ -0,0 +1,9 @@ + + + + + + + + + diff --git a/docs/source-fabric/_static/images/logo-small.svg b/docs/source-fabric/_static/images/logo-small.svg new file mode 100644 index 0000000..1f523a5 --- /dev/null +++ b/docs/source-fabric/_static/images/logo-small.svg @@ -0,0 +1,9 @@ + + + + + + + + + diff --git a/docs/source-fabric/_static/images/logo.png b/docs/source-fabric/_static/images/logo.png new file mode 100644 index 0000000..392c965 Binary files /dev/null and b/docs/source-fabric/_static/images/logo.png differ diff --git a/docs/source-fabric/_static/images/logo.svg b/docs/source-fabric/_static/images/logo.svg new file mode 100644 index 0000000..7c0920c --- /dev/null +++ b/docs/source-fabric/_static/images/logo.svg @@ -0,0 +1,21 @@ + + + + + + + + + + + + + + + + + + + + + diff --git a/source/_static/main.css b/docs/source-fabric/_static/main.css similarity index 100% rename from source/_static/main.css rename to docs/source-fabric/_static/main.css diff --git a/docs/_static/autosummary/module.rst b/docs/source-fabric/_templates/autosummary/module.rst similarity index 100% rename from docs/_static/autosummary/module.rst rename to docs/source-fabric/_templates/autosummary/module.rst diff --git a/docs/source-fabric/_templates/classtemplate.rst b/docs/source-fabric/_templates/classtemplate.rst new file mode 100644 index 0000000..482db13 --- /dev/null +++ b/docs/source-fabric/_templates/classtemplate.rst @@ -0,0 +1,14 @@ +.. role:: hidden + :class: hidden-section +.. currentmodule:: {{ module }} + + +{{ name | underline }} + +.. autoclass:: {{ name }} + :members: + + +.. + autogenerated from source-fabric/_templates/classtemplate.rst + note it does not have :inherited-members: diff --git a/docs/source-fabric/_templates/classtemplate_no_index.rst b/docs/source-fabric/_templates/classtemplate_no_index.rst new file mode 100644 index 0000000..858c37b --- /dev/null +++ b/docs/source-fabric/_templates/classtemplate_no_index.rst @@ -0,0 +1,12 @@ +:orphan: + +.. role:: hidden + :class: hidden-section +.. currentmodule:: {{ module }} + + +{{ name | underline }} + +.. autoclass:: {{ name }} + :members: + :noindex: diff --git a/docs/_static/layout.html b/docs/source-fabric/_templates/layout.html similarity index 100% rename from docs/_static/layout.html rename to docs/source-fabric/_templates/layout.html diff --git a/docs/source-fabric/_templates/theme_variables.jinja b/docs/source-fabric/_templates/theme_variables.jinja new file mode 100644 index 0000000..cce7263 --- /dev/null +++ b/docs/source-fabric/_templates/theme_variables.jinja @@ -0,0 +1,15 @@ +{%- set external_urls = { + 'github': 'https://github.com/Lightning-AI/lightning', + 'github_issues': 'https://github.com/Lightning-AI/lightning/issues', + 'contributing': 'https://github.com/Lightning-AI/lightning/blob/master/.github/CONTRIBUTING.md', + 'governance': 'https://lightning.ai/docs/pytorch/latest/community/governance.html', + 'docs': 'https://lightning.ai/docs/fabric/', + 'twitter': 'https://twitter.com/LightningAI', + 'home': 'https://lightning.ai/docs/fabric/', + 'get_started': '', + 'blog': 'https://lightning.ai/pages/blog/', + 'support': '', + 'community': 'https://www.pytorchlightning.ai/community', + 'forums': 'https://lightning.ai/forums/', +} +-%} diff --git a/docs/source-fabric/advanced/distributed_communication.rst b/docs/source-fabric/advanced/distributed_communication.rst new file mode 100644 index 0000000..83aac5c --- /dev/null +++ b/docs/source-fabric/advanced/distributed_communication.rst @@ -0,0 +1,286 @@ +########################################### +Communication between distributed processes +########################################### + +With Fabric, you can easily access information about a process or send data between processes with a standardized API and agnostic to the distributed strategy. + + +---- + + +******************* +Rank and world size +******************* + +The rank assigned to a process is a zero-based index in the range of *0, ..., world size - 1*, where *world size* is the total number of distributed processes. +If you are using multi-GPU, think of the rank as the *GPU ID* or *GPU index*, although rank generally extends to distributed processing. + +The rank is unique across all processes, regardless of how they are distributed across machines, and it is therefore also called **global rank**. +We can also identify processes by their **local rank**, which is unique among processes running on the same machine but is not unique globally across all machines. +Finally, each process is associated with a **node rank** in the range *0, ..., num nodes - 1*, which identifies which machine (node) the process is running on. + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/fabric_collectives_ranks.jpeg + :alt: The different type of process ranks: Local, global, node. + :width: 100% + +Here is how you launch multiple processes in Fabric: + +.. code-block:: python + + from lightning.fabric import Fabric + + # Devices and num_nodes determine how many processes there are + fabric = Fabric(devices=2, num_nodes=3) + fabric.launch() + +Learn more about :doc:`launching distributed training <../fundamentals/launch>`. +And here is how you access all rank and world size information: + +.. code-block:: python + + # The total number of processes running across all devices and nodes + fabric.world_size # 2 * 3 = 6 + + # The global index of the current process across all devices and nodes + fabric.global_rank # -> {0, 1, 2, 3, 4, 5} + + # The index of the current process among the processes running on the local node + fabric.local_rank # -> {0, 1} + + # The index of the current node + fabric.node_rank # -> {0, 1, 2} + + # Do something only on rank 0 + if fabric.global_rank == 0: + ... + + +.. _race conditions: + +Avoid race conditions +===================== + +Access to the rank information helps you avoid *race conditions* which could crash your script or lead to corrupted data. +Such conditions can occur when multiple processes try to write to the same file simultaneously, for example, writing a checkpoint file or downloading a dataset. +Avoid this from happening by guarding your logic with a rank check: + +.. code-block:: python + + # Only write files from one process (rank 0) ... + if fabric.global_rank == 0: + with open("output.txt", "w") as file: + file.write(...) + + # ... or save from all processes but don't write to the same file + with open(f"output-{fabric.global_rank}.txt", "w") as file: + file.write(...) + + # Multi-node: download a dataset, the filesystem between nodes is shared + if fabric.global_rank == 0: + download_dataset() + + # Multi-node: download a dataset, the filesystem between nodes is NOT shared + if fabric.local_rank == 0: + download_dataset() + +Another type of race condition is when one or multiple processes try to access a resource before it is available. +For example, when rank 0 downloads a dataset, all other processes should *wait* for the download to complete before they start reading the contents. +This can be achieved with a **barrier**. + + +---- + + +******* +Barrier +******* + +The barrier forces every process to wait until all processes have reached it. +In other words, it is a **synchronization**. + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/fabric_collectives_barrier.jpeg + :alt: The barrier for process synchronization + :width: 100% + +A barrier is needed when processes do different amounts of work and as a result fall out of sync. + +.. code-block:: python + + fabric = Fabric(accelerator="cpu", devices=4) + fabric.launch() + + # Simulate each process taking a different amount of time + sleep(2 * fabric.global_rank) + print(f"Process {fabric.global_rank} is done.") + + # Wait for all processes to reach the barrier + fabric.barrier() + print("All processes reached the barrier!") + + +A more realistic scenario is when downloading data. +Here, we need to ensure that processes only start to load the data once it has completed downloading. +Since downloading should be done on rank 0 only to :ref:`avoid race conditions `, we need a barrier: + +.. code-block:: python + + if fabric.global_rank == 0: + print("Downloading dataset. This can take a while ...") + download_dataset("http://...") + + # All other processes wait here until rank 0 is done with downloading: + fabric.barrier() + + # After everyone reached the barrier, they can access the downloaded files: + dataset = load_dataset() + + +Specifically for the use case of downloading and reading data, there is a convenience context manager that combines both the rank-check and the barrier: + +.. code-block:: python + + with fabric.rank_zero_first(): + if not dataset_exists(): + download_dataset("http://...") + dataset = load_dataset() + +With :meth:`~lightning.fabric.fabric.Fabric.rank_zero_first`, it is guaranteed that process 0 executes the code block first before all others can enter it. + + +---- + +.. _broadcast collective: + +********* +Broadcast +********* + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/fabric_collectives_broadcast.jpeg + :alt: The broadcast collective operation + :width: 100% + +The broadcast operation sends a tensor of data from one process to all other processes so that all end up with the same data. + +.. code-block:: python + + fabric = Fabric(...) + + # Transfer a tensor from one process to all the others + result = fabric.broadcast(tensor) + + # By default, the source is the process rank 0 ... + result = fabric.broadcast(tensor, src=0) + + # ... which can be change to a different rank + result = fabric.broadcast(tensor, src=3) + + +Full example: + +.. code-block:: python + + fabric = Fabric(devices=4, accelerator="cpu") + fabric.launch() + + # Data is different on each process + learning_rate = torch.rand(1) + print("Before broadcast:", learning_rate) + + # Transfer the tensor from one process to all the others + learning_rate = fabric.broadcast(learning_rate) + print("After broadcast:", learning_rate) + + +---- + + +****** +Gather +****** + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/fabric_collectives_all-gather.jpeg + :alt: The All-gather collective operation + :width: 100% + +The gather operation transfers the tensors from each process to every other process and stacks the results. +As opposed to the :ref:`broadcast `, every process gets the data from every other process, not just from a particular rank. + +.. code-block:: python + + fabric = Fabric(...) + + # Gather the data from + result = fabric.all_gather(tensor) + + # Tip: Turn off gradient syncing if you don't need to back-propagate through it + with torch.no_grad(): + result = fabric.all_gather(tensor) + + # Also works with a (nested) collection of tensors (dict, list, tuple): + collection = {"loss": torch.tensor(...), "data": ...} + gathered_collection = fabric.all_gather(collection) + + +Full example: + +.. code-block:: python + + fabric = Fabric(devices=4, accelerator="cpu") + fabric.launch() + + # Data is different in each process + data = torch.tensor(10 * fabric.global_rank) + + # Every process gathers the tensors from all other processes + # and stacks the result: + result = fabric.all_gather(data) + print("Result of all-gather:", result) # tensor([ 0, 10, 20, 30]) + + +---- + + +****** +Reduce +****** + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/fabric_collectives_all-reduce.jpeg + :alt: The All-reduce collective operation + :width: 100% + + +The reduction is an operation that takes multiple values (tensors) as input and returns a single value. +An example of a reduction is *summation*, e.g., ``torch.sum()``. +The :meth:`~lightning.fabric.fabric.Fabric.all_reduce` operation allows you to apply a reduction across multiple processes: + +.. code-block:: python + + fabric = Fabric(...) + + # Compute the mean of a tensor across processes: + result = fabric.all_reduce(tensor, reduce_op="mean") + + # Or the sum: + result = fabric.all_reduce(tensor, reduce_op="sum") + + # Also works with a (nested) collection of tensors (dict, list, tuple): + collection = {"loss": torch.tensor(...), "data": ...} + reduced_collection = fabric.all_reduce(collection) + +The support of options for ``reduce_op`` depends on the strategy used, but all strategies support *sum* and *mean*. + +Full example: + +.. code-block:: python + + fabric = Fabric(devices=4, accelerator="cpu") + fabric.launch() + + # Data is different in each process + data = torch.tensor(10 * fabric.global_rank) + + # Sum the tensors from every process + result = fabric.all_reduce(data, reduce_op="sum") + + # sum(0 + 10 + 20 + 30) = tensor(60) + print("Result of all-reduce:", result) diff --git a/docs/source-fabric/advanced/gradient_accumulation.rst b/docs/source-fabric/advanced/gradient_accumulation.rst new file mode 100644 index 0000000..0fb5a31 --- /dev/null +++ b/docs/source-fabric/advanced/gradient_accumulation.rst @@ -0,0 +1,55 @@ +############################### +Efficient Gradient Accumulation +############################### + +Gradient accumulation works the same way with Fabric as in PyTorch. +You are in control of which model accumulates and at what frequency: + +.. code-block:: python + + for iteration, batch in enumerate(dataloader): + # Accumulate gradient 8 batches at a time + is_accumulating = iteration % 8 != 0 + + output = model(input) + loss = ... + + # .backward() accumulates when .zero_grad() wasn't called + fabric.backward(loss) + ... + + if not is_accumulating: + # Step the optimizer after the accumulation phase is over + optimizer.step() + optimizer.zero_grad() + + +However, in a distributed setting, for example, when training across multiple GPUs or machines, doing it this way can significantly slow down your training loop. +To optimize this code, we should skip the synchronization in ``.backward()`` during the accumulation phase. +We only need to synchronize the gradients when the accumulation phase is over! +This can be achieved by adding the :meth:`~lightning.fabric.fabric.Fabric.no_backward_sync` context manager over the :meth:`~lightning.fabric.fabric.Fabric.backward` call: + +.. code-block:: diff + + for iteration, batch in enumerate(dataloader): + + # Accumulate gradient 8 batches at a time + is_accumulating = iteration % 8 != 0 + + + with fabric.no_backward_sync(model, enabled=is_accumulating): + output = model(input) + loss = ... + + # .backward() accumulates when .zero_grad() wasn't called + fabric.backward(loss) + + ... + + if not is_accumulating: + # Step the optimizer after accumulation phase is over + optimizer.step() + optimizer.zero_grad() + + +For those strategies that don't support it, a warning is emitted. For single-device strategies, it is a no-op. +Both the model's ``.forward()`` and the ``fabric.backward()`` call need to run under this context. diff --git a/docs/source-fabric/advanced/model_parallel/fsdp.rst b/docs/source-fabric/advanced/model_parallel/fsdp.rst new file mode 100644 index 0000000..5035554 --- /dev/null +++ b/docs/source-fabric/advanced/model_parallel/fsdp.rst @@ -0,0 +1,520 @@ +########################################### +Training models with billions of parameters +########################################### + +Use Fully Shared Data Parallel (FSDP) to train large models with billions or trillions of parameters efficiently on multiple GPUs and across multiple machines. + +.. note:: This is an experimental feature. + + +Today, large models with billions of parameters are trained with many GPUs across several machines in parallel. +Even a single A100 GPU with 80 GB of VRAM (the biggest today) is not enough to train just a 30B parameter model (even with batch size 1 and 16-bit precision). +The memory consumption for training is generally made up of + +1. the model parameters, +2. the optimizer states (e.g., Adam has two additional exponential averages per parameter), +3. the layer activations (forward) and +4. the gradients (backward). + +| + +When the sum of these memory components exceed the VRAM of a single GPU, regular data-parallel training (DDP) can no longer be employed. +One of the methods that can alleviate this limitation is called **model-parallel** training, and known as **FSDP** in PyTorch, and in this guide, you will learn how to effectively scale large models with it. + + +---- + + +*************************** +Checklist: When to use FSDP +*************************** + +| + +✅ I have multiple GPUs + +✅ I have tried regular DDP training with batch size 1 but I run out of memory + +✅ I have PyTorch 2.0 or newer installed + + +---- + + +********************* +Enable FSDP in Fabric +********************* + + +To enable model-parallel training with FSDP in a single-line change, set ``strategy="fsdp"``: + +.. code-block:: python + + fabric = L.Fabric(accelerator="cuda", devices=2, strategy="fsdp") + +As we will see in the next sections, there are many settings we can tune to optimize memory usage and throughput, scaling to massively large models. +This is equivalent to the above, but will let us configure additional settings later: + +.. code-block:: python + + from lightning.fabric.strategies import FSDPStrategy + + fabric = L.Fabric(accelerator="cuda", devices=2, strategy=FSDPStrategy()) + + +Here is a full code example: + +.. code-block:: python + + import torch + import torch.nn as nn + import torch.nn.functional as F + + import lightning as L + from lightning.fabric.strategies import FSDPStrategy + from lightning.pytorch.demos import Transformer, WikiText2 + + fabric = L.Fabric(accelerator="cuda", devices=2, strategy=FSDPStrategy()) + fabric.launch() + + fabric.seed_everything(42) + + with fabric.rank_zero_first(): + dataset = WikiText2() + + # 1B parameters + model = Transformer(vocab_size=dataset.vocab_size, nlayers=32, nhid=4096, ninp=1024, nhead=64) + optimizer = torch.optim.Adam(model.parameters(), lr=0.1) + + model, optimizer = fabric.setup(model, optimizer) + + for i in range(10): + input, target = fabric.to_device(dataset[i]) + output = model(input.unsqueeze(0), target.unsqueeze(0)) + loss = F.nll_loss(output, target.view(-1)) + fabric.backward(loss) + optimizer.step() + optimizer.zero_grad() + fabric.print(loss.item()) + + fabric.print(torch.cuda.memory_summary()) + + +We will reuse this Transformer example throughout the guide, optimize speed and memory usage, and compare it to regular DDP training. + + +---- + + +********************* +Identify large layers +********************* + +Models that have many large layers like linear layers in LLMs, ViTs, etc. with >100M parameters will benefit the most from FSDP because the memory they consume through parameters, activations and corresponding optimizer states can be evenly split across all GPUs. +However, one should avoid splitting small layers that have a few thousand parameters because communication overhead would dominate and slow the training down. +We can specify a list of layer classes in the **wrapping policy** to inform FSDP which parameters it should wrap: + +.. code-block:: python + + # 1. Define a set of layers that FSDP should manage + # Here we are choosing the large encoder and decoder layers + policy = {nn.TransformerEncoderLayer, nn.TransformerDecoderLayer} + + # 2. Pass the policy to the FSDPStrategy object + strategy = FSDPStrategy(auto_wrap_policy=policy) + + fabric = L.Fabric(..., strategy=strategy) + +.. collapse:: Alternative ways to define the policy (Lightning < 2.1) + + The ``auto_wrap_policy`` argument also accepts the old-style function-policies. For example: + + .. code-block:: python + + from functools import partial + + # 1. Import a suiting wrapping policy from PyTorch + from torch.distributed.fsdp.wrap import size_based_auto_wrap_policy + + # 2. Configure the policy + policy = partial(size_based_auto_wrap_policy, min_num_params=10000) + + # 3. Pass it to the FSDPStrategy object + strategy = FSDPStrategy(auto_wrap_policy=policy) + + PyTorch provides several of these functional policies under :mod:`torch.distributed.fsdp.wrap`. + +| + +Verify that FSDP works with your model by comparing the peak memory usage printed in the CUDA memory summary (see example above) with regular DDP training. +You should see a decrease in allocated memory and a slight increase in iteration time: + +.. list-table:: + :widths: 25 25 25 + :header-rows: 1 + + * - + - DDP + - FSDP + * - Memory (MB) + - 26’953 + - 11’578 + * - Iteration time (sec) + - 0.26 + - 0.36 + +---- + + +***************************** +Speed up model initialization +***************************** + +The standard practice in PyTorch is to put all model parameters into CPU memory first and then in a second step move them to the GPU device. +However, the larger the model the longer these two steps take. With the :meth:`~lightning.fabric.fabric.Fabric.init_module` context manager, you can initialize very large models quickly and reduce memory peaks. + +Before: + +.. code-block:: python + + # Slow: Places the model on CPU first + model = Transformer(vocab_size=dataset.vocab_size) + +After: + +.. code-block:: python + + # Fast: Creates the model on the GPU directly + with fabric.init_module(): + model = Transformer(vocab_size=dataset.vocab_size) + + +---- + + +****************************** +Optimize the sharding strategy +****************************** + +By default, FSDP will automatically shard 1) the model weights 2) the gradients during backward and 3) the optimizer states across all GPUs of the corresponding layers selected by the auto-wrap-policy. +You can configure the following options to trade-off memory for speed: + +.. code-block:: python + + strategy = FSDPStrategy( + # Default: Shard weights, gradients, optimizer state (1 + 2 + 3) + sharding_strategy="FULL_SHARD", + # Shard gradients, optimizer state (2 + 3) + sharding_strategy="SHARD_GRAD_OP", + # Don't shard anything (similar to DDP) + sharding_strategy="NO_SHARD", + ) + fabric = L.Fabric(..., strategy=strategy) + + +**Recipe for choosing a sharding strategy:** + +1. Try the default settings first (FULL_SHARD). This is the slowest but will save you the most memory. +2. Try SHARD_GRAD_OP. If you run out of memory, revert back to the default (FULL_SHARD). Otherwise you should expect to see an increase in iteration speed. + +| + +Here is the memory and speed impact for each option when configured in our example code: + +.. list-table:: + :widths: 25 25 25 25 25 + :header-rows: 1 + + * - + - DDP + - NO_SHARD + - SHARD_GRAD_OP + - FULL_SHARD + * - Memory (MB) + - 26’953 + - 23’181 + - 11’815 + - 11’578 + * - Iteration time (sec) + - 0.26 + - 0.30 + - 0.31 + - 0.36 + + +---- + + +************************** +Trade-off speed for memory +************************** + +If you are short on GPU memory because you are training large models with 10+ billion parameters or require extreme batch sizes, consider trading off speed for more memory by enabling activation checkpointing or CPU offload. + + +Activation checkpointing +======================== + +Activations, the intermediate outputs of layers, are stored during the forward pass and needed during the backward pass to compute the gradients. +By enabling activation checkpointing, we can choose to discard and recompute selected layer activations dynamically during the backward pass when they are required, instead of storing them throughout the forward pass. +While this approach may slightly reduce training speed, it significantly reduces memory consumption. +The freed-up memory can then be allocated to increase the model's capacity or accommodate larger batch sizes, resulting in potential performance improvements. + +To enable activation checkpointing, pass in the list of layers to checkpoint. +This is typically your transformer block (including attention + feed-forward): + +.. code-block:: python + + strategy = FSDPStrategy( + # Enable activation checkpointing on these layers + activation_checkpointing_policy={ + nn.TransformerEncoderLayer, + nn.TransformerDecoderLayer, + }, + ) + fabric = L.Fabric(..., strategy=strategy) + + +Offload parameters to CPU +========================= + +The most drastic GPU memory savings can be achieved by offloading parameters to the CPU: + +.. code-block:: python + + # 1. Set `cpu_offload=True` + strategy = FSDPStrategy(..., cpu_offload=True) + fabric = L.Fabric(..., strategy=strategy) + + # 2. Set `move_to_device=False` (won't be required in future versions) + model, optimizer = setup(model, optimizer, move_to_device=False) + +The drawback is a much slower training speed due to the added communication between CPU and GPU for transferring parameters in every forward pass. +You should use this only if you have enough CPU memory and other scaling methods don’t give you enough memory savings. +In our example, we see a 4x memory saving, but a 10x increase in iteration time: + +.. list-table:: + :widths: 25 25 25 25 + :header-rows: 1 + + * - + - DDP + - FSDP + - FSDP + CPU offload + * - Memory (MB) + - 26’953 + - 11’578 + - 2’825 + * - Iteration time (sec) + - 0.26 + - 0.36 + - 3.24 + + +---- + + +***************** +Save a checkpoint +***************** + +Since training large models can be very expensive, it is best practice to include checkpointing logic into the training loop to save the progress periodically in case it gets interrupted unexpectedly. +Fabric offers a convenient and efficient method to save large model checkpoints and other state to a checkpoint file. +Simply add the following calls to your training loop: + +.. code-block:: python + + # 1. Define model, optimizer, and other training loop state + state = {"model": model, "optimizer": optimizer, "iter": iteration} + + # DON'T do this (inefficient): + # state = {"model": model.state_dict(), "optimizer": optimizer.state_dict(), ...} + + # 2. Save using Fabric's method + fabric.save("path/to/checkpoint/file", state) + + # DON'T do this (inefficient): + # torch.save("path/to/checkpoint/file", state) + +To reduce memory peaks and speed up the saving to disk, each process/GPU will save its own file into a folder at the given path by default. +The resulting checkpoint folder will have this structure: + +.. code-block:: text + + path/to/checkpoint/file + ├── .metadata + ├── __0_0.distcp + ├── __1_0.distcp + └── meta.pt + +The “sharded” checkpoint format is the most efficient to save and load in Fabric. +However, if you prefer to have a single consolidated file instead, you can configure this by setting the ``state_dict_type`` flag in the strategy: + +.. code-block:: python + + # Default: Save individual files with state from each process + strategy = FSDPStrategy(state_dict_type="sharded") + + # Save a single, consolidated checkpoint file + strategy = FSDPStrategy(state_dict_type="full") + + +**Which checkpoint format should I use?** + +- ``state_dict_type="sharded"``: Use for pre-training very large models. It is fast and uses less memory, but it is less portable - you can’t easily load the checkpoint in raw PyTorch (in the future, Lightning will provide utilities to convert the checkpoint though). +- ``state_dict_type="full"``: Use when pre-training small to moderately large models (less than 10B parameters), when fine-tuning, and when portability is required. + + +---- + + +***************** +Load a checkpoint +***************** + +You can easily load checkpoints saved by Fabric to resume training: + +.. code-block:: python + + # 1. Define model, optimizer, and other training loop state + state = {"model": model, "optimizer": optimizer, "iter": iteration} + + # 2. Load using Fabric's method + fabric.load("path/to/checkpoint/file", state) + + # DON'T do this (inefficient): + # model.load_state_dict(torch.load("path/to/checkpoint/file")) + +Fabric will automatically recognize whether the provided path contains a checkpoint saved with ``state_dict_type="full"`` or ``state_dict_type="sharded"``. + +.. warning:: + + Loading a full-state checkpoint will replicate the file in CPU RAM for every GPU. + For very large checkpoints/models, you may run out of memory and your program will crash. + If this happens, save using the “sharded” checkpoint format instead (default). + + +---- + + +********************************** +Advanced performance optimizations +********************************** + +If you’ve reached a good understanding of how the different FSDP settings impact the memory usage and speed of your model, here are a few more to squeeze out the last bit of performance. +These settings really depend on the specific use cases, so you will have to turn them on and off to see the impact on your model. + +Overlap backward and optimizer’s step +===================================== + +Fabric provides a context manager that allows you to overlap the backward and optimizer step to save significant memory and speed up the iteration time too. +By overlapping the two, we eliminate the need to store all gradients at once in memory. +Instead, the optimizer step updates are applied directly during backward as gradients become available, and the memory for gradients is immediately freed up. + +Here is the recipe: + +.. code-block:: python + + # 1. Import the context manager + from lightning.fabric.strategies.fsdp import fsdp_overlap_step_with_backward + + # 2. Create one optimizer instance per parameter + optimizers = [torch.optim.Adam([p], ...) for p in model.parameters()] + model, *optimizers = fabric.setup(model, *optimizers) + + ... + + for i in range(max_iters): + loss = ... + + # 3. Instead of calling `optimizer.step()`, call `fabric.backward(loss)` + # within the context manager + with fsdp_overlap_step_with_backward(optimizers, model): + fabric.backward(loss) + + # optimizer.step() + + +.. collapse:: Full example + + .. code-block:: python + + import torch + import torch.nn as nn + import torch.nn.functional as F + + import lightning as L + from lightning.fabric.strategies.fsdp import FSDPStrategy, fsdp_overlap_step_with_backward + from lightning.pytorch.demos import Transformer, WikiText2 + + policy = {nn.TransformerEncoderLayer, nn.TransformerDecoderLayer} + strategy = FSDPStrategy(auto_wrap_policy=policy) + fabric = L.Fabric(accelerator="cuda", devices=2, strategy=strategy) + fabric.launch() + + fabric.seed_everything(42) + + with fabric.rank_zero_first(): + dataset = WikiText2() + + # 1B parameters + model = Transformer(vocab_size=dataset.vocab_size, nlayers=32, nhid=4096, ninp=1024, nhead=64) + optimizers = [torch.optim.Adam([p], lr=0.1) for p in model.parameters()] + + model, *optimizers = fabric.setup(model, *optimizers) + + for i in range(10): + input, target = fabric.to_device(dataset[i]) + output = model(input.unsqueeze(0), target.unsqueeze(0)) + loss = F.nll_loss(output, target.view(-1)) + + with fsdp_overlap_step_with_backward(optimizers, model): + fabric.backward(loss) + # no `optimizer.step()` here! + + fabric.print(loss.item()) + + fabric.print(torch.cuda.memory_summary()) + +| + +`Read the detailed blog post here `_. +Note that this feature cannot work with gradient accumulation! + + +Disable foreach in the optimizer +================================ + +The commonly used optimizers in PyTorch have a setting ``foreach=True|False`` that speeds up the parameter and state updates when enabled. +However, you might see a slight memory peak and the larger the model is, the more noticeable it can be. +Consider disabling the ``foreach`` option if undesired memory patterns occur: + +.. code-block:: python + + optimizer = torch.optim.AdamW(model.parameters(), foreach=False) + +`See the full list of optimizers that support this `_. + + +Limit all-gathers +================= + +If you are running training close to the max. +GPU memory limit, you might be getting so-called CUDA malloc retries. +This is essentially the GPU running out of memory but before crashing completely, it tries to find some unused or cached memory it can free. +When they happen frequently, these retries can have a significant impact on speed. +Normally, you would decrease the batch size slightly to avoid it. +With FSDP, you have one more knob you can tweak to combat the issue, by setting ``limit_all_gathers=True``: + +.. code-block:: python + + strategy = FSDPStrategy( + # Default: The CPU will schedule the transfer of weights between GPUs + # at will, sometimes too aggressively + limit_all_gathers=False, + # Enable this if you are close to the max. GPU memory usage + limit_all_gathers=True, + ) + fabric = L.Fabric(..., strategy=strategy) + +You can monitor CUDA malloc retries in the output of ``torch.cuda.memory_summary()`` for example, or through the PyTorch profiler. diff --git a/docs/source-fabric/advanced/multiple_setup.rst b/docs/source-fabric/advanced/multiple_setup.rst new file mode 100644 index 0000000..1ecdcc9 --- /dev/null +++ b/docs/source-fabric/advanced/multiple_setup.rst @@ -0,0 +1,116 @@ +:orphan: + +############################## +Multiple Models and Optimizers +############################## + +Fabric makes it very easy to work with multiple models and/or optimizers at once in your training workflow. +Examples of where this comes in handy are Generative Adversarial Networks (GANs), Auto-encoders, meta-learning and more. + + +---- + +************************ +One model, one optimizer +************************ + +Fabric has a simple guideline you should follow: +If you have an optimizer, you should set it up together with the model to make your code truly strategy-agnostic. + +.. code-block:: python + + import torch + from lightning.fabric import Fabric + + fabric = Fabric() + + # Instantiate model and optimizer + model = LitModel() + optimizer = torch.optim.Adam(model.parameters()) + + # Set up the model and optimizer together + model, optimizer = fabric.setup(model, optimizer) + + +Depending on the selected strategy, the :meth:`~lightning.fabric.fabric.Fabric.setup` method will wrap and link the model with the optimizer. + + +---- + + +****************************** +One model, multiple optimizers +****************************** + +You can also have multiple optimizers over a single model. +This is useful if you need specific optimizers or learning rates for parts of the model. + +.. code-block:: python + + # Instantiate model and optimizers + model = LitModel() + optimizer1 = torch.optim.SGD(model.layer1.parameters(), lr=0.003) + optimizer2 = torch.optim.SGD(model.layer2.parameters(), lr=0.01) + + # Set up the model and optimizers together + model, optimizer1, optimizer2 = fabric.setup(model, optimizer1, optimizer2) + + + +---- + + +****************************** +Multiple models, one optimizer +****************************** + +Using a single optimizer to update multiple models is possible too. +The best way to do this is to group all your individual models under one top level ``nn.Module``: + +.. code-block:: python + + class AutoEncoder(torch.nn.Module): + def __init__(self): + super().__init__() + + # Group all models under a common nn.Module + self.encoder = Encoder() + self.decoder = Decoder() + +Now all of these models can be treated as a single one: + +.. code-block:: python + + # Instantiate the big model + autoencoder = AutoEncoder() + optimizer = ... + + # Set up the model(s) and optimizer together + autoencoder, optimizer = fabric.setup(autoencoder, optimizer) + + +---- + + +************************************ +Multiple models, multiple optimizers +************************************ + +You can pair up as many models and optimizers as you want. For example, two models with one optimizer each: + +.. code-block:: python + + # Two models + generator = Generator() + discriminator = Discriminator() + + # Two optimizers + optimizer_gen = torch.optim.SGD(generator.parameters(), lr=0.01) + optimizer_dis = torch.optim.SGD(discriminator.parameters(), lr=0.001) + + # Set up generator + generator, optimizer_gen = fabric.setup(generator, optimizer_gen) + # Set up discriminator + discriminator, optimizer_dis = fabric.setup(discriminator, optimizer_dis) + +For a full example of this use case, see our `GAN example `_. diff --git a/docs/source-fabric/api/accelerators.rst b/docs/source-fabric/api/accelerators.rst new file mode 100644 index 0000000..7e8444d --- /dev/null +++ b/docs/source-fabric/api/accelerators.rst @@ -0,0 +1,22 @@ +.. include:: ../links.rst + +############################# +lightning.fabric.accelerators +############################# + + +Accelerators +^^^^^^^^^^^^ + +.. currentmodule:: lightning.fabric.accelerators + +.. autosummary:: + :toctree: ./generated + :nosignatures: + :template: classtemplate.rst + + Accelerator + CPUAccelerator + CUDAAccelerator + MPSAccelerator + XLAAccelerator diff --git a/docs/source-fabric/api/collectives.rst b/docs/source-fabric/api/collectives.rst new file mode 100644 index 0000000..21a7734 --- /dev/null +++ b/docs/source-fabric/api/collectives.rst @@ -0,0 +1,23 @@ +.. include:: ../links.rst + +#################################### +lightning.fabric.plugins.collectives +#################################### + +.. warning:: + This is an `experimental `__ feature. + + +Collectives +^^^^^^^^^^^ + +.. currentmodule:: lightning.fabric.plugins.collectives + +.. autosummary:: + :toctree: ./generated + :nosignatures: + :template: classtemplate.rst + + Collective + TorchCollective + SingleDeviceCollective diff --git a/docs/source-fabric/api/environments.rst b/docs/source-fabric/api/environments.rst new file mode 100644 index 0000000..f824ed8 --- /dev/null +++ b/docs/source-fabric/api/environments.rst @@ -0,0 +1,25 @@ +.. include:: ../links.rst + +##################################### +lightning.fabric.plugins.environments +##################################### + + +Environments +^^^^^^^^^^^^ + +.. currentmodule:: lightning.fabric.plugins.environments + +.. autosummary:: + :toctree: ./generated + :nosignatures: + :template: classtemplate_noindex.rst + + ~cluster_environment.ClusterEnvironment + ~kubeflow.KubeflowEnvironment + ~lightning.LightningEnvironment + ~lsf.LSFEnvironment + ~mpi.MPIEnvironment + ~slurm.SLURMEnvironment + ~torchelastic.TorchElasticEnvironment + ~xla.XLAEnvironment diff --git a/docs/source-fabric/api/fabric.rst b/docs/source-fabric/api/fabric.rst new file mode 100644 index 0000000..41036e3 --- /dev/null +++ b/docs/source-fabric/api/fabric.rst @@ -0,0 +1,18 @@ +.. include:: ../links.rst + +####################### +lightning.fabric.Fabric +####################### + + +Fabric +^^^^^^ + +.. currentmodule:: lightning.fabric.fabric + +.. autosummary:: + :toctree: ./generated + :nosignatures: + :template: classtemplate.rst + + Fabric diff --git a/docs/source-fabric/api/fabric_args.rst b/docs/source-fabric/api/fabric_args.rst new file mode 100644 index 0000000..b285fc2 --- /dev/null +++ b/docs/source-fabric/api/fabric_args.rst @@ -0,0 +1,228 @@ +################ +Fabric Arguments +################ + + +accelerator +=========== + +Choose one of ``"cpu"``, ``"gpu"``, ``"tpu"``, ``"auto"``. + +.. code-block:: python + + # CPU accelerator + fabric = Fabric(accelerator="cpu") + + # Running with GPU Accelerator using 2 GPUs + fabric = Fabric(devices=2, accelerator="gpu") + + # Running with TPU Accelerator using 8 TPU cores + fabric = Fabric(devices=8, accelerator="tpu") + + # Running with GPU Accelerator using the DistributedDataParallel strategy + fabric = Fabric(devices=4, accelerator="gpu", strategy="ddp") + +The ``"auto"`` option recognizes the machine you are on and selects the available accelerator. + +.. code-block:: python + + # If your machine has GPUs, it will use the GPU Accelerator + fabric = Fabric(devices=2, accelerator="auto") + + +See also: :doc:`../fundamentals/accelerators` + + +strategy +======== + +Choose a training strategy: ``"dp"``, ``"ddp"``, ``"ddp_spawn"``, ``"xla"``, ``"deepspeed"``, ``"fsdp"````. + +.. code-block:: python + + # Running with the DistributedDataParallel strategy on 4 GPUs + fabric = Fabric(strategy="ddp", accelerator="gpu", devices=4) + + # Running with the DDP Spawn strategy using 4 CPU processes + fabric = Fabric(strategy="ddp_spawn", accelerator="cpu", devices=4) + + +Additionally, you can pass in your custom strategy by configuring additional parameters. + +.. code-block:: python + + from lightning.fabric.strategies import DeepSpeedStrategy + + fabric = Fabric(strategy=DeepSpeedStrategy(stage=2), accelerator="gpu", devices=2) + +See also: :doc:`../fundamentals/launch` + + +devices +======= + +Configure the devices to run on. Can be of type: + +- int: the number of devices (e.g., GPUs) to train on +- list of int: which device index (e.g., GPU ID) to train on (0-indexed) +- str: a string representation of one of the above + +.. code-block:: python + + # default used by Fabric, i.e., use the CPU + fabric = Fabric(devices=None) + + # equivalent + fabric = Fabric(devices=0) + + # int: run on two GPUs + fabric = Fabric(devices=2, accelerator="gpu") + + # list: run on the 2nd (idx 1) and 5th (idx 4) GPUs (by bus ordering) + fabric = Fabric(devices=[1, 4], accelerator="gpu") + fabric = Fabric(devices="1, 4", accelerator="gpu") # equivalent + + # -1: run on all GPUs + fabric = Fabric(devices=-1, accelerator="gpu") + fabric = Fabric(devices="-1", accelerator="gpu") # equivalent + +See also: :doc:`../fundamentals/launch` + + +num_nodes +========= + + +The number of cluster nodes for distributed operation. + +.. code-block:: python + + # Default used by Fabric + fabric = Fabric(num_nodes=1) + + # Run on 8 nodes + fabric = Fabric(num_nodes=8) + + +Learn more about :ref:`distributed multi-node training on clusters `. + + +precision +========= + +There are two different techniques to set the mixed precision. "True" precision and "Mixed" precision. +For an extensive guide into their differences, please see: :doc:`../fundamentals/precision` + +Fabric supports doing floating point operations in 64-bit precision ("double"), 32-bit precision ("full"), or 16-bit ("half") with both regular and `bfloat16 `_). +This selected precision will have a direct impact in the performance and memory usage based on your hardware. +Automatic mixed precision settings are denoted by a ``"-mixed"`` suffix, while "true" precision settings have a ``"-true"`` suffix: + +.. code-block:: python + + # Default used by the Fabric + fabric = Fabric(precision="32-true", devices=1) + + # the same as: + fabric = Fabric(precision="32", devices=1) + + # 16-bit mixed precision (model weights remain in torch.float32) + fabric = Fabric(precision="16-mixed", devices=1) + + # 16-bit bfloat mixed precision (model weights remain in torch.float32) + fabric = Fabric(precision="bf16-mixed", devices=1) + + # 8-bit mixed precision via TransformerEngine (model weights remain in torch.float32) + fabric = Fabric(precision="transformer-engine", devices=1) + + # 16-bit precision (model weights get cast to torch.float16) + fabric = Fabric(precision="16-true", devices=1) + + # 16-bit bfloat precision (model weights get cast to torch.bfloat16) + fabric = Fabric(precision="bf16-true", devices=1) + + # 64-bit (double) precision (model weights get cast to torch.float64) + fabric = Fabric(precision="64-true", devices=1) + + +plugins +======= + +Plugins allow you to connect arbitrary backends, precision libraries, clusters, etc. For example: +To define your own behavior, subclass the relevant class and pass it in. Here's an example linking up your own +:class:`~lightning.fabric.plugins.environments.ClusterEnvironment`. + +.. code-block:: python + + from lightning.fabric.plugins.environments import ClusterEnvironment + + + class MyCluster(ClusterEnvironment): + @property + def main_address(self): + return your_main_address + + @property + def main_port(self): + return your_main_port + + def world_size(self): + return the_world_size + + + fabric = Fabric(plugins=[MyCluster()], ...) + + +callbacks +========= + +A callback class is a collection of methods that the training loop can call at a specific time, for example, at the end of an epoch. +Add callbacks to Fabric to inject logic into your training loop from an external callback class. + +.. code-block:: python + + class MyCallback: + def on_train_epoch_end(self, results): + ... + +You can then register this callback or multiple ones directly in Fabric: + +.. code-block:: python + + fabric = Fabric(callbacks=[MyCallback()]) + + +Then, in your training loop, you can call a hook by its name. Any callback objects that have this hook will execute it: + +.. code-block:: python + + # Call any hook by name + fabric.call("on_train_epoch_end", results={...}) + +See also: :doc:`../guide/callbacks` + + +loggers +======= + +Attach one or several loggers/experiment trackers to Fabric for convenient metrics logging. + +.. code-block:: python + + # Default used by Fabric; no loggers are active + fabric = Fabric(loggers=[]) + + # Log to a single logger + fabric = Fabric(loggers=TensorBoardLogger(...)) + + # Or multiple instances + fabric = Fabric(loggers=[logger1, logger2, ...]) + +Anywhere in your training loop, you can log metrics to all loggers at once: + +.. code-block:: python + + fabric.log("loss", loss) + fabric.log_dict({"loss": loss, "accuracy": acc}) + + +See also: :doc:`../guide/logging` diff --git a/docs/source-fabric/api/fabric_methods.rst b/docs/source-fabric/api/fabric_methods.rst new file mode 100644 index 0000000..9411966 --- /dev/null +++ b/docs/source-fabric/api/fabric_methods.rst @@ -0,0 +1,429 @@ +############## +Fabric Methods +############## + +launch +====== + +With :meth:`~lightning.fabric.fabric.Fabric.launch` you can conveniently launch your script or a function +into multiple processes for distributed training on a single machine. + +.. code-block:: python + + # Launch the script on 2 devices and init distributed backend + fabric = Fabric(devices=2) + fabric.launch() + +The same can be done with code inside a function: + +.. code-block:: python + + def run(fabric): + # Your distributed code here + ... + + + # Launch a function on 2 devices and init distributed backend + fabric = Fabric(devices=2) + fabric.launch(run) + +For example, you can use the latter for multi-GPU training inside a :doc:`Jupyter notebook <../fundamentals/notebooks>`. +For launching distributed training with the CLI, multi-node cluster, or cloud, see :doc:`../fundamentals/launch`. + +setup +===== + +Set up a model and corresponding optimizer(s). If you need to set up multiple models, call ``setup()`` on each of them. +Moves the model and optimizer to the correct device automatically. + +.. code-block:: python + + model = nn.Linear(32, 64) + optimizer = torch.optim.SGD(model.parameters(), lr=0.001) + + # Set up model and optimizer for accelerated training + model, optimizer = fabric.setup(model, optimizer) + + # If you don't want Fabric to set the device + model, optimizer = fabric.setup(model, optimizer, move_to_device=False) + + +The setup method also prepares the model for the selected precision choice so that operations during ``forward()`` get +cast automatically. + +setup_dataloaders +================= + +Set up one or multiple data loaders for accelerated operation. If you run a distributed strategy (e.g., DDP), Fabric +automatically replaces the sampler. In addition, the data loader will be configured to move the returned +data tensors to the correct device automatically. + +.. code-block:: python + + train_data = torch.utils.DataLoader(train_dataset, ...) + test_data = torch.utils.DataLoader(test_dataset, ...) + + train_data, test_data = fabric.setup_dataloaders(train_data, test_data) + + # If you don't want Fabric to move the data to the device + train_data, test_data = fabric.setup_dataloaders(train_data, test_data, move_to_device=False) + + # If you don't want Fabric to replace the sampler in the context of distributed training + train_data, test_data = fabric.setup_dataloaders(train_data, test_data, use_distributed_sampler=False) + + +backward +======== + +This replaces any occurrences of ``loss.backward()`` and makes your code accelerator and precision agnostic. + +.. code-block:: python + + output = model(input) + loss = loss_fn(output, target) + + # loss.backward() + fabric.backward(loss) + + +clip_gradients +============== + +Clip the gradients of the model to a given max value or max norm. +This is useful if your model experiences *exploding gradients* during training. + +.. code-block:: python + + # Clip gradients to a max value of +/- 0.5 + fabric.clip_gradients(model, optimizer, clip_val=0.5) + + # Clip gradients such that their total norm is no bigger than 2.0 + fabric.clip_gradients(model, optimizer, max_norm=2.0) + + # By default, clipping by norm uses the 2-norm + fabric.clip_gradients(model, optimizer, max_norm=2.0, norm_type=2) + + # You can also choose the infinity-norm, which clips the largest + # element among all + fabric.clip_gradients(model, optimizer, max_norm=2.0, norm_type="inf") + +The :meth:`~lightning.fabric.fabric.Fabric.clip_gradients` method is agnostic to the precision and strategy being used. +Note: Gradient clipping with FSDP is not yet fully supported. + + +to_device +========= + +Use :meth:`~lightning.fabric.fabric.Fabric.to_device` to move models, tensors, or collections of tensors to +the current device. By default :meth:`~lightning.fabric.fabric.Fabric.setup` and +:meth:`~lightning.fabric.fabric.Fabric.setup_dataloaders` already move the model and data to the correct +device, so calling this method is only necessary for manual operation when needed. + +.. code-block:: python + + data = torch.load("dataset.pt") + data = fabric.to_device(data) + + +seed_everything +=============== + +Make your code reproducible by calling this method at the beginning of your run. + +.. code-block:: python + + # Instead of `torch.manual_seed(...)`, call: + fabric.seed_everything(1234) + + +This covers PyTorch, NumPy, and Python random number generators. In addition, Fabric takes care of properly initializing +the seed of data loader worker processes (can be turned off by passing ``workers=False``). + +init_module +=========== + +Instantiating a ``nn.Module`` in PyTorch creates all parameters on CPU in float32 precision by default. +To speed up initialization, you can force PyTorch to create the model directly on the target device and with the desired precision without changing your model code. + +.. code-block:: python + + fabric = Fabric(accelerator="cuda", precision="16-true") + + with fabric.init_module(): + # models created here will be on GPU and in float16 + model = MyModel() + +This eliminates the waiting time to transfer the model parameters from the CPU to the device. +For strategies that handle large sharded models (FSDP, DeepSpeed), the :meth:`~lightning.fabric.fabric.Fabric.init_module` method will allocate the model parameters on the meta device first before sharding. +This makes it possible to work with models that are larger than the memory of a single device. + +When loading a model from a checkpoint, for example when fine-tuning, set `empty_init=True` to avoid expensive +and redundant memory initialization: + +.. code-block:: python + + with fabric.init_module(empty_init=True): + # creation of the model is very fast + # and depending on the strategy allocates no memory, or uninitialized memory + model = MyModel() + + # weights get loaded into the model + model.load_state_dict(checkpoint["state_dict"]) + + +autocast +======== + +Let the precision backend autocast the block of code under this context manager. This is optional and already done by +Fabric for the model's forward method (once the model was :meth:`~lightning.fabric.fabric.Fabric.setup`). +You need this only if you wish to autocast more operations outside the ones in model forward: + +.. code-block:: python + + model, optimizer = fabric.setup(model, optimizer) + + # Fabric handles precision automatically for the model + output = model(inputs) + + with fabric.autocast(): # optional + loss = loss_function(output, target) + + fabric.backward(loss) + ... + +See also: :doc:`../fundamentals/precision` + + +print +===== + +Print to the console via the built-in print function, but only on the main process. +This avoids excessive printing and logs when running on multiple devices/nodes. + + +.. code-block:: python + + # Print only on the main process + fabric.print(f"{epoch}/{num_epochs}| Train Epoch Loss: {loss}") + + +save +==== + +Save the state of objects to a checkpoint file. +Replaces all occurrences of ``torch.save(...)`` in your code. +Fabric will handle the saving part correctly, whether running a single device, multi-devices, or multi-nodes. + +.. code-block:: python + + # Define the state of your program/loop + state = { + "model1": model1, + "model2": model2, + "optimizer": optimizer, + "iteration": iteration, + } + + # Instead of `torch.save(...)` + fabric.save("path/to/checkpoint.ckpt", state) + +You should pass the model and optimizer objects directly into the dictionary so Fabric can unwrap them and automatically retrieve their *state-dict*. + +See also: :doc:`../guide/checkpoint` + + +load +==== + +Load checkpoint contents from a file and restore the state of objects in your program. +Replaces all occurrences of ``torch.load(...)`` in your code. +Fabric will handle the loading part correctly, whether running a single device, multi-device, or multi-node. + +.. code-block:: python + + # Define the state of your program/loop + state = { + "model1": model1, + "model2": model2, + "optimizer": optimizer, + "iteration": iteration, + } + + # Restore the state of objects (in-place) + fabric.load("path/to/checkpoint.ckpt", state) + + # Or load everything and restore your objects manually + checkpoint = fabric.load("./checkpoints/version_2/checkpoint.ckpt") + model.load_state_dict(checkpoint["model"]) + ... + + +To load the state of your model or optimizer from a raw PyTorch checkpoint (not saved with Fabric), use :meth:`~lightning.fabric.fabric.Fabric.load_raw` instead. +See also: :doc:`../guide/checkpoint` + + +load_raw +======== + +Load the state-dict of a model or optimizer from a raw PyTorch checkpoint not saved by Fabric. + +.. code-block:: python + + model = MyModel() + + # A model weights file saved by your friend who doesn't use Fabric + fabric.load_raw("path/to/model.pt", model) + + # Equivalent to this: + # model.load_state_dict(torch.load("path/to/model.pt")) + + +See also: :doc:`../guide/checkpoint` + + +barrier +======= + +Call this if you want all processes to wait and synchronize. Once all processes have entered this call, +execution continues. Useful for example, when you want to download data on one process and make all others wait until +the data is written to disk. + +.. code-block:: python + + if fabric.global_rank == 0: + print("Downloading dataset. This can take a while ...") + download_dataset("http://...") + + # All other processes wait here until rank 0 is done with downloading: + fabric.barrier() + + # After everyone reached the barrier, they can access the downloaded files: + load_dataset() + +See also: :doc:`../advanced/distributed_communication` + + +all_gather, all_reduce, broadcast +================================= + +You can send tensors and other data between processes using collective operations. +The three most common ones, :meth:`~lightning.fabric.fabric.Fabric.broadcast`, :meth:`~lightning.fabric.fabric.Fabric.all_gather` and :meth:`~lightning.fabric.fabric.Fabric.all_reduce` are available directly on the Fabric object for convenience: + +- :meth:`~lightning.fabric.fabric.Fabric.broadcast`: Send a tensor from one process to all others. +- :meth:`~lightning.fabric.fabric.Fabric.all_gather`: Gather tensors from every process and stack them. +- :meth:`~lightning.fabric.fabric.Fabric.all_reduce`: Apply a reduction function on tensors across processes (sum, mean, etc.). + +.. code-block:: python + + # Send the value of a tensor from rank 0 to all others + result = fabric.broadcast(tensor, src=0) + + # Every process gets the stack of tensors from everybody else + all_tensors = fabric.all_gather(tensor) + + # Sum a tensor across processes (everyone gets the result) + reduced_tensor = fabric.all_reduce(tensor, reduce_op="sum") + + # Also works with a collection of tensors (dict, list, tuple): + collection = {"loss": torch.tensor(...), "data": ...} + gathered_collection = fabric.all_gather(collection, ...) + reduced_collection = fabric.all_reduce(collection, ...) + + +.. important:: + + Every process needs to enter the collective calls, and tensors need to have the same shape across all processes. + Otherwise, the program will hang! + +Learn more about :doc:`distributed communication <../advanced/distributed_communication>`. + + +no_backward_sync +================ + +Use this context manager when performing gradient accumulation and using a distributed strategy (e.g., DDP). +It will speed up your training loop by cutting redundant communication between processes during the accumulation phase. + +.. code-block:: python + + # Accumulate gradient 8 batches at a time + is_accumulating = batch_idx % 8 != 0 + + with fabric.no_backward_sync(model, enabled=is_accumulating): + output = model(input) + loss = ... + fabric.backward(loss) + ... + + # Step the optimizer every 8 batches + if not is_accumulating: + optimizer.step() + optimizer.zero_grad() + +Both the model's `.forward()` and the `fabric.backward()` call need to run under this context as shown in the example above. +For single-device strategies, it is a no-op. Some strategies don't support this: + +- deepspeed +- dp +- xla + +For these, the context manager falls back to a no-op and emits a warning. + + +call +==== + +Use this to run all registered callback hooks with a given name and inputs. +It is useful when building a Trainer that allows the user to run arbitrary code at fixed points in the training loop. + +.. code-block:: python + + class MyCallback: + def on_train_start(self): + ... + + def on_train_epoch_end(self, model, results): + ... + + + fabric = Fabric(callbacks=[MyCallback()]) + + # Call any hook by name + fabric.call("on_train_start") + + # Pass in additional arguments that the hook requires + fabric.call("on_train_epoch_end", model=..., results={...}) + + # Only the callbacks that have this method defined will be executed + fabric.call("undefined") + + +See also: :doc:`../guide/callbacks` + + +log and log_dict +================ + +These methods allow you to send scalar metrics to a logger registered in Fabric. + +.. code-block:: python + + # Set the logger in Fabric + fabric = Fabric(loggers=TensorBoardLogger(...)) + + # Anywhere in your training loop or model: + fabric.log("loss", loss) + + # Or send multiple metrics at once: + fabric.log_dict({"loss": loss, "accuracy": acc}) + +If no loggers are given to Fabric (default), ``log`` and ``log_dict`` won't do anything. +Here is what's happening under the hood (pseudo code) when you call ``.log()`` or ``log_dict``: + +.. code-block:: python + + # When you call .log() or .log_dict(), we do this: + for logger in fabric.loggers: + logger.log_metrics(metrics=metrics, step=step) + +See also: :doc:`../guide/logging` diff --git a/docs/source-fabric/api/io.rst b/docs/source-fabric/api/io.rst new file mode 100644 index 0000000..8253a4b --- /dev/null +++ b/docs/source-fabric/api/io.rst @@ -0,0 +1,24 @@ +.. include:: ../links.rst + +########################### +lightning.fabric.plugins.io +########################### + + +.. warning:: + This is an `experimental `__ feature. + + +IO +^^ + +.. currentmodule:: lightning.fabric.plugins.io + +.. autosummary:: + :toctree: ./generated + :nosignatures: + :template: classtemplate.rst + + ~checkpoint_io.CheckpointIO + ~torch_io.TorchCheckpointIO + ~xla.XLACheckpointIO diff --git a/docs/source-fabric/api/loggers.rst b/docs/source-fabric/api/loggers.rst new file mode 100644 index 0000000..3c4936c --- /dev/null +++ b/docs/source-fabric/api/loggers.rst @@ -0,0 +1,20 @@ +.. include:: ../links.rst + +######################## +lightning.fabric.loggers +######################## + + +Loggers +^^^^^^^ + +.. currentmodule:: lightning.fabric.loggers + +.. autosummary:: + :toctree: ./generated + :nosignatures: + :template: classtemplate.rst + + Logger + CSVLogger + TensorBoardLogger diff --git a/docs/source-fabric/api/precision.rst b/docs/source-fabric/api/precision.rst new file mode 100644 index 0000000..b48d397 --- /dev/null +++ b/docs/source-fabric/api/precision.rst @@ -0,0 +1,25 @@ +.. include:: ../links.rst + +################################## +lightning.fabric.plugins.precision +################################## + + +Precision +^^^^^^^^^ + +.. TODO(fabric): include DeepSpeedPrecision + +.. currentmodule:: lightning.fabric.plugins.precision + +.. autosummary:: + :toctree: ./generated + :nosignatures: + :template: classtemplate.rst + + Precision + DoublePrecision + MixedPrecision + XLAPrecision + XLABf16Precision + FSDPPrecision diff --git a/docs/source-fabric/api/strategies.rst b/docs/source-fabric/api/strategies.rst new file mode 100644 index 0000000..3547483 --- /dev/null +++ b/docs/source-fabric/api/strategies.rst @@ -0,0 +1,26 @@ +.. include:: ../links.rst + +########################### +lightning.fabric.strategies +########################### + + +Strategies +^^^^^^^^^^ + +.. TODO(fabric): include DeepSpeedStrategy, XLAStrategy + +.. currentmodule:: lightning.fabric.strategies + +.. autosummary:: + :toctree: ./generated + :nosignatures: + :template: classtemplate.rst + + Strategy + DDPStrategy + DataParallelStrategy + FSDPStrategy + ParallelStrategy + SingleDeviceStrategy + SingleDeviceXLAStrategy diff --git a/docs/source-fabric/conf.py b/docs/source-fabric/conf.py new file mode 100644 index 0000000..5c6028f --- /dev/null +++ b/docs/source-fabric/conf.py @@ -0,0 +1,383 @@ +# Configuration file for the Sphinx documentation builder. +# +# This file does only contain a selection of the most common options. For a +# full list see the documentation: +# http://www.sphinx-doc.org/en/master/config + +# -- Path setup -------------------------------------------------------------- + +# If extensions (or modules to document with autodoc) are in another directory, +# add these directories to sys.path here. If the directory is relative to the +# documentation root, use os.path.abspath to make it absolute, like shown here. + +import glob +import inspect +import os +import shutil +import sys + +import pt_lightning_sphinx_theme +from lightning_utilities.docs import fetch_external_assets + +import lightning + +_PATH_HERE = os.path.abspath(os.path.dirname(__file__)) +_PATH_ROOT = os.path.realpath(os.path.join(_PATH_HERE, "..", "..")) +sys.path.insert(0, os.path.abspath(_PATH_ROOT)) + +SPHINX_MOCK_REQUIREMENTS = int(os.environ.get("SPHINX_MOCK_REQUIREMENTS", True)) + +# -- Project information ----------------------------------------------------- + +# this name shall match the project name in Github as it is used for linking to code +project = "lightning" +copyright = lightning.__copyright__ +author = lightning.__author__ + +# The short X.Y version +version = lightning.__version__ +# The full version, including alpha/beta/rc tags +release = lightning.__version__ + +# Options for the linkcode extension +# ---------------------------------- +github_user = "Lightning-AI" +github_repo = project + +# -- Project documents ------------------------------------------------------- + +fetch_external_assets( + docs_folder=_PATH_HERE, + assets_folder="_static/fetched-s3-assets", + retrieve_pattern=r"https?://[-a-zA-Z0-9_]+\.s3\.[-a-zA-Z0-9()_\\+.\\/=]+", +) + +# -- General configuration --------------------------------------------------- + +# If your documentation needs a minimal Sphinx version, state it here. + +needs_sphinx = "4.5" + +# Add any Sphinx extension module names here, as strings. They can be +# extensions coming with Sphinx (named 'sphinx.ext.*') or your custom +# ones. +extensions = [ + "sphinx.ext.autodoc", + "sphinx.ext.doctest", + "sphinx.ext.intersphinx", + "sphinx_toolbox.collapse", + "sphinx.ext.todo", + "sphinx.ext.coverage", + "sphinx.ext.viewcode", + "sphinx.ext.autosummary", + "sphinx.ext.napoleon", + "sphinx.ext.imgmath", + "sphinx.ext.autosectionlabel", + # 'sphinxcontrib.mockautodoc', # raises error: directive 'automodule' is already registered ... + # 'sphinxcontrib.fulltoc', # breaks pytorch-theme with unexpected kw argument 'titles_only' + "sphinxcontrib.video", + "myst_parser", + "sphinx_autodoc_typehints", + "sphinx_copybutton", + "sphinx_paramlinks", + "sphinx_togglebutton", + # "lai_sphinx_theme.extensions.lightning", + "pt_lightning_sphinx_theme.extensions.lightning", +] + +# Add any paths that contain templates here, relative to this directory. +templates_path = ["_templates"] + +# myst-parser, forcing to parse all html pages with mathjax +# https://github.com/executablebooks/MyST-Parser/issues/394 +myst_update_mathjax = False +# https://myst-parser.readthedocs.io/en/latest/syntax/optional.html?highlight=anchor#auto-generated-header-anchors +myst_heading_anchors = 3 + +# https://berkeley-stat159-f17.github.io/stat159-f17/lectures/14-sphinx..html#conf.py-(cont.) +# https://stackoverflow.com/questions/38526888/embed-ipython-notebook-in-sphinx-document +# I execute the notebooks manually in advance. If notebooks test the code, +# they should be run at build time. +nbsphinx_execute = "never" +nbsphinx_allow_errors = True +nbsphinx_requirejs_path = "" + +# The suffix(es) of source filenames. +# You can specify multiple suffix as a list of string: +# +# source_suffix = ['.rst', '.md'] +# source_suffix = ['.rst', '.md', '.ipynb'] +source_suffix = { + ".rst": "restructuredtext", + ".txt": "markdown", + ".md": "markdown", + ".ipynb": "nbsphinx", +} + +# The master toctree document. +master_doc = "index" + +# The language for content autogenerated by Sphinx. Refer to documentation +# for a list of supported languages. +# +# This is also used if you do content translation via gettext catalogs. +# Usually you set "language" from the command line for these cases. +language = "en" + +# List of patterns, relative to source directory, that match files and +# directories to ignore when looking for source files. +# This pattern also affects html_static_path and html_extra_path. +exclude_patterns = [ + "PULL_REQUEST_TEMPLATE.md", + "**/README.md/*", + "readme.md", + "_templates", + "code_samples/convert_pl_to_app/requirements.txt", + "**/_static/*", +] + +# The name of the Pygments (syntax highlighting) style to use. +pygments_style = None + +# -- Options for HTML output ------------------------------------------------- + +# The theme to use for HTML and HTML Help pages. See the documentation for +# a list of builtin themes. +# +# html_theme = "lai_sphinx_theme" +html_theme = "pt_lightning_sphinx_theme" +html_theme_path = [os.environ.get("LIT_SPHINX_PATH", pt_lightning_sphinx_theme.get_html_theme_path())] + +# Theme options are theme-specific and customize the look and feel of a theme +# further. For a list of options available for each theme, see the +# documentation. + +html_theme_options = { + "pytorch_project": lightning.__homepage__, + "analytics_id": "G-D3Q2ESCTZR", + "canonical_url": lightning.__homepage__, + "collapse_navigation": False, + "display_version": True, + "logo_only": False, +} + +html_favicon = "_static/images/icon.svg" + +# Add any paths that contain custom static files (such as style sheets) here, +# relative to this directory. They are copied after the builtin static files, +# so a file named "default.css" will overwrite the builtin "default.css". +html_static_path = ["_templates", "_static"] + +# Custom sidebar templates, must be a dictionary that maps document names +# to template names. +# +# The default sidebars (for documents that don't match any pattern) are +# defined by theme itself. Builtin themes are using these templates by +# default: ``['localtoc.html', 'relations.html', 'sourcelink.html', +# 'searchbox.html']``. +# +# html_sidebars = {} + +# -- Options for HTMLHelp output --------------------------------------------- + +# Output file base name for HTML help builder. +htmlhelp_basename = project + "-doc" + +# -- Options for LaTeX output ------------------------------------------------ + +latex_elements = { + # The paper size ('letterpaper' or 'a4paper'). + # 'papersize': 'letterpaper', + # The font size ('10pt', '11pt' or '12pt'). + # 'pointsize': '10pt', + # Additional stuff for the LaTeX preamble. + # 'preamble': '', + # Latex figure (float) alignment + "figure_align": "htbp", +} + +# Grouping the document tree into LaTeX files. List of tuples +# (source start file, target name, title, +# author, documentclass [howto, manual, or own class]). +latex_documents = [ + (master_doc, project + ".tex", project + " Documentation", author, "manual"), +] + +# -- Options for manual page output ------------------------------------------ + +# One entry per manual page. List of tuples +# (source start file, name, description, authors, manual section). +man_pages = [(master_doc, project, project + " Documentation", [author], 1)] + +# -- Options for Texinfo output ---------------------------------------------- + +# Grouping the document tree into Texinfo files. List of tuples +# (source start file, target name, title, author, +# dir menu entry, description, category) +texinfo_documents = [ + ( + master_doc, + project, + project + " Documentation", + author, + project, + lightning.__docs__, + "Miscellaneous", + ), +] + +# -- Options for Epub output ------------------------------------------------- + +# Bibliographic Dublin Core info. +epub_title = project + +# The unique identifier of the text. This can be a ISBN number +# or the project homepage. +# +# epub_identifier = '' + +# A unique identification for the text. +# +# epub_uid = '' + +# A list of files that should not be packed into the epub file. +epub_exclude_files = ["search.html"] + +# -- Extension configuration ------------------------------------------------- + +# -- Options for intersphinx extension --------------------------------------- + +# Example configuration for intersphinx: refer to the Python standard library. +intersphinx_mapping = { + "python": ("https://docs.python.org/3", None), + "torch": ("https://pytorch.org/docs/stable/", None), + "pytorch_lightning": ("https://lightning.ai/docs/pytorch/stable/", None), +} + +# -- Options for todo extension ---------------------------------------------- + +# If true, `todo` and `todoList` produce output, else they produce nothing. +todo_include_todos = True + + +def setup(app): + # this is for hiding doctest decoration, + # see: http://z4r.github.io/python/2011/12/02/hides-the-prompts-and-output/ + app.add_js_file("copybutton.js") + app.add_css_file("main.css") + + +# Ignoring Third-party packages +# https://stackoverflow.com/questions/15889621/sphinx-how-to-exclude-imports-in-automodule +def _package_list_from_file(file): + list_pkgs = [] + with open(file) as fp: + lines = fp.readlines() + for ln in lines: + found = [ln.index(ch) for ch in list(",=<>#") if ch in ln] + pkg = ln[: min(found)] if found else ln + if pkg.rstrip(): + list_pkgs.append(pkg.rstrip()) + return list_pkgs + + +# define mapping from PyPI names to python imports +PACKAGE_MAPPING = { + "PyYAML": "yaml", +} +MOCK_PACKAGES = [] +if SPHINX_MOCK_REQUIREMENTS: + # mock also base packages when we are on RTD since we don't install them there + MOCK_PACKAGES += _package_list_from_file(os.path.join(_PATH_ROOT, "requirements.txt")) +MOCK_PACKAGES = [PACKAGE_MAPPING.get(pkg, pkg) for pkg in MOCK_PACKAGES] + +autodoc_mock_imports = MOCK_PACKAGES + + +# Resolve function +# This function is used to populate the (source) links in the API +def linkcode_resolve(domain, info): + def find_source(): + # try to find the file and line number, based on code from numpy: + # https://github.com/numpy/numpy/blob/master/doc/source/conf.py#L286 + obj = sys.modules[info["module"]] + for part in info["fullname"].split("."): + obj = getattr(obj, part) + fname = inspect.getsourcefile(obj) + # https://github.com/rtfd/readthedocs.org/issues/5735 + if any(s in fname for s in ("readthedocs", "rtfd", "checkouts")): + # /home/docs/checkouts/readthedocs.org/user_builds/pytorch_lightning/checkouts/ + # devel/pytorch_lightning/utilities/cls_experiment.py#L26-L176 + path_top = os.path.abspath(os.path.join("..", "..", "..")) + fname = os.path.relpath(fname, start=path_top) + else: + # Local build, imitate master + fname = "master/" + os.path.relpath(fname, start=os.path.abspath("..")) + source, lineno = inspect.getsourcelines(obj) + return fname, lineno, lineno + len(source) - 1 + + if domain != "py" or not info["module"]: + return None + try: + filename = "%s#L%d-L%d" % find_source() + except Exception: + filename = info["module"].replace(".", "/") + ".py" + # import subprocess + # tag = subprocess.Popen(['git', 'rev-parse', 'HEAD'], stdout=subprocess.PIPE, + # universal_newlines=True).communicate()[0][:-1] + branch = filename.split("/")[0] + # do mapping from latest tags to master + branch = {"latest": "master", "stable": "master"}.get(branch, branch) + filename = "/".join([branch] + filename.split("/")[1:]) + return f"https://github.com/{github_user}/{github_repo}/blob/{filename}" + + +autosummary_generate = True + +autodoc_member_order = "groupwise" +autoclass_content = "both" +# the options are fixed and will be soon in release, +# see https://github.com/sphinx-doc/sphinx/issues/5459 +autodoc_default_options = { + "members": None, + "methods": None, + # 'attributes': None, + "special-members": "__call__", + "exclude-members": "_abc_impl", + "show-inheritance": True, + "private-members": True, + "noindex": True, +} + +# Sphinx will add “permalinks” for each heading and description environment as paragraph signs that +# become visible when the mouse hovers over them. +# This value determines the text for the permalink; it defaults to "¶". Set it to None or the empty +# string to disable permalinks. +# https://www.sphinx-doc.org/en/master/usage/configuration.html#confval-html_permalinks +# html_add_permalinks = "¶" +# True to prefix each section label with the name of the document it is in, followed by a colon. +# For example, index:Introduction for a section called Introduction that appears in document index.rst. +# Useful for avoiding ambiguity when the same section heading appears in different documents. +# http://www.sphinx-doc.org/en/master/usage/extensions/autosectionlabel.html +autosectionlabel_prefix_document = True + +# only run doctests marked with a ".. doctest::" directive +doctest_test_doctest_blocks = "" +doctest_global_setup = """ +import importlib +import os +import lightning as L + +from lightning_utilities.core.imports import package_available +from lightning import LightningModule, Trainer +from lightning.fabric.loggers.tensorboard import _TENSORBOARD_AVAILABLE, _TENSORBOARDX_AVAILABLE + +_TORCHVISION_AVAILABLE = package_available("torchvision") +""" +coverage_skip_undoc_in_source = True + +# skip false positive linkcheck errors from anchors +linkcheck_anchors = False + +# ignore all links in any CHANGELOG file +linkcheck_exclude_documents = [r"^(.*\/)*CHANGELOG.*$"] diff --git a/docs/source-fabric/examples/index.rst b/docs/source-fabric/examples/index.rst new file mode 100644 index 0000000..3936f2e --- /dev/null +++ b/docs/source-fabric/examples/index.rst @@ -0,0 +1,74 @@ +######## +Examples +######## + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Image Classification + :description: Train an image classifier on the MNIST dataset + :button_link: https://github.com/Lightning-AI/lightning/blob/master/examples/fabric/image_classifier + :col_css: col-md-4 + :height: 150 + :tag: basic + +.. displayitem:: + :header: Transformer Language Model + :description: A simple language model that learns to predict the next word in a sentence + :button_link: https://github.com/Lightning-AI/lightning/blob/master/examples/fabric/language_model + :col_css: col-md-4 + :height: 150 + :tag: basic + +.. displayitem:: + :header: GAN + :description: Train a GAN that generates realistic human faces + :button_link: https://github.com/Lightning-AI/lightning/blob/master/examples/fabric/dcgan + :col_css: col-md-4 + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Meta-Learning + :description: Distributed training with the MAML algorithm on the Omniglot and MiniImagenet datasets + :button_link: https://github.com/Lightning-AI/lightning/blob/master/examples/fabric/meta_learning + :col_css: col-md-4 + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Large Language Models + :description: Pre-train a GPT-2 language model on OpenWebText data + :button_link: https://github.com/Lightning-AI/nanoGPT/blob/master/train_fabric.py + :col_css: col-md-4 + :height: 150 + :tag: advanced + +.. displayitem:: + :header: Reinforcement Learning + :description: Implementation of the Proximal Policy Optimization (PPO) algorithm with multi-GPU support + :button_link: https://github.com/Lightning-AI/lightning/blob/master/examples/fabric/reinforcement_learning + :col_css: col-md-4 + :height: 150 + +.. displayitem:: + :header: K-Fold Cross Validation + :description: Cross validation helps you estimate the generalization error of a model and select the best one. + :button_link: https://github.com/Lightning-AI/lightning/tree/master/examples/fabric/kfold_cv + :col_css: col-md-4 + :height: 150 + +.. displayitem:: + :header: Active Learning + :description: Coming soon + :col_css: col-md-4 + :height: 150 + + +.. raw:: html + +
+
diff --git a/docs/source-fabric/fundamentals/accelerators.rst b/docs/source-fabric/fundamentals/accelerators.rst new file mode 100644 index 0000000..c1496a0 --- /dev/null +++ b/docs/source-fabric/fundamentals/accelerators.rst @@ -0,0 +1,78 @@ +################################ +Accelerate your code with Fabric +################################ + + +.. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/fabric/animations/accelerators.mp4 + :width: 800 + :autoplay: + :loop: + :muted: + :nocontrols: + + +*************************** +Set accelerator and devices +*************************** + +Fabric enables you to take full advantage of the hardware on your system. It supports + +- CPU +- GPU (NVIDIA, AMD, Apple Silicon) +- TPU + +By default, Fabric tries to maximize the hardware utilization of your system + +.. code-block:: python + + # Default settings + fabric = Fabric(accelerator="auto", devices="auto", strategy="auto") + + # Same as + fabric = Fabric() + +This is the most flexible option and makes your code run on most systems. +You can also explicitly set which accelerator to use: + +.. code-block:: python + + # CPU (slow) + fabric = Fabric(accelerator="cpu") + + # GPU + fabric = Fabric(accelerator="gpu", devices=1) + + # GPU (multiple) + fabric = Fabric(accelerator="gpu", devices=8) + + # GPU: Apple M1/M2 only + fabric = Fabric(accelerator="mps") + + # GPU: NVIDIA CUDA only + fabric = Fabric(accelerator="cuda", devices=8) + + # TPU + fabric = Fabric(accelerator="tpu", devices=8) + + +For running on multiple devices in parallel, also known as "distributed", read our guide for :doc:`Launching Multiple Processes <./launch>`. + + +---- + + +***************** +Access the Device +***************** + +You can access the device anytime through ``fabric.device``. +This lets you replace boilerplate code like this: + +.. code-block:: diff + + - if torch.cuda.is_available(): + - device = torch.device("cuda") + - else: + - device = torch.device("cpu") + + + device = fabric.device diff --git a/docs/source-fabric/fundamentals/code_structure.rst b/docs/source-fabric/fundamentals/code_structure.rst new file mode 100644 index 0000000..36b11ff --- /dev/null +++ b/docs/source-fabric/fundamentals/code_structure.rst @@ -0,0 +1,168 @@ +###################################### +How to structure your code with Fabric +###################################### + +Fabric is flexible enough to adapt to any project structure, regardless of whether you are experimenting with a simple script or an extensive framework, because it makes no assumptions about how your code is organized. +Despite the ultimate freedom, this page is meant to give beginners a template for how to organize a typical training script with Fabric: +We also have several :doc:`examples <../examples/index>` that you can take inspiration from. + + +---- + + +***************** +The Main Function +***************** + +At the highest level, every Python script should contain the following boilerplate code to guard the entry point for the main function: + +.. code-block:: python + + def main(): + # Here goes all the rest of the code + ... + + + if __name__ == "__main__": + # This is the entry point of your program + main() + + +This ensures that any form of multiprocessing will work properly (for example, ``DataLoader(num_workers=...)`` etc.) + + +---- + + +************** +Model Training +************** + +Here is a skeleton for training a model in a function ``train()``: + +.. code-block:: python + + import lightning as L + + + def train(fabric, model, optimizer, dataloader): + # Training loop + model.train() + for epoch in range(num_epochs): + for i, batch in enumerate(dataloader): + ... + + + def main(): + # (Optional) Parse command line options + args = parse_args() + + # Configure Fabric + fabric = L.Fabric(...) + + # Instantiate objects + model = ... + optimizer = ... + train_dataloader = ... + + # Set up objects + model, optimizer = fabric.setup(model, optimizer) + train_dataloader = fabric.setup_dataloaders(train_dataloader) + + # Run training loop + train(fabric, model, optimizer, train_dataloader) + + + if __name__ == "__main__": + main() + + +---- + + +***************************** +Training, Validation, Testing +***************************** + +Often it is desired to evaluate the ability of the model to generalize on unseen data. +Here is how the code would be structured if we did that periodically during training (called validation) and after training (called testing). + + +.. code-block:: python + + import lightning as L + + + def train(fabric, model, optimizer, train_dataloader, val_dataloader): + # Training loop with validation every few epochs + model.train() + for epoch in range(num_epochs): + for i, batch in enumerate(train_dataloader): + ... + + if epoch % validate_every_n_epoch == 0: + validate(fabric, model, val_dataloader) + + + def validate(fabric, model, dataloader): + # Validation loop + model.eval() + for i, batch in enumerate(dataloader): + ... + + + def test(fabric, model, dataloader): + # Test/Prediction loop + model.eval() + for i, batch in enumerate(dataloader): + ... + + + def main(): + ... + + # Run training loop with validation + train(fabric, model, optimizer, train_dataloader, val_dataloader) + + # Test on unseen data + test(fabric, model, test_dataloader) + + + if __name__ == "__main__": + main() + + + +---- + + +************ +Full Trainer +************ + +Building a fully-fledged, personalized Trainer can be a lot of work. +To get started quickly, copy `this `_ Trainer template and adapt it to your needs. + +- Only ~500 lines of code, all in one file +- Relies on Fabric to configure accelerator, devices, strategy +- Simple epoch based training with validation loop +- Only essential features included: Checkpointing, loggers, progress bar, callbacks, gradient accumulation + + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Trainer Template + :description: Take our Fabric Trainer template and customize it for your needs + :button_link: https://github.com/Lightning-AI/lightning/tree/master/examples/fabric/build_your_own_trainer + :col_css: col-md-4 + :height: 150 + :tag: intermediate + +.. raw:: html + +
+
diff --git a/docs/source-fabric/fundamentals/convert.rst b/docs/source-fabric/fundamentals/convert.rst new file mode 100644 index 0000000..8b80cb4 --- /dev/null +++ b/docs/source-fabric/fundamentals/convert.rst @@ -0,0 +1,129 @@ +############################## +Convert PyTorch code to Fabric +############################## + +Here are five easy steps to let :class:`~lightning.fabric.fabric.Fabric` scale your PyTorch models. + +**Step 1:** Create the :class:`~lightning.fabric.fabric.Fabric` object at the beginning of your training code. + +.. code-block:: python + + from lightning.fabric import Fabric + + fabric = Fabric() + +**Step 2:** Call :meth:`~lightning.fabric.fabric.Fabric.launch` if you intend to use multiple devices (e.g., multi-GPU). + +.. code-block:: python + + fabric.launch() + +**Step 3:** Call :meth:`~lightning.fabric.fabric.Fabric.setup` on each model and optimizer pair and :meth:`~lightning.fabric.fabric.Fabric.setup_dataloaders` on all your data loaders. + +.. code-block:: python + + model, optimizer = fabric.setup(model, optimizer) + dataloader = fabric.setup_dataloaders(dataloader) + +**Step 4:** Remove all ``.to`` and ``.cuda`` calls since :class:`~lightning.fabric.fabric.Fabric` will take care of it. + +.. code-block:: diff + + - model.to(device) + - batch.to(device) + +**Step 5:** Replace ``loss.backward()`` by ``fabric.backward(loss)``. + +.. code-block:: diff + + - loss.backward() + + fabric.backward(loss) + + +These are all code changes required to prepare your script for Fabric. +You can now simply run from the terminal: + +.. code-block:: bash + + python path/to/your/script.py + +| + +All steps combined, this is how your code will change: + +.. code-block:: diff + + import torch + from lightning.pytorch.demos import WikiText2, Transformer + + import lightning as L + + - device = torch.device("cuda" if torch.cuda.is_available() else "cpu") + + fabric = L.Fabric(accelerator="cuda", devices=8, strategy="ddp") + + fabric.launch() + + dataset = WikiText2() + dataloader = torch.utils.data.DataLoader(dataset) + model = Transformer(vocab_size=dataset.vocab_size) + optimizer = torch.optim.SGD(model.parameters(), lr=0.1) + + - model = model.to(device) + + model, optimizer = fabric.setup(model, optimizer) + + dataloader = fabric.setup_dataloaders(dataloader) + + model.train() + for epoch in range(20): + for batch in dataloader: + input, target = batch + - input, target = input.to(device), target.to(device) + optimizer.zero_grad() + output = model(input, target) + loss = torch.nn.functional.nll_loss(output, target.view(-1)) + - loss.backward() + + fabric.backward(loss) + optimizer.step() + + +That's it! You can now train on any device at any scale with a switch of a flag. +Check out our before-and-after example for `image classification `_ and many more :doc:`examples <../examples/index>` that use Fabric. + + +---- + + +********** +Next steps +********** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Examples + :description: See examples across computer vision, NLP, RL, etc. + :col_css: col-md-4 + :button_link: ../examples/index.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: Accelerators + :description: Take advantage of your hardware with a switch of a flag + :button_link: accelerators.html + :col_css: col-md-4 + :height: 150 + :tag: basic + +.. displayitem:: + :header: Build your own Trainer + :description: Learn how to build a trainer tailored for you + :col_css: col-md-4 + :button_link: ../levels/intermediate + :height: 150 + :tag: intermediate + +.. raw:: html + +
+
diff --git a/docs/source-fabric/fundamentals/installation.rst b/docs/source-fabric/fundamentals/installation.rst new file mode 100644 index 0000000..f7c35f7 --- /dev/null +++ b/docs/source-fabric/fundamentals/installation.rst @@ -0,0 +1,77 @@ +################# +Install Lightning +################# + +Fabric is part of the `Lightning `_ package. Here is how you get it! + +| + +.. raw:: html + +
+
+ +**Pip users** + +.. code-block:: bash + + pip install lightning + +.. raw:: html + +
+
+ +**Conda users** + +.. code-block:: bash + + conda install lightning -c conda-forge + +.. raw:: html + +
+
+ +| + + +If you don't already have it, this command will also install the latest `stable PyTorch version `_. + +You can find our the list of supported PyTorch versions in our `compatibility matrix `__. + + +---- + + +********** +Next steps +********** + +With the installation done, let's get your PyTorch code to the next level. + +.. raw:: html + +
+
+ +.. displayitem:: + :header: From PyTorch to Fabric + :description: Learn how to add Fabric to your PyTorch code + :button_link: ./convert.html + :col_css: col-md-4 + :height: 150 + :tag: basic + +.. displayitem:: + :header: Examples + :description: See examples across computer vision, NLP, RL, etc. + :col_css: col-md-4 + :button_link: ../examples/index.html + :height: 150 + :tag: basic + +.. raw:: html + +
+
diff --git a/docs/source-fabric/fundamentals/launch.rst b/docs/source-fabric/fundamentals/launch.rst new file mode 100644 index 0000000..bc4a5ba --- /dev/null +++ b/docs/source-fabric/fundamentals/launch.rst @@ -0,0 +1,243 @@ +########################### +Launch distributed training +########################### + +To run your code distributed across many devices and many machines, you need to do two things: + +1. Configure Fabric with the number of devices and number of machines you want to use +2. Launch your code in multiple processes + + +---- + + +************* +Simple Launch +************* + +.. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/fabric/animations/launch.mp4 + :width: 800 + :autoplay: + :loop: + :muted: + :nocontrols: + +You can configure and launch processes on your machine directly with Fabric's :meth:`~lightning.fabric.fabric.Fabric.launch` method: + +.. code-block:: python + + # train.py + ... + + # Configure accelerator, devices, num_nodes, etc. + fabric = Fabric(devices=4, ...) + + # This launches itself into multiple processes + fabric.launch() + + +In the command line, you run this like any other Python script: + +.. code-block:: bash + + python train.py + + +This is the recommended way for running on a single machine and is the most convenient method for development and debugging. + +It is also possible to use Fabric in a Jupyter notebook (including Google Colab, Kaggle, etc.) and launch multiple processes there. +You can learn more about it :ref:`here `. + + +---- + + +******************* +Launch with the CLI +******************* + +.. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/fabric/animations/launch-cli.mp4 + :width: 800 + :autoplay: + :loop: + :muted: + :nocontrols: + +An alternative way to launch your Python script in multiple processes is to use the dedicated command line interface (CLI): + +.. code-block:: bash + + lightning run model path/to/your/script.py + +This is essentially the same as running ``python path/to/your/script.py``, but it also lets you configure the following settings externally without changing your code: + +- ``--accelerator``: The accelerator to use +- ``--devices``: The number of devices to use (per machine) +- ``--num_nodes``: The number of machines (nodes) to use +- ``--precision``: Which type of precision to use +- ``--strategy``: The strategy (communication layer between processes) + + +.. code-block:: bash + + lightning run model --help + + Usage: lightning run model [OPTIONS] SCRIPT [SCRIPT_ARGS]... + + Run a Lightning Fabric script. + + SCRIPT is the path to the Python script with the code to run. The script + must contain a Fabric object. + + SCRIPT_ARGS are the remaining arguments that you can pass to the script + itself and are expected to be parsed there. + + Options: + --accelerator [cpu|gpu|cuda|mps|tpu] + The hardware accelerator to run on. + --strategy [ddp|dp|deepspeed] Strategy for how to run across multiple + devices. + --devices TEXT Number of devices to run on (``int``), which + devices to run on (``list`` or ``str``), or + ``'auto'``. The value applies per node. + --num-nodes, --num_nodes INTEGER + Number of machines (nodes) for distributed + execution. + --node-rank, --node_rank INTEGER + The index of the machine (node) this command + gets started on. Must be a number in the + range 0, ..., num_nodes - 1. + --main-address, --main_address TEXT + The hostname or IP address of the main + machine (usually the one with node_rank = + 0). + --main-port, --main_port INTEGER + The main port to connect to the main + machine. + --precision [16-mixed|bf16-mixed|32-true|64-true|64|32|16|bf16] + Double precision (``64-true`` or ``64``), + full precision (``32-true`` or ``64``), half + precision (``16-mixed`` or ``16``) or + bfloat16 precision (``bf16-mixed`` or + ``bf16``) + --help Show this message and exit. + + + +Here is how you run DDP with 8 GPUs and `torch.bfloat16 `_ precision: + +.. code-block:: bash + + lightning run model ./path/to/train.py \ + --strategy=ddp \ + --devices=8 \ + --accelerator=cuda \ + --precision="bf16" + +Or `DeepSpeed Zero3 `_ with mixed precision: + +.. code-block:: bash + + lightning run model ./path/to/train.py \ + --strategy=deepspeed_stage_3 \ + --devices=8 \ + --accelerator=cuda \ + --precision=16 + +:class:`~lightning.fabric.fabric.Fabric` can also figure it out automatically for you! + +.. code-block:: bash + + lightning run model ./path/to/train.py \ + --devices=auto \ + --accelerator=auto \ + --precision=16 + + +---- + + +.. _Fabric Cluster: + +******************* +Launch on a Cluster +******************* + +Fabric enables distributed training across multiple machines in several ways. +Choose from the following options based on your expertise level and available infrastructure. + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Lightning Cloud + :description: The easiest way to scale models in the cloud. No infrastructure setup required. + :col_css: col-md-4 + :button_link: ../guide/multi_node/cloud.html + :height: 160 + :tag: basic + +.. displayitem:: + :header: SLURM Managed Cluster + :description: Most popular for academic and private enterprise clusters. + :col_css: col-md-4 + :button_link: ../guide/multi_node/slurm.html + :height: 160 + :tag: intermediate + +.. displayitem:: + :header: Bare Bones Cluster + :description: Train across machines on a network using `torchrun`. + :col_css: col-md-4 + :button_link: ../guide/multi_node/barebones.html + :height: 160 + :tag: advanced + +.. displayitem:: + :header: Other Cluster Environments + :description: MPI, LSF, Kubeflow + :col_css: col-md-4 + :button_link: ../guide/multi_node/other.html + :height: 160 + :tag: advanced + +.. raw:: html + +
+
+ + +---- + + +********** +Next steps +********** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Mixed Precision Training + :description: Save memory and speed up training using mixed precision + :col_css: col-md-4 + :button_link: ../fundamentals/precision.html + :height: 160 + :tag: basic + +.. displayitem:: + :header: Distributed Communication + :description: Learn all about communication primitives for distributed operation. Gather, reduce, broadcast, etc. + :button_link: ../advanced/distributed_communication.html + :col_css: col-md-4 + :height: 160 + :tag: advanced + +.. raw:: html + +
+
diff --git a/docs/source-fabric/fundamentals/notebooks.rst b/docs/source-fabric/fundamentals/notebooks.rst new file mode 100644 index 0000000..7cc9fab --- /dev/null +++ b/docs/source-fabric/fundamentals/notebooks.rst @@ -0,0 +1,28 @@ +.. _Fabric in Notebooks: + +################### +Fabric in Notebooks +################### + +Fabric works the same way in notebooks (Jupyter, Google Colab, Kaggle, etc.) if you only run in a single process or GPU. +If you want to use multiprocessing, for example, multi-GPU, you can put your code in a function and pass that function to the +:meth:`~lightning.fabric.fabric.Fabric.launch` method: + + +.. code-block:: python + + + # Notebook Cell + def train(fabric): + model = ... + optimizer = ... + model, optimizer = fabric.setup(model, optimizer) + ... + + + # Notebook Cell + fabric = Fabric(accelerator="cuda", devices=2) + fabric.launch(train) # Launches the `train` function on two GPUs + + +As you can see, this function accepts one argument, the ``Fabric`` object, and it gets launched on as many devices as specified. diff --git a/docs/source-fabric/fundamentals/precision.rst b/docs/source-fabric/fundamentals/precision.rst new file mode 100644 index 0000000..0ab7d46 --- /dev/null +++ b/docs/source-fabric/fundamentals/precision.rst @@ -0,0 +1,235 @@ +################################ +Save memory with mixed precision +################################ + +.. video:: https://pl-public-data.s3.amazonaws.com/assets_lightning/fabric/animations/precision.mp4 + :width: 800 + :autoplay: + :loop: + :muted: + :nocontrols: + + +************************ +What is Mixed Precision? +************************ + +Like most deep learning frameworks, PyTorch runs on 32-bit floating-point (FP32) arithmetic by default. +However, many deep learning models do not require this to reach complete accuracy during training. +Mixed precision training delivers significant computational speedup by conducting operations in half-precision while keeping minimum information in single-precision to maintain as much information as possible in crucial areas of the network. +Switching to mixed precision has resulted in considerable training speedups since the introduction of Tensor Cores in the Volta and Turing architectures. +It combines FP32 and lower-bit floating points (such as FP16) to reduce memory footprint and increase performance during model training and evaluation. +It accomplishes this by recognizing the steps that require complete accuracy and employing a 32-bit floating point for those steps only while using a 16-bit floating point for the rest. +Compared to complete precision training, mixed precision training delivers all these benefits while ensuring no task-specific accuracy is lost `[1] `_. + +This is how you select the precision in Fabric: + +.. code-block:: python + + from lightning.fabric import Fabric + + # This is the default + fabric = Fabric(precision="32-true") + + # Also FP32 (legacy) + fabric = Fabric(precision=32) + + # FP32 as well (legacy) + fabric = Fabric(precision="32") + + # Float16 mixed precision + fabric = Fabric(precision="16-mixed") + + # Float16 true half precision + fabric = Fabric(precision="16-true") + + # BFloat16 mixed precision (Volta GPUs and later) + fabric = Fabric(precision="bf16-mixed") + + # BFloat16 true half precision (Volta GPUs and later) + fabric = Fabric(precision="bf16-true") + + # 8-bit mixed precision via TransformerEngine (Hopper GPUs and later) + fabric = Fabric(precision="transformer-engine") + + # Double precision + fabric = Fabric(precision="64-true") + + # Or (legacy) + fabric = Fabric(precision="64") + + # Or (legacy) + fabric = Fabric(precision=64) + + +The same values can also be set through the :doc:`command line interface `: + +.. code-block:: bash + + lightning run model train.py --precision=bf16-mixed + + +.. note:: + + In some cases, it is essential to remain in FP32 for numerical stability, so keep this in mind when using mixed precision. + For example, when running scatter operations during the forward (such as torchpoint3d), the computation must remain in FP32. + + +---- + + +******************** +FP16 Mixed Precision +******************** + +In most cases, mixed precision uses FP16. +Supported `PyTorch operations `_ automatically run in FP16, saving memory and improving throughput on the supported accelerators. +Since computation happens in FP16, which has a very limited "dynamic range", there is a chance of numerical instability during training. +This is handled internally by a dynamic grad scaler which skips invalid steps and adjusts the scaler to ensure subsequent steps fall within a finite range. +For more information `see the autocast docs `_. + +This is how you enable FP16 in Fabric: + +.. code-block:: python + + # Select FP16 mixed precision + fabric = Fabric(precision="16-mixed") + +.. note:: + + When using TPUs, setting ``precision="16-mixed"`` will enable bfloat16 based mixed precision, the only supported half-precision type on TPUs. + + +---- + + +************************ +BFloat16 Mixed Precision +************************ + +BFloat16 Mixed precision is similar to FP16 mixed precision. However, it maintains more of the "dynamic range" that FP32 offers. +This means it can improve numerical stability than FP16 mixed precision. +For more information, see `this TPU performance blog post `_. + +.. code-block:: python + + # Select BF16 precision + fabric = Fabric(precision="bf16-mixed") + + +Under the hood, we use `torch.autocast `__ with the dtype set to ``bfloat16``, with no gradient scaling. +It is also possible to use BFloat16 mixed precision on the CPU, relying on MKLDNN. + +.. note:: + + BFloat16 may not provide significant speedups or memory improvements, offering better numerical stability. + For GPUs, the most significant benefits require `Ampere `_ based GPUs or newer, such as A100s or 3090s. + + +---- + + +***************************************************** +Float8 Mixed Precision via Nvidia's TransformerEngine +***************************************************** + +`Transformer Engine `__ (TE) is a library for accelerating models on the +latest NVIDIA GPUs using 8-bit floating point (FP8) precision on Hopper GPUs, to provide better performance with lower +memory utilization in both training and inference. It offers improved performance over half precision with no degradation in accuracy. + +Using TE requires replacing some of the layers in your model. Fabric automatically replaces the :class:`torch.nn.Linear` +and :class:`torch.nn.LayerNorm` layers in your model with their TE alternatives, however, TE also offers +`fused layers `__ +to squeeze out all the possible performance. If Fabric detects that any layer has been replaced already, automatic +replacement is not done. + +This plugin is a mix of "mixed" and "true" precision. The computation is downcasted to FP8 precision on the fly, but +the model and inputs can be kept in true full or half precision. + +.. code-block:: python + + # Select 8bit mixed precision via TransformerEngine + fabric = Fabric(precision="transformer-engine") + + # Customize the fp8 recipe or set a different base precision: + from lightning.fabric.plugins.precision import TransformerEnginePrecision + + recipe = {"fp8_format": "HYBRID", "amax_history_len": 16, "amax_compute_algo": "max"} + precision = TransformerEnginePrecision(dtype=torch.bfloat16, recipe=recipe) + fabric = Fabric(plugins=precision) + + +Under the hood, we use `transformer_engine.pytorch.fp8_autocast `__ with the default fp8 recipe. + +.. note:: + + This requires `Hopper `_ based GPUs or newer, such the H100. + + +---- + + +******************* +True Half Precision +******************* + +As mentioned before, for numerical stability mixed precision keeps the model weights in full float32 precision while casting only supported operations to lower bit precision. +However, in some cases it is indeed possible to train completely in half precision. Similarly, for inference the model weights can often be cast to half precision without a loss in accuracy (even when trained with mixed precision). + +.. code-block:: python + + # Select FP16 precision + fabric = Fabric(precision="16-true") + model = MyModel() + model = fabric.setup(model) # model gets cast to torch.float16 + + # Select BF16 precision + fabric = Fabric(precision="bf16-true") + model = MyModel() + model = fabric.setup(model) # model gets cast to torch.bfloat16 + +Tip: For faster initialization, you can create model parameters with the desired dtype directly on the device: + +.. code-block:: python + + fabric = Fabric(precision="bf16-true") + + # init the model directly on the device and with parameters in half-precision + with fabric.init_module(): + model = MyModel() + + model = fabric.setup(model) + + +---- + + +************************************ +Control where precision gets applied +************************************ + +Fabric automatically casts the data type and operations in the ``forward`` of your model: + +.. code-block:: python + + fabric = Fabric(precision="bf16-mixed") + + model = ... + optimizer = ... + + # Here, Fabric sets up the `model.forward` for precision auto-casting + model, optimizer = fabric.setup(model, optimizer) + + # Precision casting gets handled in your forward, no code changes required + output = model.forward(input) + + # Precision does NOT get applied here (only in forward) + loss = loss_function(output, target) + +If you want to enable operations in lower bit-precision **outside** your model's ``forward()``, you can use the :meth:`~lightning.fabric.fabric.Fabric.autocast` context manager: + +.. code-block:: python + + # Precision now gets also handled in this part of the code: + with fabric.autocast(): + loss = loss_function(output, target) diff --git a/docs/source-fabric/glossary/index.rst b/docs/source-fabric/glossary/index.rst new file mode 100644 index 0000000..4b23fce --- /dev/null +++ b/docs/source-fabric/glossary/index.rst @@ -0,0 +1,185 @@ +######## +Glossary +######## + + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Accelerator + :button_link: ../fundamentals/accelerators.html + :col_css: col-md-4 + +.. displayitem:: + :header: Apple Silicon + :button_link: ../fundamentals/accelerators.html + :col_css: col-md-4 + +.. displayitem:: + :header: Autocast + :button_link: ../fundamentals/precision.html + :col_css: col-md-4 + +.. displayitem:: + :header: Barrier + :button_link: ../advanced/distributed_communication.html + :col_css: col-md-4 + +.. displayitem:: + :header: Broadcast + :button_link: ../advanced/distributed_communication.html + :col_css: col-md-4 + +.. displayitem:: + :header: Callback + :button_link: ../guide/callbacks.html + :col_css: col-md-4 + +.. displayitem:: + :header: Checkpoint + :button_link: ../guide/checkpoint.html + :col_css: col-md-4 + +.. displayitem:: + :header: CLI + :button_link: ../fundamentals/launch.html + :col_css: col-md-4 + +.. displayitem:: + :header: Cloud + :button_link: ../guide/multi_node/cloud.html + :col_css: col-md-4 + +.. displayitem:: + :header: Collective + :button_link: ../advanced/distributed_communication.html + :col_css: col-md-4 + +.. displayitem:: + :header: CUDA + :button_link: ../fundamentals/accelerators.html + :col_css: col-md-4 + +.. displayitem:: + :header: FSDP + :button_link: ../advanced/model_parallel/fsdp.html + :col_css: col-md-4 + +.. displayitem:: + :header: Gather + :button_link: ../advanced/distributed_communication.html + :col_css: col-md-4 + +.. displayitem:: + :header: Gradient Accumulation + :button_link: ../advanced/gradient_accumulation.html + :col_css: col-md-4 + +.. displayitem:: + :header: GPU + :button_link: ../fundamentals/accelerators.html + :col_css: col-md-4 + +.. displayitem:: + :header: Jypyter + :button_link: ../launch/notebooks.html + :col_css: col-md-4 + +.. displayitem:: + :header: Launch + :button_link: ../fundamentals/launch.html + :col_css: col-md-4 + +.. displayitem:: + :header: LightningModule + :button_link: ../guide/lightning_module.html + :col_css: col-md-4 + +.. displayitem:: + :header: Logger + :button_link: ../guide/logging.html + :col_css: col-md-4 + +.. displayitem:: + :header: Mixed Precision + :button_link: ../fundamentals/precision.html + :col_css: col-md-4 + +.. displayitem:: + :header: MPI + :button_link: ../guide/multi_node/other.html + :col_css: col-md-4 + +.. displayitem:: + :header: MPS + :button_link: ../fundamentals/accelerators.html + :col_css: col-md-4 + +.. displayitem:: + :header: Multi-GPU + :button_link: ../fundamentals/launch.html + :col_css: col-md-4 + +.. displayitem:: + :header: Multi-Node + :button_link: ../fundamentals/launch.html + :col_css: col-md-4 + +.. displayitem:: + :header: Notebook + :button_link: ../launch/notebook.html + :col_css: col-md-4 + +.. displayitem:: + :header: Optimizers + :button_link: ../advanced/multiple_setup.html + :col_css: col-md-4 + +.. displayitem:: + :header: Precision + :button_link: ../fundamentals/precision.html + :col_css: col-md-4 + +.. displayitem:: + :header: Reduce + :button_link: ../advanced/distributed_communication.html + :col_css: col-md-4 + +.. displayitem:: + :header: SLURM + :button_link: ../guide/multi_node/slurm.html + :col_css: col-md-4 + +.. displayitem:: + :header: TensorBoard + :button_link: ../guide/logging.html + :col_css: col-md-4 + +.. displayitem:: + :header: TorchElastic + :button_link: ../guide/multi_node/barebones.html + :col_css: col-md-4 + +.. displayitem:: + :header: TorchRun + :button_link: ../guide/multi_node/barebones.html + :col_css: col-md-4 + +.. displayitem:: + :header: TPU + :button_link: ../fundamentals/accelerators.html + :col_css: col-md-4 + +.. displayitem:: + :header: Trainer + :button_link: ../guide/trainer_template.html + :col_css: col-md-4 + + +.. raw:: html + +
+
diff --git a/docs/source-fabric/guide/callbacks.rst b/docs/source-fabric/guide/callbacks.rst new file mode 100644 index 0000000..87fd58e --- /dev/null +++ b/docs/source-fabric/guide/callbacks.rst @@ -0,0 +1,113 @@ +######### +Callbacks +######### + +Callbacks enable you, or the users of your code, to add new behavior to the training loop without needing to modify the source code. + + +---- + + +************************************* +Add a callback interface to your loop +************************************* + +Suppose we want to enable anyone to run some arbitrary code at the end of a training iteration. +Here is how that gets done in Fabric: + +.. code-block:: python + :caption: my_callbacks.py + + class MyCallback: + def on_train_batch_end(self, loss, output): + # Here, put any code you want to run at the end of a training step + ... + + +.. code-block:: python + :caption: train.py + :emphasize-lines: 4,7,18 + + from lightning.fabric import Fabric + + # The code of a callback can live anywhere, away from the training loop + from my_callbacks import MyCallback + + # Add one or several callbacks: + fabric = Fabric(callbacks=[MyCallback()]) + + ... + + for iteration, batch in enumerate(train_dataloader): + ... + fabric.backward(loss) + optimizer.step() + + # Let a callback add some arbitrary processing at the appropriate place + # Give the callback access to some varibles + fabric.call("on_train_batch_end", loss=loss, output=...) + + +As you can see, the code inside the callback method is completely decoupled from the trainer code. +This enables flexibility in extending the loop in arbitrary ways. + +**Exercise**: Implement a callback that computes and prints the time to complete an iteration. + + +---- + + +****************** +Multiple callbacks +****************** + +The callback system is designed to easily run multiple callbacks at the same time. +You can pass a list to Fabric: + +.. code-block:: python + + # Add multiple callback implementations in a list + callback1 = LearningRateMonitor() + callback2 = Profiler() + fabric = Fabric(callbacks=[callback1, callback2]) + + # Let Fabric call the implementations (if they exist) + fabric.call("any_callback_method", arg1=..., arg2=...) + + # fabric.call is the same as doing this + callback1.any_callback_method(arg1=..., arg2=...) + callback2.any_callback_method(arg1=..., arg2=...) + + +The :meth:`~lightning.fabric.fabric.Fabric.call` calls the callback objects in the order they were given to Fabric. +Not all objects registered via ``Fabric(callbacks=...)`` must implement a method with the given name. +The ones that have a matching method name will get called. + + +---- + + +********** +Next steps +********** + +Callbacks are a powerful tool for building a Trainer. +See a real example of how they can be integrated in our Trainer template based on Fabric: + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Trainer Template + :description: Take our Fabric Trainer template and customize it for your needs + :button_link: https://github.com/Lightning-AI/lightning/tree/master/examples/fabric/build_your_own_trainer + :col_css: col-md-4 + :height: 150 + :tag: intermediate + +.. raw:: html + +
+
diff --git a/docs/source-fabric/guide/checkpoint.rst b/docs/source-fabric/guide/checkpoint.rst new file mode 100644 index 0000000..50e4cf5 --- /dev/null +++ b/docs/source-fabric/guide/checkpoint.rst @@ -0,0 +1,204 @@ +############################## +Saving and Loading Checkpoints +############################## + +Fabric makes it easy and efficient to save the state of your training loop into a checkpoint file, no matter how large your model is. + +---- + + +******************************** +Define the state of your program +******************************** + +To save and resume your training, you need to define which variables in your program you want to have saved. +Put everything into a dictionary, including models and optimizers and whatever metadata you have: + +.. code-block:: python + + # Define the state of your program/loop + state = {"model1": model1, "model2": model2, "optimizer": optimizer, "iteration": iteration, "hparams": ...} + + +---- + + +***************** +Save a checkpoint +***************** + +To save the state to the filesystem, pass it to the :meth:`~lightning.fabric.fabric.Fabric.save` method: + +.. code-block:: python + + fabric.save("path/to/checkpoint.ckpt", state) + +This will unwrap your model and optimizer and automatically convert their ``state_dict`` for you. +Fabric and the underlying strategy will decide in which format your checkpoint gets saved. +For example, ``strategy="ddp"`` saves a single file on rank 0, while ``strategy="fsdp"`` saves multiple files from all ranks. + + +---- + + +************************* +Restore from a checkpoint +************************* + +From a checkpoint saved by Fabric +================================= + +You can restore the state by loading a saved checkpoint back with :meth:`~lightning.fabric.fabric.Fabric.load`: + +.. code-block:: python + + fabric.load("path/to/checkpoint.ckpt", state) + +Fabric will replace the state of your objects in-place. +You can also request only to restore a portion of the checkpoint. +For example, you want only to restore the model weights in your inference script: + +.. code-block:: python + + state = {"model1": model1} + remainder = fabric.load("path/to/checkpoint.ckpt", state) + +The remainder of the checkpoint that wasn't restored gets returned in case you want to do something else with it. +If you want to be in complete control of how states get restored, you can omit passing a state and get the entire raw checkpoint dictionary returned: + +.. code-block:: python + + # Request the raw checkpoint + full_checkpoint = fabric.load("path/to/checkpoint.ckpt") + + model.load_state_dict(full_checkpoint["model"]) + optimizer.load_state_dict(full_checkpoint["optimizer"]) + ... + + +From a raw state-dict file +========================== + +You can load a raw weights file into a model directly using the :meth:`~lightning.fabric.fabric.Fabric.load_raw` method: + +.. code-block:: python + + model = MyModel() + + # A model weights file saved by your friend who doesn't use Fabric + fabric.load_raw("path/to/model.pt", model) + + # Equivalent to this: + # model.load_state_dict(torch.load("path/to/model.pt")) + + # Also supports optimizers + optimizer = torch.optim.Adam(model.parameters()) + fabric.load_raw("path/to/optimizer.pt", optimizer) + +The file to load must contain a valid state-dict for the model/optimizer. +If your checkpoint has a different format, you will have to convert it manually first. + + +---- + + +************************* +Load a partial checkpoint +************************* + +Loading a checkpoint is normally "strict", meaning parameter names in the checkpoint must match the parameter names in the model. +However, when loading checkpoints for fine-tuning or transfer learning, it can happen that only a portion of the parameters match the model. +For this case, you can disable strict loading to avoid errors: + +.. code-block:: python + + state = {"model": model} + + # strict loading is the default + fabric.load("path/to/checkpoint.ckpt", state, strict=True) + + # disable strict loading + fabric.load("path/to/checkpoint.ckpt", state, strict=False) + + +Here is a trivial example to illustrate how it works: + +.. code-block:: python + + import torch + import lightning as L + + fabric = L.Fabric() + + # Save a checkpoint of a trained model + model1 = torch.nn.Linear(2, 2, bias=True) + state = {"model": model1} + fabric.save("state.ckpt", state) + + # Later on, make a new model that misses a parameter + model2 = torch.nn.Linear(2, 2, bias=False) + state = {"model": model2} + + # `strict=True` would lead to an error, because the bias + # parameter is missing, but we can load the rest of the + # parameters successfully + fabric.load("state.ckpt", state, strict=False) + + +The :meth:`~lightning.fabric.fabric.Fabric.load_raw` method also supports the ``strict`` argument. +See also: `Saving and loading models in PyTorch `_. + + +---- + +************************* +Save a partial checkpoint +************************* + +When saving a checkpoint using Fabric, you have the flexibility to choose which parameters to include in the saved file. +This can be useful in scenarios such as fine-tuning, where you only want to save a subset of the parameters, reducing +the size of the checkpoint and saving disk space. + +To accomplish this, you can use filters during the saving process. The filter is a function that determines whether +an item should be saved (returning ``True``) or excluded (returning ``False``). +The filter operates on dictionary objects and evaluates each key-value pair individually. + +Here's an example of using a filter when saving a checkpoint: + +.. code-block:: python + + state = {"model": model, "optimizer": optimizer, "foo": 123} + + # save only the model weights + filter = {"model": lambda k, v: "weight"} + fabric.save("path/to/checkpoint.ckpt", state, filter=filter) + # This will save {"model": {"layer.weight": ...}, "optimizer": ..., "foo": 123} + # note that the optimizer params corresponding to the excluded model params are not filtered + + +---- + + +********** +Next steps +********** + +Learn from our template how Fabrics checkpoint mechanism can be integrated into a full Trainer: + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Trainer Template + :description: Take our Fabric Trainer template and customize it for your needs + :button_link: https://github.com/Lightning-AI/lightning/tree/master/examples/fabric/build_your_own_trainer + :col_css: col-md-4 + :height: 150 + :tag: intermediate + +.. raw:: html + +
+
diff --git a/docs/source-fabric/guide/index.rst b/docs/source-fabric/guide/index.rst new file mode 100644 index 0000000..4d68aa7 --- /dev/null +++ b/docs/source-fabric/guide/index.rst @@ -0,0 +1,171 @@ +############# +How-to Guides +############# + + +****** +Basics +****** + + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Convert to Fabric in 5 minutes + :description: Learn how to add Fabric to your PyTorch code + :button_link: ../fundamentals/convert.html + :col_css: col-md-4 + :height: 150 + :tag: basic + +.. displayitem:: + :header: Scale your model with Accelerators + :description: Take advantage of your hardware with a switch of a flag + :button_link: ../fundamentals/accelerators.html + :col_css: col-md-4 + :height: 150 + :tag: basic + +.. displayitem:: + :header: Structure your Fabric code + :description: Best practices for setting up your training script with Fabric + :button_link: ../fundamentals/code_structure.html + :col_css: col-md-4 + :height: 150 + :tag: basic + +.. displayitem:: + :header: Launch distributed training + :description: Launch a Python script on multiple devices and machines + :button_link: ../fundamentals/launch.html + :col_css: col-md-4 + :height: 150 + :tag: basic + +.. displayitem:: + :header: Launch Fabric in a notebook + :description: Launch on multiple devices from within a Jupyter notebook + :button_link: ../fundamentals/notebooks.html + :col_css: col-md-4 + :height: 150 + :tag: basic + +.. displayitem:: + :header: Improve performance with Mixed-Precision training + :description: Save memory and speed up training using mixed precision + :button_link: ../fundamentals/precision.html + :col_css: col-md-4 + :height: 150 + :tag: basic + +.. raw:: html + +
+
+ + + +********************** +Build your own Trainer +********************** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Organize your model code with with LightningModule + :description: Organize your code in a LightningModule and use it with Fabric + :button_link: lightning_module.html + :col_css: col-md-4 + :height: 170 + :tag: intermediate + +.. displayitem:: + :header: Encapsulate code into Callbacks + :description: Make use of the Callback system in Fabric + :button_link: callbacks.html + :col_css: col-md-4 + :height: 170 + :tag: intermediate + +.. displayitem:: + :header: Track and visualize experiments + :description: Learn how Fabric helps you remove boilerplate code for tracking metrics with a logger + :button_link: logging.html + :col_css: col-md-4 + :height: 170 + :tag: intermediate + +.. displayitem:: + :header: Save and load model progress + :description: Efficient saving and loading of model weights, training state, hyperparameters and more. + :button_link: checkpoint.html + :col_css: col-md-4 + :height: 170 + :tag: intermediate + +.. displayitem:: + :header: Build your own Trainer + :description: Take our Fabric Trainer template and customize it for your needs + :button_link: https://github.com/Lightning-AI/lightning/tree/master/examples/fabric/build_your_own_trainer + :col_css: col-md-4 + :height: 170 + :tag: intermediate + +.. raw:: html + +
+
+ + +*************** +Advanced Topics +*************** + + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Use efficient gradient accumulation + :description: Learn how to perform efficient gradient accumulation in distributed settings + :button_link: ../advanced/gradient_accumulation.html + :col_css: col-md-4 + :height: 160 + :tag: advanced + +.. displayitem:: + :header: Distribute communication + :description: Learn all about communication primitives for distributed operation. Gather, reduce, broadcast, etc. + :button_link: ../advanced/distributed_communication.html + :col_css: col-md-4 + :height: 160 + :tag: advanced + +.. displayitem:: + :header: Use multiple models and optimizers + :description: See how flexible Fabric is to work with multiple models and optimizers! + :button_link: ../advanced/multiple_setup.html + :col_css: col-md-4 + :height: 160 + :tag: advanced + +.. displayitem:: + :header: Train models with billions of parameters + :description: Train the largest models with FSDP across multiple GPUs and machines + :button_link: ../advanced/model_parallel/fsdp.html + :col_css: col-md-4 + :height: 160 + :tag: advanced + +.. raw:: html + +
+
diff --git a/docs/source-fabric/guide/lightning_module.rst b/docs/source-fabric/guide/lightning_module.rst new file mode 100644 index 0000000..6140a97 --- /dev/null +++ b/docs/source-fabric/guide/lightning_module.rst @@ -0,0 +1,148 @@ +################## +Organize Your Code +################## + +Any raw PyTorch can be converted to Fabric with zero refactoring required, giving maximum flexibility in how you want to organize your projects. + +However, when developing a project in a team or sharing the code publicly, it can be beneficial to conform to a standard format of how core pieces of the code are organized. +This is what the `LightningModule `_ was made for! + +Here is how you can neatly separate the research code (model, loss, optimization, etc.) from the "trainer" code (training loop, checkpointing, logging, etc.). + + +---- + + +************************************************* +Step 1: Move your code into LightningModule hooks +************************************************* + +Take these main ingredients and put them in a LightningModule: + +- The PyTorch model(s) as an attribute (e.g. ``self.model``) +- The forward, including loss computation, goes into ``training_step()`` +- Setup of optimizer(s) goes into ``configure_optimizers()`` +- Setup of the training data loader goes into ``train_dataloader()`` + + +.. code-block:: python + + import lightning as L + + + class LitModel(L.LightningModule): + def __init__(self): + super().__init__() + self.model = ... + + def training_step(self, batch, batch_idx): + # Main forward, loss computation, and metrics goes here + x, y = batch + y_hat = self.model(x) + loss = self.loss_fn(y, y_hat) + acc = self.accuracy(y, y_hat) + ... + return loss + + def configure_optimizers(self): + # Return one or several optimizers + return torch.optim.Adam(self.parameters(), ...) + + def train_dataloader(self): + # Return your dataloader for training + return DataLoader(...) + + def on_train_start(self): + # Do something at the beginning of training + ... + + def any_hook_you_like(self, *args, **kwargs): + ... + + +This is a minimal LightningModule, but there are `many other useful hooks `_ you can use. + + +---- + + +**************************************** +Step 2: Call hooks from your Fabric code +**************************************** + +In your Fabric training loop, you can now call the hooks of the LightningModule interface. +It is up to you to call everything at the right place. + +.. code-block:: python + + import lightning as L + + fabric = L.Fabric(...) + + # Instantiate the LightningModule + model = LitModel() + + # Get the optimizer(s) from the LightningModule + optimizer = model.configure_optimizers() + + # Get the training data loader from the LightningModule + train_dataloader = model.train_dataloader() + + # Set up objects + model, optimizer = fabric.setup(model, optimizer) + train_dataloader = fabric.setup_dataloaders(train_dataloader) + + # Call the hooks at the right time + model.on_train_start() + + model.train() + for epoch in range(num_epochs): + for i, batch in enumerate(dataloader): + optimizer.zero_grad() + loss = model.training_step(batch, i) + fabric.backward(loss) + optimizer.step() + + # Control when hooks are called + if condition: + model.any_hook_you_like() + + +Your code is now modular. You can switch out the entire LightningModule implementation for another one, and you don't need to touch the training loop: + +.. code-block:: diff + + # Instantiate the LightningModule + - model = LitModel() + + model = DopeModel() + + ... + + +---- + + +************************************ +Access Fabric inside LightningModule +************************************ + +You can access the Fabric instance in any of the LightningModule hooks via ``self.fabric``, provided that you called +``fabric.setup()`` on the module. + +.. code-block:: python + + import lightning as L + + + class LitModel(L.LightningModule): + def on_train_start(self): + # Access Fabric and its attributes + print(self.fabric.world_size) + + + fabric = L.Fabric() + model = fabric.setup(LitModel()) + model.on_train_start() + +To maximize compatibility with LightningModules written for the Lightning Trainer, ``self.trainer`` is also available and will +reroute to ``self.fabric``. diff --git a/docs/source-fabric/guide/logging.rst b/docs/source-fabric/guide/logging.rst new file mode 100644 index 0000000..36b9513 --- /dev/null +++ b/docs/source-fabric/guide/logging.rst @@ -0,0 +1,123 @@ +############################### +Track and Visualize Experiments +############################### + +******************************* +Why do I need to track metrics? +******************************* + +In model development, we track values of interest, such as the *validation_loss* to visualize the learning process for our models. +Model development is like driving a car without windows. Charts and logs provide the *windows* to know where to drive the car. + +With Lightning, you can visualize virtually anything you can think of: numbers, text, images, and audio. + +---- + +************* +Track metrics +************* + +Metric visualization is the most basic but powerful way to understand how your model is doing throughout development. +To track a metric, add the following: + +**Step 1:** Pick a logger. + +.. code-block:: python + + from lightning.fabric import Fabric + from lightning.fabric.loggers import TensorBoardLogger + + # Pick a logger and add it to Fabric + logger = TensorBoardLogger(root_dir="logs") + fabric = Fabric(loggers=logger) + + +Built-in loggers you can choose from: + +- :class:`~lightning.fabric.loggers.TensorBoardLogger` +- :class:`~lightning.fabric.loggers.CSVLogger` + +| + +**Step 2:** Add :meth:`~lightning.fabric.fabric.Fabric.log` calls in your code. + +.. code-block:: python + + value = ... # Python scalar or tensor scalar + fabric.log("some_value", value) + + +To log multiple metrics at once, use :meth:`~lightning.fabric.fabric.Fabric.log_dict`: + +.. code-block:: python + + values = {"loss": loss, "acc": acc, "other": other} + fabric.log_dict(values) + + +---- + + +******************* +View logs dashboard +******************* + +How you can view the metrics depends on the individual logger you choose. +Most have a dashboard that lets you browse everything you log in real time. + +For the :class:`~lightning.fabric.loggers.tensorboard.TensorBoardLogger` shown above, you can open it by running + +.. code-block:: bash + + tensorboard --logdir=./logs + +If you're using a notebook environment such as *Google Colab* or *Kaggle* or *Jupyter*, launch TensorBoard with this command + +.. code-block:: bash + + %reload_ext tensorboard + %tensorboard --logdir=./logs + + +---- + + +************************* +Control logging frequency +************************* + +Logging a metric in every iteration can slow down the training. +Reduce the added overhead by logging less frequently: + +.. code-block:: python + :emphasize-lines: 3 + + for iteration in range(num_iterations): + if iteration % log_every_n_steps == 0: + value = ... + fabric.log("some_value", value) + + +---- + + +******************** +Use multiple loggers +******************** + +You can add as many loggers as you want without changing the logging code in your loop. + +.. code-block:: python + :emphasize-lines: 8 + + from lightning.fabric import Fabric + from lightning.fabric.loggers import CSVLogger, TensorBoardLogger + + tb_logger = TensorBoardLogger(root_dir="logs/tensorboard") + csv_logger = CSVLogger(root_dir="logs/csv") + + # Add multiple loggers in a list + fabric = Fabric(loggers=[tb_logger, csv_logger]) + + # Calling .log() or .log_dict() always logs to all loggers simultaneously + fabric.log("some_value", value) diff --git a/docs/source-fabric/guide/multi_node/barebones.rst b/docs/source-fabric/guide/multi_node/barebones.rst new file mode 100644 index 0000000..825f150 --- /dev/null +++ b/docs/source-fabric/guide/multi_node/barebones.rst @@ -0,0 +1,161 @@ +:orphan: + +################## +Bare Bones Cluster +################## + +**Audience**: Users who want to train on multiple machines that aren't part of a managed cluster. + +This guide shows how to run a training job on a general-purpose cluster. +It assumes that you can log in to each machine and run commands. + +Don't want to maintain your own infrastructure? Try the :doc:`Lightning cloud <./cloud>` instead. + + +---- + + +************ +Requirements +************ + +To set up a multi-node computing cluster, you need the following: + +1. Multiple computers with Lightning installed +2. A network connectivity between the machines with firewall rules that allow traffic flow on a specified port. + +| + +We highly recommend setting up a shared filesystem to avoid the cumbersome copying of files between machines. + + +---- + + +*************************** +Prepare the training script +*************************** + +.. code-block:: python + :caption: train.py + + from lightning.fabric import Fabric + + fabric = Fabric() + + # The rest of the training script + ... + +We intentionally omit to specify ``strategy``, ``devices``, and ``num_nodes`` here because these settings will get supplied through the CLI in the later steps. +You can still hard-code other options if you like. + + +---- + + +********************************* +Launch the script on your cluster +********************************* + +**Step 1**: Upload the training script and all needed files to the cluster. +Each node needs access to the same files. +If the nodes don't attach to a shared network drive, you'll need to upload the files to each node separately. + +**Step 2**: Pick one of the nodes as your main node and write down its IP address. +Example: 10.10.10.16 + +**Step 3**: Launch the script on each node using the Lightning CLI. + +In this example, we want to launch training across two nodes, each with 8 GPUs. +Log in to the **first node** and run this command: + +.. code-block:: bash + :emphasize-lines: 2,3 + + lightning run model \ + --node-rank=0 \ + --main-address=10.10.10.16 \ + --accelerator=cuda \ + --devices=8 \ + --num-nodes=2 \ + train.py + +Log in to the **second node** and run this command: + +.. code-block:: bash + :emphasize-lines: 2,3 + + lightning run model \ + --node-rank=1 \ + --main-address=10.10.10.16 \ + --accelerator=cuda \ + --devices=8 \ + --num-nodes=2 \ + train.py + +Note: The only difference between the two commands is the ``--node-rank`` setting, which identifies each node. +After executing these commands, you should immediately see an output like this: + +.. code-block:: + + Initializing distributed: GLOBAL_RANK: 0, MEMBER: 1/16 + Initializing distributed: GLOBAL_RANK: 1, MEMBER: 2/16 + ... + + +---- + + +*************** +Troubleshooting +*************** + + +**My program is stuck initializing at startup. What is causing this?** + +You are seeing a message like this in the logs, but nothing happens: + +.. code-block:: + + Initializing distributed: GLOBAL_RANK: 0, MEMBER: 1/4 + +The most likely reasons and how to fix it: + +- **Wrong network interface:** Some servers have multiple network interfaces. + There is usually only one that can send and receive traffic from the network of the other nodes, but sometimes it is not set as the default. + In this case, you need to set it manually: + + .. code-block:: bash + + export GLOO_SOCKET_IFNAME=eno1 + export NCCL_SOCKET_IFNAME=eno1 + lightning run model ... + + You can find the interface name by parsing the output of the ``ifconfig`` command. + The name of this interface **may differ on each node**. + +- **NCCL can't communicate between the nodes:** + + Follow the steps in the `NCCL troubleshooting guide `_. + In particular, take note of the network section that describes restricting the port range and firewall rules. + + .. code-block:: bash + + echo "net.ipv4.ip_local_port_range = 50000 51000" >> /etc/sysctl.conf + sysctl --system + ufw allow 50000:51000/tcp + + +**My program crashes with an NCCL error, but it is not helpful** + +Launch your command by prepending ``NCCL_DEBUG=INFO`` to get more info. + +.. code-block:: bash + + NCCL_DEBUG=INFO lightning run model ... + + +---- + +If you are sick of troubleshooting cluster problems, give :doc:`Lightning cloud <./cloud>` a try! +For other questions, please don't hesitate to join the `Discord `_. diff --git a/docs/source-fabric/guide/multi_node/cloud.rst b/docs/source-fabric/guide/multi_node/cloud.rst new file mode 100644 index 0000000..833bb92 --- /dev/null +++ b/docs/source-fabric/guide/multi_node/cloud.rst @@ -0,0 +1,115 @@ +:orphan: + +########################## +Run in the Lightning Cloud +########################## + +**Audience**: Users who don't want to waste time on cluster configuration and maintenance. + + +The Lightning AI cloud is a platform where you can build, train, finetune and deploy models without worrying about infrastructure, cost management, scaling, and other technical headaches. +In this guide, and within just 10 minutes, you will learn how to run a Fabric training script across multiple nodes in the cloud. + + +---- + + +************* +Initial Setup +************* + +First, create a free `Lightning AI account `_. +Then, log in from the CLI: + +.. code-block:: bash + + lightning login + +A page opens in your browser where you can follow the instructions to complete the setup. + + +---- + + +*************************************** +Launch multi-node training in the cloud +*************************************** + +**Step 1:** Put your code inside a :class:`~lightning_app.core.work.LightningWork`: + +.. code-block:: python + :emphasize-lines: 5 + :caption: app.py + + import lightning as L + from lightning.app.components import FabricMultiNode + + + # 1. Put your code inside a LightningWork + class MyTrainingComponent(L.LightningWork): + def run(self): + # Set up Fabric + # The `devices` and `num_nodes` gets set by Lightning automatically + fabric = L.Fabric(strategy="ddp", precision="16-mixed") + + # Your training code + model = ... + optimizer = ... + model, optimizer = fabric.setup(model, optimizer) + ... + +**Step 2:** Init a :class:`~lightning_app.core.app.LightningApp` with the ``FabricMultiNode`` component. +Configure the number of nodes, the number of GPUs per node, and the type of GPU: + +.. code-block:: python + :emphasize-lines: 5,7 + :caption: app.py + + # 2. Create the app with the FabricMultiNode component inside + app = L.LightningApp( + FabricMultiNode( + MyTrainingComponent, + # Run with 2 nodes + num_nodes=2, + # Each with 4 x V100 GPUs, total 8 GPUs + cloud_compute=L.CloudCompute("gpu-fast-multi"), + ) + ) + + +**Step 3:** Run your code from the CLI: + +.. code-block:: bash + + lightning run app app.py --cloud + +This command will upload your Python file and then opens the app admin view, where you can see the logs of what's happening. + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/fabric/fabric-multi-node-admin.png + :alt: The Lightning AI admin page of an app running a multi-node fabric training script + :width: 100% + + +---- + + +********** +Next steps +********** + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Lightning Platform + :description: Develop, Train and Deploy models on the cloud + :col_css: col-md-4 + :button_link: https://lightning.ai + :height: 150 + +.. raw:: html + +
+
diff --git a/docs/source-fabric/guide/multi_node/other.rst b/docs/source-fabric/guide/multi_node/other.rst new file mode 100644 index 0000000..6bddf04 --- /dev/null +++ b/docs/source-fabric/guide/multi_node/other.rst @@ -0,0 +1,66 @@ +:orphan: + +########################## +Other Cluster Environments +########################## + +**Audience**: Users who want to run on a cluster that launches the training script via MPI, LSF, Kubeflow, etc. + +Lightning automates the details behind training on the most common cluster environments. +While :doc:`SLURM <./slurm>` is the most popular choice for on-prem clusters, there are other systems that Lightning can detect automatically. + +Don't have access to an enterprise cluster? Try the :doc:`Lightning cloud <./cloud>`. + + +---- + + +*** +MPI +*** + +`MPI (Message Passing Interface) `_ is a communication system for parallel computing. +There are many implementations available, the most popular among them are `OpenMPI `_ and `MPICH `_. +To support all these, Lightning relies on the `mpi4py package `_: + +.. code-block:: bash + + pip install mpi4py + +If the package is installed and the Python script gets launched by MPI, Fabric will automatically detect it and parse the process information from the environment. +There is nothing you have to change in your code: + +.. code-block:: python + + fabric = Fabric(...) # automatically detects MPI + print(fabric.world_size) # world size provided by MPI + print(fabric.global_rank) # rank provided by MPI + ... + +If you want to bypass the automatic detection, you can explicitly set the MPI environment as a plugin: + +.. code-block:: python + + from lightning.fabric.plugins.environments import MPIEnvironment + + fabric = Fabric(..., plugins=[MPIEnvironment()]) + + +---- + + +*** +LSF +*** + +Coming soon. + + +---- + + +******** +Kubeflow +******** + +Coming soon. diff --git a/docs/source-fabric/guide/multi_node/slurm.rst b/docs/source-fabric/guide/multi_node/slurm.rst new file mode 100644 index 0000000..62025ce --- /dev/null +++ b/docs/source-fabric/guide/multi_node/slurm.rst @@ -0,0 +1,136 @@ +:orphan: + +############################## +Run on a SLURM Managed Cluster +############################## + +**Audience**: Users who need to run on an academic or enterprise private cluster. + +Lightning automates the details behind training on a SLURM-powered cluster. +Unlike the :doc:`general-purpose cluster <./barebones>`, with SLURM the users don't need to start the jobs manually on each node but instead submit it to SLURM, which schedules the resources and time for which the job is allowed to run. + +Don't have access to an enterprise cluster? Try the :doc:`Lightning cloud <./cloud>`. + +---- + + +********************************* +Submit a training script to SLURM +********************************* + +To train a model using multiple nodes, do the following: + +**Step 1:** Set the number of devices per node and how many nodes the training will run on. + +.. code-block:: python + + from lightning.fabric import Fabric + + # Train on 32 GPUs across 4 nodes + fabric = Fabric(accelerator="gpu", devices=8, num_nodes=4) + +By default, this will run classic *distributed data-parallel*. +Optionally, explore other strategies too: + +.. code-block:: python + + # DeepSpeed + fabric = Fabric(accelerator="gpu", devices=8, num_nodes=4, strategy="deepspeed") + + # Fully Sharded Data Parallel (FSDP) + fabric = Fabric(accelerator="gpu", devices=8, num_nodes=4, strategy="fsdp") + + +**Step 2:** Call :meth:`~lightning.fabric.fabric.Fabric.launch` to initialize the communication between devices and nodes. + +.. code-block:: python + + fabric = Fabric(...) + fabric.launch() + + +**Step 3:** Create the appropriate SLURM job configuration: + +.. code-block:: bash + :caption: submit.sh + :emphasize-lines: 4,5,21 + + #!/bin/bash -l + + # SLURM SUBMIT SCRIPT + #SBATCH --nodes=4 # This needs to match Fabric(num_nodes=...) + #SBATCH --ntasks-per-node=8 # This needs to match Fabric(devices=...) + #SBATCH --gres=gpu:8 # Request N GPUs per machine + #SBATCH --mem=0 + #SBATCH --time=0-02:00:00 + + # Activate conda environment + source activate $1 + + # Debugging flags (optional) + export NCCL_DEBUG=INFO + export PYTHONFAULTHANDLER=1 + + # On your cluster you might need this: + # export NCCL_SOCKET_IFNAME=^docker0,lo + + # Run your training script + srun python train.py + + +**Step 4:** Submit the job to SLURM + +.. code-block:: bash + + sbatch submit.sh + + +---- + + +**************** +Interactive Mode +**************** + +You can also let SLURM schedule a machine for you and then log in to the machine to run scripts manually. +This is useful for development and debugging. +If you set the job name to *bash* or *interactive*, and then log in and run scripts, Lightning's SLURM auto-detection will get bypassed and it can launch processes normally: + +.. code-block:: bash + + # make sure to set `--job-name "interactive"` + srun --account --pty bash --job-name "interactive" ... + + # now run scripts normally + python train.py ... + + +---- + + +*************** +Troubleshooting +*************** + +**My program is stuck initializing at startup. What is causing this?** + +You are seeing a message like this in the logs, but nothing happens: + +.. code-block:: + + Initializing distributed: GLOBAL_RANK: 0, MEMBER: 1/4 + + +The most likely reasons and how to fix it: + +- You forgot to run the ``python train.py`` command with ``srun``: + Please have a look at the SLURM template script above, which includes the ``srun`` at the bottom of the script. + +- The number of nodes or the number of devices per node is misconfigured: + Two parameters in the SLURM submission script determine how many processes will run your training, the ``#SBATCH --nodes=X`` setting and ``#SBATCH --ntasks-per-node=Y`` settings. + The numbers there need to match what is configured in Fabric in the code: ``Fabric(num_nodes=X, devices=Y)``. + If you change the numbers, update them in BOTH places. + + +If you are sick of troubleshooting SLURM settings, give :doc:`Lightning cloud <./cloud>` a try! +For other questions, please don't hesitate to join the `Discord `_. diff --git a/docs/source-fabric/guide/trainer_template.rst b/docs/source-fabric/guide/trainer_template.rst new file mode 100644 index 0000000..f13eccf --- /dev/null +++ b/docs/source-fabric/guide/trainer_template.rst @@ -0,0 +1,7 @@ +:orphan: + +################ +Template Trainer +################ + +TODO: Write a guide explaining how to build a template like the one in https://github.com/Lightning-AI/lightning/tree/master/examples/fabric/build_your_own_trainer diff --git a/docs/source-fabric/index.rst b/docs/source-fabric/index.rst new file mode 100644 index 0000000..08d37e8 --- /dev/null +++ b/docs/source-fabric/index.rst @@ -0,0 +1,158 @@ +.. include:: links.rst + +#################### +Welcome to ⚡ Fabric +#################### + +Fabric is the fast and lightweight way to scale PyTorch models without boilerplate code. + +- Easily switch from running on CPU to GPU (Apple Silicon, CUDA, ...), TPU, multi-GPU or even multi-node training +- State-of-the-art distributed training strategies (DDP, FSDP, DeepSpeed) and mixed precision out of the box +- Handles all the boilerplate device logic for you +- Brings useful tools to help you build a trainer (callbacks, logging, checkpoints, ...) +- Designed with multi-billion parameter models in mind + +| + +.. code-block:: diff + + import torch + from lightning.pytorch.demos import WikiText2, Transformer + + import lightning as L + + - device = torch.device("cuda" if torch.cuda.is_available() else "cpu") + + fabric = L.Fabric(accelerator="cuda", devices=8, strategy="ddp") + + fabric.launch() + + dataset = WikiText2() + dataloader = torch.utils.data.DataLoader(dataset) + model = Transformer(vocab_size=dataset.vocab_size) + optimizer = torch.optim.SGD(model.parameters(), lr=0.1) + + - model = model.to(device) + + model, optimizer = fabric.setup(model, optimizer) + + dataloader = fabric.setup_dataloaders(dataloader) + + model.train() + for epoch in range(20): + for batch in dataloader: + input, target = batch + - input, target = input.to(device), target.to(device) + optimizer.zero_grad() + output = model(input, target) + loss = torch.nn.functional.nll_loss(output, target.view(-1)) + - loss.backward() + + fabric.backward(loss) + optimizer.step() + + +---- + + +*********** +Why Fabric? +*********** + +| +| + +.. figure:: https://pl-public-data.s3.amazonaws.com/assets_lightning/fabric/PyTorch-to-Fabric-Spectrum-2.svg + :alt: Fabric spans across a large spectrum - from raw PyTorch all the way to high-level PyTorch Lightning + :width: 100% + +| +| + +Fabric differentiates itself from a fully-fledged trainer like Lightning's `Trainer`_ in these key aspects: + +**Fast to implement** +There is no need to restructure your code: Just change a few lines in the PyTorch script and you'll be able to leverage Fabric features. + +**Maximum Flexibility** +Write your own training and/or inference logic down to the individual optimizer calls. +You aren't forced to conform to a standardized epoch-based training loop like the one in Lightning `Trainer`_. +You can do flexible iteration based training, meta-learning, cross-validation and other types of optimization algorithms without digging into framework internals. +This also makes it super easy to adopt Fabric in existing PyTorch projects to speed-up and scale your models without the compromise on large refactors. +Just remember: With great power comes a great responsibility. + +**Maximum Control** +The Lightning `Trainer`_ has many built-in features to make research simpler with less boilerplate, but debugging it requires some familiarity with the framework internals. +In Fabric, everything is opt-in. Think of it as a toolbox: You take out the tools (Fabric functions) you need and leave the other ones behind. +This makes it easier to develop and debug your PyTorch code as you gradually add more features to it. +Fabric provides important tools to remove undesired boilerplate code (distributed, hardware, checkpoints, logging, ...), but leaves the design and orchestration fully up to you. + + +---- + +************ +Installation +************ + +Fabric ships directly with Lightning. Install it with + +.. code-block:: bash + + pip install lightning + +For alternative ways to install, read the :doc:`installation guide `. + + + +.. raw:: html + +
+ +.. toctree:: + :maxdepth: 1 + :name: start + :caption: Home + + self + Install + + +.. toctree:: + :maxdepth: 1 + :caption: Get started in steps + + Basic skills + Intermediate skills + Advanced skills + + +.. toctree:: + :maxdepth: 1 + :caption: Core API Reference + + Fabric Arguments + Fabric Methods + + +.. toctree:: + :maxdepth: 1 + :caption: Full API Reference + + Accelerators + Collectives + Environments + Fabric + IO + Loggers + Precision + Strategies + + +.. toctree:: + :maxdepth: 1 + :name: more + :caption: More + + Examples + Glossary + How-tos + Style Guide + + +.. raw:: html + +
diff --git a/docs/source-fabric/levels/advanced.rst b/docs/source-fabric/levels/advanced.rst new file mode 100644 index 0000000..b8fb45d --- /dev/null +++ b/docs/source-fabric/levels/advanced.rst @@ -0,0 +1,55 @@ +.. toctree:: + :maxdepth: 1 + :hidden: + + <../advanced/gradient_accumulation> + <../advanced/distributed_communication> + <../advanced/multiple_setup> + <../advanced/model_parallel/fsdp> + + +############### +Advanced skills +############### + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Use efficient gradient accumulation + :description: Learn how to perform efficient gradient accumulation in distributed settings + :button_link: ../advanced/gradient_accumulation.html + :col_css: col-md-4 + :height: 170 + :tag: advanced + +.. displayitem:: + :header: Distribute communication + :description: Learn all about communication primitives for distributed operation. Gather, reduce, broadcast, etc. + :button_link: ../advanced/distributed_communication.html + :col_css: col-md-4 + :height: 170 + :tag: advanced + +.. displayitem:: + :header: Use multiple models and optimizers + :description: See how flexible Fabric is to work with multiple models and optimizers! + :button_link: ../advanced/multiple_setup.html + :col_css: col-md-4 + :height: 170 + :tag: advanced + +.. displayitem:: + :header: Train models with billions of parameters + :description: Train the largest models with FSDP across multiple GPUs and machines + :button_link: ../advanced/model_parallel/fsdp.html + :col_css: col-md-4 + :height: 170 + :tag: advanced + +.. raw:: html + +
+
diff --git a/docs/source-fabric/levels/basic.rst b/docs/source-fabric/levels/basic.rst new file mode 100644 index 0000000..cf53eff --- /dev/null +++ b/docs/source-fabric/levels/basic.rst @@ -0,0 +1,74 @@ +.. toctree:: + :maxdepth: 1 + :hidden: + + <../fundamentals/convert> + <../fundamentals/accelerators> + <../fundamentals/code_structure> + <../fundamentals/launch> + <../fundamentals/notebooks> + <../fundamentals/precision> + + +############ +Basic skills +############ + + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Convert to Fabric in 5 minutes + :description: Learn how to add Fabric to your PyTorch code + :button_link: ../fundamentals/convert.html + :col_css: col-md-4 + :height: 150 + :tag: basic + +.. displayitem:: + :header: Scale your model with Accelerators + :description: Take advantage of your hardware with a switch of a flag + :button_link: ../fundamentals/accelerators.html + :col_css: col-md-4 + :height: 150 + :tag: basic + +.. displayitem:: + :header: Structure your Fabric code + :description: Best practices for setting up your training script with Fabric + :button_link: ../fundamentals/code_structure.html + :col_css: col-md-4 + :height: 150 + :tag: basic + +.. displayitem:: + :header: Launch distributed training + :description: Launch a Python script on multiple devices and machines + :button_link: ../fundamentals/launch.html + :col_css: col-md-4 + :height: 150 + :tag: basic + +.. displayitem:: + :header: Launch Fabric in a notebook + :description: Launch on multiple devices from within a Jupyter notebook + :button_link: ../fundamentals/notebooks.html + :col_css: col-md-4 + :height: 150 + :tag: basic + +.. displayitem:: + :header: Improve performance with Mixed-Precision training + :description: Save memory and speed up training using mixed precision + :button_link: ../fundamentals/precision.html + :col_css: col-md-4 + :height: 150 + :tag: basic + +.. raw:: html + +
+
diff --git a/docs/source-fabric/levels/intermediate.rst b/docs/source-fabric/levels/intermediate.rst new file mode 100644 index 0000000..2d2037a --- /dev/null +++ b/docs/source-fabric/levels/intermediate.rst @@ -0,0 +1,64 @@ +.. toctree:: + :maxdepth: 1 + :hidden: + + <../guide/lightning_module> + <../guide/callbacks> + <../guide/logging> + <../guide/checkpoint> + <../guide/trainer_template> + + +################### +Intermediate skills +################### + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Organize your model code with with LightningModule + :description: Organize your code in a LightningModule and use it with Fabric + :button_link: ../guide/lightning_module.html + :col_css: col-md-4 + :height: 180 + :tag: intermediate + +.. displayitem:: + :header: Encapsulate code into Callbacks + :description: Make use of the Callback system in Fabric + :button_link: ../guide/callbacks.html + :col_css: col-md-4 + :height: 180 + :tag: intermediate + +.. displayitem:: + :header: Track and visualize experiments + :description: Learn how Fabric helps you remove boilerplate code for tracking metrics with a logger + :button_link: ../guide/logging.html + :col_css: col-md-4 + :height: 180 + :tag: intermediate + +.. displayitem:: + :header: Save and load model progress + :description: Efficient saving and loading of model weights, training state, hyperparameters and more. + :button_link: ../guide/checkpoint.html + :col_css: col-md-4 + :height: 180 + :tag: intermediate + +.. displayitem:: + :header: Build your own Trainer + :description: Take our Fabric Trainer template and customize it for your needs + :button_link: https://github.com/Lightning-AI/lightning/tree/master/examples/fabric/build_your_own_trainer + :col_css: col-md-4 + :height: 180 + :tag: intermediate + +.. raw:: html + +
+
diff --git a/docs/source-fabric/links.rst b/docs/source-fabric/links.rst new file mode 100644 index 0000000..d8e1d12 --- /dev/null +++ b/docs/source-fabric/links.rst @@ -0,0 +1,3 @@ +.. _PyTorchJob: https://www.kubeflow.org/docs/components/training/pytorch/ +.. _Kubeflow: https://www.kubeflow.org +.. _Trainer: https://lightning.ai/docs/pytorch/stable/common/trainer.html diff --git a/docs/source-fabric/make.bat b/docs/source-fabric/make.bat new file mode 100644 index 0000000..9b56514 --- /dev/null +++ b/docs/source-fabric/make.bat @@ -0,0 +1,35 @@ +@ECHO OFF + +pushd %~dp0 + +REM Command file for Sphinx documentation + +if "%SPHINXBUILD%" == "" ( + set SPHINXBUILD=sphinx-build +) +set SOURCEDIR=. +set BUILDDIR=../build + +if "%1" == "" goto help + +%SPHINXBUILD% >NUL 2>NUL +if errorlevel 9009 ( + echo. + echo.The 'sphinx-build' command was not found. Make sure you have Sphinx + echo.installed, then set the SPHINXBUILD environment variable to point + echo.to the full path of the 'sphinx-build' executable. Alternatively you + echo.may add the Sphinx directory to PATH. + echo. + echo.If you don't have Sphinx installed, grab it from + echo.http://sphinx-doc.org/ + exit /b 1 +) + +%SPHINXBUILD% -M %1 %SOURCEDIR% %BUILDDIR% %SPHINXOPTS% +goto end + +:help +%SPHINXBUILD% -M help %SOURCEDIR% %BUILDDIR% %SPHINXOPTS% + +:end +popd diff --git a/docs/source-pytorch/Makefile b/docs/source-pytorch/Makefile new file mode 100644 index 0000000..68be4c9 --- /dev/null +++ b/docs/source-pytorch/Makefile @@ -0,0 +1,19 @@ +# Minimal makefile for Sphinx documentation +# + +# You can set these variables from the command line. +SPHINXOPTS = +SPHINXBUILD = sphinx-build +SOURCEDIR = . +BUILDDIR = ../build + +# Put it first so that "make" without argument is like "make help". +help: + @$(SPHINXBUILD) -M help "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O) + +.PHONY: help Makefile + +# Catch-all target: route all unknown targets to Sphinx using the new +# "make mode" option. $(O) is meant as a shortcut for $(SPHINXOPTS). +%: Makefile + @$(SPHINXBUILD) -M $@ "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O) diff --git a/docs/source-pytorch/_static/copybutton.js b/docs/source-pytorch/_static/copybutton.js new file mode 100644 index 0000000..453363c --- /dev/null +++ b/docs/source-pytorch/_static/copybutton.js @@ -0,0 +1,64 @@ +/* Copied from the official Python docs: https://docs.python.org/3/_static/copybutton.js */ +$(document).ready(function() { + /* Add a [>>>] button on the top-right corner of code samples to hide + * the >>> and ... prompts and the output and thus make the code + * copyable. */ + var div = $('.highlight-python .highlight,' + + '.highlight-python3 .highlight,' + + '.highlight-pycon .highlight,' + + '.highlight-default .highlight'); + var pre = div.find('pre'); + + // get the styles from the current theme + pre.parent().parent().css('position', 'relative'); + var hide_text = 'Hide the prompts and output'; + var show_text = 'Show the prompts and output'; + var border_width = pre.css('border-top-width'); + var border_style = pre.css('border-top-style'); + var border_color = pre.css('border-top-color'); + var button_styles = { + 'cursor':'pointer', 'position': 'absolute', 'top': '0', 'right': '0', + 'border-color': border_color, 'border-style': border_style, + 'border-width': border_width, 'color': border_color, 'text-size': '75%', + 'font-family': 'monospace', 'padding-left': '0.2em', 'padding-right': '0.2em', + 'border-radius': '0 3px 0 0' + } + + // create and add the button to all the code blocks that contain >>> + div.each(function(index) { + var jthis = $(this); + if (jthis.find('.gp').length > 0) { + var button = $('>>>'); + button.css(button_styles) + button.attr('title', hide_text); + button.data('hidden', 'false'); + jthis.prepend(button); + } + // tracebacks (.gt) contain bare text elements that need to be + // wrapped in a span to work with .nextUntil() (see later) + jthis.find('pre:has(.gt)').contents().filter(function() { + return ((this.nodeType == 3) && (this.data.trim().length > 0)); + }).wrap(''); + }); + + // define the behavior of the button when it's clicked + $('.copybutton').click(function(e){ + e.preventDefault(); + var button = $(this); + if (button.data('hidden') === 'false') { + // hide the code output + button.parent().find('.go, .gp, .gt').hide(); + button.next('pre').find('.gt').nextUntil('.gp, .go').css('visibility', 'hidden'); + button.css('text-decoration', 'line-through'); + button.attr('title', show_text); + button.data('hidden', 'true'); + } else { + // show the code output + button.parent().find('.go, .gp, .gt').show(); + button.next('pre').find('.gt').nextUntil('.gp, .go').css('visibility', 'visible'); + button.css('text-decoration', 'none'); + button.attr('title', hide_text); + button.data('hidden', 'false'); + } + }); +}); diff --git a/docs/_images/profiler.png b/docs/source-pytorch/_static/images/accelerator/ipus/profiler.png similarity index 100% rename from docs/_images/profiler.png rename to docs/source-pytorch/_static/images/accelerator/ipus/profiler.png diff --git a/docs/_images/figure-parity-times.png b/docs/source-pytorch/_static/images/benchmarks/figure-parity-times.png similarity index 100% rename from docs/_images/figure-parity-times.png rename to docs/source-pytorch/_static/images/benchmarks/figure-parity-times.png diff --git a/docs/_static/images/general/PTL101_youtube_thumbnail.jpg b/docs/source-pytorch/_static/images/general/PTL101_youtube_thumbnail.jpg similarity index 100% rename from docs/_static/images/general/PTL101_youtube_thumbnail.jpg rename to docs/source-pytorch/_static/images/general/PTL101_youtube_thumbnail.jpg diff --git a/docs/_static/images/general/fast_2.gif b/docs/source-pytorch/_static/images/general/fast_2.gif similarity index 100% rename from docs/_static/images/general/fast_2.gif rename to docs/source-pytorch/_static/images/general/fast_2.gif diff --git a/docs/_static/images/general/pl_overview.gif b/docs/source-pytorch/_static/images/general/pl_overview.gif similarity index 100% rename from docs/_static/images/general/pl_overview.gif rename to docs/source-pytorch/_static/images/general/pl_overview.gif diff --git a/docs/_static/images/general/pl_overview_flat.jpg b/docs/source-pytorch/_static/images/general/pl_overview_flat.jpg similarity index 100% rename from docs/_static/images/general/pl_overview_flat.jpg rename to docs/source-pytorch/_static/images/general/pl_overview_flat.jpg diff --git a/docs/_static/images/general/pl_quick_start_full_compressed.gif b/docs/source-pytorch/_static/images/general/pl_quick_start_full_compressed.gif similarity index 100% rename from docs/_static/images/general/pl_quick_start_full_compressed.gif rename to docs/source-pytorch/_static/images/general/pl_quick_start_full_compressed.gif diff --git a/docs/_static/images/general/tf_loss.jpg b/docs/source-pytorch/_static/images/general/tf_loss.jpg similarity index 100% rename from docs/_static/images/general/tf_loss.jpg rename to docs/source-pytorch/_static/images/general/tf_loss.jpg diff --git a/docs/_static/images/general/tf_tags.jpg b/docs/source-pytorch/_static/images/general/tf_tags.jpg similarity index 100% rename from docs/_static/images/general/tf_tags.jpg rename to docs/source-pytorch/_static/images/general/tf_tags.jpg diff --git a/docs/_static/images/general/tutorial_cover.jpg b/docs/source-pytorch/_static/images/general/tutorial_cover.jpg similarity index 100% rename from docs/_static/images/general/tutorial_cover.jpg rename to docs/source-pytorch/_static/images/general/tutorial_cover.jpg diff --git a/docs/_static/images/icon.svg b/docs/source-pytorch/_static/images/icon.svg similarity index 100% rename from docs/_static/images/icon.svg rename to docs/source-pytorch/_static/images/icon.svg diff --git a/docs/_static/images/lightning_lite/lite.gif b/docs/source-pytorch/_static/images/lightning_lite/lite.gif similarity index 100% rename from docs/_static/images/lightning_lite/lite.gif rename to docs/source-pytorch/_static/images/lightning_lite/lite.gif diff --git a/docs/_static/images/lightning_module/pt_to_pl.png b/docs/source-pytorch/_static/images/lightning_module/pt_to_pl.png similarity index 100% rename from docs/_static/images/lightning_module/pt_to_pl.png rename to docs/source-pytorch/_static/images/lightning_module/pt_to_pl.png diff --git a/docs/_static/images/lightning_module/pt_trainer.png b/docs/source-pytorch/_static/images/lightning_module/pt_trainer.png similarity index 100% rename from docs/_static/images/lightning_module/pt_trainer.png rename to docs/source-pytorch/_static/images/lightning_module/pt_trainer.png diff --git a/docs/_static/images/logo.png b/docs/source-pytorch/_static/images/logo.png similarity index 100% rename from docs/_static/images/logo.png rename to docs/source-pytorch/_static/images/logo.png diff --git a/docs/_static/images/logo.svg b/docs/source-pytorch/_static/images/logo.svg similarity index 100% rename from docs/_static/images/logo.svg rename to docs/source-pytorch/_static/images/logo.svg diff --git a/docs/_static/images/logo_light.svg b/docs/source-pytorch/_static/images/logo_light.svg similarity index 100% rename from docs/_static/images/logo_light.svg rename to docs/source-pytorch/_static/images/logo_light.svg diff --git a/docs/_static/images/mnist_imgs/mnist_cpu_bar.png b/docs/source-pytorch/_static/images/mnist_imgs/mnist_cpu_bar.png similarity index 100% rename from docs/_static/images/mnist_imgs/mnist_cpu_bar.png rename to docs/source-pytorch/_static/images/mnist_imgs/mnist_cpu_bar.png diff --git a/docs/_static/images/mnist_imgs/mnist_gpu.png b/docs/source-pytorch/_static/images/mnist_imgs/mnist_gpu.png similarity index 100% rename from docs/_static/images/mnist_imgs/mnist_gpu.png rename to docs/source-pytorch/_static/images/mnist_imgs/mnist_gpu.png diff --git a/docs/_static/images/mnist_imgs/mnist_tb.png b/docs/source-pytorch/_static/images/mnist_imgs/mnist_tb.png similarity index 100% rename from docs/_static/images/mnist_imgs/mnist_tb.png rename to docs/source-pytorch/_static/images/mnist_imgs/mnist_tb.png diff --git a/docs/_static/images/mnist_imgs/pt_to_pl.jpg b/docs/source-pytorch/_static/images/mnist_imgs/pt_to_pl.jpg similarity index 100% rename from docs/_static/images/mnist_imgs/pt_to_pl.jpg rename to docs/source-pytorch/_static/images/mnist_imgs/pt_to_pl.jpg diff --git a/docs/_static/images/mnist_imgs/restart_runtime.png b/docs/source-pytorch/_static/images/mnist_imgs/restart_runtime.png similarity index 100% rename from docs/_static/images/mnist_imgs/restart_runtime.png rename to docs/source-pytorch/_static/images/mnist_imgs/restart_runtime.png diff --git a/docs/_static/images/mnist_imgs/runtime_tpu.png b/docs/source-pytorch/_static/images/mnist_imgs/runtime_tpu.png similarity index 100% rename from docs/_static/images/mnist_imgs/runtime_tpu.png rename to docs/source-pytorch/_static/images/mnist_imgs/runtime_tpu.png diff --git a/docs/_static/images/mnist_imgs/tpu_fast.png b/docs/source-pytorch/_static/images/mnist_imgs/tpu_fast.png similarity index 100% rename from docs/_static/images/mnist_imgs/tpu_fast.png rename to docs/source-pytorch/_static/images/mnist_imgs/tpu_fast.png diff --git a/docs/_static/images/mnist_imgs/tpu_start.png b/docs/source-pytorch/_static/images/mnist_imgs/tpu_start.png similarity index 100% rename from docs/_static/images/mnist_imgs/tpu_start.png rename to docs/source-pytorch/_static/images/mnist_imgs/tpu_start.png diff --git a/docs/_images/lr_finder.png b/docs/source-pytorch/_static/images/trainer/lr_finder.png similarity index 100% rename from docs/_images/lr_finder.png rename to docs/source-pytorch/_static/images/trainer/lr_finder.png diff --git a/docs/source-pytorch/_static/main.css b/docs/source-pytorch/_static/main.css new file mode 100644 index 0000000..82aa8b3 --- /dev/null +++ b/docs/source-pytorch/_static/main.css @@ -0,0 +1,3 @@ +col { + width: 50% !important; +} diff --git a/source/_templates/autosummary/module.rst b/docs/source-pytorch/_templates/autosummary/module.rst similarity index 100% rename from source/_templates/autosummary/module.rst rename to docs/source-pytorch/_templates/autosummary/module.rst diff --git a/docs/source-pytorch/_templates/classtemplate.rst b/docs/source-pytorch/_templates/classtemplate.rst new file mode 100644 index 0000000..dc11b74 --- /dev/null +++ b/docs/source-pytorch/_templates/classtemplate.rst @@ -0,0 +1,14 @@ +.. role:: hidden + :class: hidden-section +.. currentmodule:: {{ module }} + + +{{ name | underline }} + +.. autoclass:: {{ name }} + :members: + + +.. + autogenerated from source-pytorch/_templates/classtemplate.rst + note it does not have :inherited-members: diff --git a/source/_templates/layout.html b/docs/source-pytorch/_templates/layout.html similarity index 100% rename from source/_templates/layout.html rename to docs/source-pytorch/_templates/layout.html diff --git a/docs/source-pytorch/_templates/theme_variables.jinja b/docs/source-pytorch/_templates/theme_variables.jinja new file mode 100644 index 0000000..912c188 --- /dev/null +++ b/docs/source-pytorch/_templates/theme_variables.jinja @@ -0,0 +1,20 @@ +{%- set external_urls = { + 'github': 'https://github.com/Lightning-AI/lightning', + 'github_issues': 'https://github.com/Lightning-AI/lightning/issues', + 'contributing': 'https://github.com/Lightning-AI/lightning/blob/master/.github/CONTRIBUTING.md', + 'governance': 'https://lightning.ai/docs/pytorch/latest/community/governance.html', + 'docs': 'https://lightning.ai/docs/pytorch/latest/', + 'twitter': 'https://twitter.com/LightningAI', + 'discuss': 'https://www.pytorchlightning.ai/community', + 'tutorials': 'https://lightning.ai/docs/pytorch/latest/#tutorials', + 'home': 'https://lightning.ai/docs/pytorch/latest/', + 'get_started': 'https://lightning.ai/docs/pytorch/latest/starter/introduction.html', + 'features': 'https://lightning.ai/docs/pytorch/latest/', + 'blog': 'https://lightning.ai/pages/blog/', + 'resources': 'https://lightning.ai/docs/pytorch/latest/#community-examples', + 'support': 'https://lightning.ai/docs/pytorch/latest/', + 'community': 'https://www.pytorchlightning.ai/community', + 'forums': 'https://lightning.ai/forums/', + 'versions': 'https://lightning.ai/docs/pytorch/latest/past_versions.html' +} +-%} diff --git a/source/accelerators/accelerator_prepare.rst b/docs/source-pytorch/accelerators/accelerator_prepare.rst similarity index 86% rename from source/accelerators/accelerator_prepare.rst rename to docs/source-pytorch/accelerators/accelerator_prepare.rst index 38921f4..4035443 100644 --- a/source/accelerators/accelerator_prepare.rst +++ b/docs/source-pytorch/accelerators/accelerator_prepare.rst @@ -31,10 +31,10 @@ Delete any calls to .cuda() or .to(device). ---- -********************************************** -Init tensors using type_as and register_buffer -********************************************** -When you need to create a new tensor, use ``type_as``. +************************************************ +Init tensors using Tensor.to and register_buffer +************************************************ +When you need to create a new tensor, use ``Tensor.to``. This will make your code scale to any arbitrary number of GPUs or TPUs with Lightning. .. testcode:: @@ -48,9 +48,9 @@ This will make your code scale to any arbitrary number of GPUs or TPUs with Ligh # with lightning def forward(self, x): z = torch.Tensor(2, 3) - z = z.type_as(x) + z = z.to(x) -The :class:`~pytorch_lightning.core.lightning.LightningModule` knows what device it is on. You can access the reference via ``self.device``. +The :class:`~lightning.pytorch.core.module.LightningModule` knows what device it is on. You can access the reference via ``self.device``. Sometimes it is necessary to store tensors as module attributes. However, if they are not parameters they will remain on the CPU even if the module gets moved to a new device. To prevent that and remain device agnostic, register the tensor as a buffer in your modules' ``__init__`` method with :meth:`~torch.nn.Module.register_buffer`. @@ -105,19 +105,27 @@ Note if you use any built in metrics or custom metrics that use `TorchMetrics +
+ +.. displayitem:: + :header: Train 1 trillion+ parameter models + :description: + :col_css: col-md-4 + :button_link: ../advanced/model_parallel.html + :height: 150 + :tag: advanced + + +.. raw:: html + +
+ diff --git a/docs/source-pytorch/accelerators/gpu_basic.rst b/docs/source-pytorch/accelerators/gpu_basic.rst new file mode 100644 index 0000000..25b026b --- /dev/null +++ b/docs/source-pytorch/accelerators/gpu_basic.rst @@ -0,0 +1,113 @@ +:orphan: + +.. _gpu_basic: + +GPU training (Basic) +==================== +**Audience:** Users looking to save money and run large models faster using single or multiple + +---- + +What is a GPU? +-------------- +A Graphics Processing Unit (GPU), is a specialized hardware accelerator designed to speed up mathematical computations used in gaming and deep learning. + +---- + +.. _multi_gpu: + +Train on GPUs +------------- + +The Trainer will run on all available GPUs by default. Make sure you're running on a machine with at least one GPU. +There's no need to specify any NVIDIA flags as Lightning will do it for you. + +.. code-block:: python + + # run on as many GPUs as available by default + trainer = Trainer(accelerator="auto", devices="auto", strategy="auto") + # equivalent to + trainer = Trainer() + + # run on one GPU + trainer = Trainer(accelerator="gpu", devices=1) + # run on multiple GPUs + trainer = Trainer(accelerator="gpu", devices=8) + # choose the number of devices automatically + trainer = Trainer(accelerator="gpu", devices="auto") + +.. note:: + Setting ``accelerator="gpu"`` will also automatically choose the "mps" device on Apple sillicon GPUs. + If you want to avoid this, you can set ``accelerator="cuda"`` instead. + +Choosing GPU devices +^^^^^^^^^^^^^^^^^^^^ + +You can select the GPU devices using ranges, a list of indices or a string containing +a comma separated list of GPU ids: + +.. testsetup:: + + k = 1 + +.. testcode:: + :skipif: torch.cuda.device_count() < 2 + + # DEFAULT (int) specifies how many GPUs to use per node + Trainer(accelerator="gpu", devices=k) + + # Above is equivalent to + Trainer(accelerator="gpu", devices=list(range(k))) + + # Specify which GPUs to use (don't use when running on cluster) + Trainer(accelerator="gpu", devices=[0, 1]) + + # Equivalent using a string + Trainer(accelerator="gpu", devices="0, 1") + + # To use all available GPUs put -1 or '-1' + # equivalent to `list(range(torch.cuda.device_count())) and `"auto"` + Trainer(accelerator="gpu", devices=-1) + +The table below lists examples of possible input formats and how they are interpreted by Lightning. + ++------------------+-----------+---------------------+---------------------------------+ +| `devices` | Type | Parsed | Meaning | ++==================+===========+=====================+=================================+ +| 3 | int | [0, 1, 2] | first 3 GPUs | ++------------------+-----------+---------------------+---------------------------------+ +| -1 | int | [0, 1, 2, ...] | all available GPUs | ++------------------+-----------+---------------------+---------------------------------+ +| [0] | list | [0] | GPU 0 | ++------------------+-----------+---------------------+---------------------------------+ +| [1, 3] | list | [1, 3] | GPU index 1 and 3 (0-based) | ++------------------+-----------+---------------------+---------------------------------+ +| "3" | str | [0, 1, 2] | first 3 GPUs | ++------------------+-----------+---------------------+---------------------------------+ +| "1, 3" | str | [1, 3] | GPU index 1 and 3 (0-based) | ++------------------+-----------+---------------------+---------------------------------+ +| "-1" | str | [0, 1, 2, ...] | all available GPUs | ++------------------+-----------+---------------------+---------------------------------+ + + +Find usable CUDA devices +^^^^^^^^^^^^^^^^^^^^^^^^ + +If you want to run several experiments at the same time on your machine, for example for a hyperparameter sweep, then you can +use the following utility function to pick GPU indices that are "accessible", without having to change your code every time. + +.. code-block:: python + + from lightning.pytorch.accelerators import find_usable_cuda_devices + + # Find two GPUs on the system that are not already occupied + trainer = Trainer(accelerator="cuda", devices=find_usable_cuda_devices(2)) + + from lightning.fabric.accelerators import find_usable_cuda_devices + + # Works with Fabric too + fabric = Fabric(accelerator="cuda", devices=find_usable_cuda_devices(2)) + + +This is especially useful when GPUs are configured to be in "exclusive compute mode", such that only one process at a time is allowed access to the device. +This special mode is often enabled on server GPUs or systems shared among multiple users. diff --git a/source/accelerators/gpu_expert.rst b/docs/source-pytorch/accelerators/gpu_expert.rst similarity index 87% rename from source/accelerators/gpu_expert.rst rename to docs/source-pytorch/accelerators/gpu_expert.rst index a2178a3..9ef4e0e 100644 --- a/source/accelerators/gpu_expert.rst +++ b/docs/source-pytorch/accelerators/gpu_expert.rst @@ -6,16 +6,20 @@ GPU training (Expert) ===================== **Audience:** Experts creating new scaling techniques such as Deepspeed or FSDP +.. warning:: This is an :ref:`experimental ` feature. + ---- Lightning enables experts focused on researching new ways of optimizing distributed training/inference strategies to create new strategies and plug them into Lightning. For example, Lightning worked closely with the Microsoft team to develop a Deepspeed integration and with the Facebook(Meta) team to develop a FSDP integration. + ---- -.. include:: ../advanced/strategy_registry.rst +.. include:: ../extensions/strategy.rst + ---- -.. include:: ../extensions/strategy.rst +.. include:: ../advanced/strategy_registry.rst diff --git a/docs/source-pytorch/accelerators/gpu_faq.rst b/docs/source-pytorch/accelerators/gpu_faq.rst new file mode 100644 index 0000000..605cfb3 --- /dev/null +++ b/docs/source-pytorch/accelerators/gpu_faq.rst @@ -0,0 +1,77 @@ +:orphan: + +.. _gpu_faq: + +GPU training (FAQ) +================== + +****************************************************************** +How should I adjust the learning rate when using multiple devices? +****************************************************************** + +When using distributed training make sure to modify your learning rate according to your effective +batch size. + +Let's say you have a batch size of 7 in your dataloader. + +.. testcode:: + + class LitModel(LightningModule): + def train_dataloader(self): + return Dataset(..., batch_size=7) + +Whenever you use multiple devices and/or nodes, your effective batch size will be 7 * devices * num_nodes. + +.. code-block:: python + + # effective batch size = 7 * 8 + Trainer(accelerator="gpu", devices=8, strategy=...) + + # effective batch size = 7 * 8 * 10 + Trainer(accelerator="gpu", devices=8, num_nodes=10, strategy=...) + + +.. note:: Huge batch sizes are actually really bad for convergence. Check out: + `Accurate, Large Minibatch SGD: Training ImageNet in 1 Hour `_ + +---- + + +********************************************************* +How do I use multiple GPUs on Jupyter or Colab notebooks? +********************************************************* + +To use multiple GPUs on notebooks, use the *DDP_NOTEBOOK* mode. + +.. code-block:: python + + Trainer(accelerator="gpu", devices=4, strategy="ddp_notebook") + +If you want to use other strategies, please launch your training via the command-shell. + +---- + +***************************************************** +I'm getting errors related to Pickling. What do I do? +***************************************************** + +Pickle is Python's mechanism for serializing and unserializing data. Some distributed modes require that your code is fully pickle compliant. If you run into an issue with pickling, try the following to figure out the issue. + +.. code-block:: python + + import pickle + + model = YourModel() + pickle.dumps(model) + +For example, the `ddp_spawn` strategy has the pickling requirement. This is a limitation of Python. + +.. code-block:: python + + Trainer(accelerator="gpu", devices=4, strategy="ddp_spawn") + +If you use `ddp`, your code doesn't need to be pickled: + +.. code-block:: python + + Trainer(accelerator="gpu", devices=4, strategy="ddp") diff --git a/docs/source-pytorch/accelerators/gpu_intermediate.rst b/docs/source-pytorch/accelerators/gpu_intermediate.rst new file mode 100644 index 0000000..9baec7b --- /dev/null +++ b/docs/source-pytorch/accelerators/gpu_intermediate.rst @@ -0,0 +1,284 @@ +:orphan: + +.. _gpu_intermediate: + +GPU training (Intermediate) +=========================== +**Audience:** Users looking to train across machines or experiment with different scaling techniques. + +---- + +Distributed Training strategies +------------------------------- +Lightning supports multiple ways of doing distributed training. + +.. video:: ../_static/fetched-s3-assets/Trainer+flags+4-+multi+node+training_3.mp4 + :poster: ../_static/fetched-s3-assets/thumb_multi_gpus.png + :width: 400 + +- DistributedDataParallel (multiple-gpus across many machines) + - Regular (``strategy='ddp'``) + - Spawn (``strategy='ddp_spawn'``) + - Notebook/Fork (``strategy='ddp_notebook'``) + +.. note:: + If you request multiple GPUs or nodes without setting a strategy, DDP will be automatically used. + +For a deeper understanding of what Lightning is doing, feel free to read this +`guide `_. + + +Distributed Data Parallel +^^^^^^^^^^^^^^^^^^^^^^^^^ +:class:`~torch.nn.parallel.DistributedDataParallel` (DDP) works as follows: + +1. Each GPU across each node gets its own process. + +2. Each GPU gets visibility into a subset of the overall dataset. It will only ever see that subset. + +3. Each process inits the model. + +4. Each process performs a full forward and backward pass in parallel. + +5. The gradients are synced and averaged across all processes. + +6. Each process updates its optimizer. + +.. code-block:: python + + # train on 8 GPUs (same machine (ie: node)) + trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp") + + # train on 32 GPUs (4 nodes) + trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp", num_nodes=4) + +This Lightning implementation of DDP calls your script under the hood multiple times with the correct environment +variables: + +.. code-block:: bash + + # example for 3 GPUs DDP + MASTER_ADDR=localhost MASTER_PORT=random() WORLD_SIZE=3 NODE_RANK=0 LOCAL_RANK=0 python my_file.py --accelerator 'gpu' --devices 3 --etc + MASTER_ADDR=localhost MASTER_PORT=random() WORLD_SIZE=3 NODE_RANK=1 LOCAL_RANK=0 python my_file.py --accelerator 'gpu' --devices 3 --etc + MASTER_ADDR=localhost MASTER_PORT=random() WORLD_SIZE=3 NODE_RANK=2 LOCAL_RANK=0 python my_file.py --accelerator 'gpu' --devices 3 --etc + +We use DDP this way because `ddp_spawn` has a few limitations (due to Python and PyTorch): + +1. Since `.spawn()` trains the model in subprocesses, the model on the main process does not get updated. +2. Dataloader(num_workers=N), where N is large, bottlenecks training with DDP... ie: it will be VERY slow or won't work at all. This is a PyTorch limitation. +3. Forces everything to be picklable. + +There are cases in which it is NOT possible to use DDP. Examples are: + +- Jupyter Notebook, Google COLAB, Kaggle, etc. +- You have a nested script without a root package + +In these situations you should use `ddp_notebook` or `dp` instead. + +Distributed Data Parallel Spawn +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +`ddp_spawn` is exactly like `ddp` except that it uses .spawn to start the training processes. + +.. warning:: It is STRONGLY recommended to use `DDP` for speed and performance. + +.. code-block:: python + + mp.spawn(self.ddp_train, nprocs=self.num_processes, args=(model,)) + +If your script does not support being called from the command line (ie: it is nested without a root +project module) you can use the following method: + +.. code-block:: python + + # train on 8 GPUs (same machine (ie: node)) + trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp_spawn") + +We STRONGLY discourage this use because it has limitations (due to Python and PyTorch): + +1. The model you pass in will not update. Please save a checkpoint and restore from there. +2. Set Dataloader(num_workers=0) or it will bottleneck training. + +`ddp` is MUCH faster than `ddp_spawn`. We recommend you + +1. Install a top-level module for your project using setup.py + +.. code-block:: python + + # setup.py + #!/usr/bin/env python + + from setuptools import setup, find_packages + + setup( + name="src", + version="0.0.1", + description="Describe Your Cool Project", + author="", + author_email="", + url="https://github.com/YourSeed", # REPLACE WITH YOUR OWN GITHUB PROJECT LINK + install_requires=["lightning"], + packages=find_packages(), + ) + +2. Setup your project like so: + +.. code-block:: bash + + /project + /src + some_file.py + /or_a_folder + setup.py + +3. Install as a root-level package + +.. code-block:: bash + + cd /project + pip install -e . + +You can then call your scripts anywhere + +.. code-block:: bash + + cd /project/src + python some_file.py --accelerator 'gpu' --devices 8 --strategy 'ddp' + + +Distributed Data Parallel in Notebooks +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +DDP Notebook/Fork is an alternative to Spawn that can be used in interactive Python and Jupyter notebooks, Google Colab, Kaggle notebooks, and so on: +The Trainer enables it by default when such environments are detected. + +.. code-block:: python + + # train on 8 GPUs in a Jupyter notebook + trainer = Trainer(accelerator="gpu", devices=8) + + # can be set explicitly + trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp_notebook") + + # can also be used in non-interactive environments + trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp_fork") + +Among the native distributed strategies, regular DDP (``strategy="ddp"``) is still recommended as the go-to strategy over Spawn and Fork/Notebook for its speed and stability but it can only be used with scripts. + + +Comparison of DDP variants and tradeoffs +**************************************** + +.. list-table:: DDP variants and their tradeoffs + :widths: 40 20 20 20 + :header-rows: 1 + + * - + - DDP + - DDP Spawn + - DDP Notebook/Fork + * - Works in Jupyter notebooks / IPython environments + - No + - No + - Yes + * - Supports multi-node + - Yes + - Yes + - Yes + * - Supported platforms + - Linux, Mac, Win + - Linux, Mac, Win + - Linux, Mac + * - Requires all objects to be picklable + - No + - Yes + - No + * - Limitations in the main process + - None + - The state of objects is not up-to-date after returning to the main process (`Trainer.fit()` etc). Only the model parameters get transferred over. + - GPU operations such as moving tensors to the GPU or calling ``torch.cuda`` functions before invoking ``Trainer.fit`` is not allowed. + * - Process creation time + - Slow + - Slow + - Fast + + +Distributed and 16-bit precision +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +Below are the possible configurations we support. + ++-------+---------+-----+--------+-----------------------------------------------------------------------+ +| 1 GPU | 1+ GPUs | DDP | 16-bit | command | ++=======+=========+=====+========+=======================================================================+ +| Y | | | | `Trainer(accelerator="gpu", devices=1)` | ++-------+---------+-----+--------+-----------------------------------------------------------------------+ +| Y | | | Y | `Trainer(accelerator="gpu", devices=1, precision=16)` | ++-------+---------+-----+--------+-----------------------------------------------------------------------+ +| | Y | Y | | `Trainer(accelerator="gpu", devices=k, strategy='ddp')` | ++-------+---------+-----+--------+-----------------------------------------------------------------------+ +| | Y | Y | Y | `Trainer(accelerator="gpu", devices=k, strategy='ddp', precision=16)` | ++-------+---------+-----+--------+-----------------------------------------------------------------------+ + +DDP can also be used with 1 GPU, but there's no reason to do so other than debugging distributed-related issues. + + +Implement Your Own Distributed (DDP) training +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +If you need your own way to init PyTorch DDP you can override :meth:`lightning.pytorch.strategies.ddp.DDPStrategy.setup_distributed`. + +If you also need to use your own DDP implementation, override :meth:`lightning.pytorch.strategies.ddp.DDPStrategy.configure_ddp`. + +---------- + +Torch Distributed Elastic +------------------------- +Lightning supports the use of Torch Distributed Elastic to enable fault-tolerant and elastic distributed job scheduling. To use it, specify the 'ddp' backend and the number of GPUs you want to use in the trainer. + +.. code-block:: python + + Trainer(accelerator="gpu", devices=8, strategy="ddp") + +To launch a fault-tolerant job, run the following on all nodes. + +.. code-block:: bash + + python -m torch.distributed.run + --nnodes=NUM_NODES + --nproc_per_node=TRAINERS_PER_NODE + --rdzv_id=JOB_ID + --rdzv_backend=c10d + --rdzv_endpoint=HOST_NODE_ADDR + YOUR_LIGHTNING_TRAINING_SCRIPT.py (--arg1 ... train script args...) + +To launch an elastic job, run the following on at least ``MIN_SIZE`` nodes and at most ``MAX_SIZE`` nodes. + +.. code-block:: bash + + python -m torch.distributed.run + --nnodes=MIN_SIZE:MAX_SIZE + --nproc_per_node=TRAINERS_PER_NODE + --rdzv_id=JOB_ID + --rdzv_backend=c10d + --rdzv_endpoint=HOST_NODE_ADDR + YOUR_LIGHTNING_TRAINING_SCRIPT.py (--arg1 ... train script args...) + +See the official `Torch Distributed Elastic documentation `_ for details +on installation and more use cases. + +Optimize multi-machine communication +------------------------------------ + +By default, Lightning will select the ``nccl`` backend over ``gloo`` when running on GPUs. +Find more information about PyTorch's supported backends `here `__. + +Lightning allows explicitly specifying the backend via the `process_group_backend` constructor argument on the relevant Strategy classes. By default, Lightning will select the appropriate process group backend based on the hardware used. + +.. code-block:: python + + from lightning.pytorch.strategies import DDPStrategy + + # Explicitly specify the process group backend if you choose to + ddp = DDPStrategy(process_group_backend="nccl") + + # Configure the strategy on the Trainer + trainer = Trainer(strategy=ddp, accelerator="gpu", devices=8) diff --git a/source/accelerators/ipu.rst b/docs/source-pytorch/accelerators/ipu.rst similarity index 100% rename from source/accelerators/ipu.rst rename to docs/source-pytorch/accelerators/ipu.rst diff --git a/source/accelerators/ipu_advanced.rst b/docs/source-pytorch/accelerators/ipu_advanced.rst similarity index 94% rename from source/accelerators/ipu_advanced.rst rename to docs/source-pytorch/accelerators/ipu_advanced.rst index 1dc4e71..98c1de5 100644 --- a/source/accelerators/ipu_advanced.rst +++ b/docs/source-pytorch/accelerators/ipu_advanced.rst @@ -6,6 +6,8 @@ Accelerator: IPU training ========================= **Audience:** Users looking to customize IPU training for massive models. +.. warning:: This is an :ref:`experimental ` feature. + ---- Advanced IPU options @@ -19,8 +21,8 @@ IPUs provide further optimizations to speed up training. By using the ``IPUStrat .. code-block:: python - import pytorch_lightning as pl - from pytorch_lightning.strategies import IPUStrategy + import lightning.pytorch as pl + from lightning_graphcore import IPUStrategy model = MyLightningModule() trainer = pl.Trainer(accelerator="ipu", devices=8, strategy=IPUStrategy(device_iterations=32)) @@ -31,8 +33,8 @@ Note that by default we return the last device iteration loss. You can override .. code-block:: python import poptorch - import pytorch_lightning as pl - from pytorch_lightning.strategies import IPUStrategy + import lightning.pytorch as pl + from lightning_graphcore import IPUStrategy model = MyLightningModule() inference_opts = poptorch.Options() @@ -71,7 +73,7 @@ Below is an example using the block annotation in a LightningModule. .. code-block:: python - import pytorch_lightning as pl + import lightning.pytorch as pl import poptorch @@ -104,7 +106,7 @@ You can also use the block context manager within the forward function, or any o .. code-block:: python - import pytorch_lightning as pl + import lightning.pytorch as pl import poptorch @@ -120,7 +122,6 @@ You can also use the block context manager within the forward function, or any o self.softmax = torch.nn.Softmax(dim=1) def forward(self, x): - with poptorch.Block(ipu_id=0): x = self.act(self.layer1(x)) diff --git a/docs/source-pytorch/accelerators/ipu_basic.rst b/docs/source-pytorch/accelerators/ipu_basic.rst new file mode 100644 index 0000000..8381b26 --- /dev/null +++ b/docs/source-pytorch/accelerators/ipu_basic.rst @@ -0,0 +1,72 @@ +:orphan: + +.. _ipu_basic: + +Accelerator: IPU training +========================= +**Audience:** Users looking to save money and run large models faster using single or multiple IPU devices. + +.. warning:: This is an :ref:`experimental ` feature. + +---- + +What is an IPU? +--------------- + +The Graphcore `Intelligence Processing Unit (IPU) `__, built for Artificial Intelligence and Machine Learning, consists of many individual cores, called *tiles*, allowing highly parallel computation. Due to the high bandwidth between tiles, IPUs facilitate machine learning loads where parallelization is essential. Because computation is heavily parallelized, + +IPUs operate in a different way to conventional accelerators such as CPU/GPUs. IPUs do not require large batch sizes for maximum parallelization, can provide optimizations across the compiled graph and rely on model parallelism to fully utilize tiles for larger models. + +IPUs are used to build IPU-PODs, rack-based systems of IPU-Machines for larger workloads. See the `IPU Architecture `__ for more information. + +See the `Graphcore Glossary `__ for the definitions of other IPU-specific terminology. + +---- + +Run on IPU +---------- + +To enable PyTorch Lightning to utilize the IPU accelerator, simply provide ``accelerator="ipu"`` parameter to the Trainer class. + +To use multiple IPUs set the devices to a number that is a power of 2 (i.e: 2, 4, 8, 16, ...) + +.. code-block:: python + + # run on as many IPUs as available by default + trainer = Trainer(accelerator="auto", devices="auto", strategy="auto") + # equivalent to + trainer = Trainer() + + # run on one IPU + trainer = Trainer(accelerator="ipu", devices=1) + # run on multiple IPUs + trainer = Trainer(accelerator="ipu", devices=8) + # choose the number of devices automatically + trainer = Trainer(accelerator="ipu", devices="auto") + +---- + +How to access IPUs +------------------ + +To use IPUs you must have access to a system with IPU devices. To get access see `get started `__. + +You must ensure that the IPU system has enabled the PopART and Poplar packages from the SDK. Instructions are in the Get Started guide for your IPU system, on the Graphcore `documents portal `__. + +---- + +.. _known-limitations: + +Known limitations +----------------- + +Currently there are some known limitations that are being addressed in the near future to make the experience seamless when moving from different devices. + +Please see the `MNIST example `__ which displays most of the limitations and how to overcome them till they are resolved. + +* ``self.log`` is not supported in the ``training_step``, ``validation_step``, ``test_step`` or ``predict_step``. This is due to the step function being traced and sent to the IPU devices. +* Since the step functions are traced, branching logic or any form of primitive values are traced into constants. Be mindful as this could lead to errors in your custom code. +* Clipping gradients is not supported. +* It is not possible to use :class:`torch.utils.data.BatchSampler` in your dataloaders if you are using multiple IPUs. +* IPUs handle the data transfer to the device on the host, hence the hooks :meth:`~lightning.pytorch.core.hooks.ModelHooks.transfer_batch_to_device` and + :meth:`~lightning.pytorch.core.hooks.ModelHooks.on_after_batch_transfer` do not apply here and if you have overridden any of them, an exception will be raised. diff --git a/source/accelerators/ipu_intermediate.rst b/docs/source-pytorch/accelerators/ipu_intermediate.rst similarity index 86% rename from source/accelerators/ipu_intermediate.rst rename to docs/source-pytorch/accelerators/ipu_intermediate.rst index 68c866e..251004f 100644 --- a/source/accelerators/ipu_intermediate.rst +++ b/docs/source-pytorch/accelerators/ipu_intermediate.rst @@ -6,6 +6,8 @@ Accelerator: IPU training ========================= **Audience:** IPU users looking to increase performance via mixed precision and analysis tools. +.. warning:: This is an :ref:`experimental ` feature. + ---- Mixed precision & 16 bit precision @@ -20,7 +22,7 @@ set the precision flag. .. code-block:: python - import pytorch_lightning as pl + import lightning.pytorch as pl model = MyLightningModule() trainer = pl.Trainer(accelerator="ipu", devices=8, precision=16) @@ -30,8 +32,8 @@ You can also use pure 16-bit training, where the weights are also in 16-bit prec .. code-block:: python - import pytorch_lightning as pl - from pytorch_lightning.strategies import IPUStrategy + import lightning.pytorch as pl + from lightning_graphcore import IPUStrategy model = MyLightningModule() model = model.half() @@ -53,11 +55,11 @@ Lightning supports dumping all reports to a directory to open using the tool. .. code-block:: python - import pytorch_lightning as pl - from pytorch_lightning.strategies import IPUStrategy + import lightning.pytorch as pl + from lightning_graphcore import IPUStrategy model = MyLightningModule() trainer = pl.Trainer(accelerator="ipu", devices=8, strategy=IPUStrategy(autoreport_dir="report_dir/")) trainer.fit(model) -This will dump all reports to ``report_dir/`` which can then be opened using the Graph Analyser Tool, see `Opening Reports `__. +This will dump all reports to ``report_dir/`` which can then be opened using the Graph Analyser Tool, see `Opening Reports `__. diff --git a/docs/source-pytorch/accelerators/mps.rst b/docs/source-pytorch/accelerators/mps.rst new file mode 100644 index 0000000..53e8609 --- /dev/null +++ b/docs/source-pytorch/accelerators/mps.rst @@ -0,0 +1,32 @@ +.. _mps: + +Accelerator: Apple Silicon training +=================================== + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Prepare your code (Optional) + :description: Prepare your code to run on any hardware + :col_css: col-md-4 + :button_link: accelerator_prepare.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: Basic + :description: Learn the basics of Apple silicon gpu training. + :col_css: col-md-4 + :button_link: mps_basic.html + :height: 150 + :tag: basic + +.. raw:: html + +
+
diff --git a/docs/source-pytorch/accelerators/mps_basic.rst b/docs/source-pytorch/accelerators/mps_basic.rst new file mode 100644 index 0000000..eec8967 --- /dev/null +++ b/docs/source-pytorch/accelerators/mps_basic.rst @@ -0,0 +1,63 @@ +:orphan: + +.. _mps_basic: + +MPS training (basic) +==================== +**Audience:** Users looking to train on their Apple silicon GPUs. + +.. warning:: + + Both the MPS accelerator and the PyTorch backend are still experimental. + As such, not all operations are currently supported. However, with ongoing development from the PyTorch team, an increasingly large number of operations are becoming available. + You can use ``PYTORCH_ENABLE_MPS_FALLBACK=1 python your_script.py`` to fall back to cpu for unsupported operations. + + +---- + +What is Apple silicon? +---------------------- +Apple silicon chips are a unified system on a chip (SoC) developed by Apple based on the ARM design. +Among other things, they feature CPU-cores, GPU-cores, a neural engine and shared memory between all of these features. + +---- + +So it's a CPU? +-------------- +Apple silicon includes CPU-cores among several other features. However, the full potential for the hardware acceleration of which the M-Socs are capable is unavailable when running on the ``CPUAccelerator``. This is because they also feature a GPU and a neural engine. + +To use them, Lightning supports the ``MPSAccelerator``. + +---- + +Run on Apple silicon gpus +------------------------- +Enable the following Trainer arguments to run on Apple silicon gpus (MPS devices). + +.. code-block:: python + + trainer = Trainer(accelerator="mps", devices=1) + +.. note:: + The ``MPSAccelerator`` only supports 1 device at a time. Currently there are no machines with multiple MPS-capable GPUs. + +---- + +What does MPS stand for? +------------------------ +MPS is short for `Metal Performance Shaders `_ which is the technology used in the back for gpu communication and computing. + +---- + +Troubleshooting +--------------- + + +If Lightning can't detect the Apple Silicon hardware, it will raise this exception: + +.. code:: + + MisconfigurationException: `MPSAccelerator` can not run on your system since the accelerator is not available. + +If you are seeing this despite running on an ARM-enabled Mac, the most likely cause is that your Python is being emulated and thinks it is running on an Intel CPU. +To solve this, re-install your python executable (and if using environment managers like conda, you have to reinstall these as well) by downloading the Apple M1/M2 build (not Intel!), for example `here `_. diff --git a/source/accelerators/tpu.rst b/docs/source-pytorch/accelerators/tpu.rst similarity index 97% rename from source/accelerators/tpu.rst rename to docs/source-pytorch/accelerators/tpu.rst index 6809277..f8ca8f5 100644 --- a/source/accelerators/tpu.rst +++ b/docs/source-pytorch/accelerators/tpu.rst @@ -46,7 +46,7 @@ Accelerator: TPU training :header: FAQ :description: Frequently asked questions about TPU training. :col_css: col-md-4 - :button_link: gpu_faq.html + :button_link: tpu_faq.html :height: 150 .. raw:: html diff --git a/docs/source-pytorch/accelerators/tpu_advanced.rst b/docs/source-pytorch/accelerators/tpu_advanced.rst new file mode 100644 index 0000000..e410c6e --- /dev/null +++ b/docs/source-pytorch/accelerators/tpu_advanced.rst @@ -0,0 +1,64 @@ +:orphan: + +TPU training (Advanced) +======================= +**Audience:** Users looking to apply advanced performance techniques to TPU training. + +.. warning:: This is an :ref:`experimental ` feature. + +---- + +Weight Sharing/Tying +-------------------- +Weight Tying/Sharing is a technique where in the module weights are shared among two or more layers. +This is a common method to reduce memory consumption and is utilized in many State of the Art +architectures today. + +PyTorch XLA requires these weights to be tied/shared after moving the model to the XLA device. +To support this requirement, Lightning automatically finds these weights and ties them after +the modules are moved to the XLA device under the hood. It will ensure that the weights among +the modules are shared but not copied independently. + +PyTorch Lightning has an inbuilt check which verifies that the model parameter lengths +match once the model is moved to the device. If the lengths do not match Lightning +throws a warning message. + +Example: + +.. code-block:: python + + from lightning.pytorch.core.module import LightningModule + from torch import nn + from lightning.pytorch.trainer.trainer import Trainer + + + class WeightSharingModule(LightningModule): + def __init__(self): + super().__init__() + self.layer_1 = nn.Linear(32, 10, bias=False) + self.layer_2 = nn.Linear(10, 32, bias=False) + self.layer_3 = nn.Linear(32, 10, bias=False) + # Lightning automatically ties these weights after moving to the XLA device, + # so all you need is to write the following just like on other accelerators. + self.layer_3.weight = self.layer_1.weight + + def forward(self, x): + x = self.layer_1(x) + x = self.layer_2(x) + x = self.layer_3(x) + return x + + + model = WeightSharingModule() + trainer = Trainer(max_epochs=1, accelerator="tpu") + +See `XLA Documentation `_ + +---- + +XLA +--- +XLA is the library that interfaces PyTorch with the TPUs. +For more information check out `XLA `_. + +Guide for `troubleshooting XLA `_ diff --git a/docs/source-pytorch/accelerators/tpu_basic.rst b/docs/source-pytorch/accelerators/tpu_basic.rst new file mode 100644 index 0000000..36cd478 --- /dev/null +++ b/docs/source-pytorch/accelerators/tpu_basic.rst @@ -0,0 +1,114 @@ +:orphan: + +TPU training (Basic) +==================== +**Audience:** Users looking to train on single or multiple TPU cores. + +.. warning:: This is an :ref:`experimental ` feature. + +---- + +.. video:: ../_static/fetched-s3-assets/tpu_cores.mp4 + :poster: ../_static/fetched-s3-assets/thumb_tpus.png + :width: 400 + :muted: + +Lightning supports running on TPUs. At this moment, TPUs are available +on Google Cloud (GCP), Google Colab and Kaggle Environments. For more information on TPUs +`watch this video `_. + +---------------- + +What is a TPU? +-------------- +Tensor Processing Unit (TPU) is an AI accelerator application-specific integrated circuit (ASIC) developed by Google specifically for neural networks. + +A TPU has 8 cores where each core is optimized for 128x128 matrix multiplies. In general, a single TPU is about as fast as 5 V100 GPUs! + +A TPU pod hosts many TPUs on it. Currently, TPU v3 Pod has up to 2048 TPU cores and 32 TiB of memory! +You can request a full pod from Google cloud or a "slice" which gives you +some subset of those 2048 cores. + +---- + +Run on TPU cores +---------------- + +To run on different cores, modify the ``devices`` argument. + +.. code-block:: python + + # run on as many TPUs as available by default + trainer = Trainer(accelerator="auto", devices="auto", strategy="auto") + # equivalent to + trainer = Trainer() + + # run on one TPU core + trainer = Trainer(accelerator="tpu", devices=1) + # run on multiple TPU cores + trainer = Trainer(accelerator="tpu", devices=8) + # run on one specific TPU core: the 2nd core (index 1) + trainer = Trainer(accelerator="tpu", devices=[1]) + # choose the number of cores automatically + trainer = Trainer(accelerator="tpu", devices="auto") + +---- + +How to access TPUs +------------------ +To access TPUs, there are three main ways. + +Google Colab +^^^^^^^^^^^^ +Colab is like a jupyter notebook with a free GPU or TPU +hosted on GCP. + +To get a TPU on colab, follow these steps: + +1. Go to `Google Colab `_. + +2. Click "new notebook" (bottom right of pop-up). + +3. Click runtime > change runtime settings. Select Python 3, and hardware accelerator "TPU". + This will give you a TPU with 8 cores. + +4. Next, insert this code into the first cell and execute. + This will install the xla library that interfaces between PyTorch and the TPU. + + .. code-block:: + + !pip install cloud-tpu-client https://storage.googleapis.com/tpu-pytorch/wheels/torch_xla-1.13-cp38-cp38m-linux_x86_64.whl + +5. Once the above is done, install PyTorch Lightning. + + .. code-block:: + + !pip install lightning + +6. Then set up your LightningModule as normal. + +Google Cloud (GCP) +^^^^^^^^^^^^^^^^^^ +You could refer to this `page `_ for getting started with Cloud TPU resources on GCP. + +---- + +Optimize Performance +-------------------- + +The TPU was designed for specific workloads and operations to carry out large volumes of matrix multiplication, +convolution operations and other commonly used ops in applied deep learning. +The specialization makes it a strong choice for NLP tasks, sequential convolutional networks, and under low precision operation. +There are cases in which training on TPUs is slower when compared with GPUs, for possible reasons listed: + +- Too small batch size. +- Explicit evaluation of tensors during training, e.g. ``tensor.item()`` +- Tensor shapes (e.g. model inputs) change often during training. +- Limited resources when using TPU's with PyTorch `Link `_ +- XLA Graph compilation during the initial steps `Reference `_ +- Some tensor ops are not fully supported on TPU, or not supported at all. These operations will be performed on CPU (context switch). + +The official PyTorch XLA `performance guide `_ +has more detailed information on how PyTorch code can be optimized for TPU. In particular, the +`metrics report `_ allows +one to identify operations that lead to context switching. diff --git a/docs/source-pytorch/accelerators/tpu_faq.rst b/docs/source-pytorch/accelerators/tpu_faq.rst new file mode 100644 index 0000000..8a26899 --- /dev/null +++ b/docs/source-pytorch/accelerators/tpu_faq.rst @@ -0,0 +1,117 @@ +:orphan: + +.. _tpu_faq: + +TPU training (FAQ) +================== + +***************************** +XLA configuration is missing? +***************************** + +.. code-block:: + + File "/usr/local/lib/python3.8/dist-packages/torch_xla/core/xla_model.py", line 18, in + _DEVICES = xu.LazyProperty(lambda: torch_xla._XLAC._xla_get_devices()) + RuntimeError: tensorflow/compiler/xla/xla_client/computation_client.cc:273 : Missing XLA configuration + Traceback (most recent call last): + ... + File "/home/kaushikbokka/pytorch-lightning/pytorch_lightning/utilities/device_parser.py", line 125, in parse_tpu_cores + raise MisconfigurationException('No TPU devices were found.') + lightning.pytorch.utilities.exceptions.MisconfigurationException: No TPU devices were found. + +This means the system is missing XLA configuration. You would need to set up XRT TPU device configuration. + +For TPUVM architecture, you could set it in your terminal by: + +.. code-block:: bash + + export XRT_TPU_CONFIG="localservice;0;localhost:51011" + +And for the old TPU + 2VM architecture, you could set it by: + +.. code-block:: bash + + export TPU_IP_ADDRESS=10.39.209.42 # You could get the IP Address in the GCP TPUs section + export XRT_TPU_CONFIG="tpu_worker;0;$TPU_IP_ADDRESS:8470" + +---- + +********************************************************** +How to clear up the programs using TPUs in the background? +********************************************************** + +.. code-block:: bash + + pgrep python | awk '{print $2}' | xargs -r kill -9 + +Sometimes, there can still be old programs running on the TPUs, which would make the TPUs unavailable to use. You could use the above command in the terminal to kill the running processes. + +---- + +************************************* +How to resolve the replication issue? +************************************* + +.. code-block:: + + File "/usr/local/lib/python3.6/dist-packages/torch_xla/core/xla_model.py", line 200, in set_replication + replication_devices = xla_replication_devices(devices) + File "/usr/local/lib/python3.6/dist-packages/torch_xla/core/xla_model.py", line 187, in xla_replication_devices + .format(len(local_devices), len(kind_devices))) + RuntimeError: Cannot replicate if number of devices (1) is different from 8 + +This error is raised when the XLA device is called outside the spawn process. Internally in the XLA-Strategy for training on multiple tpu cores, we use XLA's `xmp.spawn`. +Don't use ``xm.xla_device()`` while working on Lightning + TPUs! + +---- + +************************************** +Unsupported datatype transfer to TPUs? +************************************** + +.. code-block:: + + File "/usr/local/lib/python3.8/dist-packages/torch_xla/utils/utils.py", line 205, in _for_each_instance_rewrite + v = _for_each_instance_rewrite(result.__dict__[k], select_fn, fn, rwmap) + File "/usr/local/lib/python3.8/dist-packages/torch_xla/utils/utils.py", line 206, in _for_each_instance_rewrite + result.__dict__[k] = v + TypeError: 'mappingproxy' object does not support item assignment + +PyTorch XLA only supports Tensor objects for CPU to TPU data transfer. Might cause issues if the User is trying to send some non-tensor objects through the DataLoader or during saving states. + +---- + +************************************************* +How to setup the debug mode for Training on TPUs? +************************************************* + +.. code-block:: python + + import lightning.pytorch as pl + + my_model = MyLightningModule() + trainer = pl.Trainer(accelerator="tpu", devices=8, strategy="xla_debug") + trainer.fit(my_model) + +Example Metrics report: + +.. code-block:: + + Metric: CompileTime + TotalSamples: 202 + Counter: 06m09s401ms746.001us + ValueRate: 778ms572.062us / second + Rate: 0.425201 / second + Percentiles: 1%=001ms32.778us; 5%=001ms61.283us; 10%=001ms79.236us; 20%=001ms110.973us; 50%=001ms228.773us; 80%=001ms339.183us; 90%=001ms434.305us; 95%=002ms921.063us; 99%=21s102ms853.173us + + +A lot of PyTorch operations aren't lowered to XLA, which could lead to significant slowdown of the training process. +These operations are moved to the CPU memory and evaluated, and then the results are transferred back to the XLA device(s). +By using the `xla_debug` Strategy, users could create a metrics report to diagnose issues. + +The report includes things like (`XLA Reference `_): + +* how many times we issue XLA compilations and time spent on issuing. +* how many times we execute and time spent on execution +* how many device data handles we create/destroy etc. diff --git a/docs/source-pytorch/accelerators/tpu_intermediate.rst b/docs/source-pytorch/accelerators/tpu_intermediate.rst new file mode 100644 index 0000000..579d2cc --- /dev/null +++ b/docs/source-pytorch/accelerators/tpu_intermediate.rst @@ -0,0 +1,122 @@ +:orphan: + +TPU training (Intermediate) +=========================== +**Audience:** Users looking to use cloud TPUs. + +.. warning:: This is an :ref:`experimental ` feature. + +---- + +DistributedSamplers +------------------- +Lightning automatically inserts the correct samplers - no need to do this yourself! + +Usually, with TPUs (and DDP), you would need to define a DistributedSampler to move the right +chunk of data to the appropriate TPU. As mentioned, this is not needed in Lightning + +.. note:: Don't add distributedSamplers. Lightning does this automatically + +If for some reason you still need to, this is how to construct the sampler +for TPU use + +.. code-block:: python + + import torch_xla.core.xla_model as xm + + + def train_dataloader(self): + dataset = MNIST(os.getcwd(), train=True, download=True, transform=transforms.ToTensor()) + + # required for TPU support + sampler = None + if use_tpu: + sampler = torch.utils.data.distributed.DistributedSampler( + dataset, num_replicas=xm.xrt_world_size(), rank=xm.get_ordinal(), shuffle=True + ) + + loader = DataLoader(dataset, sampler=sampler, batch_size=32) + + return loader + +Configure the number of TPU cores in the trainer. You can only choose 1 or 8. +To use a full TPU pod skip to the TPU pod section. + +.. code-block:: python + + import lightning.pytorch as pl + + my_model = MyLightningModule() + trainer = pl.Trainer(accelerator="tpu", devices=8) + trainer.fit(my_model) + +That's it! Your model will train on all 8 TPU cores. + +---------------- + +TPU VM +------ +Lightning supports training on the new Cloud TPU VMs. +Previously, we needed separate VMs to connect to the TPU machines, but as +Cloud TPU VMs run on the TPU Host machines, it allows direct SSH access +for the users. Hence, this architecture upgrade leads to cheaper and significantly +better performance and usability while working with TPUs. + +The TPUVMs come pre-installed with latest versions of PyTorch and PyTorch XLA. +After connecting to the VM and before running your Lightning code, you would need +to set the `XRT TPU device configuration `__. + +.. code-block:: bash + + export XRT_TPU_CONFIG="localservice;0;localhost:51011" + + # Set the environment variable to visible devices. + # You might need to change the value depending on how many chips you have + export TPU_NUM_DEVICES=4 + + # Allow LIBTPU LOAD by multiple processes + export ALLOW_MULTIPLE_LIBTPU_LOAD=1 + +You can learn more about the Cloud TPU VM architecture `here `_ + +---------------- + +TPU Pod +------- +To train on more than the number of cores in a node, your code actually doesn't change! + +All TPU VMs in a Pod setup are required to access the model code and data. +One easy way to achieve this is to use the following startup script when creating the TPU VM pod. +It will perform the data downloading on all TPU VMs. Note that you need to export the corresponding environment variables following the instruction in Create TPU Node. + +.. code-block:: bash + + gcloud alpha compute tpus tpu-vm create ${TPU_POD_NAME} --zone ${ZONE} --project ${PROJECT_ID} --accelerator-type ${ACCELERATOR_TYPE} --version ${RUNTIME_VERSION} --metadata startup-script=setup.py + +Then you could ssh to any TPU worker, e.g. worker 0, check if data/model downloading is finished and +start the training after generating the ssh-keys to ssh between VM workers on a pod. +All you need to do is submit the following command: + +.. code-block:: bash + + python3 -m torch_xla.distributed.xla_dist --tpu=$TPU_POD_NAME -- python3 train.py --max_epochs=5 --batch_size=32 + +See `this guide `_ +on how to set up the instance groups and VMs needed to run TPU Pods. + +---------------- + +16 bit precision +---------------- +Lightning also supports training in 16-bit precision with TPUs. +By default, TPU training will use 32-bit precision. To enable it, do + +.. code-block:: python + + import lightning.pytorch as pl + + my_model = MyLightningModule() + trainer = pl.Trainer(accelerator="tpu", precision="16-mixed") + trainer.fit(my_model) + +Under the hood the xla library will use the `bfloat16 type `_. diff --git a/docs/source-pytorch/advanced/finetuning.rst b/docs/source-pytorch/advanced/finetuning.rst new file mode 100644 index 0000000..4809e6e --- /dev/null +++ b/docs/source-pytorch/advanced/finetuning.rst @@ -0,0 +1 @@ +.. include:: transfer_learning.rst diff --git a/docs/source-pytorch/advanced/model_parallel.rst b/docs/source-pytorch/advanced/model_parallel.rst new file mode 100644 index 0000000..3f40241 --- /dev/null +++ b/docs/source-pytorch/advanced/model_parallel.rst @@ -0,0 +1,922 @@ +.. _model-parallel: + +################################## +Train 1 trillion+ parameter models +################################## + +When training large models, fitting larger batch sizes, or trying to increase throughput using multi-GPU compute, Lightning provides advanced optimized distributed training strategies to support these cases and offer substantial improvements in memory usage. + +Note that some of the extreme memory saving configurations will affect the speed of training. This Speed/Memory trade-off in most cases can be adjusted. + +Some of these memory-efficient strategies rely on offloading onto other forms of memory, such as CPU RAM or NVMe. This means you can even see memory benefits on a **single GPU**, using a strategy such as :ref:`deepspeed-zero-stage-3-offload`. + +Check out this amazing video explaining model parallelism and how it works behind the scenes: + +.. raw:: html + + + + +********************************************* +Choosing an Advanced Distributed GPU Strategy +********************************************* + +If you would like to stick with PyTorch DDP, see :ref:`ddp-optimizations`. + +Unlike :class:`~torch.nn.parallel.DistributedDataParallel` (DDP) where the maximum trainable model size and batch size do not change with respect to the number of GPUs, memory-optimized strategies can accommodate bigger models and larger batches as more GPUs are used. This means as you scale up the number of GPUs, you can reach the number of model parameters you'd like to train. + +There are many considerations when choosing a strategy as described below. In addition, check out the visualization of various strategy benchmarks using `minGPT `__ `here `__. + +Pre-training vs Fine-tuning +=========================== + +When fine-tuning, we often use a magnitude less data compared to pre-training a model. This is important when choosing a distributed strategy as usually for pre-training, **we are compute-bound**. +This means we cannot sacrifice throughput as much as if we were fine-tuning, because in fine-tuning the data requirement is smaller. + +Overall: + +* When **fine-tuning** a model, use advanced memory efficient strategies such as :ref:`fully-sharded-training`, :ref:`deepspeed-zero-stage-3` or :ref:`deepspeed-zero-stage-3-offload`, allowing you to fine-tune larger models if you are limited on compute +* When **pre-training** a model, use simpler optimizations such as :ref:`deepspeed-zero-stage-2`, scaling the number of GPUs to reach larger parameter sizes +* For both fine-tuning and pre-training, use :ref:`deepspeed-activation-checkpointing` as the throughput degradation is not significant + +For example when using 128 GPUs, you can **pre-train** large 10 to 20 Billion parameter models using :ref:`deepspeed-zero-stage-2` without having to take a performance hit with more advanced optimized multi-gpu strategy. + +But for **fine-tuning** a model, you can reach 10 to 20 Billion parameter models using :ref:`deepspeed-zero-stage-3-offload` on a **single GPU**. This does come with a significant throughput hit, which needs to be weighed accordingly. + +When Shouldn't I use an Optimized Distributed Strategy? +======================================================= + +Sharding techniques help when model sizes are fairly large; roughly 500M+ parameters is where we've seen benefits. However, in the following cases, we recommend sticking to ordinary distributed strategies + +* When your model is small (ResNet50 of around 80M Parameters), unless you are using unusually large batch sizes or inputs. +* Due to high distributed communication between devices, if running on a slow network/interconnect, the training might be much slower than expected and then it's up to you to determince the tradeoff here. + + +Cutting-edge and third-party Strategies +======================================= + +Cutting-edge Lightning strategies are being developed by third-parties outside of Lightning. + +If you want to try some of the latest and greatest features for model-parallel training, check out the :doc:`Colossal-AI Strategy <../integrations/strategies/colossalai>` integration. + +Another integration is :doc:`Bagua Strategy <../integrations/strategies/bagua>`, deep learning training acceleration framework for PyTorch, with advanced distributed training algorithms and system optimizations. + +For training on unreliable mixed GPUs across the internet check out the :doc:`Hivemind Strategy <../integrations/strategies/hivemind>` integration. + +---- + + +************************ +Efficient initialization +************************ + +Instantiating a ``nn.Module`` in PyTorch creates all parameters on CPU in float32 precision by default. +To speed up initialization, you can force PyTorch to create the model directly on the target device and with the desired precision without changing your model code. + +.. code-block:: python + + fabric = Trainer(accelerator="cuda", precision="16-true") + + with trainer.init_module(): + # models created here will be on GPU and in float16 + model = MyModel() + + trainer.fit(model) + +This eliminates the waiting time to transfer the model parameters from the CPU to the device. + +When loading a model from a checkpoint, for example when fine-tuning, set `empty_init=True` to avoid expensive +and redundant memory initialization: + +.. code-block:: python + + with trainer.init_module(empty_init=True): + # creation of the model is very fast + model = MyModel.load_from_checkpoint("my/checkpoint/path.ckpt") + + trainer.fit(model) + +For strategies that handle large sharded models (FSDP, DeepSpeed), the :meth:`~lightning.pytorch.trainer.trainer.Trainer.init_module` +should not be used, instead override the :meth:`~lightning.pytorch.core.hooks.ModelHooks.configure_model` hook: + +.. code-block:: python + + class MyModel(LightningModule): + def __init__(self): + super().__init__() + # don't instantiate layers here + # move the creation of layers to `configure_model` + + def configure_model(self): + # create all your layers here + self.layers = nn.Sequential(...) + +This makes it possible to work with models that are larger than the memory of a single device. + + +.. _fully-sharded-training: + +********************** +Fully Sharded Training +********************** + +PyTorch has it's own version of `FSDP `_ which is upstreamed from their `fairscale `__ project. +It was introduced in their `v1.11.0 release `_ but it is recommended to use it with PyTorch v1.12 or more and that's what +Lightning supports. + +.. warning:: This is an :ref:`experimental ` feature. + +Auto Wrapping +============= + +Model layers should be wrapped in FSDP in a nested way to save peak memory and enable communication and computation overlapping. The +simplest way to do it is auto wrapping, which can serve as a drop-in replacement for DDP without changing the rest of the code. You don't +have to ``wrap`` layers manually as in the case of manual wrapping. + +.. note:: + For users of PyTorch < 2.0: While initializing the optimizers inside ``configure_optimizers`` hook, make sure to use ``self.trainer.model.parameters()``, else + PyTorch will raise an error. This is required because when you use auto-wrap, the model layers are sharded and your + ``lightning_module.parameters()`` will return a generator with no params. + +.. code-block:: python + + model = BoringModel() + trainer = Trainer(accelerator="gpu", devices=4, strategy="fsdp", precision=16) + trainer.fit(model) + + +You can customize the strategy configuration by adjusting the arguments of :class:`~lightning.pytorch.strategies.FSDPStrategy` and pass that to the ``strategy`` argument inside the ``Trainer``. + +.. code-block:: python + + from lightning.pytorch import Trainer + from lightning.pytorch.strategies import FSDPStrategy + + # equivalent to passing `"fsdp_cpu_offload"` + fsdp = FSDPStrategy(cpu_offload=True) + trainer = pl.Trainer(strategy=fsdp, accelerator="gpu", devices=4) + + # configure the wrapping condition + fsdp = FSDPStrategy(auto_wrap_policy={MyTransformerBlock}) + trainer = pl.Trainer(strategy=fsdp, accelerator="gpu", devices=4) + + +Read more `here `__. + + +Manual Wrapping +=============== + +Manual wrapping can be useful to explore complex sharding strategies by applying ``wrap`` selectively to some parts of the model. To activate +parameter sharding with manual wrapping, you can wrap your model using the ``wrap`` function. Internally in Lightning, we enable a context manager around the ``configure_model`` hook to make sure the ``wrap`` parameters are passed correctly. + +When not using Fully Sharded, these ``wrap`` calls are a no-op. This means once the changes have been made, there is no need to remove the changes for other strategies. + +``wrap`` simply wraps the module with a Fully Sharded Parallel class with the correct parameters from the Lightning context manager. + +Here's an example using that uses ``wrap`` to create your model: + +.. code-block:: python + + import torch + import torch.nn as nn + import lightning.pytorch as pl + from lightning.pytorch import Trainer + from torch.distributed.fsdp.wrap import wrap + + + class MyModel(pl.LightningModule): + def configure_model(self): + self.linear_layer = nn.Linear(32, 32) + self.block = nn.Sequential(nn.Linear(32, 32), nn.Linear(32, 32)) + + # modules are sharded across processes + # as soon as they are wrapped with `wrap`. + # During the forward/backward passes, weights get synced across processes + # and de-allocated once computation is complete, saving memory. + + # Wraps the layer in a Fully Sharded Wrapper automatically + linear_layer = wrap(self.linear_layer) + + for i, layer in enumerate(self.block): + self.block[i] = wrap(layer) + + self.model = nn.Sequential(linear_layer, nn.ReLU(), self.block) + + def configure_optimizers(self): + return torch.optim.AdamW(self.model.parameters()) + + + model = MyModel() + trainer = Trainer(accelerator="gpu", devices=4, strategy="fsdp", precision=16) + trainer.fit(model) + +In this case, Lightning will not re-wrap your model, so you don't need to set ``FSDPStrategy(auto_wrap_policy=...)``. + +Check out `this tutorial `__ to learn more about it. + +---- + + +Activation Checkpointing +======================== + +Activation checkpointing reduces GPU memory usage by avoiding the storage of intermediate activation tensors in +selected layers. The tradeoff is that computation cost for the backpropagation increases, as the dropped activations +need to be recomputed. + +Enable checkpointing on large layers (like Transformers) by providing a policy: + +.. code-block:: python + + from lightning.pytorch.strategies import FSDPStrategy + + fsdp = FSDPStrategy(activation_checkpointing_policy={MyTransformerBlock}) + trainer = pl.Trainer(strategy=fsdp, accelerator="gpu", devices=4) + + +You could also configure activation checkpointing manually inside the ``configure_model`` hook: + +.. code-block:: python + + from torch.distributed.algorithms._checkpoint.checkpoint_wrapper import apply_activation_checkpointing + + + class MyModel(pl.LightningModule): + ... + + def configure_model(self): + # Same code as in the "Manual wrapping" snippet above + ... + apply_activation_checkpointing(self.model) + +In this case, Lightning will not re-configure activation checkpointing, so you don't need to set ``FSDPStrategy(activation_checkpointing=...)``. + + +---- + + +.. _deepspeed_advanced: + +********* +DeepSpeed +********* + +`DeepSpeed `__ is a deep learning training optimization library, providing the means to train massive billion parameter models at scale. +Using the DeepSpeed strategy, we were able to **train model sizes of 10 Billion parameters and above**, with a lot of useful information in this `benchmark `_ and the `DeepSpeed docs `__. +DeepSpeed also offers lower level training optimizations, and efficient optimizers such as `1-bit Adam `_. We recommend using DeepSpeed in environments where speed and memory optimizations are important (such as training large billion parameter models). + +.. warning:: This is an :ref:`experimental ` feature. + +Below is a summary of all the configurations of DeepSpeed. + +* :ref:`deepspeed-zero-stage-1` - **Shard optimizer states**, remains at speed parity with DDP whilst providing memory improvement + +* :ref:`deepspeed-zero-stage-2` - **Shard optimizer states and gradients**, remains at speed parity with DDP whilst providing even more memory improvement + +* :ref:`deepspeed-zero-stage-2-offload` - **Offload optimizer states and gradients to CPU**. Increases distributed communication volume and GPU-CPU device transfer, but provides significant memory improvement + +* :ref:`deepspeed-zero-stage-3` - **Shard optimizer states, gradients, parameters and optionally activations**. Increases distributed communication volume, but provides even more memory improvement + +* :ref:`deepspeed-zero-stage-3-offload` - **Offload optimizer states, gradients, parameters and optionally activations to CPU**. Increases distributed communication volume and GPU-CPU device transfer, but even more significant memory improvement. + +* :ref:`deepspeed-activation-checkpointing` - **Free activations after forward pass**. Increases computation, but provides memory improvement for all stages. + +To use DeepSpeed, you first need to install DeepSpeed using the commands below. + +.. code-block:: bash + + pip install deepspeed + +If you run into an issue with the install or later in training, ensure that the CUDA version of the PyTorch you've installed matches your locally installed CUDA (you can see which one has been recognized by running ``nvcc --version``). + +.. note:: + + DeepSpeed currently only supports single optimizer, single scheduler within the training loop. + + When saving a checkpoint we rely on DeepSpeed which saves a directory containing the model and various components. + + +.. _deepspeed-zero-stage-1: + +DeepSpeed ZeRO Stage 1 +====================== + +`DeepSpeed ZeRO Stage 1 `_ partitions your optimizer states (Stage 1) across your GPUs to reduce memory. + +It is recommended to skip Stage 1 and use Stage 2, which comes with larger memory improvements and still remains efficient. Stage 1 is useful to pair with certain optimizations such as `Torch ORT `__. + +.. code-block:: python + + from lightning.pytorch import Trainer + + model = MyModel() + trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_1", precision=16) + trainer.fit(model) + + +.. _deepspeed-zero-stage-2: + +DeepSpeed ZeRO Stage 2 +====================== + +`DeepSpeed ZeRO Stage 2 `_ partitions your optimizer states (Stage 1) and your gradients (Stage 2) across your GPUs to reduce memory. In most cases, this is more efficient or at parity with DDP, primarily due to the optimized custom communications written by the DeepSpeed team. +As a result, benefits can also be seen on a single GPU. Do note that the default bucket sizes allocate around ``3.6GB`` of VRAM to use during distributed communications, which can be tweaked when instantiating the strategy described in a few sections below. + +.. code-block:: python + + from lightning.pytorch import Trainer + + model = MyModel() + trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_2", precision=16) + trainer.fit(model) + +.. code-block:: bash + + python train.py --strategy deepspeed_stage_2 --precision 16 --accelerator 'gpu' --devices 4 + + +.. _deepspeed-zero-stage-2-offload: + +DeepSpeed ZeRO Stage 2 Offload +------------------------------ + +Below we show an example of running `ZeRO-Offload `_. ZeRO-Offload leverages the host CPU to offload optimizer memory/computation, reducing the overall memory consumption. + +.. code-block:: python + + from lightning.pytorch import Trainer + + model = MyModel() + trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_2_offload", precision=16) + trainer.fit(model) + + +This can also be done via the command line using a PyTorch Lightning script: + +.. code-block:: bash + + python train.py --strategy deepspeed_stage_2_offload --precision 16 --accelerator 'gpu' --devices 4 + + +You can also modify the ZeRO-Offload parameters via the strategy as below. + +.. code-block:: python + + from lightning.pytorch import Trainer + from lightning.pytorch.strategies import DeepSpeedStrategy + + model = MyModel() + trainer = Trainer( + accelerator="gpu", + devices=4, + strategy=DeepSpeedStrategy(offload_optimizer=True, allgather_bucket_size=5e8, reduce_bucket_size=5e8), + precision=16, + ) + trainer.fit(model) + + +.. note:: + We suggest tuning the ``allgather_bucket_size`` parameter and ``reduce_bucket_size`` parameter to find optimum parameters based on your model size. + These control how large a buffer we limit the model to using when reducing gradients/gathering updated parameters. Smaller values will result in less memory, but tradeoff with speed. + + DeepSpeed allocates a reduce buffer size `multiplied by 1.5x `_ so take that into consideration when tweaking the parameters. + + The strategy sets a reasonable default of ``2e8``, which should work for most low VRAM GPUs (less than ``7GB``), allocating roughly ``3.6GB`` of VRAM as buffer. Higher VRAM GPUs should aim for values around ``5e8``. + +For even more speed benefit, DeepSpeed offers an optimized CPU version of ADAM called `DeepSpeedCPUAdam `_ to run the offloaded computation, which is faster than the standard PyTorch implementation. + +.. code-block:: python + + import lightning.pytorch + from lightning.pytorch import Trainer + from deepspeed.ops.adam import DeepSpeedCPUAdam + + + class MyModel(pl.LightningModule): + ... + + def configure_optimizers(self): + # DeepSpeedCPUAdam provides 5x to 7x speedup over torch.optim.adam(w) + return DeepSpeedCPUAdam(self.parameters()) + + + model = MyModel() + trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_2_offload", precision=16) + trainer.fit(model) + + +.. _deepspeed-zero-stage-3: + +DeepSpeed ZeRO Stage 3 +====================== + +DeepSpeed ZeRO Stage 3 shards the optimizer states, gradients and the model parameters (also optionally activations). Sharding model parameters and activations comes with an increase in distributed communication, however allows you to scale your models massively from one GPU to multiple GPUs. +**The DeepSpeed team report the ability to fine-tune models with over 40B parameters on a single GPU and over 2 Trillion parameters on 512 GPUs.** For more information we suggest checking the `DeepSpeed ZeRO-3 Offload documentation `__. + +We've ran benchmarks for all these features and given a simple example of how all these features work in Lightning, which you can see at `minGPT `_. + +To reach the highest memory efficiency or model size, you must: + +1. Use the DeepSpeed strategy with the stage 3 parameter +2. Use CPU Offloading to offload weights to CPU, plus have a reasonable amount of CPU RAM to offload onto +3. Use DeepSpeed Activation Checkpointing to shard activations + +Below we describe how to enable all of these to see benefit. **With all these improvements we reached 45 Billion parameters training a GPT model on 8 GPUs with ~1TB of CPU RAM available**. + +Also please have a look at our :ref:`deepspeed-zero-stage-3-tips` which contains a lot of helpful information when configuring your own models. + +.. note:: + + When saving a model using DeepSpeed and Stage 3, model states and optimizer states will be saved in separate sharded states (based on the world size). See :ref:`deepspeed-zero-stage-3-single-file` to obtain a single checkpoint file. + +.. code-block:: python + + from lightning.pytorch import Trainer + from deepspeed.ops.adam import FusedAdam + + + class MyModel(pl.LightningModule): + ... + + def configure_optimizers(self): + return FusedAdam(self.parameters()) + + + model = MyModel() + trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3", precision=16) + trainer.fit(model) + + trainer.test() + trainer.predict() + + +You can also use the Lightning Trainer to run predict or evaluate with DeepSpeed once the model has been trained. + +.. code-block:: python + + from lightning.pytorch import Trainer + + + class MyModel(pl.LightningModule): + ... + + + model = MyModel() + trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3", precision=16) + trainer.test(ckpt_path="my_saved_deepspeed_checkpoint.ckpt") + + +Shard Model Instantly to Reduce Initialization Time/Memory +---------------------------------------------------------- + +When instantiating really large models, it is sometimes necessary to shard the model layers instantly. + +This is the case if layers may not fit on one single machines CPU or GPU memory, but would fit once sharded across multiple machines. +We expose a hook that layers initialized within the hook will be sharded instantly on a per layer basis, allowing you to instantly shard models. + +This reduces the time taken to initialize very large models, as well as ensure we do not run out of memory when instantiating larger models. For more information you can refer to the DeepSpeed docs for `Constructing Massive Models `_. + +.. code-block:: python + + import torch.nn as nn + from lightning.pytorch import Trainer + from deepspeed.ops.adam import FusedAdam + + + class MyModel(pl.LightningModule): + ... + + def configure_model(self): + # Created within sharded model context, modules are instantly sharded across processes + # as soon as they are made. + self.block = nn.Sequential(nn.Linear(32, 32), nn.ReLU()) + + def configure_optimizers(self): + return FusedAdam(self.parameters()) + + + model = MyModel() + trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3", precision=16) + trainer.fit(model) + + trainer.test() + trainer.predict() + + +.. _deepspeed-zero-stage-3-offload: + +DeepSpeed ZeRO Stage 3 Offload +------------------------------ + +DeepSpeed ZeRO Stage 3 Offloads optimizer state, gradients to the host CPU to reduce memory usage as ZeRO Stage 2 does, however additionally allows you to offload the parameters as well for even more memory saving. + +.. note:: + + When saving a model using DeepSpeed and Stage 3, model states and optimizer states will be saved in separate sharded states (based on the world size). See :ref:`deepspeed-zero-stage-3-single-file` to obtain a single checkpoint file. + +.. code-block:: python + + from lightning.pytorch import Trainer + from lightning.pytorch.strategies import DeepSpeedStrategy + + # Enable CPU Offloading + model = MyModel() + trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3_offload", precision=16) + trainer.fit(model) + + # Enable CPU Offloading, and offload parameters to CPU + model = MyModel() + trainer = Trainer( + accelerator="gpu", + devices=4, + strategy=DeepSpeedStrategy( + stage=3, + offload_optimizer=True, + offload_parameters=True, + ), + precision=16, + ) + trainer.fit(model) + + +DeepSpeed Infinity (NVMe Offloading) +------------------------------------ + +Additionally, DeepSpeed supports offloading to NVMe drives for even larger models, utilizing the large memory space found in NVMes. DeepSpeed `reports `__ the ability to fine-tune 1 Trillion+ parameters using NVMe Offloading on one 8 GPU machine. Below shows how to enable this, assuming the NVMe drive is mounted in a directory called ``/local_nvme``. + +.. code-block:: python + + from lightning.pytorch import Trainer + from lightning.pytorch.strategies import DeepSpeedStrategy + + # Enable CPU Offloading + model = MyModel() + trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3_offload", precision=16) + trainer.fit(model) + + # Enable CPU Offloading, and offload parameters to CPU + model = MyModel() + trainer = Trainer( + accelerator="gpu", + devices=4, + strategy=DeepSpeedStrategy( + stage=3, + offload_optimizer=True, + offload_parameters=True, + remote_device="nvme", + offload_params_device="nvme", + offload_optimizer_device="nvme", + nvme_path="/local_nvme", + ), + precision=16, + ) + trainer.fit(model) + +When offloading to NVMe you may notice that the speed is slow. There are parameters that need to be tuned based on the drives that you are using. Running the `aio_bench_perf_sweep.py `__ script can help you to find optimum parameters. See the `issue `__ for more information on how to parse the information. + +.. _deepspeed-activation-checkpointing: + +DeepSpeed Activation Checkpointing +---------------------------------- + +Activation checkpointing frees activations from memory as soon as they are not needed during the forward pass. +They are then re-computed for the backwards pass as needed. + +Activation checkpointing is very useful when you have intermediate layers that produce large activations. + +This saves memory when training larger models, however requires using a checkpoint function to run modules as shown below. + +.. warning:: + + Ensure to not wrap the entire model with activation checkpointing. This is not the intended usage of activation checkpointing, and will lead to failures as seen in `this discussion `__. + +.. code-block:: python + + from lightning.pytorch import Trainer + import deepspeed + + + class MyModel(LightningModule): + ... + + def __init__(self): + super().__init__() + self.block_1 = nn.Sequential(nn.Linear(32, 32), nn.ReLU()) + self.block_2 = torch.nn.Linear(32, 2) + + def forward(self, x): + # Use the DeepSpeed checkpointing function instead of calling the module directly + # checkpointing self.block_1 means the activations are deleted after use, + # and re-calculated during the backward passes + x = deepspeed.checkpointing.checkpoint(self.block_1, x) + return self.block_2(x) + + +.. code-block:: python + + from lightning.pytorch import Trainer + from lightning.pytorch.strategies import DeepSpeedStrategy + import deepspeed + + + class MyModel(pl.LightningModule): + ... + + def configure_model(self): + self.block_1 = nn.Sequential(nn.Linear(32, 32), nn.ReLU()) + self.block_2 = torch.nn.Linear(32, 2) + + def forward(self, x): + # Use the DeepSpeed checkpointing function instead of calling the module directly + x = deepspeed.checkpointing.checkpoint(self.block_1, x) + return self.block_2(x) + + + model = MyModel() + + trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3_offload", precision=16) + + # Enable CPU Activation Checkpointing + trainer = Trainer( + accelerator="gpu", + devices=4, + strategy=DeepSpeedStrategy( + stage=3, + offload_optimizer=True, # Enable CPU Offloading + cpu_checkpointing=True, # (Optional) offload activations to CPU + ), + precision=16, + ) + trainer.fit(model) + + +.. _deepspeed-zero-stage-3-tips: + +DeepSpeed ZeRO Stage 3 Tips +--------------------------- + +Here is some helpful information when setting up DeepSpeed ZeRO Stage 3 with Lightning. + +* If you're using Adam or AdamW, ensure to use FusedAdam or DeepSpeedCPUAdam (for CPU Offloading) rather than the default torch optimizers as they come with large speed benefits +* Treat your GPU/CPU memory as one large pool. In some cases, you may not want to offload certain things (like activations) to provide even more space to offload model parameters +* When offloading to the CPU, make sure to bump up the batch size as GPU memory will be freed +* We also support sharded checkpointing. By passing ``save_full_weights=False`` to the ``DeepSpeedStrategy``, we'll save shards of the model which allows you to save extremely large models. However to load the model and run test/validation/predict you must use the Trainer object. + +.. _deepspeed-zero-stage-3-single-file: + +Collating Single File Checkpoint for DeepSpeed ZeRO Stage 3 +----------------------------------------------------------- + +After training using ZeRO Stage 3, you'll notice that your checkpoints are a directory of sharded model and optimizer states. If you'd like to collate a single file from the checkpoint directory please use the below command, which handles all the Lightning states additionally when collating the file. + +.. code-block:: python + + from lightning.pytorch.utilities.deepspeed import convert_zero_checkpoint_to_fp32_state_dict + + # lightning deepspeed has saved a directory instead of a file + save_path = "lightning_logs/version_0/checkpoints/epoch=0-step=0.ckpt/" + output_path = "lightning_model.pt" + convert_zero_checkpoint_to_fp32_state_dict(save_path, output_path) + + +.. warning:: + + This single file checkpoint does not include the optimizer/lr-scheduler states. This means we cannot restore training via the ``trainer.fit(ckpt_path=)`` call. Ensure to keep the sharded checkpoint directory if this is required. + +Custom DeepSpeed Config +======================= + +In some cases you may want to define your own DeepSpeed Config, to access all parameters defined. We've exposed most of the important parameters, however, there may be debugging parameters to enable. Also, DeepSpeed allows the use of custom DeepSpeed optimizers and schedulers defined within a config file that is supported. + +.. note:: + All strategy default parameters will be ignored when a config object is passed. + All compatible arguments can be seen in the `DeepSpeed docs `_. + +.. code-block:: python + + from lightning.pytorch import Trainer + from lightning.pytorch.strategies import DeepSpeedStrategy + + deepspeed_config = { + "zero_allow_untested_optimizer": True, + "optimizer": { + "type": "OneBitAdam", + "params": { + "lr": 3e-5, + "betas": [0.998, 0.999], + "eps": 1e-5, + "weight_decay": 1e-9, + "cuda_aware": True, + }, + }, + "scheduler": { + "type": "WarmupLR", + "params": { + "last_batch_iteration": -1, + "warmup_min_lr": 0, + "warmup_max_lr": 3e-5, + "warmup_num_steps": 100, + }, + }, + "zero_optimization": { + "stage": 2, # Enable Stage 2 ZeRO (Optimizer/Gradient state partitioning) + "offload_optimizer": {"device": "cpu"}, # Enable Offloading optimizer state/calculation to the host CPU + "contiguous_gradients": True, # Reduce gradient fragmentation. + "overlap_comm": True, # Overlap reduce/backward operation of gradients for speed. + "allgather_bucket_size": 2e8, # Number of elements to all gather at once. + "reduce_bucket_size": 2e8, # Number of elements we reduce/allreduce at once. + }, + } + + model = MyModel() + trainer = Trainer(accelerator="gpu", devices=4, strategy=DeepSpeedStrategy(config=deepspeed_config), precision=16) + trainer.fit(model) + + +We support taking the config as a json formatted file: + +.. code-block:: python + + from lightning.pytorch import Trainer + from lightning.pytorch.strategies import DeepSpeedStrategy + + model = MyModel() + trainer = Trainer( + accelerator="gpu", devices=4, strategy=DeepSpeedStrategy(config="/path/to/deepspeed_config.json"), precision=16 + ) + trainer.fit(model) + + +You can use also use an environment variable via your PyTorch Lightning script: + +.. code-block:: bash + + PL_DEEPSPEED_CONFIG_PATH=/path/to/deepspeed_config.json python train.py --strategy deepspeed + +---------- + +.. _ddp-optimizations: + +***************** +DDP Optimizations +***************** + + +DDP Static Graph +================ + +`DDP static graph `__ assumes that your model +employs the same set of used/unused parameters in every iteration, so that it can deterministically know the flow of +training and apply special optimizations during runtime. + +.. note:: + DDP static graph support requires PyTorch>=1.11.0 + +.. code-block:: python + + from lightning.pytorch import Trainer + from lightning.pytorch.strategies import DDPStrategy + + trainer = Trainer(devices=4, strategy=DDPStrategy(static_graph=True)) + + +When Using DDP on a Multi-node Cluster, Set NCCL Parameters +=========================================================== + +`NCCL `__ is the NVIDIA Collective Communications Library that is used by PyTorch to handle communication across nodes and GPUs. There are reported benefits in terms of speedups when adjusting NCCL parameters as seen in this `issue `__. In the issue, we see a 30% speed improvement when training the Transformer XLM-RoBERTa and a 15% improvement in training with Detectron2. + +NCCL parameters can be adjusted via environment variables. + +.. note:: + + AWS and GCP already set default values for these on their clusters. This is typically useful for custom cluster setups. + +* `NCCL_NSOCKS_PERTHREAD `__ +* `NCCL_SOCKET_NTHREADS `__ +* `NCCL_MIN_NCHANNELS `__ + +.. code-block:: bash + + export NCCL_NSOCKS_PERTHREAD=4 + export NCCL_SOCKET_NTHREADS=2 + + +Gradients as Bucket View +======================== + +Enabling ``gradient_as_bucket_view=True`` in the ``DDPStrategy`` will make gradients views point to different offsets of the ``allreduce`` communication buckets. See :class:`~torch.nn.parallel.DistributedDataParallel` for more information. + +This can reduce peak memory usage and throughput as saved memory will be equal to the total gradient memory + removes the need to copy gradients to the ``allreduce`` communication buckets. + +.. note:: + + When ``gradient_as_bucket_view=True`` you cannot call ``detach_()`` on gradients. If hitting such errors, please fix it by referring to the :meth:`~torch.optim.Optimizer.zero_grad` function in ``torch/optim/optimizer.py`` as a solution (`source `__). + +.. code-block:: python + + from lightning.pytorch import Trainer + from lightning.pytorch.strategies import DDPStrategy + + model = MyModel() + trainer = Trainer(accelerator="gpu", devices=4, strategy=DDPStrategy(gradient_as_bucket_view=True)) + trainer.fit(model) + + +DDP Communication Hooks +======================= + +DDP Communication hooks is an interface to control how gradients are communicated across workers, overriding the standard allreduce in DistributedDataParallel. This allows you to enable performance improving communication hooks when using multiple nodes. + +Enable `FP16 Compress Hook for multi-node throughput improvement `__: + +.. code-block:: python + + from lightning.pytorch import Trainer + from lightning.pytorch.strategies import DDPStrategy + from torch.distributed.algorithms.ddp_comm_hooks import default_hooks as default + + model = MyModel() + trainer = Trainer(accelerator="gpu", devices=4, strategy=DDPStrategy(ddp_comm_hook=default.fp16_compress_hook)) + trainer.fit(model) + +Enable `PowerSGD for multi-node throughput improvement `__: + +.. note:: + + PowerSGD typically requires extra memory of the same size as the model’s gradients to enable error feedback, which can compensate for biased compressed communication and improve accuracy (`source `__). + +.. code-block:: python + + from lightning.pytorch import Trainer + from lightning.pytorch.strategies import DDPStrategy + from torch.distributed.algorithms.ddp_comm_hooks import powerSGD_hook as powerSGD + + model = MyModel() + trainer = Trainer( + accelerator="gpu", + devices=4, + strategy=DDPStrategy( + ddp_comm_state=powerSGD.PowerSGDState( + process_group=None, + matrix_approximation_rank=1, + start_powerSGD_iter=5000, + ), + ddp_comm_hook=powerSGD.powerSGD_hook, + ), + ) + trainer.fit(model) + + +Combine hooks for accumulated benefit: + +.. code-block:: python + + from lightning.pytorch import Trainer + from lightning.pytorch.strategies import DDPStrategy + from torch.distributed.algorithms.ddp_comm_hooks import ( + default_hooks as default, + powerSGD_hook as powerSGD, + ) + + model = MyModel() + trainer = Trainer( + accelerator="gpu", + devices=4, + strategy=DDPStrategy( + ddp_comm_state=powerSGD.PowerSGDState( + process_group=None, + matrix_approximation_rank=1, + start_powerSGD_iter=5000, + ), + ddp_comm_hook=powerSGD.powerSGD_hook, + ddp_comm_wrapper=default.fp16_compress_wrapper, + ), + ) + trainer.fit(model) + + +When using Post-localSGD, you must also pass ``model_averaging_period`` to allow for model parameter averaging: + +.. code-block:: python + + from lightning.pytorch import Trainer + from lightning.pytorch.strategies import DDPStrategy + from torch.distributed.algorithms.ddp_comm_hooks import post_localSGD_hook as post_localSGD + + model = MyModel() + trainer = Trainer( + accelerator="gpu", + devices=4, + strategy=DDPStrategy( + ddp_comm_state=post_localSGD.PostLocalSGDState( + process_group=None, + subgroup=None, + start_localSGD_iter=8, + ), + ddp_comm_hook=post_localSGD.post_localSGD_hook, + model_averaging_period=4, + ), + ) + trainer.fit(model) diff --git a/docs/source-pytorch/advanced/post_training_quantization.rst b/docs/source-pytorch/advanced/post_training_quantization.rst new file mode 100644 index 0000000..611014e --- /dev/null +++ b/docs/source-pytorch/advanced/post_training_quantization.rst @@ -0,0 +1,185 @@ +:orphan: + +.. _post_training_quantization: + +########################## +Post-training Quantization +########################## + +Most deep learning applications are using 32-bits of floating-point precision for inference. But low precision data types, especially INT8, are attracting more attention due to significant performance margin. One of the essential concerns of adopting low precision is how to easily mitigate the possible accuracy loss and reach predefined accuracy requirements. + +Intel® Neural Compressor, is an open-source Python library that runs on Intel CPUs and GPUs, which could address the aforementioned concern by extending the PyTorch Lightning model with accuracy-driven automatic quantization tuning strategies to help users quickly find out the best-quantized model on Intel hardware. It also supports multiple popular network compression technologies such as sparse, pruning, and knowledge distillation. + +**Audience** : Machine learning engineers optimizing models for a better model inference speed and lower memory usage. + +Visit the Intel® Neural Compressor online document website at: ``_. + +****************** +Model Quantization +****************** + +Model quantization is an efficient model optimization tool that can accelerate the model inference speed and decrease the memory load while still maintaining the model accuracy. + +Intel® Neural Compressor provides a convenient model quantization API to quantize the already-trained Lightning module with Post-training Quantization and Quantization Aware Training. This extension API exhibits the merits of an ease-of-use coding environment and multi-functional quantization options. The user can easily quantize their fine-tuned model by adding a few clauses to their original code. We only introduce post-training quantization in this document. + +There are two post-training quantization types in Intel® Neural Compressor, post-training static quantization and post-training dynamic quantization. Post-training dynamic quantization is a recommended starting point because it provides reduced memory usage and faster computation without additional calibration datasets. This type of quantization statically quantizes only the weights from floating point to integer at conversion time. This optimization provides latencies close to post-training static quantization. But the outputs of ops are still stored with the floating point, so the increased speed of dynamic-quantized ops is less than a static-quantized computation. + +Post-training static quantization saves the output of ops via INT8 bit. It can tackle the accuracy and latency loss caused by "quant" and "dequant" operations. For Post-training static quantization, the user needs to estimate the min-max range of all FP32 tensors in the model. Unlike constant tensors such as weights and biases, variable tensors such as model input, activations and model output cannot be calibrated unless the model run a few inference cycles. As a result, the converter requires a calibration dataset to estimate that range. This dataset can be a small subset (default 100 samples) of the training or the validation data. + +************ +Installation +************ + +Prerequisites +============= + +Python version: 3.8, 3.9, 3.10 + +Install Intel® Neural Compressor +================================ + +Release binary install: + +.. code-block:: bash + + # Install stable basic version from pip + pip install neural-compressor + # Or install stable full version from pip (including GUI) + pip install neural-compressor-full + +More installation methods can be found in the `Installation Guide `_. + +***** +Usage +***** + +Minor code changes are required for the user to get started with Intel® Neural Compressor quantization API. To construct the quantization process, users can specify the below settings via the Python code: + +1. Calibration Dataloader (Needed for post-training static quantization) +2. Evaluation Dataloader and Metric + +The code changes that are required for Intel® Neural Compressor are highlighted with comments in the line above. + +PyTorch Lightning model +======================= + +Load the pretrained model with PyTorch Lightning: + +.. code-block:: python + + import torch + from lightning.pytorch import LightningModule + from transformers import AutoConfig, AutoModelForSequenceClassification, AutoTokenizer + + + # BERT Model definition + class GLUETransformer(LightningModule): + def __init__(self): + self.config = AutoConfig.from_pretrained(model_name_or_path, num_labels=num_labels) + self.model = AutoModelForSequenceClassification.from_pretrained(model_name_or_path, config=self.config) + + def forward(self, **inputs): + return self.model(**inputs) + + + model = GLUETransformer(model_name_or_path="Intel/bert-base-uncased-mrpc") + +The fine-tuned model from Intel could be downloaded from `Intel Hugging Face repository `_. + +Accuracy-driven quantization config +=================================== + +Intel® Neural Compressor supports accuracy-driven automatic tuning to generate the optimal INT8 model which meets a predefined accuracy goal. The default tolerance of accuracy loss in the accuracy criterion is 0.01. And the maximum trial number of quantization is 600. The user can specifically define their own criteria by: + +.. code-block:: python + + from neural_compressor.config import PostTrainingQuantConfig, TuningCriterion, AccuracyCriterion + + accuracy_criterion = AccuracyCriterion(tolerable_loss=0.01) + tuning_criterion = TuningCriterion(max_trials=600) + conf = PostTrainingQuantConfig( + approach="static", backend="default", tuning_criterion=tuning_criterion, accuracy_criterion=accuracy_criterion + ) + +The "approach" parameter in PostTrainingQuantConfig is defined by the user to make a choice from post-training static quantization and post-training dynamic by "static" or "dynamic". + +Quantize the model +================== + +The model can be qutized by Intel® Neural Compressor with: + +.. code-block:: python + + from neural_compressor.quantization import fit + + q_model = fit(model=model.model, conf=conf, calib_dataloader=val_dataloader(), eval_func=eval_func) + +Users can define the evaluation function "eval_func" by themselves. + +At last, the quantized model can be saved by: + +.. code-block:: python + + q_model.save("./saved_model/") + +***************** +Hands-on Examples +***************** + +Based on the `given example code `_, we show how Intel Neural Compressor conduct model quantization on PyTorch Lightning. We first define the basic config of the quantization process. + +.. code-block:: python + + from neural_compressor.quantization import fit as fit + from neural_compressor.config import PostTrainingQuantConfig + + + def eval_func_for_nc(model_n, trainer_n): + setattr(model, "model", model_n) + result = trainer_n.validate(model=model, dataloaders=dm.val_dataloader()) + return result[0]["accuracy"] + + + def eval_func(model): + return eval_func_for_nc(model, trainer) + + + conf = PostTrainingQuantConfig() + q_model = fit(model=model.model, conf=conf, calib_dataloader=dm.val_dataloader(), eval_func=eval_func) + + q_model.save("./saved_model/") + +We define the evaluation function as: + +.. code-block:: python + + def eval_func_for_nc(model_n, trainer_n): + setattr(model, "model", model_n) + result = trainer_n.validate(model=model, dataloaders=dm.val_dataloader()) + return result[0]["accuracy"] + + + def eval_func(model): + return eval_func_for_nc(model, trainer) + +Following is the performance comparison between FP32 model and INT8 model: + + ++-------------+-----------------+------------------+ +| Info Type | Baseline FP32 | Quantized INT8 | ++=============+=================+==================+ +| Accuracy | 0.8603 | 0.8578 | ++-------------+-----------------+------------------+ +| Duration(s) | 5.8973 | 3.5952 | ++-------------+-----------------+------------------+ +| Memory(MB) | 417.73 | 113.28 | ++-------------+-----------------+------------------+ + + +For more model quantization performance, please refer to `our model list `_ + +***************** +Technical Support +***************** + +Welcome to visit Intel® Neural Compressor website at: https://intel.github.io/neural-compressor to find technical support or contribute your code. diff --git a/docs/source-pytorch/advanced/pretrained.rst b/docs/source-pytorch/advanced/pretrained.rst new file mode 100644 index 0000000..4809e6e --- /dev/null +++ b/docs/source-pytorch/advanced/pretrained.rst @@ -0,0 +1 @@ +.. include:: transfer_learning.rst diff --git a/docs/source-pytorch/advanced/pruning_quantization.rst b/docs/source-pytorch/advanced/pruning_quantization.rst new file mode 100644 index 0000000..f8b0996 --- /dev/null +++ b/docs/source-pytorch/advanced/pruning_quantization.rst @@ -0,0 +1,54 @@ +.. _pruning_quantization: + +######################## +Pruning and Quantization +######################## + +Pruning and Quantization are techniques to compress model size for deployment, allowing inference speed up and energy saving without significant accuracy losses. + +******* +Pruning +******* + +.. warning:: This is an :ref:`experimental ` feature. + +Pruning is a technique which focuses on eliminating some of the model weights to reduce the model size and decrease inference requirements. + +Pruning has been shown to achieve significant efficiency improvements while minimizing the drop in model performance (prediction quality). Model pruning is recommended for cloud endpoints, deploying models on edge devices, or mobile inference (among others). + +To enable pruning during training in Lightning, simply pass in the :class:`~lightning.pytorch.callbacks.ModelPruning` callback to the Lightning Trainer. PyTorch's native pruning implementation is used under the hood. + +This callback supports multiple pruning functions: pass any `torch.nn.utils.prune `_ function as a string to select which weights to prune (`random_unstructured `_, `RandomStructured `_, etc) or implement your own by subclassing `BasePruningMethod `_. + +.. code-block:: python + + from lightning.pytorch.callbacks import ModelPruning + + # set the amount to be the fraction of parameters to prune + trainer = Trainer(callbacks=[ModelPruning("l1_unstructured", amount=0.5)]) + +You can also perform iterative pruning, apply the `lottery ticket hypothesis `__, and more! + +.. code-block:: python + + def compute_amount(epoch): + # the sum of all returned values need to be smaller than 1 + if epoch == 10: + return 0.5 + + elif epoch == 50: + return 0.25 + + elif 75 < epoch < 99: + return 0.01 + + + # the amount can be also be a callable + trainer = Trainer(callbacks=[ModelPruning("l1_unstructured", amount=compute_amount)]) + + + +Post-training Quantization +========================== + +If you want to quantize a fine-tuned model with PTQ, it is recommended to adopt a third party API names Intel® Neural Compressor, read more :doc:`here <./post_training_quantization>`, which provides a convenient tool for accelerating the model inference speed on Intel CPUs and GPUs. diff --git a/source/guides/speed.rst b/docs/source-pytorch/advanced/speed.rst similarity index 90% rename from source/guides/speed.rst rename to docs/source-pytorch/advanced/speed.rst index 1020755..1cbbf86 100644 --- a/source/guides/speed.rst +++ b/docs/source-pytorch/advanced/speed.rst @@ -2,7 +2,7 @@ .. testsetup:: * - from pytorch_lightning.callbacks.early_stopping import EarlyStopping + from lightning.pytorch.callbacks.early_stopping import EarlyStopping .. _training-speedup: @@ -27,9 +27,9 @@ GPU Training Lightning supports a variety of plugins to speed up distributed GPU training. Most notably: -* :class:`~pytorch_lightning.strategies.DDPStrategy` -* :class:`~pytorch_lightning.strategies.DDPShardedStrategy` -* :class:`~pytorch_lightning.strategies.DeepSpeedStrategy` +* :class:`~lightning.pytorch.strategies.DDPStrategy` +* :class:`~lightning.pytorch.strategies.FSDPStrategy` +* :class:`~lightning.pytorch.strategies.DeepSpeedStrategy` .. code-block:: python @@ -49,27 +49,14 @@ GPU Training Speedup Tips When training on single or multiple GPU machines, Lightning offers a host of advanced optimizations to improve throughput, memory efficiency, and model scaling. Refer to :doc:`Advanced GPU Optimized Training for more details <../advanced/model_parallel>`. -Prefer DDP Over DP -^^^^^^^^^^^^^^^^^^ -:class:`~pytorch_lightning.strategies.dp.DataParallelStrategy` performs three GPU transfers for EVERY batch: - -1. Copy the model to the device. -2. Copy the data to the device. -3. Copy the outputs of each device back to the main device. - -.. image:: https://pl-public-data.s3.amazonaws.com/docs/static/images/distributed_training/dp.gif - :alt: Animation showing DP execution. - :width: 500 - :align: center - | -Whereas :class:`~pytorch_lightning.strategies.ddp.DDPStrategy` only performs two transfer operations, making DDP much faster than DP: +:class:`~lightning.pytorch.strategies.ddp.DDPStrategy` only performs two transfer operations for each step, making it the simplest distributed training strategy: 1. Moving data to the device. 2. Transfer and sync gradients. -.. image:: https://pl-public-data.s3.amazonaws.com/docs/static/images/distributed_training/ddp.gif +.. image:: ../_static/fetched-s3-assets/ddp.gif :alt: Animation showing DDP execution. :width: 500 :align: center @@ -110,7 +97,7 @@ For debugging purposes or for dataloaders that load very small datasets, it is d warnings.filterwarnings("ignore", ".*Consider increasing the value of the `num_workers` argument*") # or to ignore all warnings that could be false positives - from pytorch_lightning.utilities.warnings import PossibleUserWarning + from lightning.pytorch.utilities.warnings import PossibleUserWarning warnings.filterwarnings("ignore", category=PossibleUserWarning) @@ -174,7 +161,7 @@ Early Stopping ************** Usually, long training epochs can lead to either overfitting or no major improvements in your metrics due to no limited convergence. -Here :class:`~pytorch_lightning.callbacks.early_stopping.EarlyStopping` callback can help you stop the training entirely by monitoring a metric of your choice. +Here :class:`~lightning.pytorch.callbacks.early_stopping.EarlyStopping` callback can help you stop the training entirely by monitoring a metric of your choice. You can read more about it :ref:`here `. @@ -196,11 +183,9 @@ less memory bandwidth and run match operations much faster on GPUs that support * Your optimization algorithm (training_step) is numerically stable. * You want to be the cool person in the lab :p -.. raw:: html - - +.. video:: ../_static/fetched-s3-assets/Trainer+flags+9+-+precision_1.mp4 + :width: 400 + :poster: ../_static/fetched-s3-assets/thumb_precision.png | @@ -352,8 +337,8 @@ Here is an explanation of what it does: When performing gradient accumulation, there is no need to perform grad synchronization during the accumulation phase. Setting ``sync_grad`` to ``False`` will block this synchronization and improve your training speed. -:class:`~pytorch_lightning.core.optimizer.LightningOptimizer` provides a -:meth:`~pytorch_lightning.core.optimizer.LightningOptimizer.toggle_model` function as a +:class:`~lightning.pytorch.core.optimizer.LightningOptimizer` provides a +:meth:`~lightning.pytorch.core.optimizer.LightningOptimizer.toggle_model` function as a :func:`contextlib.contextmanager` for advanced users. Here is an example of an advanced use case: @@ -422,15 +407,16 @@ Here is an example of an advanced use case: Set Grads to None ***************** -In order to improve performance, you can override :meth:`~pytorch_lightning.core.lightning.LightningModule.optimizer_zero_grad`. +In order to improve performance, you can override :meth:`~lightning.pytorch.core.module.LightningModule.optimizer_zero_grad`. For a more detailed explanation of the pros / cons of this technique, read the documentation for :meth:`~torch.optim.Optimizer.zero_grad` by the PyTorch team. +This is enabled by default on ``torch>=2.0.0``. .. testcode:: class Model(LightningModule): - def optimizer_zero_grad(self, epoch, batch_idx, optimizer, optimizer_idx): + def optimizer_zero_grad(self, epoch, batch_idx, optimizer): optimizer.zero_grad(set_to_none=True) diff --git a/source/advanced/strategy_registry.rst b/docs/source-pytorch/advanced/strategy_registry.rst similarity index 78% rename from source/advanced/strategy_registry.rst rename to docs/source-pytorch/advanced/strategy_registry.rst index d92069a..1a66890 100644 --- a/source/advanced/strategy_registry.rst +++ b/docs/source-pytorch/advanced/strategy_registry.rst @@ -1,8 +1,6 @@ Strategy Registry ================= -.. warning:: The Strategy Registry is experimental and subject to change. - Lightning includes a registry that holds information about Training strategies and allows for the registration of new custom strategies. The Strategies are assigned strings that identify them, such as "ddp", "deepspeed_stage_2_offload", and so on. @@ -11,21 +9,21 @@ It also returns the optional description and parameters for initialising the Str .. code-block:: python - # Training with the DDP Strategy with `find_unused_parameters` as False - trainer = Trainer(strategy="ddp_find_unused_parameters_false", accelerator="gpu", devices=4) + # Training with the DDP Strategy + trainer = Trainer(strategy="ddp", accelerator="gpu", devices=4) # Training with DeepSpeed ZeRO Stage 3 and CPU Offload trainer = Trainer(strategy="deepspeed_stage_3_offload", accelerator="gpu", devices=3) # Training with the TPU Spawn Strategy with `debug` as True - trainer = Trainer(strategy="tpu_spawn_debug", accelerator="tpu", devices=8) + trainer = Trainer(strategy="xla_debug", accelerator="tpu", devices=8) Additionally, you can pass your custom registered training strategies to the ``strategy`` argument. .. code-block:: python - from pytorch_lightning.strategies import DDPStrategy, StrategyRegistry, CheckpointIO + from lightning.pytorch.strategies import DDPStrategy, StrategyRegistry, CheckpointIO class CustomCheckpointIO(CheckpointIO): diff --git a/docs/source-pytorch/advanced/training_tricks.rst b/docs/source-pytorch/advanced/training_tricks.rst new file mode 100644 index 0000000..a5c3bfc --- /dev/null +++ b/docs/source-pytorch/advanced/training_tricks.rst @@ -0,0 +1,438 @@ +.. testsetup:: * + + from lightning.pytorch.callbacks import StochasticWeightAveraging + +.. _training_tricks: + +############################# +Effective Training Techniques +############################# + +Lightning implements various techniques to help during training that can help make the training smoother. + +---------- + +******************** +Accumulate Gradients +******************** + +.. include:: ../common/gradient_accumulation.rst + +---------- + +***************** +Gradient Clipping +***************** + +Gradient clipping can be enabled to avoid exploding gradients. By default, this will clip the gradient norm by calling +:func:`torch.nn.utils.clip_grad_norm_` computed over all model parameters together. +If the Trainer's ``gradient_clip_algorithm`` is set to ``'value'`` (``'norm'`` by default), this will use instead +:func:`torch.nn.utils.clip_grad_value_` for each parameter instead. + +.. note:: + If using mixed precision, the ``gradient_clip_val`` does not need to be changed as the gradients are unscaled + before applying the clipping function. + +.. seealso:: :class:`~lightning.pytorch.trainer.trainer.Trainer` + +.. testcode:: + + # DEFAULT (ie: don't clip) + trainer = Trainer(gradient_clip_val=0) + + # clip gradients' global norm to <=0.5 using gradient_clip_algorithm='norm' by default + trainer = Trainer(gradient_clip_val=0.5) + + # clip gradients' maximum magnitude to <=0.5 + trainer = Trainer(gradient_clip_val=0.5, gradient_clip_algorithm="value") + +Read more about :ref:`Configuring Gradient Clipping ` for advanced use-cases. + +---------- + +*************************** +Stochastic Weight Averaging +*************************** + +Stochastic Weight Averaging (SWA) can make your models generalize better at virtually no additional cost. +This can be used with both non-trained and trained models. The SWA procedure smooths the loss landscape thus making +it harder to end up in a local minimum during optimization. + +For a more detailed explanation of SWA and how it works, +read `this post `__ by the PyTorch team. + +.. seealso:: The :class:`~lightning.pytorch.callbacks.StochasticWeightAveraging` callback + +.. testcode:: + + # Enable Stochastic Weight Averaging using the callback + trainer = Trainer(callbacks=[StochasticWeightAveraging(swa_lrs=1e-2)]) + +---------- + +.. _batch_size_finder: + +***************** +Batch Size Finder +***************** + +Auto-scaling of batch size can be enabled to find the largest batch size that fits into +memory. Large batch size often yields a better estimation of the gradients, but may also result in +longer training time. Inspired by https://github.com/BlackHC/toma. + +.. seealso:: :class:`~lightning.pytorch.tuner.tuning.Tuner` + +.. code-block:: python + + from lightning.pytorch.tuner import Tuner + + # Create a tuner for the trainer + trainer = Trainer(...) + tuner = Tuner(trainer) + + # Auto-scale batch size by growing it exponentially (default) + tuner.scale_batch_size(model, mode="power") + + # Auto-scale batch size with binary search + tuner.scale_batch_size(model, mode="binsearch") + + # Fit as normal with new batch size + trainer.fit(model) + + +Currently, this feature supports two modes ``'power'`` scaling and ``'binsearch'`` +scaling. In ``'power'`` scaling, starting from a batch size of 1 keeps doubling +the batch size until an out-of-memory (OOM) error is encountered. Setting the +argument to ``'binsearch'`` will initially also try doubling the batch size until +it encounters an OOM, after which it will do a binary search that will finetune the +batch size. Additionally, it should be noted that the batch size scaler cannot +search for batch sizes larger than the size of the training dataset. + +.. note:: + + This feature expects that a ``batch_size`` field is either located as a model attribute + i.e. ``model.batch_size`` or as a field in your ``hparams`` i.e. ``model.hparams.batch_size``. + Similarly it can work with datamodules too. The field should exist and will be updated by + the results of this algorithm. Additionally, your ``train_dataloader()`` method should depend + on this field for this feature to work i.e. + + .. code-block:: python + + # using LightningModule + class LitModel(LightningModule): + def __init__(self, batch_size): + super().__init__() + self.save_hyperparameters() + # or + self.batch_size = batch_size + + def train_dataloader(self): + return DataLoader(train_dataset, batch_size=self.batch_size | self.hparams.batch_size) + + + model = LitModel(batch_size=32) + trainer = Trainer(...) + tuner = Tuner(trainer) + tuner.scale_batch_size(model) + + + # using LightningDataModule + class LitDataModule(LightningDataModule): + def __init__(self, batch_size): + super().__init__() + self.save_hyperparameters() + # or + self.batch_size = batch_size + + def train_dataloader(self): + return DataLoader(train_dataset, batch_size=self.batch_size | self.hparams.batch_size) + + + model = MyModel() + datamodule = LitDataModule(batch_size=32) + + trainer = Trainer(...) + tuner = Tuner(trainer) + tuner.scale_batch_size(model, datamodule=datamodule) + + Note that the ``train_dataloader`` can be either part of + the ``LightningModule`` or ``LightningDataModule`` + as shown above. If both the ``LightningModule`` + and the ``LightningDataModule`` contain a ``train_dataloader``, + the ``LightningDataModule`` takes precedence. + +The algorithm in short works by: + 1. Dumping the current state of the model and trainer + 2. Iteratively until convergence or maximum number of tries ``max_trials`` (default 25) has been reached: + - Call ``fit()`` method of trainer. This evaluates ``steps_per_trial`` (default 3) number of + optimization steps. Each training step can trigger an OOM error if the tensors + (training batch, weights, gradients, etc.) allocated during the steps have a + too large memory footprint. + - If an OOM error is encountered, decrease batch size else increase it. + How much the batch size is increased/decreased is determined by the chosen + strategy. + 3. The found batch size is saved to either ``model.batch_size`` or ``model.hparams.batch_size`` + 4. Restore the initial state of model and trainer + +.. warning:: Batch size finder is not yet supported for DDP or any of its variations, it is coming soon. + + +Customizing Batch Size Finder +============================= + +.. warning:: This is an :ref:`experimental ` feature. + +1. You can also customize the :class:`~lightning.pytorch.callbacks.batch_size_finder.BatchSizeFinder` callback to run + at different epochs. This feature is useful while fine-tuning models since you can't always use the same batch size after + unfreezing the backbone. + +.. code-block:: python + + from lightning.pytorch.callbacks import BatchSizeFinder + + + class FineTuneBatchSizeFinder(BatchSizeFinder): + def __init__(self, milestones, *args, **kwargs): + super().__init__(*args, **kwargs) + self.milestones = milestones + + def on_fit_start(self, *args, **kwargs): + return + + def on_train_epoch_start(self, trainer, pl_module): + if trainer.current_epoch in self.milestones or trainer.current_epoch == 0: + self.scale_batch_size(trainer, pl_module) + + + trainer = Trainer(callbacks=[FineTuneBatchSizeFinder(milestones=(5, 10))]) + trainer.fit(...) + + +2. Run batch size finder for ``validate``/``test``/``predict``. + +.. code-block:: python + + from lightning.pytorch.callbacks import BatchSizeFinder + + + class EvalBatchSizeFinder(BatchSizeFinder): + def __init__(self, *args, **kwargs): + super().__init__(*args, **kwargs) + + def on_fit_start(self, *args, **kwargs): + return + + def on_test_start(self, trainer, pl_module): + self.scale_batch_size(trainer, pl_module) + + + trainer = Trainer(callbacks=[EvalBatchSizeFinder()]) + trainer.test(...) + + +---------- + +.. _learning_rate_finder: + +******************** +Learning Rate Finder +******************** + +For training deep neural networks, selecting a good learning rate is essential +for both better performance and faster convergence. Even optimizers such as +:class:`~torch.optim.Adam` that are self-adjusting the learning rate can benefit from more optimal +choices. + +To reduce the amount of guesswork concerning choosing a good initial learning +rate, a `learning rate finder` can be used. As described in `this paper `_ +a learning rate finder does a small run where the learning rate is increased +after each processed batch and the corresponding loss is logged. The result of +this is a ``lr`` vs. ``loss`` plot that can be used as guidance for choosing an optimal +initial learning rate. + +.. warning:: + + For the moment, this feature only works with models having a single optimizer. + + +.. note:: + + With DDP: Since all the processes run in isolation, only process with ``global_rank=0`` will make the decision to stop the + learning rate finder and broadcast its results to all other ranks. That means, at the end of LR finder, each process will be running with + the learning rate found on ``global_rank=0``. + + +Using Lightning's built-in LR finder +==================================== + +To enable the learning rate finder, your :doc:`lightning module <../common/lightning_module>` needs to +have a ``learning_rate`` or ``lr`` attribute (or as a field in your ``hparams`` i.e. +``hparams.learning_rate`` or ``hparams.lr``). Then, create the :class:`~lightning.pytorch.tuner.tuning.Tuner` via ``tuner = Tuner(trainer)`` +and call ``tuner.lr_find(model)`` to run the LR finder. +The suggested ``learning_rate`` will be written to the console and will be automatically +set to your :doc:`lightning module <../common/lightning_module>`, which can be accessed +via ``self.learning_rate`` or ``self.lr``. + +.. code-block:: python + + from lightning.pytorch.tuner import Tuner + + + class LitModel(LightningModule): + def __init__(self, learning_rate): + super().__init__() + self.learning_rate = learning_rate + self.model = Model(...) + + def configure_optimizers(self): + return Adam(self.parameters(), lr=(self.lr or self.learning_rate)) + + + model = LitModel() + trainer = Trainer(...) + + # Create a Tuner + tuner = Tuner(trainer) + + # finds learning rate automatically + # sets hparams.lr or hparams.learning_rate to that learning rate + tuner.lr_find(model) + + +If your model is using an arbitrary value instead of ``self.lr`` or ``self.learning_rate``, set that value in ``lr_find``: + +.. code-block:: python + + model = LitModel() + trainer = Trainer(...) + tuner = Tuner(trainer) + + # to set to your own hparams.my_value + tuner.lr_find(model, attr_name="my_value") + + +You can also inspect the results of the learning rate finder or just play around +with the parameters of the algorithm. A typical example of this would look like: + +.. code-block:: python + + model = MyModelClass(hparams) + trainer = Trainer() + tuner = Tuner(trainer) + + # Run learning rate finder + lr_finder = tuner.lr_find(model) + + # Results can be found in + print(lr_finder.results) + + # Plot with + fig = lr_finder.plot(suggest=True) + fig.show() + + # Pick point based on plot, or get suggestion + new_lr = lr_finder.suggestion() + + # update hparams of the model + model.hparams.lr = new_lr + + # Fit model + trainer.fit(model) + +The figure produced by ``lr_finder.plot()`` should look something like the figure +below. It is recommended to not pick the learning rate that achieves the lowest +loss, but instead something in the middle of the sharpest downward slope (red point). +This is the point returned py ``lr_finder.suggestion()``. + + +Customizing Learning Rate Finder +================================ + +.. warning:: This is an :ref:`experimental ` feature. + +You can also customize the :class:`~lightning.pytorch.callbacks.lr_finder.LearningRateFinder` callback to run at different epochs. This feature is useful while fine-tuning models. + +.. code-block:: python + + from lightning.pytorch.callbacks import LearningRateFinder + + + class FineTuneLearningRateFinder(LearningRateFinder): + def __init__(self, milestones, *args, **kwargs): + super().__init__(*args, **kwargs) + self.milestones = milestones + + def on_fit_start(self, *args, **kwargs): + return + + def on_train_epoch_start(self, trainer, pl_module): + if trainer.current_epoch in self.milestones or trainer.current_epoch == 0: + self.lr_find(trainer, pl_module) + + + trainer = Trainer(callbacks=[FineTuneLearningRateFinder(milestones=(5, 10))]) + trainer.fit(...) + + +.. figure:: ../_static/images/trainer/lr_finder.png + +---------- + +************************** +Advanced GPU Optimizations +************************** + +When training on single or multiple GPU machines, Lightning offers a host of advanced optimizations to improve throughput, memory efficiency, and model scaling. +Refer to :doc:`Advanced GPU Optimized Training <../advanced/model_parallel>` for more details. + +---------- + + +.. _ddp_spawn_shared_memory: + +****************************************** +Sharing Datasets Across Process Boundaries +****************************************** + +The :class:`~lightning.pytorch.core.datamodule.LightningDataModule` class provides an organized way to decouple data loading from training logic, with :meth:`~lightning.pytorch.core.hooks.DataHooks.prepare_data` being used for downloading and pre-processing the dataset on a single process, and :meth:`~lightning.pytorch.core.hooks.DataHooks.setup` loading the pre-processed data for each process individually: + +.. code-block:: python + + class MNISTDataModule(pl.LightningDataModule): + def prepare_data(self): + MNIST(self.data_dir, download=True) + + def setup(self, stage: str): + self.mnist = MNIST(self.data_dir) + + def train_loader(self): + return DataLoader(self.mnist, batch_size=128) + +However, for in-memory datasets, that means that each process will hold a (redundant) replica of the dataset in memory, which may be impractical when using many processes while utilizing datasets that nearly fit into CPU memory, as the memory consumption will scale up linearly with the number of processes. +For example, when training Graph Neural Networks, a common strategy is to load the entire graph into CPU memory for fast access to the entire graph structure and its features, and to then perform neighbor sampling to obtain mini-batches that fit onto the GPU. + +A simple way to prevent redundant dataset replicas is to rely on :obj:`torch.multiprocessing` to share the `data automatically between spawned processes via shared memory `_. +For this, all data pre-loading should be done on the main process inside :meth:`DataModule.__init__`. As a result, all tensor-data will get automatically shared when using the ``'ddp_spawn'`` strategy. + +.. warning:: + + :obj:`torch.multiprocessing` will send a handle of each individual tensor to other processes. + In order to prevent any errors due to too many open file handles, try to reduce the number of tensors to share, *e.g.*, by stacking your data into a single tensor. + +.. code-block:: python + + class MNISTDataModule(pl.LightningDataModule): + def __init__(self, data_dir: str): + self.mnist = MNIST(data_dir, download=True, transform=T.ToTensor()) + + def train_loader(self): + return DataLoader(self.mnist, batch_size=128) + + + model = Model(...) + datamodule = MNISTDataModule("data/MNIST") + + trainer = Trainer(accelerator="gpu", devices=2, strategy="ddp_spawn") + trainer.fit(model, datamodule) + +See the `graph-level `_ and `node-level `_ prediction examples in PyTorch Geometric for practical use-cases. diff --git a/source/advanced/transfer_learning.rst b/docs/source-pytorch/advanced/transfer_learning.rst similarity index 98% rename from source/advanced/transfer_learning.rst rename to docs/source-pytorch/advanced/transfer_learning.rst index caa739b..102555b 100644 --- a/source/advanced/transfer_learning.rst +++ b/docs/source-pytorch/advanced/transfer_learning.rst @@ -62,7 +62,7 @@ Example: Imagenet (Computer Vision) super().__init__() # init a pretrained resnet - backbone = models.resnet50(pretrained=True) + backbone = models.resnet50(weights="DEFAULT") num_filters = backbone.fc.in_features layers = list(backbone.children())[:-1] self.feature_extractor = nn.Sequential(*layers) @@ -120,7 +120,6 @@ Here's a model that uses `Huggingface transformers `__. + + +---- + +Find performance bottlenecks +============================= + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Find bottlenecks in your models + :description: Benchmark your own Lightning models + :button_link: ../tuning/profiler.html + :col_css: col-md-3 + :height: 180 + :tag: basic + +.. raw:: html + +
+
diff --git a/docs/source-pytorch/cli/lightning_cli.rst b/docs/source-pytorch/cli/lightning_cli.rst new file mode 100644 index 0000000..e3220a6 --- /dev/null +++ b/docs/source-pytorch/cli/lightning_cli.rst @@ -0,0 +1,121 @@ +:orphan: + +.. _lightning-cli: + +###################################### +Configure hyperparameters from the CLI +###################################### + +************* +Why use a CLI +************* + +When running deep learning experiments, there are a couple of good practices that are recommended to follow: + +- Separate configuration from source code +- Guarantee reproducibility of experiments + +Implementing a command line interface (CLI) makes it possible to execute an experiment from a shell terminal. By having +a CLI, there is a clear separation between the Python source code and what hyperparameters are used for a particular +experiment. If the CLI corresponds to a stable version of the code, reproducing an experiment can be achieved by +installing the same version of the code plus dependencies and running with the same configuration (CLI arguments). + +---- + +********* +Basic use +********* + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: 1: Control it all from the CLI + :description: Learn to control a LightningModule and LightningDataModule from the CLI + :col_css: col-md-4 + :button_link: lightning_cli_intermediate.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: 2: Mix models, datasets and optimizers + :description: Support multiple models, datasets, optimizers and learning rate schedulers + :col_css: col-md-4 + :button_link: lightning_cli_intermediate_2.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: 3: Control it all via YAML + :description: Enable composable YAMLs + :col_css: col-md-4 + :button_link: lightning_cli_advanced.html + :height: 150 + :tag: advanced + +.. raw:: html + +
+
+ +---- + +************ +Advanced use +************ + +.. raw:: html + +
+
+ +.. displayitem:: + :header: YAML for production + :description: Use the Lightning CLI with YAMLs for production environments + :col_css: col-md-4 + :button_link: lightning_cli_advanced_2.html + :height: 150 + :tag: advanced + +.. displayitem:: + :header: Customize for complex projects + :description: Learn how to implement CLIs for complex projects + :col_css: col-md-4 + :button_link: lightning_cli_advanced_3.html + :height: 150 + :tag: advanced + +.. displayitem:: + :header: Extend the Lightning CLI + :description: Customize the Lightning CLI + :col_css: col-md-4 + :button_link: lightning_cli_expert.html + :height: 150 + :tag: expert + +---- + +************* +Miscellaneous +************* + +.. raw:: html + +
+
+ +.. displayitem:: + :header: FAQ + :description: Frequently asked questions about working with the Lightning CLI and YAML files + :col_css: col-md-6 + :button_link: lightning_cli_faq.html + :height: 150 + +.. raw:: html + +
+
diff --git a/docs/source-pytorch/cli/lightning_cli_advanced.rst b/docs/source-pytorch/cli/lightning_cli_advanced.rst new file mode 100644 index 0000000..e64b961 --- /dev/null +++ b/docs/source-pytorch/cli/lightning_cli_advanced.rst @@ -0,0 +1,259 @@ +:orphan: + +################################################# +Configure hyperparameters from the CLI (Advanced) +################################################# +**Audience:** Users looking to modularize their code for a professional project. + +**Pre-reqs:** You must have read :doc:`(Mix models and datasets) `. + +As a project becomes more complex, the number of configurable options becomes very large, making it inconvenient to +control through individual command line arguments. To address this, CLIs implemented using +:class:`~lightning.pytorch.cli.LightningCLI` always support receiving input from configuration files. The default format +used for config files is YAML. + +.. tip:: + + If you are unfamiliar with YAML, it is recommended that you first read :ref:`what-is-a-yaml-config-file`. + + +---- + +*********************** +Run using a config file +*********************** +To run the CLI using a yaml config, do: + +.. code:: bash + + python main.py fit --config config.yaml + +Individual arguments can be given to override options in the config file: + +.. code:: bash + + python main.py fit --config config.yaml --trainer.max_epochs 100 + +---- + +************************ +Automatic save of config +************************ + +To ease experiment reporting and reproducibility, by default ``LightningCLI`` automatically saves the full YAML +configuration in the log directory. After multiple fit runs with different hyperparameters, each one will have in its +respective log directory a ``config.yaml`` file. These files can be used to trivially reproduce an experiment, e.g.: + +.. code:: bash + + python main.py fit --config lightning_logs/version_7/config.yaml + +The automatic saving of the config is done by the special callback :class:`~lightning.pytorch.cli.SaveConfigCallback`. +This callback is automatically added to the ``Trainer``. To disable the save of the config, instantiate ``LightningCLI`` +with ``save_config_callback=None``. + +.. tip:: + + To change the file name of the saved configs to e.g. ``name.yaml``, do: + + .. code:: python + + cli = LightningCLI(..., save_config_kwargs={"config_filename": "name.yaml"}) + +It is also possible to extend the :class:`~lightning.pytorch.cli.SaveConfigCallback` class, for instance to additionally +save the config in a logger. An example of this is: + + .. code:: python + + class LoggerSaveConfigCallback(SaveConfigCallback): + def save_config(self, trainer: Trainer, pl_module: LightningModule, stage: str) -> None: + if isinstance(trainer.logger, Logger): + config = self.parser.dump(self.config, skip_none=False) # Required for proper reproducibility + trainer.logger.log_hyperparams({"config": config}) + + + cli = LightningCLI(..., save_config_callback=LoggerSaveConfigCallback) + +.. tip:: + + If you want to disable the standard behavior of saving the config to the ``log_dir``, then you can either implement + ``__init__`` and call ``super().__init__(*args, save_to_log_dir=False, **kwargs)`` or instantiate the + ``LightningCLI`` as: + + .. code:: python + + cli = LightningCLI(..., save_config_kwargs={"save_to_log_dir": False}) + +.. note:: + + The ``save_config``method is only called on rank zero. This allows to implement a custom save config without having + to worry about ranks or race conditions. Since it only runs on rank zero, any collective call will make the process + hang waiting for a broadcast. If you need to make collective calls, implement the ``setup`` method instead. + + +---- + +********************************* +Prepare a config file for the CLI +********************************* +The ``--help`` option of the CLIs can be used to learn which configuration options are available and how to use them. +However, writing a config from scratch can be time-consuming and error-prone. To alleviate this, the CLIs have the +``--print_config`` argument, which prints to stdout the configuration without running the command. + +For a CLI implemented as ``LightningCLI(DemoModel, BoringDataModule)``, executing: + +.. code:: bash + + python main.py fit --print_config + +generates a config with all default values like the following: + +.. code:: bash + + seed_everything: null + trainer: + logger: true + ... + model: + out_dim: 10 + learning_rate: 0.02 + data: + data_dir: ./ + ckpt_path: null + +Other command line arguments can be given and considered in the printed configuration. A use case for this is CLIs that +accept multiple models. By default, no model is selected, meaning the printed config will not include model settings. To +get a config with the default values of a particular model would be: + +.. code:: bash + + python main.py fit --model DemoModel --print_config + +which generates a config like: + +.. code:: bash + + seed_everything: null + trainer: + ... + model: + class_path: lightning.pytorch.demos.boring_classes.DemoModel + init_args: + out_dim: 10 + learning_rate: 0.02 + ckpt_path: null + +.. tip:: + + A standard procedure to run experiments can be: + + .. code:: bash + + # Print a configuration to have as reference + python main.py fit --print_config > config.yaml + # Modify the config to your liking - you can remove all default arguments + nano config.yaml + # Fit your model using the edited configuration + python main.py fit --config config.yaml + +Configuration items can be either simple Python objects such as int and str, +or complex objects comprised of a ``class_path`` and ``init_args`` arguments. The ``class_path`` refers +to the complete import path of the item class, while ``init_args`` are the arguments to be passed +to the class constructor. For example, your model is defined as: + +.. code:: python + + # model.py + class MyModel(pl.LightningModule): + def __init__(self, criterion: torch.nn.Module): + self.criterion = criterion + +Then the config would be: + +.. code:: yaml + + model: + class_path: model.MyModel + init_args: + criterion: + class_path: torch.nn.CrossEntropyLoss + init_args: + reduction: mean + ... + +``LightningCLI`` uses `jsonargparse `_ under the hood for parsing +configuration files and automatic creation of objects, so you don't need to do it yourself. + +.. note:: + + Lighting automatically registers all subclasses of :class:`~lightning.pytorch.core.module.LightningModule`, + so the complete import path is not required for them and can be replaced by the class name. + +.. note:: + + Parsers make a best effort to determine the correct names and types that the parser should accept. + However, there can be cases not yet supported or cases for which it would be impossible to support. + To somewhat overcome these limitations, there is a special key ``dict_kwargs`` that can be used + to provide arguments that will not be validated during parsing, but will be used for class instantiation. + + For example, then using the ``pytorch_lightning.profilers.PyTorchProfiler`` profiler, + the ``profile_memory`` argument has a type that is determined dynamically. As a result, it's not possible + to know the expected type during parsing. To account for this, your config file should be set up like this: + + .. code:: yaml + + trainer: + profiler: + class_path: pytorch_lightning.profilers.PyTorchProfiler + dict_kwargs: + profile_memory: true + +---- + +******************** +Compose config files +******************** +Multiple config files can be provided, and they will be parsed sequentially. Let's say we have two configs with common +settings: + +.. code:: yaml + + # config_1.yaml + trainer: + num_epochs: 10 + ... + + # config_2.yaml + trainer: + num_epochs: 20 + ... + +The value from the last config will be used, ``num_epochs = 20`` in this case: + +.. code-block:: bash + + $ python main.py fit --config config_1.yaml --config config_2.yaml + +---- + +********************* +Use groups of options +********************* +Groups of options can also be given as independent config files. For configs like: + +.. code:: yaml + + # trainer.yaml + num_epochs: 10 + + # model.yaml + out_dim: 7 + + # data.yaml + data_dir: ./data + +a fit command can be run as: + +.. code-block:: bash + + $ python main.py fit --trainer trainer.yaml --model model.yaml --data data.yaml [...] diff --git a/docs/source-pytorch/cli/lightning_cli_advanced_2.rst b/docs/source-pytorch/cli/lightning_cli_advanced_2.rst new file mode 100644 index 0000000..749ce9e --- /dev/null +++ b/docs/source-pytorch/cli/lightning_cli_advanced_2.rst @@ -0,0 +1,209 @@ +:orphan: + +.. testsetup:: * + :skipif: not _JSONARGPARSE_AVAILABLE + + import torch + from unittest import mock + from typing import List + import lightning.pytorch.cli as pl_cli + from lightning.pytorch import LightningModule, LightningDataModule, Trainer, Callback + + + class NoFitTrainer(Trainer): + def fit(self, *_, **__): + pass + + + class LightningCLI(pl_cli.LightningCLI): + def __init__(self, *args, trainer_class=NoFitTrainer, run=False, **kwargs): + super().__init__(*args, trainer_class=trainer_class, run=run, **kwargs) + + + class MyModel(LightningModule): + def __init__( + self, + encoder_layers: int = 12, + decoder_layers: List[int] = [2, 4], + batch_size: int = 8, + ): + pass + + + class MyDataModule(LightningDataModule): + def __init__(self, batch_size: int = 8): + self.num_classes = 5 + + + mock_argv = mock.patch("sys.argv", ["any.py"]) + mock_argv.start() + +.. testcleanup:: * + + mock_argv.stop() + +################################################# +Configure hyperparameters from the CLI (Advanced) +################################################# + +********************************* +Customize arguments by subcommand +********************************* +To customize arguments by subcommand, pass the config *before* the subcommand: + +.. code-block:: bash + + $ python main.py [before] [subcommand] [after] + $ python main.py ... fit ... + +For example, here we set the Trainer argument [max_steps = 100] for the full training routine and [max_steps = 10] for +testing: + +.. code-block:: bash + + # config.yaml + fit: + trainer: + max_steps: 100 + test: + trainer: + max_epochs: 10 + +now you can toggle this behavior by subcommand: + +.. code-block:: bash + + # full routine with max_steps = 100 + $ python main.py --config config.yaml fit + + # test only with max_epochs = 10 + $ python main.py --config config.yaml test + +---- + +*************************** +Run from cloud yaml configs +*************************** +For certain enterprise workloads, Lightning CLI supports running from hosted configs: + +.. code-block:: bash + + $ python main.py [subcommand] --config s3://bucket/config.yaml + +For more options, refer to :doc:`Remote filesystems <../common/remote_fs>`. + +---- + +************************************** +Use a config via environment variables +************************************** +For certain CI/CD systems, it's useful to pass in raw yaml config as environment variables: + +.. code-block:: bash + + $ python main.py fit --trainer "$TRAINER_CONFIG" --model "$MODEL_CONFIG" [...] + +---- + +*************************************** +Run from environment variables directly +*************************************** +The Lightning CLI can convert every possible CLI flag into an environment variable. To enable this, add to +``parser_kwargs`` the ``default_env`` argument: + +.. code:: python + + cli = LightningCLI(..., parser_kwargs={"default_env": True}) + +now use the ``--help`` CLI flag with any subcommand: + +.. code:: bash + + $ python main.py fit --help + +which will show you ALL possible environment variables that can be set: + +.. code:: bash + + usage: main.py [options] fit [-h] [-c CONFIG] + ... + + optional arguments: + ... + ARG: --model.out_dim OUT_DIM + ENV: PL_FIT__MODEL__OUT_DIM + (type: int, default: 10) + ARG: --model.learning_rate LEARNING_RATE + ENV: PL_FIT__MODEL__LEARNING_RATE + (type: float, default: 0.02) + +now you can customize the behavior via environment variables: + +.. code:: bash + + # set the options via env vars + $ export PL_FIT__MODEL__LEARNING_RATE=0.01 + $ export PL_FIT__MODEL__OUT_DIM=5 + + $ python main.py fit + +---- + +************************ +Set default config files +************************ +To set a path to a config file of defaults, use the ``default_config_files`` argument: + +.. testcode:: + + cli = LightningCLI(MyModel, MyDataModule, parser_kwargs={"default_config_files": ["my_cli_defaults.yaml"]}) + +or if you want defaults per subcommand: + +.. testcode:: + + cli = LightningCLI(MyModel, MyDataModule, parser_kwargs={"fit": {"default_config_files": ["my_fit_defaults.yaml"]}}) + +---- + +***************************** +Enable variable interpolation +***************************** +In certain cases where multiple settings need to share a value, consider using variable interpolation. For instance: + +.. code-block:: yaml + + model: + encoder_layers: 12 + decoder_layers: + - ${model.encoder_layers} + - 4 + +To enable variable interpolation, first install omegaconf: + +.. code:: bash + + pip install omegaconf + +Then set omegaconf when instantiating the ``LightningCLI`` class: + +.. code:: python + + cli = LightningCLI(MyModel, parser_kwargs={"parser_mode": "omegaconf"}) + +After this, the CLI will automatically perform interpolation in yaml files: + +.. code:: bash + + python main.py --model.encoder_layers=12 + +For more details about the interpolation support and its limitations, have a look at the `jsonargparse +`__ and the `omegaconf +`__ documentations. + +.. note:: + + There are many use cases in which variable interpolation is not the correct approach. When a parameter **must + always** be derived from other settings, it shouldn't be up to the CLI user to do this in a config file. For + example, if the data and model both require ``batch_size`` and must be the same value, then + :ref:`cli_link_arguments` should be used instead of interpolation. diff --git a/docs/source-pytorch/cli/lightning_cli_advanced_3.rst b/docs/source-pytorch/cli/lightning_cli_advanced_3.rst new file mode 100644 index 0000000..06e5d70 --- /dev/null +++ b/docs/source-pytorch/cli/lightning_cli_advanced_3.rst @@ -0,0 +1,393 @@ +:orphan: + +.. testsetup:: * + :skipif: not _JSONARGPARSE_AVAILABLE + + import torch + from unittest import mock + from typing import List + import lightning.pytorch.cli as pl_cli + from lightning.pytorch import LightningModule, LightningDataModule, Trainer, Callback + + + class NoFitTrainer(Trainer): + def fit(self, *_, **__): + pass + + + class LightningCLI(pl_cli.LightningCLI): + def __init__(self, *args, trainer_class=NoFitTrainer, run=False, **kwargs): + super().__init__(*args, trainer_class=trainer_class, run=run, **kwargs) + + + class MyModel(LightningModule): + def __init__( + self, + encoder_layers: int = 12, + decoder_layers: List[int] = [2, 4], + batch_size: int = 8, + ): + pass + + + class MyDataModule(LightningDataModule): + def __init__(self, batch_size: int = 8): + self.num_classes = 5 + + + MyModelBaseClass = MyModel + MyDataModuleBaseClass = MyDataModule + + mock_argv = mock.patch("sys.argv", ["any.py"]) + mock_argv.start() + +.. testcleanup:: * + + mock_argv.stop() + +################################################# +Configure hyperparameters from the CLI (Advanced) +################################################# + +Instantiation only mode +^^^^^^^^^^^^^^^^^^^^^^^ + +The CLI is designed to start fitting with minimal code changes. On class instantiation, the CLI will automatically call +the trainer function associated with the subcommand provided, so you don't have to do it. To avoid this, you can set the +following argument: + +.. testcode:: + + cli = LightningCLI(MyModel, run=False) # True by default + # you'll have to call fit yourself: + cli.trainer.fit(cli.model) + +In this mode, subcommands are **not** added to the parser. This can be useful to implement custom logic without having +to subclass the CLI, but still, use the CLI's instantiation and argument parsing capabilities. + + +Trainer Callbacks and arguments with class type +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +A very important argument of the :class:`~lightning.pytorch.trainer.trainer.Trainer` class is the ``callbacks``. In +contrast to simpler arguments that take numbers or strings, ``callbacks`` expects a list of instances of subclasses of +:class:`~lightning.pytorch.callbacks.Callback`. To specify this kind of argument in a config file, each callback must be +given as a dictionary, including a ``class_path`` entry with an import path of the class and optionally an ``init_args`` +entry with arguments to use to instantiate. Therefore, a simple configuration file that defines two callbacks is the +following: + +.. code-block:: yaml + + trainer: + callbacks: + - class_path: lightning.pytorch.callbacks.EarlyStopping + init_args: + patience: 5 + - class_path: lightning.pytorch.callbacks.LearningRateMonitor + init_args: + ... + +Similar to the callbacks, any parameter in :class:`~lightning.pytorch.trainer.trainer.Trainer` and user extended +:class:`~lightning.pytorch.core.module.LightningModule` and +:class:`~lightning.pytorch.core.datamodule.LightningDataModule` classes that have as type hint a class, can be +configured the same way using ``class_path`` and ``init_args``. If the package that defines a subclass is imported +before the :class:`~lightning.pytorch.cli.LightningCLI` class is run, the name can be used instead of the full import +path. + +From command line the syntax is the following: + +.. code-block:: bash + + $ python ... \ + --trainer.callbacks+={CALLBACK_1_NAME} \ + --trainer.callbacks.{CALLBACK_1_ARGS_1}=... \ + --trainer.callbacks.{CALLBACK_1_ARGS_2}=... \ + ... + --trainer.callbacks+={CALLBACK_N_NAME} \ + --trainer.callbacks.{CALLBACK_N_ARGS_1}=... \ + ... + +Note the use of ``+`` to append a new callback to the list and that the ``init_args`` are applied to the previous +callback appended. Here is an example: + +.. code-block:: bash + + $ python ... \ + --trainer.callbacks+=EarlyStopping \ + --trainer.callbacks.patience=5 \ + --trainer.callbacks+=LearningRateMonitor \ + --trainer.callbacks.logging_interval=epoch + +.. note:: + + Serialized config files (e.g. ``--print_config`` or :class:`~lightning.pytorch.cli.SaveConfigCallback`) always have + the full ``class_path``, even when class name shorthand notation is used in the command line or in input config + files. + + +Multiple models and/or datasets +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +A CLI can be written such that a model and/or a datamodule is specified by an import path and init arguments. For +example, with a tool implemented as: + +.. code-block:: python + + cli = LightningCLI(MyModelBaseClass, MyDataModuleBaseClass, subclass_mode_model=True, subclass_mode_data=True) + +A possible config file could be as follows: + +.. code-block:: yaml + + model: + class_path: mycode.mymodels.MyModel + init_args: + decoder_layers: + - 2 + - 4 + encoder_layers: 12 + data: + class_path: mycode.mydatamodules.MyDataModule + init_args: + ... + trainer: + callbacks: + - class_path: lightning.pytorch.callbacks.EarlyStopping + init_args: + patience: 5 + ... + +Only model classes that are a subclass of ``MyModelBaseClass`` would be allowed, and similarly, only subclasses of +``MyDataModuleBaseClass``. If as base classes :class:`~lightning.pytorch.core.module.LightningModule` and +:class:`~lightning.pytorch.core.datamodule.LightningDataModule` is given, then the CLI would allow any lightning module +and data module. + +.. tip:: + + Note that with the subclass modes, the ``--help`` option does not show information for a specific subclass. To get + help for a subclass, the options ``--model.help`` and ``--data.help`` can be used, followed by the desired class + path. Similarly, ``--print_config`` does not include the settings for a particular subclass. To include them, the + class path should be given before the ``--print_config`` option. Examples for both help and print config are: + + .. code-block:: bash + + $ python trainer.py fit --model.help mycode.mymodels.MyModel + $ python trainer.py fit --model mycode.mymodels.MyModel --print_config + + +Models with multiple submodules +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +Many use cases require to have several modules, each with its own configurable options. One possible way to handle this +with ``LightningCLI`` is to implement a single module having as init parameters each of the submodules. This is known as +`dependency injection `__ which is a good approach to improve +decoupling in your code base. + +Since the init parameters of the model have as a type hint a class, in the configuration, these would be specified with +``class_path`` and ``init_args`` entries. For instance, a model could be implemented as: + +.. testcode:: + + class MyMainModel(LightningModule): + def __init__(self, encoder: nn.Module, decoder: nn.Module): + """Example encoder-decoder submodules model + + Args: + encoder: Instance of a module for encoding + decoder: Instance of a module for decoding + """ + super().__init__() + self.encoder = encoder + self.decoder = decoder + +If the CLI is implemented as ``LightningCLI(MyMainModel)`` the configuration would be as follows: + +.. code-block:: yaml + + model: + encoder: + class_path: mycode.myencoders.MyEncoder + init_args: + ... + decoder: + class_path: mycode.mydecoders.MyDecoder + init_args: + ... + +It is also possible to combine ``subclass_mode_model=True`` and submodules, thereby having two levels of ``class_path``. + + +Fixed optimizer and scheduler +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +In some cases, fixing the optimizer and/or learning scheduler might be desired instead of allowing multiple. For this, +you can manually add the arguments for specific classes by subclassing the CLI. The following code snippet shows how to +implement it: + +.. testcode:: + + class MyLightningCLI(LightningCLI): + def add_arguments_to_parser(self, parser): + parser.add_optimizer_args(torch.optim.Adam) + parser.add_lr_scheduler_args(torch.optim.lr_scheduler.ExponentialLR) + +With this, in the config, the ``optimizer`` and ``lr_scheduler`` groups would accept all of the options for the given +classes, in this example, ``Adam`` and ``ExponentialLR``. Therefore, the config file would be structured like: + +.. code-block:: yaml + + optimizer: + lr: 0.01 + lr_scheduler: + gamma: 0.2 + model: + ... + trainer: + ... + +where the arguments can be passed directly through the command line without specifying the class. For example: + +.. code-block:: bash + + $ python trainer.py fit --optimizer.lr=0.01 --lr_scheduler.gamma=0.2 + + +Multiple optimizers and schedulers +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +By default, the CLIs support multiple optimizers and/or learning schedulers, automatically implementing +``configure_optimizers``. This behavior can be disabled by providing ``auto_configure_optimizers=False`` on +instantiation of :class:`~lightning.pytorch.cli.LightningCLI`. This would be required for example to support multiple +optimizers, for each selecting a particular optimizer class. Similar to multiple submodules, this can be done via +`dependency injection `__. Unlike the submodules, it is not possible +to expect an instance of a class, because optimizers require the module's parameters to optimize, which are only +available after instantiation of the module. Learning schedulers are a similar situation, requiring an optimizer +instance. For these cases, dependency injection involves providing a function that instantiates the respective class +when called. + +An example of a model that uses two optimizers is the following: + +.. code-block:: python + + from typing import Iterable + from torch.optim import Optimizer + + + OptimizerCallable = Callable[[Iterable], Optimizer] + + + class MyModel(LightningModule): + def __init__(self, optimizer1: OptimizerCallable, optimizer2: OptimizerCallable): + super().__init__() + self.optimizer1 = optimizer1 + self.optimizer2 = optimizer2 + + def configure_optimizers(self): + optimizer1 = self.optimizer1(self.parameters()) + optimizer2 = self.optimizer2(self.parameters()) + return [optimizer1, optimizer2] + + + cli = MyLightningCLI(MyModel, auto_configure_optimizers=False) + +Note the type ``Callable[[Iterable], Optimizer]``, which denotes a function that receives a singe argument, some +learnable parameters, and returns an optimizer instance. With this, from the command line it is possible to select the +class and init arguments for each of the optimizers, as follows: + +.. code-block:: bash + + $ python trainer.py fit \ + --model.optimizer1=Adam \ + --model.optimizer1.lr=0.01 \ + --model.optimizer2=AdamW \ + --model.optimizer2.lr=0.0001 + +In the example above, the ``OptimizerCallable`` type alias was created to illustrate what the type hint means. For +convenience, this type alias and one for learning schedulers is available in the ``cli`` module. An example of a model +that uses dependency injection for an optimizer and a learning scheduler is: + +.. code-block:: python + + from lightning.pytorch.cli import OptimizerCallable, LRSchedulerCallable, LightningCLI + + + class MyModel(LightningModule): + def __init__( + self, + optimizer: OptimizerCallable = torch.optim.Adam, + scheduler: LRSchedulerCallable = torch.optim.lr_scheduler.ConstantLR, + ): + super().__init__() + self.optimizer = optimizer + self.scheduler = scheduler + + def configure_optimizers(self): + optimizer = self.optimizer(self.parameters()) + scheduler = self.scheduler(optimizer) + return {"optimizer": optimizer, "lr_scheduler": scheduler} + + + cli = MyLightningCLI(MyModel, auto_configure_optimizers=False) + +Note that for this example, classes are used as defaults. This is compatible with the type hints, since they are also +callables that receive the same first argument and return an instance of the class. Classes that have more than one +required argument will not work as default. For these cases a lambda function can be used, e.g. ``optimizer: +OptimizerCallable = lambda p: torch.optim.SGD(p, lr=0.01)``. + + +Run from Python +^^^^^^^^^^^^^^^ + +Even though the :class:`~lightning.pytorch.cli.LightningCLI` class is designed to help in the implementation of command +line tools, for some use cases it is desired to run directly from Python. To allow this there is the ``args`` parameter. +An example could be to first implement a normal CLI script, but adding an ``args`` parameter with default ``None`` to +the main function as follows: + +.. code:: python + + from lightning.pytorch.cli import ArgsType, LightningCLI + + + def cli_main(args: ArgsType = None): + cli = LightningCLI(MyModel, ..., args=args) + ... + + + if __name__ == "__main__": + cli_main() + +Then it is possible to import the ``cli_main`` function to run it. Executing in a shell ``my_cli.py +--trainer.max_epochs=100 --model.encoder_layers=24`` would be equivalent to: + +.. code:: python + + from my_module.my_cli import cli_main + + cli_main(["--trainer.max_epochs=100", "--model.encoder_layers=24"]) + +All the features that are supported from the command line can be used when giving ``args`` as a list of strings. It is +also possible to provide a ``dict`` or `jsonargparse.Namespace +`__. For example in a jupyter notebook someone +might do: + +.. code:: python + + args = { + "trainer": { + "max_epochs": 100, + }, + "model": {}, + } + + args["model"]["encoder_layers"] = 8 + cli_main(args) + args["model"]["encoder_layers"] = 12 + cli_main(args) + args["trainer"]["max_epochs"] = 200 + cli_main(args) + +.. note:: + + The ``args`` parameter must be ``None`` when running from command line so that ``sys.argv`` is used as arguments. + Also, note that the purpose of ``trainer_defaults`` is different to ``args``. It is okay to use ``trainer_defaults`` + in the ``cli_main`` function to modify the defaults of some trainer parameters. diff --git a/docs/source-pytorch/cli/lightning_cli_expert.rst b/docs/source-pytorch/cli/lightning_cli_expert.rst new file mode 100644 index 0000000..eff4093 --- /dev/null +++ b/docs/source-pytorch/cli/lightning_cli_expert.rst @@ -0,0 +1,267 @@ +:orphan: + +.. testsetup:: * + :skipif: not _JSONARGPARSE_AVAILABLE + + import torch + from unittest import mock + from typing import List + import lightning.pytorch.cli as pl_cli + from lightning.pytorch import LightningModule, LightningDataModule, Trainer, Callback + + + class NoFitTrainer(Trainer): + def fit(self, *_, **__): + pass + + + class LightningCLI(pl_cli.LightningCLI): + def __init__(self, *args, trainer_class=NoFitTrainer, run=False, **kwargs): + super().__init__(*args, trainer_class=trainer_class, run=run, **kwargs) + + + class MyModel(LightningModule): + def __init__( + self, + encoder_layers: int = 12, + decoder_layers: List[int] = [2, 4], + batch_size: int = 8, + ): + pass + + + class MyClassModel(LightningModule): + def __init__(self, num_classes: int): + pass + + + class MyDataModule(LightningDataModule): + def __init__(self, batch_size: int = 8): + self.num_classes = 5 + + + def send_email(address, message): + pass + + + mock_argv = mock.patch("sys.argv", ["any.py"]) + mock_argv.start() + +.. testcleanup:: * + + mock_argv.stop() + +############################################### +Configure hyperparameters from the CLI (Expert) +############################################### +**Audience:** Users who already understand the LightningCLI and want to customize it. + +---- + +************************** +Customize the LightningCLI +************************** + +The init parameters of the :class:`~lightning.pytorch.cli.LightningCLI` class can be used to customize some things, +e.g., the description of the tool, enabling parsing of environment variables, and additional arguments to instantiate +the trainer and configuration parser. + +Nevertheless, the init arguments are not enough for many use cases. For this reason, the class is designed so that it +can be extended to customize different parts of the command line tool. The argument parser class used by +:class:`~lightning.pytorch.cli.LightningCLI` is :class:`~lightning.pytorch.cli.LightningArgumentParser`, which is an +extension of python's argparse, thus adding arguments can be done using the :func:`add_argument` method. In contrast to +argparse, it has additional methods to add arguments. For example :func:`add_class_arguments` add all arguments from the +init of a class. For more details, see the `respective documentation +`_. + +The :class:`~lightning.pytorch.cli.LightningCLI` class has the +:meth:`~lightning.pytorch.cli.LightningCLI.add_arguments_to_parser` method can be implemented to include more arguments. +After parsing, the configuration is stored in the ``config`` attribute of the class instance. The +:class:`~lightning.pytorch.cli.LightningCLI` class also has two methods that can be used to run code before and after +the trainer runs: ``before_`` and ``after_``. A realistic example of this would be to send an +email before and after the execution. The code for the ``fit`` subcommand would be something like this: + +.. testcode:: + + class MyLightningCLI(LightningCLI): + def add_arguments_to_parser(self, parser): + parser.add_argument("--notification_email", default="will@email.com") + + def before_fit(self): + send_email(address=self.config["notification_email"], message="trainer.fit starting") + + def after_fit(self): + send_email(address=self.config["notification_email"], message="trainer.fit finished") + + + cli = MyLightningCLI(MyModel) + +Note that the config object ``self.config`` is a namespace whose keys are global options or groups of options. It has +the same structure as the YAML format described previously. This means that the parameters used for instantiating the +trainer class can be found in ``self.config['fit']['trainer']``. + +.. tip:: + + Have a look at the :class:`~lightning.pytorch.cli.LightningCLI` class API reference to learn about other methods + that can be extended to customize a CLI. + +---- + +************************** +Configure forced callbacks +************************** +As explained previously, any Lightning callback can be added by passing it through the command line or including it in +the config via ``class_path`` and ``init_args`` entries. + +However, certain callbacks **must** be coupled with a model so they are always present and configurable. This can be +implemented as follows: + +.. testcode:: + + from lightning.pytorch.callbacks import EarlyStopping + + + class MyLightningCLI(LightningCLI): + def add_arguments_to_parser(self, parser): + parser.add_lightning_class_args(EarlyStopping, "my_early_stopping") + parser.set_defaults({"my_early_stopping.monitor": "val_loss", "my_early_stopping.patience": 5}) + + + cli = MyLightningCLI(MyModel) + +To change the parameters for ``EarlyStopping`` in the config it would be: + +.. code-block:: yaml + + model: + ... + trainer: + ... + my_early_stopping: + patience: 5 + +.. note:: + + The example above overrides a default in ``add_arguments_to_parser``. This is included to show that defaults can be + changed if needed. However, note that overriding defaults in the source code is not intended to be used to store the + best hyperparameters for a task after experimentation. To guarantee reproducibility, the source code should be + stable. It is better to practice storing the best hyperparameters for a task in a configuration file independent + from the source code. + +---- + +******************* +Class type defaults +******************* + +The support for classes as type hints allows to try many possibilities with the same CLI. This is a useful feature, but +it is tempting to use an instance of a class as a default. For example: + +.. testcode:: + + class MyMainModel(LightningModule): + def __init__( + self, + backbone: torch.nn.Module = MyModel(encoder_layers=24), # BAD PRACTICE! + ): + super().__init__() + self.backbone = backbone + +Normally classes are mutable, as in this case. The instance of ``MyModel`` would be created the moment that the module +that defines ``MyMainModel`` is first imported. This means that the default of ``backbone`` will be initialized before +the CLI class runs ``seed_everything``, making it non-reproducible. Furthermore, if ``MyMainModel`` is used more than +once in the same Python process and the ``backbone`` parameter is not overridden, the same instance would be used in +multiple places. Most likely, this is not what the developer intended. Having an instance as default also makes it +impossible to generate the complete config file since it is not known which arguments were used to instantiate it for +arbitrary classes. + +An excellent solution to these problems is not to have a default or set the default to a unique value (e.g., a string). +Then check this value and instantiate it in the ``__init__`` body. If a class parameter has no default and the CLI is +subclassed, then a default can be set as follows: + +.. testcode:: + + default_backbone = { + "class_path": "import.path.of.MyModel", + "init_args": { + "encoder_layers": 24, + }, + } + + + class MyLightningCLI(LightningCLI): + def add_arguments_to_parser(self, parser): + parser.set_defaults({"model.backbone": default_backbone}) + +A more compact version that avoids writing a dictionary would be: + +.. testcode:: + + from jsonargparse import lazy_instance + + + class MyLightningCLI(LightningCLI): + def add_arguments_to_parser(self, parser): + parser.set_defaults({"model.backbone": lazy_instance(MyModel, encoder_layers=24)}) + +---- + +.. _cli_link_arguments: + +**************** +Argument linking +**************** +Another case in which it might be desired to extend :class:`~lightning.pytorch.cli.LightningCLI` is that the model and +data module depends on a common parameter. For example, in some cases, both classes require to know the ``batch_size``. +It is a burden and error-prone to give the same value twice in a config file. To avoid this, the parser can be +configured so that a value is only given once and then propagated accordingly. With a tool implemented like the one +shown below, the ``batch_size`` only has to be provided in the ``data`` section of the config. + +.. testcode:: + + class MyLightningCLI(LightningCLI): + def add_arguments_to_parser(self, parser): + parser.link_arguments("data.batch_size", "model.batch_size") + + + cli = MyLightningCLI(MyModel, MyDataModule) + +The linking of arguments is observed in the help of the tool, which for this example would look like: + +.. code-block:: bash + + $ python trainer.py fit --help + ... + --data.batch_size BATCH_SIZE + Number of samples in a batch (type: int, default: 8) + + Linked arguments: + data.batch_size --> model.batch_size + Number of samples in a batch (type: int) + +Sometimes a parameter value is only available after class instantiation. An example could be that your model requires +the number of classes to instantiate its fully connected layer (for a classification task). But the value is not +available until the data module has been instantiated. The code below illustrates how to address this. + +.. testcode:: + + class MyLightningCLI(LightningCLI): + def add_arguments_to_parser(self, parser): + parser.link_arguments("data.num_classes", "model.num_classes", apply_on="instantiate") + + + cli = MyLightningCLI(MyClassModel, MyDataModule) + +Instantiation links are used to automatically determine the order of instantiation, in this case data first. + +.. note:: + + The linking of arguments is intended for things that are meant to be non-configurable. This improves the CLI user + experience since it avoids the need to provide more parameters. A related concept is a variable interpolation that + keeps things configurable. + +.. tip:: + + The linking of arguments can be used for more complex cases. For example to derive a value via a function that takes + multiple settings as input. For more details have a look at the API of `link_arguments + `_. diff --git a/docs/source-pytorch/cli/lightning_cli_faq.rst b/docs/source-pytorch/cli/lightning_cli_faq.rst new file mode 100644 index 0000000..6ebd78d --- /dev/null +++ b/docs/source-pytorch/cli/lightning_cli_faq.rst @@ -0,0 +1,122 @@ +:orphan: + +########################################### +Frequently asked questions for LightningCLI +########################################### + +************************ +What does CLI stand for? +************************ +CLI is short for command line interface. This means it is a tool intended to be run from a terminal, similar to commands +like ``git``. + +---- + +.. _what-is-a-yaml-config-file: + +*************************** +What is a yaml config file? +*************************** +A YAML is a standard for configuration files used to describe parameters for sections of a program. It is a common tool +in engineering and has recently started to gain popularity in machine learning. An example of a YAML file is the +following: + +.. code:: yaml + + # file.yaml + car: + max_speed:100 + max_passengers:2 + plane: + fuel_capacity: 50 + class_3: + option_1: 'x' + option_2: 'y' + +If you are unfamiliar with YAML, the short introduction at `realpython.com#yaml-syntax +`__ might be a good starting point. + +---- + +********************* +What is a subcommand? +********************* +A subcommand is what is the action the LightningCLI applies to the script: + +.. code:: bash + + python main.py [subcommand] + +See the Potential subcommands with: + +.. code:: bash + + python main.py --help + +which prints: + +.. code:: bash + + ... + + fit Runs the full optimization routine. + validate Perform one evaluation epoch over the validation set. + test Perform one evaluation epoch over the test set. + predict Run inference on your data. + +use a subcommand as follows: + +.. code:: bash + + python main.py fit + python main.py test + +---- + +******************************************************* +What is the relation between LightningCLI and argparse? +******************************************************* + +:class:`~lightning.pytorch.cli.LightningCLI` makes use of `jsonargparse `__ +which is an extension of `argparse `__. Due to this, +:class:`~lightning.pytorch.cli.LightningCLI` follows the same arguments style as many POSIX command line tools. Long +options are prefixed with two dashes and its corresponding values are separated by space or an equal sign, as ``--option +value`` or ``--option=value``. Command line options are parsed from left to right, therefore if a setting appears +multiple times, the value most to the right will override the previous ones. + +---- + +******************************************* +What is the override order of LightningCLI? +******************************************* + +The final configuration of CLIs implemented with :class:`~lightning.pytorch.cli.LightningCLI` can depend on default +config files (if defined), environment variables (if enabled) and command line arguments. The override order between +these is the following: + +1. Defaults defined in the source code. +2. Existing default config files in the order defined in ``default_config_files``, e.g. ``~/.myapp.yaml``. +3. Entire config environment variable, e.g. ``PL_FIT__CONFIG``. +4. Individual argument environment variables, e.g. ``PL_FIT__SEED_EVERYTHING``. +5. Command line arguments in order left to right (might include config files). + +---- + +**************************** +How do I troubleshoot a CLI? +**************************** +The standard behavior for CLIs, when they fail, is to terminate the process with a non-zero exit code and a short +message to hint the user about the cause. This is problematic while developing the CLI since there is no information to +track down the root of the problem. To troubleshoot set the environment variable ``JSONARGPARSE_DEBUG`` to any value +before running the CLI: + +.. code:: bash + + export JSONARGPARSE_DEBUG=true + python main.py fit + +.. note:: + + When asking about problems and reporting issues, please set the ``JSONARGPARSE_DEBUG`` and include the stack trace + in your description. With this, users are more likely to help identify the cause without needing to create a + reproducible script. diff --git a/docs/source-pytorch/cli/lightning_cli_intermediate.rst b/docs/source-pytorch/cli/lightning_cli_intermediate.rst new file mode 100644 index 0000000..b43a838 --- /dev/null +++ b/docs/source-pytorch/cli/lightning_cli_intermediate.rst @@ -0,0 +1,156 @@ +:orphan: + +##################################################### +Configure hyperparameters from the CLI (Intermediate) +##################################################### +**Audience:** Users who want advanced modularity via a command line interface (CLI). + +**Pre-reqs:** You must already understand how to use the command line and :doc:`LightningDataModule <../data/datamodule>`. + +---- + +************************* +LightningCLI requirements +************************* + +The :class:`~lightning.pytorch.cli.LightningCLI` class is designed to significantly ease the implementation of CLIs. To +use this class, an additional Python requirement is necessary than the minimal installation of Lightning provides. To +enable, either install all extras: + +.. code:: bash + + pip install "pytorch-lightning[extra]" + +or if only interested in ``LightningCLI``, just install jsonargparse: + +.. code:: bash + + pip install "jsonargparse[signatures]" + +---- + +****************** +Implementing a CLI +****************** +Implementing a CLI is as simple as instantiating a :class:`~lightning.pytorch.cli.LightningCLI` object giving as +arguments classes for a ``LightningModule`` and optionally a ``LightningDataModule``: + +.. code:: python + + # main.py + from lightning.pytorch.cli import LightningCLI + + # simple demo classes for your convenience + from lightning.pytorch.demos.boring_classes import DemoModel, BoringDataModule + + + def cli_main(): + cli = LightningCLI(DemoModel, BoringDataModule) + # note: don't call fit!! + + + if __name__ == "__main__": + cli_main() + # note: it is good practice to implement the CLI in a function and call it in the main if block + +Now your model can be managed via the CLI. To see the available commands type: + +.. code:: bash + + $ python main.py --help + +which prints out: + +.. code:: bash + + usage: main.py [-h] [-c CONFIG] [--print_config [={comments,skip_null,skip_default}+]] + {fit,validate,test,predict} ... + + pytorch-lightning trainer command line tool + + optional arguments: + -h, --help Show this help message and exit. + -c CONFIG, --config CONFIG + Path to a configuration file in json or yaml format. + --print_config [={comments,skip_null,skip_default}+] + Print configuration and exit. + + subcommands: + For more details of each subcommand add it as argument followed by --help. + + {fit,validate,test,predict} + fit Runs the full optimization routine. + validate Perform one evaluation epoch over the validation set. + test Perform one evaluation epoch over the test set. + predict Run inference on your data. + + +The message tells us that we have a few available subcommands: + +.. code:: bash + + python main.py [subcommand] + +which you can use depending on your use case: + +.. code:: bash + + $ python main.py fit + $ python main.py validate + $ python main.py test + $ python main.py predict + +---- + +************************** +Train a model with the CLI +************************** +To train a model, use the ``fit`` subcommand: + +.. code:: bash + + python main.py fit + +View all available options with the ``--help`` argument given after the subcommand: + +.. code:: bash + + $ python main.py fit --help + + usage: main.py [options] fit [-h] [-c CONFIG] + [--seed_everything SEED_EVERYTHING] [--trainer CONFIG] + ... + [--ckpt_path CKPT_PATH] + --trainer.logger LOGGER + + optional arguments: + : + --model.out_dim OUT_DIM + (type: int, default: 10) + --model.learning_rate LEARNING_RATE + (type: float, default: 0.02) + : + --data CONFIG Path to a configuration file. + --data.data_dir DATA_DIR + (type: str, default: ./) + +With the Lightning CLI enabled, you can now change the parameters without touching your code: + +.. code:: bash + + # change the learning_rate + python main.py fit --model.learning_rate 0.1 + + # change the output dimensions also + python main.py fit --model.out_dim 10 --model.learning_rate 0.1 + + # change trainer and data arguments too + python main.py fit --model.out_dim 2 --model.learning_rate 0.1 --data.data_dir '~/' --trainer.logger False + +.. tip:: + + The options that become available in the CLI are the ``__init__`` parameters of the ``LightningModule`` and + ``LightningDataModule`` classes. Thus, to make hyperparameters configurable, just add them to your class's + ``__init__``. It is highly recommended that these parameters are described in the docstring so that the CLI shows + them in the help. Also, the parameters should have accurate type hints so that the CLI can fail early and give + understandable error messages when incorrect values are given. diff --git a/docs/source-pytorch/cli/lightning_cli_intermediate_2.rst b/docs/source-pytorch/cli/lightning_cli_intermediate_2.rst new file mode 100644 index 0000000..db06f85 --- /dev/null +++ b/docs/source-pytorch/cli/lightning_cli_intermediate_2.rst @@ -0,0 +1,276 @@ +:orphan: + +##################################################### +Configure hyperparameters from the CLI (Intermediate) +##################################################### +**Audience:** Users who have multiple models and datasets per project. + +**Pre-reqs:** You must have read :doc:`(Control it all from the CLI) `. + +---- + +*************************** +Why mix models and datasets +*************************** +Lightning projects usually begin with one model and one dataset. As the project grows in complexity and you introduce +more models and more datasets, it becomes desirable to mix any model with any dataset directly from the command line +without changing your code. + +.. code:: bash + + # Mix and match anything + $ python main.py fit --model=GAN --data=MNIST + $ python main.py fit --model=Transformer --data=MNIST + +``LightningCLI`` makes this very simple. Otherwise, this kind of configuration requires a significant amount of +boilerplate that often looks like this: + +.. code:: python + + # choose model + if args.model == "gan": + model = GAN(args.feat_dim) + elif args.model == "transformer": + model = Transformer(args.feat_dim) + ... + + # choose datamodule + if args.data == "MNIST": + datamodule = MNIST() + elif args.data == "imagenet": + datamodule = Imagenet() + ... + + # mix them! + trainer.fit(model, datamodule) + +It is highly recommended that you avoid writing this kind of boilerplate and use ``LightningCLI`` instead. + +---- + +************************* +Multiple LightningModules +************************* +To support multiple models, when instantiating ``LightningCLI`` omit the ``model_class`` parameter: + +.. code:: python + + # main.py + from lightning.pytorch.cli import LightningCLI + from lightning.pytorch.demos.boring_classes import DemoModel, BoringDataModule + + + class Model1(DemoModel): + def configure_optimizers(self): + print("⚡", "using Model1", "⚡") + return super().configure_optimizers() + + + class Model2(DemoModel): + def configure_optimizers(self): + print("⚡", "using Model2", "⚡") + return super().configure_optimizers() + + + cli = LightningCLI(datamodule_class=BoringDataModule) + +Now you can choose between any model from the CLI: + +.. code:: bash + + # use Model1 + python main.py fit --model Model1 + + # use Model2 + python main.py fit --model Model2 + +.. tip:: + + Instead of omitting the ``model_class`` parameter, you can give a base class and ``subclass_mode_model=True``. This + will make the CLI only accept models which are a subclass of the given base class. + +---- + +***************************** +Multiple LightningDataModules +***************************** +To support multiple data modules, when instantiating ``LightningCLI`` omit the ``datamodule_class`` parameter: + +.. code:: python + + # main.py + import torch + from lightning.pytorch.cli import LightningCLI + from lightning.pytorch.demos.boring_classes import DemoModel, BoringDataModule + + + class FakeDataset1(BoringDataModule): + def train_dataloader(self): + print("⚡", "using FakeDataset1", "⚡") + return torch.utils.data.DataLoader(self.random_train) + + + class FakeDataset2(BoringDataModule): + def train_dataloader(self): + print("⚡", "using FakeDataset2", "⚡") + return torch.utils.data.DataLoader(self.random_train) + + + cli = LightningCLI(DemoModel) + +Now you can choose between any dataset at runtime: + +.. code:: bash + + # use Model1 + python main.py fit --data FakeDataset1 + + # use Model2 + python main.py fit --data FakeDataset2 + +.. tip:: + + Instead of omitting the ``datamodule_class`` parameter, you can give a base class and ``subclass_mode_data=True``. + This will make the CLI only accept data modules that are a subclass of the given base class. + +---- + +******************* +Multiple optimizers +******************* +Standard optimizers from ``torch.optim`` work out of the box: + +.. code:: bash + + python main.py fit --optimizer AdamW + +If the optimizer you want needs other arguments, add them via the CLI (no need to change your code)! + +.. code:: bash + + python main.py fit --optimizer SGD --optimizer.lr=0.01 + +Furthermore, any custom subclass of :class:`torch.optim.Optimizer` can be used as an optimizer: + +.. code:: python + + # main.py + import torch + from lightning.pytorch.cli import LightningCLI + from lightning.pytorch.demos.boring_classes import DemoModel, BoringDataModule + + + class LitAdam(torch.optim.Adam): + def step(self, closure): + print("⚡", "using LitAdam", "⚡") + super().step(closure) + + + class FancyAdam(torch.optim.Adam): + def step(self, closure): + print("⚡", "using FancyAdam", "⚡") + super().step(closure) + + + cli = LightningCLI(DemoModel, BoringDataModule) + +Now you can choose between any optimizer at runtime: + +.. code:: bash + + # use LitAdam + python main.py fit --optimizer LitAdam + + # use FancyAdam + python main.py fit --optimizer FancyAdam + +---- + +******************* +Multiple schedulers +******************* +Standard learning rate schedulers from ``torch.optim.lr_scheduler`` work out of the box: + +.. code:: bash + + python main.py fit --optimizer=Adam --lr_scheduler CosineAnnealingLR + +Please note that ``--optimizer`` must be added for ``--lr_scheduler`` to have an effect. + +If the scheduler you want needs other arguments, add them via the CLI (no need to change your code)! + +.. code:: bash + + python main.py fit --optimizer=Adam --lr_scheduler=ReduceLROnPlateau --lr_scheduler.monitor=epoch + +Furthermore, any custom subclass of ``torch.optim.lr_scheduler.LRScheduler`` can be used as learning rate scheduler: + +.. code:: python + + # main.py + import torch + from lightning.pytorch.cli import LightningCLI + from lightning.pytorch.demos.boring_classes import DemoModel, BoringDataModule + + + class LitLRScheduler(torch.optim.lr_scheduler.CosineAnnealingLR): + def step(self): + print("⚡", "using LitLRScheduler", "⚡") + super().step() + + + cli = LightningCLI(DemoModel, BoringDataModule) + +Now you can choose between any learning rate scheduler at runtime: + +.. code:: bash + + # LitLRScheduler + python main.py fit --optimizer=Adam --lr_scheduler LitLRScheduler + + +---- + +************************ +Classes from any package +************************ +In the previous sections, custom classes to select were defined in the same python file where the ``LightningCLI`` class +is run. To select classes from any package by using only the class name, import the respective package: + +.. code:: python + + from lightning.pytorch.cli import LightningCLI + import my_code.models # noqa: F401 + import my_code.data_modules # noqa: F401 + import my_code.optimizers # noqa: F401 + + cli = LightningCLI() + +Now use any of the classes: + +.. code:: bash + + python main.py fit --model Model1 --data FakeDataset1 --optimizer LitAdam --lr_scheduler LitLRScheduler + +The ``# noqa: F401`` comment avoids a linter warning that the import is unused. + +It is also possible to select subclasses that have not been imported by giving the full import path: + +.. code:: bash + + python main.py fit --model my_code.models.Model1 + +---- + +************************* +Help for specific classes +************************* +When multiple models or datasets are accepted, the main help of the CLI does not include their specific parameters. To +show this specific help, additional help arguments expect the class name or its import path. For example: + +.. code:: bash + + python main.py fit --model.help Model1 + python main.py fit --data.help FakeDataset2 + python main.py fit --optimizer.help Adagrad + python main.py fit --lr_scheduler.help StepLR diff --git a/source/clouds/cluster.rst b/docs/source-pytorch/clouds/cluster.rst similarity index 100% rename from source/clouds/cluster.rst rename to docs/source-pytorch/clouds/cluster.rst diff --git a/docs/source-pytorch/clouds/cluster_advanced.rst b/docs/source-pytorch/clouds/cluster_advanced.rst new file mode 100644 index 0000000..0bcadfa --- /dev/null +++ b/docs/source-pytorch/clouds/cluster_advanced.rst @@ -0,0 +1,177 @@ +#################################### +Run on an on-prem cluster (advanced) +#################################### + +.. _slurm: + +---- + +****************************** +Run on a SLURM managed cluster +****************************** +Lightning automates the details behind training on a SLURM-powered cluster. In contrast to the general purpose +cluster above, the user does not start the jobs manually on each node and instead submits it to SLURM which +schedules the resources and time for which the job is allowed to run. + +---- + +*************************** +Design your training script +*************************** + +To train a model using multiple nodes, do the following: + +1. Design your :ref:`lightning_module` (no need to add anything specific here). + +2. Enable DDP in the trainer + + .. code-block:: python + + # train on 32 GPUs across 4 nodes + trainer = Trainer(accelerator="gpu", devices=8, num_nodes=4, strategy="ddp") + +3. It's a good idea to structure your training script like this: + + .. testcode:: + + # train.py + def main(args): + model = YourLightningModule(args) + + trainer = Trainer(accelerator="gpu", devices=8, num_nodes=4, strategy="ddp") + + trainer.fit(model) + + + if __name__ == "__main__": + args = ... # you can use your CLI parser of choice, or the `LightningCLI` + # TRAIN + main(args) + +4. Create the appropriate SLURM job: + + .. code-block:: bash + + # (submit.sh) + #!/bin/bash -l + + # SLURM SUBMIT SCRIPT + #SBATCH --nodes=4 # This needs to match Trainer(num_nodes=...) + #SBATCH --gres=gpu:8 + #SBATCH --ntasks-per-node=8 # This needs to match Trainer(devices=...) + #SBATCH --mem=0 + #SBATCH --time=0-02:00:00 + + # activate conda env + source activate $1 + + # debugging flags (optional) + export NCCL_DEBUG=INFO + export PYTHONFAULTHANDLER=1 + + # on your cluster you might need these: + # set the network interface + # export NCCL_SOCKET_IFNAME=^docker0,lo + + # might need the latest CUDA + # module load NCCL/2.4.7-1-cuda.10.0 + + # run script from above + srun python3 train.py + +5. If you want auto-resubmit (read below), add this line to the submit.sh script + + .. code-block:: bash + + #SBATCH --signal=SIGUSR1@90 + +6. Submit the SLURM job + + .. code-block:: bash + + sbatch submit.sh + +---- + +********************************** +Enable auto wall-time resubmitions +********************************** +When you use Lightning in a SLURM cluster, it automatically detects when it is about +to run into the wall time and does the following: + +1. Saves a temporary checkpoint. +2. Requeues the job. +3. When the job starts, it loads the temporary checkpoint. + +To get this behavior make sure to add the correct signal to your SLURM script + +.. code-block:: bash + + # 90 seconds before training ends + SBATCH --signal=SIGUSR1@90 + +You can change this signal if your environment requires the use of a different one, for example + +.. code-block:: bash + + #SBATCH --signal=SIGHUP@90 + +Then, when you make your trainer, pass the `requeue_signal` option to the :class:`~lightning.pytorch.plugins.environments.slurm_environment.SLURMEnvironment` plugin: + +.. code-block:: python + + trainer = Trainer(plugins=[SLURMEnvironment(requeue_signal=signal.SIGHUP)]) + +If auto-resubmit is not desired, it can be turned off in the :class:`~lightning.pytorch.plugins.environments.slurm_environment.SLURMEnvironment` plugin: + +.. code-block:: python + + from lightning.pytorch.plugins.environments import SLURMEnvironment + + trainer = Trainer(plugins=[SLURMEnvironment(auto_requeue=False)]) + +---- + + +**************** +Interactive Mode +**************** + +You can also let SLURM schedule a machine for you and then log in to the machine to run scripts manually. +This is useful for development and debugging. +If you set the job name to *bash* or *interactive*, and then log in and run scripts, Lightning's SLURM auto-detection will get bypassed and it can launch processes normally: + +.. code-block:: bash + + # make sure to set `--job-name "interactive"` + srun --account --pty bash --job-name "interactive" ... + + # now run scripts normally + python train.py ... + + +---- + + +*************** +Troubleshooting +*************** + +**The Trainer is stuck initializing at startup, what is causing this?** + +You are seeing a message like this in the logs but nothing happens: + +.. code-block:: + + Initializing distributed: GLOBAL_RANK: 0, MEMBER: 1/4 + + +The most likely reasons and how to fix it: + +- You forgot to run the ``python train.py`` command with ``srun``: + Please have a look at the SLURM template script above which includes the ``srun`` at the botton of the script. + +- The number of nodes or number of devices per node is configured incorrectly: + There are two parametres in the SLURM submission script that determine how many processes will run your training, the ``#SBATCH --nodes=X`` setting and ``#SBATCH --ntasks-per-node=Y`` settings. + The numbers there need to match what is configured in your Trainer in the code: ``Trainer(num_nodes=X, devices=Y)``. + If you change the numbers, update them in BOTH places. diff --git a/docs/source-pytorch/clouds/cluster_expert.rst b/docs/source-pytorch/clouds/cluster_expert.rst new file mode 100644 index 0000000..4306b3f --- /dev/null +++ b/docs/source-pytorch/clouds/cluster_expert.rst @@ -0,0 +1,51 @@ +:orphan: + +################################## +Run on an on-prem cluster (expert) +################################## + +.. _custom-cluster: + +---- + +************************** +Integrate your own cluster +************************** + +Lightning provides an interface for providing your own definition of a cluster environment. It mainly consists of +parsing the right environment variables to access information such as world size, global and local rank (process id), +and node rank (node id). Here is an example of a custom +:class:`~lightning.pytorch.plugins.environments.cluster_environment.ClusterEnvironment`: + +.. code-block:: python + + import os + from lightning.pytorch.plugins.environments import ClusterEnvironment + + + class MyClusterEnvironment(ClusterEnvironment): + @property + def creates_processes_externally(self) -> bool: + """Return True if the cluster is managed (you don't launch processes yourself)""" + return True + + def world_size(self) -> int: + return int(os.environ["WORLD_SIZE"]) + + def global_rank(self) -> int: + return int(os.environ["RANK"]) + + def local_rank(self) -> int: + return int(os.environ["LOCAL_RANK"]) + + def node_rank(self) -> int: + return int(os.environ["NODE_RANK"]) + + def main_address(self) -> str: + return os.environ["MASTER_ADDRESS"] + + def main_port(self) -> int: + return int(os.environ["MASTER_PORT"]) + + + trainer = Trainer(plugins=[MyClusterEnvironment()]) diff --git a/source/clouds/cluster_intermediate_1.rst b/docs/source-pytorch/clouds/cluster_intermediate_1.rst similarity index 77% rename from source/clouds/cluster_intermediate_1.rst rename to docs/source-pytorch/clouds/cluster_intermediate_1.rst index c2d92e2..d668b2b 100644 --- a/source/clouds/cluster_intermediate_1.rst +++ b/docs/source-pytorch/clouds/cluster_intermediate_1.rst @@ -24,7 +24,7 @@ PyTorch Lightning follows the design of `PyTorch distributed communication packa - *MASTER_PORT* - required; has to be a free port on machine with NODE_RANK 0 - *MASTER_ADDR* - required (except for NODE_RANK 0); address of NODE_RANK 0 node -- *WORLD_SIZE* - required; how many nodes are in the cluster +- *WORLD_SIZE* - required; the total number of GPUs/processes that you will use - *NODE_RANK* - required; id of the node in the cluster .. _training_script_setup: @@ -68,32 +68,3 @@ Set the ``NCCL_DEBUG=INFO`` environment variable to see the ACTUAL error. .. code-block:: bash NCCL_DEBUG=INFO python train.py ... - ----- - -******** -Get help -******** -Setting up a cluster for distributed training is not trivial. Lightning offers lightning-grid which allows you to configure a cluster easily and run experiments via the CLI and web UI. - -Try it out for free today: - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Train models on the cloud - :description: Learn to run a model in the background on a cloud machine. - :col_css: col-md-6 - :button_link: cloud_training.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
`__ provides helper functions to setup distributed environment variables from the `PyTorch distributed communication package `__ that need to be defined on each node. + +Once the script is setup like described in :ref:` Training Script Setup`, you can run the below command across your nodes to start multi-node training. + +Like a custom cluster, you have to ensure that there is network connectivity between the nodes with firewall rules that allow traffic flow on a specified *MASTER_PORT*. + +Finally, you'll need to decide which node you'd like to be the main node (*MASTER_ADDR*), and the ranks of each node (*NODE_RANK*). + +For example: + +* *MASTER_ADDR* 10.10.10.16 +* *MASTER_PORT* 29500 +* *NODE_RANK* 0 for the first node, 1 for the second node + +Run the below command with the appropriate variables set on each node. + +.. code-block:: bash + + python -m torch.distributed.run + --nnodes=2 # number of nodes you'd like to run with + --master_addr + --master_port + --node_rank + train.py (--arg1 ... train script args...) + +.. note:: + + ``torch.distributed.run`` assumes that you'd like to spawn a process per GPU if GPU devices are found on the node. This can be adjusted with ``-nproc_per_node``. diff --git a/docs/source-pytorch/common/checkpointing.rst b/docs/source-pytorch/common/checkpointing.rst new file mode 100644 index 0000000..fdb4e85 --- /dev/null +++ b/docs/source-pytorch/common/checkpointing.rst @@ -0,0 +1,78 @@ +.. _checkpointing: + +############# +Checkpointing +############# + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Saving and loading checkpoints + :description: Learn to save and load checkpoints + :col_css: col-md-4 + :button_link: checkpointing_basic.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: Customize checkpointing behavior + :description: Learn how to change the behavior of checkpointing + :col_css: col-md-4 + :button_link: checkpointing_intermediate.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Upgrading checkpoints + :description: Learn how to upgrade old checkpoints to the newest Lightning version + :col_css: col-md-4 + :button_link: checkpointing_migration.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Cloud-based checkpoints + :description: Enable cloud-based checkpointing and composable checkpoints. + :col_css: col-md-4 + :button_link: checkpointing_advanced.html + :height: 150 + :tag: advanced + +.. displayitem:: + :header: Distributed checkpoints + :description: Customize checkpointing for custom distributed strategies and accelerators. + :col_css: col-md-4 + :button_link: checkpointing_expert.html + :height: 150 + :tag: expert + +.. raw:: html + +
+
+ +---- + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: ModelCheckpoint API + :description: Dig into the ModelCheckpoint API + :col_css: col-md-4 + :button_link: ../api/lightning.pytorch.callbacks.ModelCheckpoint.html + :height: 150 + +.. raw:: html + +
+
diff --git a/source/common/checkpointing_advanced.rst b/docs/source-pytorch/common/checkpointing_advanced.rst similarity index 85% rename from source/common/checkpointing_advanced.rst rename to docs/source-pytorch/common/checkpointing_advanced.rst index 561ca95..80b10e1 100644 --- a/source/common/checkpointing_advanced.rst +++ b/docs/source-pytorch/common/checkpointing_advanced.rst @@ -1,8 +1,8 @@ .. _checkpointing_advanced: -######################## -Checkpointing (advanced) -######################## +################################## +Cloud-based checkpoints (advanced) +################################## ***************** @@ -52,7 +52,7 @@ Checkpoints can also save the state of :doc:`datamodules <../extensions/datamodu **************************** Modify a checkpoint anywhere **************************** -When you need to change the components of a checkpoint before saving or loading, use the :meth:`~pytorch_lightning.core.hooks.CheckpointHooks.on_save_checkpoint` and :meth:`~pytorch_lightning.core.hooks.CheckpointHooks.on_load_checkpoint` of your ``LightningModule``. +When you need to change the components of a checkpoint before saving or loading, use the :meth:`~lightning.pytorch.core.hooks.CheckpointHooks.on_save_checkpoint` and :meth:`~lightning.pytorch.core.hooks.CheckpointHooks.on_load_checkpoint` of your ``LightningModule``. .. code:: python @@ -63,7 +63,7 @@ When you need to change the components of a checkpoint before saving or loading, def on_load_checkpoint(self, checkpoint): my_cool_pickable_object = checkpoint["something_cool_i_want_to_save"] -Use the above approach when you need to couple this behavior to your LightningModule for reproducibility reasons. Otherwise, Callbacks also have the :meth:`~pytorch_lightning.callbacks.base.Callback.on_save_checkpoint` and :meth:`~pytorch_lightning.callbacks.base.Callback.on_load_checkpoint` which you should use instead: +Use the above approach when you need to couple this behavior to your LightningModule for reproducibility reasons. Otherwise, Callbacks also have the :meth:`~lightning.pytorch.callbacks.callback.Callback.on_save_checkpoint` and :meth:`~lightning.pytorch.callbacks.callback.Callback.on_load_checkpoint` which you should use instead: .. code:: python diff --git a/source/common/checkpointing_basic.rst b/docs/source-pytorch/common/checkpointing_basic.rst similarity index 92% rename from source/common/checkpointing_basic.rst rename to docs/source-pytorch/common/checkpointing_basic.rst index 899de91..ab45d93 100644 --- a/source/common/checkpointing_basic.rst +++ b/docs/source-pytorch/common/checkpointing_basic.rst @@ -2,9 +2,9 @@ .. _checkpointing_basic: -##################### -Checkpointing (basic) -##################### +###################################### +Saving and loading checkpoints (basic) +###################################### **Audience:** All users ---- @@ -35,8 +35,9 @@ Inside a Lightning checkpoint you'll find: - State of all learning rate schedulers - State of all callbacks (for stateful callbacks) - State of datamodule (for stateful datamodules) -- The hyperparameters used for that model if passed in as hparams (Argparse.Namespace) -- State of Loops (if using Fault-Tolerant training) +- The hyperparameters (init arguments) with which the model was created +- The hyperparameters (init arguments) with which the datamodule was created +- State of Loops ---- @@ -105,8 +106,8 @@ The LightningModule also has access to the Hyperparameters ---- -Initalize with other parameters -=============================== +Initialize with other parameters +================================ If you used the *self.save_hyperparameters()* method in the init of the LightningModule, you can initialize the model with different hyperparameters. .. code-block:: python @@ -185,5 +186,5 @@ If you don't just want to load weights, but instead restore the full training, d model = LitModel() trainer = Trainer() - # automatically restores model, epoch, step, LR schedulers, apex, etc... + # automatically restores model, epoch, step, LR schedulers, etc... trainer.fit(model, ckpt_path="some/path/to/my_checkpoint.ckpt") diff --git a/docs/source-pytorch/common/checkpointing_expert.rst b/docs/source-pytorch/common/checkpointing_expert.rst new file mode 100644 index 0000000..721066d --- /dev/null +++ b/docs/source-pytorch/common/checkpointing_expert.rst @@ -0,0 +1,126 @@ +:orphan: + +.. _checkpointing_expert: + +################################ +Distributed checkpoints (expert) +################################ + +********************************* +Writing your own Checkpoint class +********************************* + +We provide ``Checkpoint`` class, for easier subclassing. Users may want to subclass this class in case of writing custom ``ModelCheckpoint`` callback, so that the ``Trainer`` recognizes the custom class as a checkpointing callback. + + +*********************** +Customize Checkpointing +*********************** + +.. warning:: This is an :ref:`experimental ` feature. + +Lightning supports modifying the checkpointing save/load functionality through the ``CheckpointIO``. This encapsulates the save/load logic +that is managed by the ``Strategy``. ``CheckpointIO`` is different from :meth:`~lightning.pytorch.core.hooks.CheckpointHooks.on_save_checkpoint` +and :meth:`~lightning.pytorch.core.hooks.CheckpointHooks.on_load_checkpoint` methods as it determines how the checkpoint is saved/loaded to storage rather than +what's saved in the checkpoint. + + +TODO: I don't understand this... + +****************************** +Built-in Checkpoint IO Plugins +****************************** + +.. list-table:: Built-in Checkpoint IO Plugins + :widths: 25 75 + :header-rows: 1 + + * - Plugin + - Description + * - :class:`~lightning.pytorch.plugins.io.TorchCheckpointIO` + - CheckpointIO that utilizes :func:`torch.save` and :func:`torch.load` to save and load checkpoints + respectively, common for most use cases. + * - :class:`~lightning.pytorch.plugins.io.XLACheckpointIO` + - CheckpointIO that utilizes :func:`xm.save` to save checkpoints for TPU training strategies. + * - :class:`~lightning.pytorch.plugins.io.AsyncCheckpointIO` + - ``AsyncCheckpointIO`` enables saving the checkpoints asynchronously in a thread. + + +*************************** +Custom Checkpoint IO Plugin +*************************** + +``CheckpointIO`` can be extended to include your custom save/load functionality to and from a path. The ``CheckpointIO`` object can be passed to either a ``Trainer`` directly or a ``Strategy`` as shown below: + +.. code-block:: python + + from lightning.pytorch import Trainer + from lightning.pytorch.callbacks import ModelCheckpoint + from lightning.pytorch.plugins import CheckpointIO + from lightning.pytorch.strategies import SingleDeviceStrategy + + + class CustomCheckpointIO(CheckpointIO): + def save_checkpoint(self, checkpoint, path, storage_options=None): + ... + + def load_checkpoint(self, path, storage_options=None): + ... + + def remove_checkpoint(self, path): + ... + + + custom_checkpoint_io = CustomCheckpointIO() + + # Either pass into the Trainer object + model = MyModel() + trainer = Trainer( + plugins=[custom_checkpoint_io], + callbacks=ModelCheckpoint(save_last=True), + ) + trainer.fit(model) + + # or pass into Strategy + model = MyModel() + device = torch.device("cpu") + trainer = Trainer( + strategy=SingleDeviceStrategy(device, checkpoint_io=custom_checkpoint_io), + callbacks=ModelCheckpoint(save_last=True), + ) + trainer.fit(model) + +.. note:: + + Some ``Strategy``s like ``DeepSpeedStrategy`` do not support custom ``CheckpointIO`` as checkpointing logic is not modifiable. + + +************************** +Asynchronous Checkpointing +************************** + +.. warning:: This is an :ref:`experimental ` feature. + +To enable saving the checkpoints asynchronously without blocking your training, you can configure +:class:`~lightning.pytorch.plugins.io.async_plugin.AsyncCheckpointIO` plugin to ``Trainer``. + +.. code-block:: python + + from lightning.pytorch.plugins.io import AsyncCheckpointIO + + + async_ckpt_io = AsyncCheckpointIO() + trainer = Trainer(plugins=[async_ckpt_io]) + + +It uses its base ``CheckpointIO`` plugin's saving logic to save the checkpoint but performs this operation asynchronously. +By default, this base ``CheckpointIO`` will be set-up for you and all you need to provide is the ``AsyncCheckpointIO`` instance to the ``Trainer``. +But if you want the plugin to use your own custom base ``CheckpointIO`` and want the base to behave asynchronously, pass it as an argument while initializing ``AsyncCheckpointIO``. + +.. code-block:: python + + from lightning.pytorch.plugins.io import AsyncCheckpointIO + + base_ckpt_io = MyCustomCheckpointIO() + async_ckpt_io = AsyncCheckpointIO(checkpoint_io=base_ckpt_io) + trainer = Trainer(plugins=[async_ckpt_io]) diff --git a/source/common/checkpointing_intermediate.rst b/docs/source-pytorch/common/checkpointing_intermediate.rst similarity index 75% rename from source/common/checkpointing_intermediate.rst rename to docs/source-pytorch/common/checkpointing_intermediate.rst index 7796575..c6b1951 100644 --- a/source/common/checkpointing_intermediate.rst +++ b/docs/source-pytorch/common/checkpointing_intermediate.rst @@ -1,10 +1,10 @@ :orphan: -.. _checkpointing_intermediate: +.. _checkpointing_intermediate_1: -############################ -Checkpointing (intermediate) -############################ +############################################### +Customize checkpointing behavior (intermediate) +############################################### **Audience:** Users looking to customize the checkpointing behavior ---- @@ -12,11 +12,11 @@ Checkpointing (intermediate) ***************************** Modify checkpointing behavior ***************************** -For fine-grain control over checkpointing behavior, use the :class:`~pytorch_lightning.callbacks.ModelCheckpoint` object +For fine-grained control over checkpointing behavior, use the :class:`~lightning.pytorch.callbacks.ModelCheckpoint` object .. code-block:: python - from pytorch_lightning.callbacks import ModelCheckpoint + from lightning.pytorch.callbacks import ModelCheckpoint checkpoint_callback = ModelCheckpoint(dirpath="my/path/", save_top_k=2, monitor="val_loss") trainer = Trainer(callbacks=[checkpoint_callback]) @@ -40,15 +40,15 @@ Any value that has been logged via *self.log* in the LightningModule can be moni ***************************** Save checkpoints by condition ***************************** -To save checkpoints based on a (*when/which/what/where*) condition (for example *when* the validation_loss is lower) modify the :class:`~pytorch_lightning.callbacks.ModelCheckpoint` properties. +To save checkpoints based on a (*when/which/what/where*) condition (for example *when* the validation_loss is lower) modify the :class:`~lightning.pytorch.callbacks.ModelCheckpoint` properties. When ==== -- When using iterative training which doesn't have an epoch, you can checkpoint at every ``N`` training steps by specifying ``every_n_training_steps=N``. -- You can also control the interval of epochs between checkpoints using ``every_n_epochs`` between checkpoints, to avoid slowdowns. -- You can checkpoint at a regular time interval using ``train_time_interval`` argument independent of the steps or epochs. -- In case you are monitoring a training metrics, we'd suggest using ``save_on_train_epoch_end=True`` to ensure the required metric is being accumulated correctly for creating a checkpoint. +- When using iterative training which doesn't have an epoch, you can checkpoint at every ``N`` training steps by specifying ``every_n_train_steps=N``. +- You can also control the interval of epochs between checkpoints using ``every_n_epochs``, to avoid slowdowns. +- You can checkpoint at a regular time interval using the ``train_time_interval`` argument independent of the steps or epochs. +- In case you are monitoring a training metric, we'd suggest using ``save_on_train_epoch_end=True`` to ensure the required metric is being accumulated correctly for creating a checkpoint. Which @@ -61,7 +61,7 @@ Which .. testcode:: - from pytorch_lightning.callbacks import ModelCheckpoint + from lightning.pytorch.callbacks import ModelCheckpoint # saves top-K checkpoints based on "val_loss" metric @@ -89,7 +89,7 @@ Which .. testcode:: - from pytorch_lightning.callbacks import ModelCheckpoint + from lightning.pytorch.callbacks import ModelCheckpoint class LitAutoEncoder(LightningModule): @@ -120,13 +120,13 @@ What Where ===== -- It gives you the ability to specify the ``dirpath`` and ``filename`` for your checkpoints. Filename can also be dynamic so you can inject the metrics that are being logged using :meth:`~pytorch_lightning.core.lightning.LightningModule.log`. +- By default, the ``ModelCheckpoint`` will save files into the ``Trainer.log_dir``. It gives you the ability to specify the ``dirpath`` and ``filename`` for your checkpoints. Filename can also be dynamic so you can inject the metrics that are being logged using :meth:`~lightning.pytorch.core.module.LightningModule.log`. | .. testcode:: - from pytorch_lightning.callbacks import ModelCheckpoint + from lightning.pytorch.callbacks import ModelCheckpoint # saves a file like: my/path/sample-mnist-epoch=02-val_loss=0.32.ckpt @@ -137,7 +137,7 @@ Where | -The :class:`~pytorch_lightning.callbacks.ModelCheckpoint` callback is very robust and should cover 99% of the use-cases. If you find a use-case that is not configured yet, feel free to open an issue with a feature request on GitHub +The :class:`~lightning.pytorch.callbacks.ModelCheckpoint` callback is very robust and should cover 99% of the use-cases. If you find a use-case that is not configured yet, feel free to open an issue with a feature request on GitHub and the Lightning Team will be happy to integrate/help integrate it. ---- @@ -146,8 +146,8 @@ and the Lightning Team will be happy to integrate/help integrate it. Save checkpoints manually ************************* -You can manually save checkpoints and restore your model from the checkpointed state using :meth:`~pytorch_lightning.trainer.trainer.Trainer.save_checkpoint` -and :meth:`~pytorch_lightning.core.saving.ModelIO.load_from_checkpoint`. +You can manually save checkpoints and restore your model from the checkpointed state using :meth:`~lightning.pytorch.trainer.trainer.Trainer.save_checkpoint` +and :meth:`~lightning.pytorch.core.module.LightningModule.load_from_checkpoint`. .. code-block:: python @@ -170,6 +170,6 @@ In distributed training cases where a model is running across many machines, Lig # Saves only on the main process trainer.save_checkpoint("example.ckpt") -Not using :meth:`~pytorch_lightning.trainer.trainer.Trainer.save_checkpoint` can lead to unexpected behavior and potential deadlock. Using other saving functions will result in all devices attempting to save the checkpoint. As a result, we highly recommend using the Trainer's save functionality. -If using custom saving functions cannot be avoided, we recommend using the :func:`~pytorch_lightning.utilities.rank_zero.rank_zero_only` decorator to ensure saving occurs only on the main process. Note that this will only work if all ranks hold the exact same state and won't work when using +Not using :meth:`~lightning.pytorch.trainer.trainer.Trainer.save_checkpoint` can lead to unexpected behavior and potential deadlock. Using other saving functions will result in all devices attempting to save the checkpoint. As a result, we highly recommend using the Trainer's save functionality. +If using custom saving functions cannot be avoided, we recommend using the :func:`~lightning.pytorch.utilities.rank_zero.rank_zero_only` decorator to ensure saving occurs only on the main process. Note that this will only work if all ranks hold the exact same state and won't work when using model parallel distributed strategies such as deepspeed or sharded training. diff --git a/docs/source-pytorch/common/checkpointing_migration.rst b/docs/source-pytorch/common/checkpointing_migration.rst new file mode 100644 index 0000000..5c536cc --- /dev/null +++ b/docs/source-pytorch/common/checkpointing_migration.rst @@ -0,0 +1,51 @@ +:orphan: + +.. _checkpointing_intermediate_2: + +#################################### +Upgrading checkpoints (intermediate) +#################################### +**Audience:** Users who are upgrading Lightning and their code and want to reuse their old checkpoints. + +---- + +************************************** +Resume training from an old checkpoint +************************************** + +Next to the model weights and trainer state, a Lightning checkpoint contains the version number of Lightning with which the checkpoint was saved. +When you load a checkpoint file, either by resuming training + +.. code-block:: python + + trainer = Trainer(...) + trainer.fit(model, ckpt_path="path/to/checkpoint.ckpt") + +or by loading the state directly into your model, + +.. code-block:: python + + model = LitModel.load_from_checkpoint("path/to/checkpoint.ckpt") + +Lightning will automatically recognize that it is from an older version and migrates the internal structure so it can be loaded properly. +This is done without any action required by the user. + +---- + +************************************ +Upgrade checkpoint files permanently +************************************ + +When Lightning loads a checkpoint, it applies the version migration on-the-fly as explained above, but it does not modify your checkpoint files. +You can upgrade checkpoint files permanently with the following command + +.. code-block:: + + python -m lightning.pytorch.utilities.upgrade_checkpoint path/to/model.ckpt + + +or a folder with multiple files: + +.. code-block:: + + python -m lightning.pytorch.utilities.upgrade_checkpoint /path/to/checkpoints/folder diff --git a/source/common/child_modules.rst b/docs/source-pytorch/common/child_modules.rst similarity index 96% rename from source/common/child_modules.rst rename to docs/source-pytorch/common/child_modules.rst index d3c1832..ab6e395 100644 --- a/source/common/child_modules.rst +++ b/docs/source-pytorch/common/child_modules.rst @@ -61,7 +61,7 @@ and we can train this using the ``Trainer``: trainer = Trainer() trainer.fit(lightning_module, train_dataloader, val_dataloader) -And remember that the forward method should define the practical use of a :class:`~pytorch_lightning.core.lightning.LightningModule`. +And remember that the forward method should define the practical use of a :class:`~lightning.pytorch.core.module.LightningModule`. In this case, we want to use the ``LitAutoEncoder`` to extract image representations: .. code-block:: python diff --git a/source/common/console_logs.rst b/docs/source-pytorch/common/console_logs.rst similarity index 86% rename from source/common/console_logs.rst rename to docs/source-pytorch/common/console_logs.rst index 6761432..210f14b 100644 --- a/source/common/console_logs.rst +++ b/docs/source-pytorch/common/console_logs.rst @@ -17,10 +17,10 @@ or redirect output for certain modules to log files: import logging # configure logging at the root level of Lightning - logging.getLogger("pytorch_lightning").setLevel(logging.ERROR) + logging.getLogger("lightning.pytorch").setLevel(logging.ERROR) # configure logging on module level, redirect to file - logger = logging.getLogger("pytorch_lightning.core") + logger = logging.getLogger("lightning.pytorch.core") logger.addHandler(logging.FileHandler("core.log")) Read more about custom Python logging `here `_. diff --git a/docs/source-pytorch/common/early_stopping.rst b/docs/source-pytorch/common/early_stopping.rst new file mode 100644 index 0000000..c1dc00b --- /dev/null +++ b/docs/source-pytorch/common/early_stopping.rst @@ -0,0 +1,98 @@ +.. testsetup:: * + + from lightning.pytorch.callbacks.early_stopping import EarlyStopping + +.. _early_stopping: + + +############## +Early Stopping +############## + +.. video:: ../_static/fetched-s3-assets/Trainer+flags+19-+early+stopping_1.mp4 + :poster: ../_static/fetched-s3-assets/thumb_earlystop.png + :width: 400 + :muted: + + +*********************** +Stopping an Epoch Early +*********************** + +You can stop and skip the rest of the current epoch early by overriding :meth:`~lightning.pytorch.core.hooks.ModelHooks.on_train_batch_start` to return ``-1`` when some condition is met. + +If you do this repeatedly, for every epoch you had originally requested, then this will stop your entire training. + + +********************** +EarlyStopping Callback +********************** + +The :class:`~lightning.pytorch.callbacks.early_stopping.EarlyStopping` callback can be used to monitor a metric and stop the training when no improvement is observed. + +To enable it: + +- Import :class:`~lightning.pytorch.callbacks.early_stopping.EarlyStopping` callback. +- Log the metric you want to monitor using :meth:`~lightning.pytorch.core.module.LightningModule.log` method. +- Init the callback, and set ``monitor`` to the logged metric of your choice. +- Set the ``mode`` based on the metric needs to be monitored. +- Pass the :class:`~lightning.pytorch.callbacks.early_stopping.EarlyStopping` callback to the :class:`~lightning.pytorch.trainer.trainer.Trainer` callbacks flag. + +.. code-block:: python + + from lightning.pytorch.callbacks.early_stopping import EarlyStopping + + + class LitModel(LightningModule): + def validation_step(self, batch, batch_idx): + loss = ... + self.log("val_loss", loss) + + + model = LitModel() + trainer = Trainer(callbacks=[EarlyStopping(monitor="val_loss", mode="min")]) + trainer.fit(model) + +You can customize the callbacks behaviour by changing its parameters. + +.. testcode:: + + early_stop_callback = EarlyStopping(monitor="val_accuracy", min_delta=0.00, patience=3, verbose=False, mode="max") + trainer = Trainer(callbacks=[early_stop_callback]) + + +Additional parameters that stop training at extreme points: + +- ``stopping_threshold``: Stops training immediately once the monitored quantity reaches this threshold. + It is useful when we know that going beyond a certain optimal value does not further benefit us. +- ``divergence_threshold``: Stops training as soon as the monitored quantity becomes worse than this threshold. + When reaching a value this bad, we believes the model cannot recover anymore and it is better to stop early and run with different initial conditions. +- ``check_finite``: When turned on, it stops training if the monitored metric becomes NaN or infinite. +- ``check_on_train_epoch_end``: When turned on, it checks the metric at the end of a training epoch. Use this only when you are monitoring any metric logged within + training-specific hooks on epoch-level. + + +In case you need early stopping in a different part of training, subclass :class:`~lightning.pytorch.callbacks.early_stopping.EarlyStopping` +and change where it is called: + +.. testcode:: + + class MyEarlyStopping(EarlyStopping): + def on_validation_end(self, trainer, pl_module): + # override this to disable early stopping at the end of val loop + pass + + def on_train_end(self, trainer, pl_module): + # instead, do it at the end of training loop + self._run_early_stopping_check(trainer) + +.. note:: + The :class:`~lightning.pytorch.callbacks.early_stopping.EarlyStopping` callback runs + at the end of every validation epoch by default. However, the frequency of validation + can be modified by setting various parameters in the :class:`~lightning.pytorch.trainer.trainer.Trainer`, + for example :paramref:`~lightning.pytorch.trainer.trainer.Trainer.check_val_every_n_epoch` + and :paramref:`~lightning.pytorch.trainer.trainer.Trainer.val_check_interval`. + It must be noted that the ``patience`` parameter counts the number of + validation checks with no improvement, and not the number of training epochs. + Therefore, with parameters ``check_val_every_n_epoch=10`` and ``patience=3``, the trainer + will perform at least 40 training epochs before being stopped. diff --git a/source/common/evaluation.rst b/docs/source-pytorch/common/evaluation.rst similarity index 100% rename from source/common/evaluation.rst rename to docs/source-pytorch/common/evaluation.rst diff --git a/source/common/evaluation_basic.rst b/docs/source-pytorch/common/evaluation_basic.rst similarity index 90% rename from source/common/evaluation_basic.rst rename to docs/source-pytorch/common/evaluation_basic.rst index 5f933ee..80da873 100644 --- a/source/common/evaluation_basic.rst +++ b/docs/source-pytorch/common/evaluation_basic.rst @@ -24,10 +24,12 @@ Datasets come with two splits. Refer to the dataset documentation to find the *t import torch.utils.data as data from torchvision import datasets + import torchvision.transforms as transforms # Load data sets - train_set = datasets.MNIST(root="MNIST", download=True, train=True) - test_set = datasets.MNIST(root="MNIST", download=True, train=False) + transform = transforms.ToTensor() + train_set = datasets.MNIST(root="MNIST", download=True, train=True, transform=transform) + test_set = datasets.MNIST(root="MNIST", download=True, train=False, transform=transform) ---- @@ -107,8 +109,8 @@ To add a validation loop, implement the **validation_step** method of the Lightn x = x.view(x.size(0), -1) z = self.encoder(x) x_hat = self.decoder(z) - test_loss = F.mse_loss(x_hat, x) - self.log("val_loss", test_loss) + val_loss = F.mse_loss(x_hat, x) + self.log("val_loss", val_loss) ---- @@ -120,9 +122,9 @@ To run the validation loop, pass in the validation set to **.fit** from torch.utils.data import DataLoader - train_set = DataLoader(train_set) - val_set = DataLoader(val_set) + train_loader = DataLoader(train_set) + valid_loader = DataLoader(valid_set) # train with both splits trainer = Trainer() - trainer.fit(model, train_set, val_set) + trainer.fit(model, train_loader, valid_loader) diff --git a/source/common/evaluation_intermediate.rst b/docs/source-pytorch/common/evaluation_intermediate.rst similarity index 84% rename from source/common/evaluation_intermediate.rst rename to docs/source-pytorch/common/evaluation_intermediate.rst index 7c0ca00..91f018c 100644 --- a/source/common/evaluation_intermediate.rst +++ b/docs/source-pytorch/common/evaluation_intermediate.rst @@ -22,12 +22,12 @@ Testing ******* Lightning allows the user to test their models with any compatible test dataloaders. This can be done before/after training -and is completely agnostic to :meth:`~pytorch_lightning.trainer.trainer.Trainer.fit` call. The logic used here is defined under -:meth:`~pytorch_lightning.core.lightning.LightningModule.test_step`. +and is completely agnostic to :meth:`~lightning.pytorch.trainer.trainer.Trainer.fit` call. The logic used here is defined under +:meth:`~lightning.pytorch.core.module.LightningModule.test_step`. Testing is performed using the ``Trainer`` object's ``.test()`` method. -.. automethod:: pytorch_lightning.trainer.Trainer.test +.. automethod:: lightning.pytorch.trainer.Trainer.test :noindex: @@ -44,10 +44,13 @@ To run the test set after training completes, use this method. # (1) load the best checkpoint automatically (lightning tracks this for you) trainer.test(ckpt_path="best") - # (2) test using a specific checkpoint + # (2) load the last available checkpoint + trainer.test(ckpt_path="last") + + # (3) test using a specific checkpoint trainer.test(ckpt_path="/path/to/my_checkpoint.ckpt") - # (3) test with an explicit model (will use this model and not load a checkpoint) + # (4) test with an explicit model (will use this model and not load a checkpoint) trainer.test(model) .. warning:: @@ -82,7 +85,7 @@ To run the test set on a pre-trained model, use this method. model = MyLightningModule.load_from_checkpoint( checkpoint_path="/path/to/pytorch_checkpoint.ckpt", - hparams_file="/path/to/test_tube/experiment/version/hparams.yaml", + hparams_file="/path/to/experiment/version/hparams.yaml", map_location=None, ) @@ -99,7 +102,7 @@ running the test set (ie: 16-bit, dp, ddp, etc...) Test with Additional DataLoaders ================================ -You can still run inference on a test dataset even if the :meth:`~pytorch_lightning.core.hooks.DataHooks.test_dataloader` method hasn't been +You can still run inference on a test dataset even if the :meth:`~lightning.pytorch.core.hooks.DataHooks.test_dataloader` method hasn't been defined within your :doc:`lightning module <../common/lightning_module>` instance. This would be the case when your test data is not available at the time your model was declared. @@ -138,13 +141,13 @@ Validation ********** Lightning allows the user to validate their models with any compatible ``val dataloaders``. This can be done before/after training. -The logic associated to the validation is defined within the :meth:`~pytorch_lightning.core.lightning.LightningModule.validation_step`. +The logic associated to the validation is defined within the :meth:`~lightning.pytorch.core.module.LightningModule.validation_step`. -Apart from this ``.validate`` has same API as ``.test``, but would rely respectively on :meth:`~pytorch_lightning.core.lightning.LightningModule.validation_step` and :meth:`~pytorch_lightning.core.lightning.LightningModule.test_step`. +Apart from this ``.validate`` has same API as ``.test``, but would rely respectively on :meth:`~lightning.pytorch.core.module.LightningModule.validation_step` and :meth:`~lightning.pytorch.core.module.LightningModule.test_step`. .. note:: ``.validate`` method uses the same validation logic being used under validation happening within - :meth:`~pytorch_lightning.trainer.trainer.Trainer.fit` call. + :meth:`~lightning.pytorch.trainer.trainer.Trainer.fit` call. .. warning:: @@ -153,5 +156,5 @@ Apart from this ``.validate`` has same API as ``.test``, but would rely respecti make sure all devices have same batch size in case of uneven inputs. This is helpful to make sure benchmarking for research papers is done the right way. -.. automethod:: pytorch_lightning.trainer.Trainer.validate +.. automethod:: lightning.pytorch.trainer.Trainer.validate :noindex: diff --git a/docs/source-pytorch/common/gradient_accumulation.rst b/docs/source-pytorch/common/gradient_accumulation.rst new file mode 100644 index 0000000..2a71d56 --- /dev/null +++ b/docs/source-pytorch/common/gradient_accumulation.rst @@ -0,0 +1,33 @@ +Accumulated gradients run K small batches of size ``N`` before doing a backward pass. The effect is a large effective batch size of size ``KxN``, where ``N`` is the batch size. +Internally it doesn't stack up the batches and do a forward pass rather it accumulates the gradients for K batches and then do an ``optimizer.step`` to make sure the +effective batch size is increased but there is no memory overhead. + +.. warning:: + + When using distributed training for eg. DDP, with let's say with ``P`` devices, each device accumulates independently i.e. it stores the gradients + after each ``loss.backward()`` and doesn't sync the gradients across the devices until we call ``optimizer.step()``. So for each accumulation + step, the effective batch size on each device will remain ``N*K`` but right before the ``optimizer.step()``, the gradient sync will make the effective + batch size as ``P*N*K``. For DP, since the batch is split across devices, the final effective batch size will be ``N*K``. + +.. testcode:: + + # DEFAULT (ie: no accumulated grads) + trainer = Trainer(accumulate_grad_batches=1) + + # Accumulate gradients for 7 batches + trainer = Trainer(accumulate_grad_batches=7) + +Optionally, you can make the ``accumulate_grad_batches`` value change over time by using the :class:`~lightning.pytorch.callbacks.gradient_accumulation_scheduler.GradientAccumulationScheduler`. +Pass in a scheduling dictionary, where the key represents the epoch at which the value for gradient accumulation should be updated. + +.. testcode:: + + from lightning.pytorch.callbacks import GradientAccumulationScheduler + + # till 5th epoch, it will accumulate every 8 batches. From 5th epoch + # till 9th epoch it will accumulate every 4 batches and after that no accumulation + # will happen. Note that you need to use zero-indexed epoch keys here + accumulator = GradientAccumulationScheduler(scheduling={0: 8, 4: 4, 8: 1}) + trainer = Trainer(callbacks=accumulator) + +Note: Not all strategies and accelerators support variable gradient accumulation windows. diff --git a/docs/source-pytorch/common/hyperparameters.rst b/docs/source-pytorch/common/hyperparameters.rst new file mode 100644 index 0000000..ce35627 --- /dev/null +++ b/docs/source-pytorch/common/hyperparameters.rst @@ -0,0 +1,52 @@ +:orphan: + +Configure hyperparameters from the CLI +-------------------------------------- + +You can use any CLI tool you want with Lightning. +For beginners, we recommand using Python's built-in argument parser. + + +---- + + +ArgumentParser +^^^^^^^^^^^^^^ + +The :class:`~argparse.ArgumentParser` is a built-in feature in Python that let's you build CLI programs. +You can use it to make hyperparameters and other training settings available from the command line: + +.. code-block:: python + + from argparse import ArgumentParser + + parser = ArgumentParser() + + # Trainer arguments + parser.add_argument("--devices", type=int, default=2) + + # Hyperparameters for the model + parser.add_argument("--layer_1_dim", type=int, default=128) + + # Parse the user inputs and defaults (returns a argparse.Namespace) + args = parser.parse_args() + + # Use the parsed arguments in your program + trainer = Trainer(devices=args.devices) + model = MyModel(layer_1_dim=args.layer_1_dim) + +This allows you to call your program like so: + +.. code-block:: bash + + python trainer.py --layer_1_dim 64 --devices 1 + +---- + + +LightningCLI +^^^^^^^^^^^^ + +Python's argument parser works well for simple use cases, but it can become cumbersome to maintain for larger projects. +For example, every time you add, change, or delete an argument from your model, you will have to add, edit, or remove the corresponding ``parser.add_argument`` code. +The :doc:`Lightning CLI <../cli/lightning_cli>` provides a seamless integration with the Trainer and LightningModule for which the CLI arguments get generated automatically for you! diff --git a/docs/source-pytorch/common/index.rst b/docs/source-pytorch/common/index.rst new file mode 100644 index 0000000..b5f44f7 --- /dev/null +++ b/docs/source-pytorch/common/index.rst @@ -0,0 +1,200 @@ +.. toctree:: + :maxdepth: 1 + :hidden: + + evaluation + ../model/build_model + ../cli/lightning_cli + progress_bar + ../deploy/production + ../advanced/training_tricks + ../tuning/profiler + Manage experiments <../visualize/logging_intermediate> + Organize existing PyTorch into Lightning <../starter/converting> + ../clouds/cluster + Save and load model progress + Save memory with half-precision + ../advanced/model_parallel + Train on single or multiple GPUs <../accelerators/gpu> + Train on single or multiple HPUs <../integrations/hpu/index> + Train on single or multiple IPUs <../accelerators/ipu> + Train on single or multiple TPUs <../accelerators/tpu> + Train on MPS <../accelerators/mps> + Use a pretrained model <../advanced/pretrained> + ../data/data + ../model/own_your_loop + +############# +How-to Guides +############# + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Avoid overfitting + :description: Learn how to add validation and test loops + :button_link: ../common/evaluation.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Build a model + :description: Step by step guide to build your model + :button_link: ../model/build_model.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Configure hyperparameters from the CLI + :description: Make your experiments modular via command line interface + :button_link: ../cli/lightning_cli.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Customize the progress bar + :description: Change the progress bar monitoring and tracking + :button_link: ../common/progress_bar.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Deploy models into production + :description: Deploy models with different levels of scal + :button_link: ../deploy/production.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Optimize training + :description: Explore advanced training techniques + :button_link: ../advanced/training_tricks.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Find bottlenecks in your code + :description: Learn how to profile your experiments to find bottlenecks + :button_link: ../tuning/profiler.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Finetune a model + :description: Learn how to use pretrained models + :col_css: col-md-4 + :button_link: ../advanced/transfer_learning.html + :height: 180 + +.. displayitem:: + :header: Manage data + :description: How to use basic to advanced data techniques + :button_link: ../data/data.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Manage experiments + :description: Learn to track and visualize with experiment managers + :button_link: ../visualize/logging_intermediate.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Organize existing PyTorch into Lightning + :description: Convert your vanila PyTorch to Lightning + :button_link: ../starter/converting.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Run on an on-prem cluster + :description: Learn to run on your own cluster + :button_link: ../clouds/cluster.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Save and load model progress + :description: Save and load progress with checkpoints + :button_link: ../common/checkpointing.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Save memory with half-precision + :description: Use precision techniques to train faster and save memory + :button_link: ../common/precision.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Train 1 trillion+ parameter models + :description: Scale GPU training to 1 trillion + parameter models + :button_link: ../advanced/model_parallel.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Train on single or multiple GPUs + :description: Train models faster with GPU accelerators + :button_link: ../accelerators/gpu.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Train on single or multiple HPUs + :description: Train models faster with HPU accelerators + :button_link: ../integrations/hpu/index.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Train on single or multiple IPUs + :description: Train models faster with IPU accelerators + :button_link: ../accelerators/ipu.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Train on single or multiple TPUs + :description: TTrain models faster with TPU accelerators + :button_link: ../accelerators/tpu.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Train on MPS + :description: Train models faster with Apple Silicon GPUs + :button_link: ../accelerators/mps.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Track and Visualize Experiments + :description: Learn to track and visualize experiments + :col_css: col-md-4 + :button_link: ../visualize/logging_intermediate.html + :height: 180 + +.. displayitem:: + :header: Use a pretrained model + :description: Improve results with transer learning on pretrained models + :button_link: ../advanced/pretrained.html + :col_css: col-md-4 + :height: 180 + +.. displayitem:: + :header: Use a pure PyTorch training loop + :description: Run your pure PyTorch loop with Lightning + :button_link: ../model/own_your_loop.html + :col_css: col-md-4 + :height: 180 + +.. raw:: html + +
+
diff --git a/docs/source-pytorch/common/lightning_module.rst b/docs/source-pytorch/common/lightning_module.rst new file mode 100644 index 0000000..4b42375 --- /dev/null +++ b/docs/source-pytorch/common/lightning_module.rst @@ -0,0 +1,1442 @@ +.. role:: hidden + :class: hidden-section + +.. _lightning_module: + +############### +LightningModule +############### + +A :class:`~lightning.pytorch.core.module.LightningModule` organizes your PyTorch code into 6 sections: + +- Initialization (``__init__`` and :meth:`~lightning.pytorch.core.hooks.ModelHooks.setup`). +- Train Loop (:meth:`~lightning.pytorch.core.module.LightningModule.training_step`) +- Validation Loop (:meth:`~lightning.pytorch.core.module.LightningModule.validation_step`) +- Test Loop (:meth:`~lightning.pytorch.core.module.LightningModule.test_step`) +- Prediction Loop (:meth:`~lightning.pytorch.core.module.LightningModule.predict_step`) +- Optimizers and LR Schedulers (:meth:`~lightning.pytorch.core.module.LightningModule.configure_optimizers`) + +When you convert to use Lightning, the code IS NOT abstracted - just organized. +All the other code that's not in the :class:`~lightning.pytorch.core.module.LightningModule` +has been automated for you by the :class:`~lightning.pytorch.trainer.trainer.Trainer`. + +| + + .. code-block:: python + + net = MyLightningModuleNet() + trainer = Trainer() + trainer.fit(net) + +There are no ``.cuda()`` or ``.to(device)`` calls required. Lightning does these for you. + +| + + .. code-block:: python + + # don't do in Lightning + x = torch.Tensor(2, 3) + x = x.cuda() + x = x.to(device) + + # do this instead + x = x # leave it alone! + + # or to init a new tensor + new_x = torch.Tensor(2, 3) + new_x = new_x.to(x) + +When running under a distributed strategy, Lightning handles the distributed sampler for you by default. + +| + + .. code-block:: python + + # Don't do in Lightning... + data = MNIST(...) + sampler = DistributedSampler(data) + DataLoader(data, sampler=sampler) + + # do this instead + data = MNIST(...) + DataLoader(data) + +A :class:`~lightning.pytorch.core.module.LightningModule` is a :class:`torch.nn.Module` but with added functionality. Use it as such! + +| + + .. code-block:: python + + net = Net.load_from_checkpoint(PATH) + net.freeze() + out = net(x) + +Thus, to use Lightning, you just need to organize your code which takes about 30 minutes, +(and let's be real, you probably should do anyway). + +------------ + +*************** +Starter Example +*************** + +Here are the only required methods. + +.. code-block:: python + + import lightning.pytorch as pl + import torch.nn as nn + import torch.nn.functional as F + + + class LitModel(pl.LightningModule): + def __init__(self): + super().__init__() + self.l1 = nn.Linear(28 * 28, 10) + + def forward(self, x): + return torch.relu(self.l1(x.view(x.size(0), -1))) + + def training_step(self, batch, batch_idx): + x, y = batch + y_hat = self(x) + loss = F.cross_entropy(y_hat, y) + return loss + + def configure_optimizers(self): + return torch.optim.Adam(self.parameters(), lr=0.02) + +Which you can train by doing: + +.. code-block:: python + + train_loader = DataLoader(MNIST(os.getcwd(), download=True, transform=transforms.ToTensor())) + trainer = pl.Trainer(max_epochs=1) + model = LitModel() + + trainer.fit(model, train_dataloaders=train_loader) + +The LightningModule has many convenience methods, but the core ones you need to know about are: + +.. list-table:: + :widths: 50 50 + :header-rows: 1 + + * - Name + - Description + * - ``__init__`` and :meth:`~lightning.pytorch.core.hooks.ModelHooks.setup` + - Define initialization here + * - :meth:`~lightning.pytorch.core.module.LightningModule.forward` + - To run data through your model only (separate from ``training_step``) + * - :meth:`~lightning.pytorch.core.module.LightningModule.training_step` + - the complete training step + * - :meth:`~lightning.pytorch.core.module.LightningModule.validation_step` + - the complete validation step + * - :meth:`~lightning.pytorch.core.module.LightningModule.test_step` + - the complete test step + * - :meth:`~lightning.pytorch.core.module.LightningModule.predict_step` + - the complete prediction step + * - :meth:`~lightning.pytorch.core.module.LightningModule.configure_optimizers` + - define optimizers and LR schedulers + +---------- + +******** +Training +******** + +Training Loop +============= + +To activate the training loop, override the :meth:`~lightning.pytorch.core.module.LightningModule.training_step` method. + +.. code-block:: python + + class LitClassifier(pl.LightningModule): + def __init__(self, model): + super().__init__() + self.model = model + + def training_step(self, batch, batch_idx): + x, y = batch + y_hat = self.model(x) + loss = F.cross_entropy(y_hat, y) + return loss + +Under the hood, Lightning does the following (pseudocode): + +.. code-block:: python + + # put model in train mode and enable gradient calculation + model.train() + torch.set_grad_enabled(True) + + for batch_idx, batch in enumerate(train_dataloader): + loss = training_step(batch, batch_idx) + + # clear gradients + optimizer.zero_grad() + + # backward + loss.backward() + + # update parameters + optimizer.step() + + +Train Epoch-level Metrics +========================= + +If you want to calculate epoch-level metrics and log them, use :meth:`~lightning.pytorch.core.module.LightningModule.log`. + +.. code-block:: python + + def training_step(self, batch, batch_idx): + x, y = batch + y_hat = self.model(x) + loss = F.cross_entropy(y_hat, y) + + # logs metrics for each training_step, + # and the average across the epoch, to the progress bar and logger + self.log("train_loss", loss, on_step=True, on_epoch=True, prog_bar=True, logger=True) + return loss + +The :meth:`~lightning.pytorch.core.module.LightningModule.log` method automatically reduces the +requested metrics across a complete epoch and devices. Here's the pseudocode of what it does under the hood: + +.. code-block:: python + + outs = [] + for batch_idx, batch in enumerate(train_dataloader): + # forward + loss = training_step(batch, batch_idx) + outs.append(loss.detach()) + + # clear gradients + optimizer.zero_grad() + # backward + loss.backward() + # update parameters + optimizer.step() + + # note: in reality, we do this incrementally, instead of keeping all outputs in memory + epoch_metric = torch.mean(torch.stack(outs)) + +Train Epoch-level Operations +============================ + +In the case that you need to make use of all the outputs from each :meth:`~lightning.pytorch.LightningModule.training_step`, +override the :meth:`~lightning.pytorch.LightningModule.on_train_epoch_end` method. + +.. code-block:: python + + def __init__(self): + super().__init__() + self.training_step_outputs = [] + + + def training_step(self, batch, batch_idx): + x, y = batch + y_hat = self.model(x) + loss = F.cross_entropy(y_hat, y) + preds = ... + self.training_step_outputs.append(preds) + return loss + + + def on_train_epoch_end(self): + all_preds = torch.stack(self.training_step_outputs) + # do something with all preds + ... + self.training_step_outputs.clear() # free memory + + +------------------ + +********** +Validation +********** + +Validation Loop +=============== + +To activate the validation loop while training, override the :meth:`~lightning.pytorch.core.module.LightningModule.validation_step` method. + +.. code-block:: python + + class LitModel(pl.LightningModule): + def validation_step(self, batch, batch_idx): + x, y = batch + y_hat = self.model(x) + loss = F.cross_entropy(y_hat, y) + self.log("val_loss", loss) + +Under the hood, Lightning does the following (pseudocode): + +.. code-block:: python + + # ... + for batch_idx, batch in enumerate(train_dataloader): + loss = model.training_step(batch, batch_idx) + loss.backward() + # ... + + if validate_at_some_point: + # disable grads + batchnorm + dropout + torch.set_grad_enabled(False) + model.eval() + + # ----------------- VAL LOOP --------------- + for val_batch_idx, val_batch in enumerate(val_dataloader): + val_out = model.validation_step(val_batch, val_batch_idx) + # ----------------- VAL LOOP --------------- + + # enable grads + batchnorm + dropout + torch.set_grad_enabled(True) + model.train() + +You can also run just the validation loop on your validation dataloaders by overriding :meth:`~lightning.pytorch.core.module.LightningModule.validation_step` +and calling :meth:`~lightning.pytorch.trainer.trainer.Trainer.validate`. + +.. code-block:: python + + model = Model() + trainer = Trainer() + trainer.validate(model) + +.. note:: + + It is recommended to validate on single device to ensure each sample/batch gets evaluated exactly once. + This is helpful to make sure benchmarking for research papers is done the right way. Otherwise, in a + multi-device setting, samples could occur duplicated when :class:`~torch.utils.data.distributed.DistributedSampler` + is used, for eg. with ``strategy="ddp"``. It replicates some samples on some devices to make sure all devices have + same batch size in case of uneven inputs. + + +Validation Epoch-level Metrics +============================== + +In the case that you need to make use of all the outputs from each :meth:`~lightning.pytorch.LightningModule.validation_step`, +override the :meth:`~lightning.pytorch.LightningModule.on_validation_epoch_end` method. +Note that this method is called before :meth:`~lightning.pytorch.LightningModule.on_train_epoch_end`. + +.. code-block:: python + + def __init__(self): + super().__init__() + self.validation_step_outputs = [] + + + def validation_step(self, batch, batch_idx): + x, y = batch + y_hat = self.model(x) + loss = F.cross_entropy(y_hat, y) + pred = ... + self.validation_step_outputs.append(pred) + return pred + + + def on_validation_epoch_end(self): + all_preds = torch.stack(self.validation_step_outputs) + # do something with all preds + ... + self.validation_step_outputs.clear() # free memory + +---------------- + +******* +Testing +******* + +Test Loop +========= + +The process for enabling a test loop is the same as the process for enabling a validation loop. Please refer to +the section above for details. For this you need to override the :meth:`~lightning.pytorch.core.module.LightningModule.test_step` method. + +The only difference is that the test loop is only called when :meth:`~lightning.pytorch.trainer.trainer.Trainer.test` is used. + +.. code-block:: python + + model = Model() + trainer = Trainer() + trainer.fit(model) + + # automatically loads the best weights for you + trainer.test(model) + +There are two ways to call ``test()``: + +.. code-block:: python + + # call after training + trainer = Trainer() + trainer.fit(model) + + # automatically auto-loads the best weights from the previous run + trainer.test(dataloaders=test_dataloader) + + # or call with pretrained model + model = MyLightningModule.load_from_checkpoint(PATH) + trainer = Trainer() + trainer.test(model, dataloaders=test_dataloader) + +.. note:: + + It is recommended to validate on single device to ensure each sample/batch gets evaluated exactly once. + This is helpful to make sure benchmarking for research papers is done the right way. Otherwise, in a + multi-device setting, samples could occur duplicated when :class:`~torch.utils.data.distributed.DistributedSampler` + is used, for eg. with ``strategy="ddp"``. It replicates some samples on some devices to make sure all devices have + same batch size in case of uneven inputs. + + +---------- + +********* +Inference +********* + +Prediction Loop +=============== + +By default, the :meth:`~lightning.pytorch.core.module.LightningModule.predict_step` method runs the +:meth:`~lightning.pytorch.core.module.LightningModule.forward` method. In order to customize this behaviour, +simply override the :meth:`~lightning.pytorch.core.module.LightningModule.predict_step` method. + +For the example let's override ``predict_step`` and try out `Monte Carlo Dropout `_: + +.. code-block:: python + + class LitMCdropoutModel(pl.LightningModule): + def __init__(self, model, mc_iteration): + super().__init__() + self.model = model + self.dropout = nn.Dropout() + self.mc_iteration = mc_iteration + + def predict_step(self, batch, batch_idx): + # enable Monte Carlo Dropout + self.dropout.train() + + # take average of `self.mc_iteration` iterations + pred = torch.vstack([self.dropout(self.model(x)).unsqueeze(0) for _ in range(self.mc_iteration)]).mean(dim=0) + return pred + +Under the hood, Lightning does the following (pseudocode): + +.. code-block:: python + + # disable grads + batchnorm + dropout + torch.set_grad_enabled(False) + model.eval() + all_preds = [] + + for batch_idx, batch in enumerate(predict_dataloader): + pred = model.predict_step(batch, batch_idx) + all_preds.append(pred) + +There are two ways to call ``predict()``: + +.. code-block:: python + + # call after training + trainer = Trainer() + trainer.fit(model) + + # automatically auto-loads the best weights from the previous run + predictions = trainer.predict(dataloaders=predict_dataloader) + + # or call with pretrained model + model = MyLightningModule.load_from_checkpoint(PATH) + trainer = Trainer() + predictions = trainer.predict(model, dataloaders=test_dataloader) + +Inference in Research +===================== + +If you want to perform inference with the system, you can add a ``forward`` method to the LightningModule. + +.. note:: When using forward, you are responsible to call :func:`~torch.nn.Module.eval` and use the :func:`~torch.no_grad` context manager. + +.. code-block:: python + + class Autoencoder(pl.LightningModule): + def forward(self, x): + return self.decoder(x) + + + model = Autoencoder() + model.eval() + with torch.no_grad(): + reconstruction = model(embedding) + +The advantage of adding a forward is that in complex systems, you can do a much more involved inference procedure, +such as text generation: + +.. code-block:: python + + class Seq2Seq(pl.LightningModule): + def forward(self, x): + embeddings = self(x) + hidden_states = self.encoder(embeddings) + for h in hidden_states: + # decode + ... + return decoded + +In the case where you want to scale your inference, you should be using +:meth:`~lightning.pytorch.core.module.LightningModule.predict_step`. + +.. code-block:: python + + class Autoencoder(pl.LightningModule): + def forward(self, x): + return self.decoder(x) + + def predict_step(self, batch, batch_idx, dataloader_idx=0): + # this calls forward + return self(batch) + + + data_module = ... + model = Autoencoder() + trainer = Trainer(accelerator="gpu", devices=2) + trainer.predict(model, data_module) + +Inference in Production +======================= + +For cases like production, you might want to iterate different models inside a LightningModule. + +.. code-block:: python + + from torchmetrics.functional import accuracy + + + class ClassificationTask(pl.LightningModule): + def __init__(self, model): + super().__init__() + self.model = model + + def training_step(self, batch, batch_idx): + x, y = batch + y_hat = self.model(x) + loss = F.cross_entropy(y_hat, y) + return loss + + def validation_step(self, batch, batch_idx): + loss, acc = self._shared_eval_step(batch, batch_idx) + metrics = {"val_acc": acc, "val_loss": loss} + self.log_dict(metrics) + return metrics + + def test_step(self, batch, batch_idx): + loss, acc = self._shared_eval_step(batch, batch_idx) + metrics = {"test_acc": acc, "test_loss": loss} + self.log_dict(metrics) + return metrics + + def _shared_eval_step(self, batch, batch_idx): + x, y = batch + y_hat = self.model(x) + loss = F.cross_entropy(y_hat, y) + acc = accuracy(y_hat, y) + return loss, acc + + def predict_step(self, batch, batch_idx, dataloader_idx=0): + x, y = batch + y_hat = self.model(x) + return y_hat + + def configure_optimizers(self): + return torch.optim.Adam(self.model.parameters(), lr=0.02) + +Then pass in any arbitrary model to be fit with this task + +.. code-block:: python + + for model in [resnet50(), vgg16(), BidirectionalRNN()]: + task = ClassificationTask(model) + + trainer = Trainer(accelerator="gpu", devices=2) + trainer.fit(task, train_dataloaders=train_dataloader, val_dataloaders=val_dataloader) + +Tasks can be arbitrarily complex such as implementing GAN training, self-supervised or even RL. + +.. code-block:: python + + class GANTask(pl.LightningModule): + def __init__(self, generator, discriminator): + super().__init__() + self.generator = generator + self.discriminator = discriminator + + ... + +When used like this, the model can be separated from the Task and thus used in production without needing to keep it in +a ``LightningModule``. + +The following example shows how you can run inference in the Python runtime: + +.. code-block:: python + + task = ClassificationTask(model) + trainer = Trainer(accelerator="gpu", devices=2) + trainer.fit(task, train_dataloader, val_dataloader) + trainer.save_checkpoint("best_model.ckpt") + + # use model after training or load weights and drop into the production system + model = ClassificationTask.load_from_checkpoint("best_model.ckpt") + x = ... + model.eval() + with torch.no_grad(): + y_hat = model(x) + +Check out :ref:`Inference in Production ` guide to learn about the possible ways to perform inference in production. + + +----------- + + +******************** +Save Hyperparameters +******************** + +Often times we train many versions of a model. You might share that model or come back to it a few months later at which +point it is very useful to know how that model was trained (i.e.: what learning rate, neural network, etc...). + +Lightning has a standardized way of saving the information for you in checkpoints and YAML files. The goal here is to +improve readability and reproducibility. + +save_hyperparameters +==================== + +Use :meth:`~lightning.pytorch.core.module.LightningModule.save_hyperparameters` within your +:class:`~lightning.pytorch.core.module.LightningModule`'s ``__init__`` method. It will enable Lightning to store all the +provided arguments under the ``self.hparams`` attribute. These hyperparameters will also be stored within the model +checkpoint, which simplifies model re-instantiation after training. + +.. code-block:: python + + class LitMNIST(LightningModule): + def __init__(self, layer_1_dim=128, learning_rate=1e-2): + super().__init__() + # call this to save (layer_1_dim=128, learning_rate=1e-4) to the checkpoint + self.save_hyperparameters() + + # equivalent + self.save_hyperparameters("layer_1_dim", "learning_rate") + + # Now possible to access layer_1_dim from hparams + self.hparams.layer_1_dim + + +In addition, loggers that support it will automatically log the contents of ``self.hparams``. + +Excluding hyperparameters +========================= + +By default, every parameter of the ``__init__`` method will be considered a hyperparameter to the LightningModule. +However, sometimes some parameters need to be excluded from saving, for example when they are not serializable. Those +parameters should be provided back when reloading the LightningModule. In this case, exclude them explicitly: + +.. code-block:: python + + class LitMNIST(LightningModule): + def __init__(self, loss_fx, generator_network, layer_1_dim=128): + super().__init__() + self.layer_1_dim = layer_1_dim + self.loss_fx = loss_fx + + # call this to save only (layer_1_dim=128) to the checkpoint + self.save_hyperparameters("layer_1_dim") + + # equivalent + self.save_hyperparameters(ignore=["loss_fx", "generator_network"]) + + +load_from_checkpoint +==================== + +LightningModules that have hyperparameters automatically saved with +:meth:`~lightning.pytorch.core.module.LightningModule.save_hyperparameters` can conveniently be loaded and instantiated +directly from a checkpoint with :meth:`~lightning.pytorch.core.module.LightningModule.load_from_checkpoint`: + +.. code-block:: python + + # to load specify the other args + model = LitMNIST.load_from_checkpoint(PATH, loss_fx=torch.nn.SomeOtherLoss, generator_network=MyGenerator()) + + +If parameters were excluded, they need to be provided at the time of loading: + +.. code-block:: python + + # the excluded parameters were `loss_fx` and `generator_network` + model = LitMNIST.load_from_checkpoint(PATH, loss_fx=torch.nn.SomeOtherLoss, generator_network=MyGenerator()) + + +----------- + + +************* +Child Modules +************* + +.. include:: ../common/child_modules.rst + +----------- + +******************* +LightningModule API +******************* + + +Methods +======= + +all_gather +~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.all_gather + :noindex: + +configure_callbacks +~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.configure_callbacks + :noindex: + +configure_optimizers +~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.configure_optimizers + :noindex: + +forward +~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.forward + :noindex: + +freeze +~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.freeze + :noindex: + +.. _lm-log: + +log +~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.log + :noindex: + +log_dict +~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.log_dict + :noindex: + +lr_schedulers +~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.lr_schedulers + :noindex: + +manual_backward +~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.manual_backward + :noindex: + +optimizers +~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.optimizers + :noindex: + +print +~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.print + :noindex: + +predict_step +~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.predict_step + :noindex: + +save_hyperparameters +~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.save_hyperparameters + :noindex: + +toggle_optimizer +~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.toggle_optimizer + :noindex: + +test_step +~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.test_step + :noindex: + +to_onnx +~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.to_onnx + :noindex: + +to_torchscript +~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.to_torchscript + :noindex: + +training_step +~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.training_step + :noindex: + +unfreeze +~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.unfreeze + :noindex: + +untoggle_optimizer +~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.untoggle_optimizer + :noindex: + +validation_step +~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.validation_step + :noindex: + +----------- + +Properties +========== + +These are properties available in a LightningModule. + +current_epoch +~~~~~~~~~~~~~ + +The number of epochs run. + +.. code-block:: python + + def training_step(self, batch, batch_idx): + if self.current_epoch == 0: + ... + +device +~~~~~~ + +The device the module is on. Use it to keep your code device agnostic. + +.. code-block:: python + + def training_step(self, batch, batch_idx): + z = torch.rand(2, 3, device=self.device) + +global_rank +~~~~~~~~~~~ + +The ``global_rank`` is the index of the current process across all nodes and devices. +Lightning will perform some operations such as logging, weight checkpointing only when ``global_rank=0``. You +usually do not need to use this property, but it is useful to know how to access it if needed. + +.. code-block:: python + + def training_step(self, batch, batch_idx): + if self.global_rank == 0: + # do something only once across all the nodes + ... + +global_step +~~~~~~~~~~~ + +The number of optimizer steps taken (does not reset each epoch). +This includes multiple optimizers (if enabled). + +.. code-block:: python + + def training_step(self, batch, batch_idx): + self.logger.experiment.log_image(..., step=self.global_step) + +hparams +~~~~~~~ + +The arguments passed through ``LightningModule.__init__()`` and saved by calling +:meth:`~lightning.pytorch.core.mixins.hparams_mixin.HyperparametersMixin.save_hyperparameters` could be accessed by the ``hparams`` attribute. + +.. code-block:: python + + def __init__(self, learning_rate): + self.save_hyperparameters() + + + def configure_optimizers(self): + return Adam(self.parameters(), lr=self.hparams.learning_rate) + +logger +~~~~~~ + +The current logger being used (tensorboard or other supported logger) + +.. code-block:: python + + def training_step(self, batch, batch_idx): + # the generic logger (same no matter if tensorboard or other supported logger) + self.logger + + # the particular logger + tensorboard_logger = self.logger.experiment + +loggers +~~~~~~~ + +The list of loggers currently being used by the Trainer. + +.. code-block:: python + + def training_step(self, batch, batch_idx): + # List of Logger objects + loggers = self.loggers + for logger in loggers: + logger.log_metrics({"foo": 1.0}) + +local_rank +~~~~~~~~~~~ + +The ``local_rank`` is the index of the current process across all the devices for the current node. +You usually do not need to use this property, but it is useful to know how to access it if needed. +For example, if using 10 machines (or nodes), the GPU at index 0 on each machine has local_rank = 0. + +.. code-block:: python + + def training_step(self, batch, batch_idx): + if self.local_rank == 0: + # do something only once across each node + ... + +precision +~~~~~~~~~ + +The type of precision used: + +.. code-block:: python + + def training_step(self, batch, batch_idx): + if self.precision == 16: + ... + +trainer +~~~~~~~ + +Pointer to the trainer + +.. code-block:: python + + def training_step(self, batch, batch_idx): + max_steps = self.trainer.max_steps + any_flag = self.trainer.any_flag + +prepare_data_per_node +~~~~~~~~~~~~~~~~~~~~~ + +If set to ``True`` will call ``prepare_data()`` on LOCAL_RANK=0 for every node. +If set to ``False`` will only call from NODE_RANK=0, LOCAL_RANK=0. + +.. testcode:: + + class LitModel(LightningModule): + def __init__(self): + super().__init__() + self.prepare_data_per_node = True + +automatic_optimization +~~~~~~~~~~~~~~~~~~~~~~ + +When set to ``False``, Lightning does not automate the optimization process. This means you are responsible for handling +your optimizers. However, we do take care of precision and any accelerators used. + +See :ref:`manual optimization ` for details. + +.. code-block:: python + + def __init__(self): + self.automatic_optimization = False + + + def training_step(self, batch, batch_idx): + opt = self.optimizers(use_pl_optimizer=True) + + loss = ... + opt.zero_grad() + self.manual_backward(loss) + opt.step() + +Manual optimization is most useful for research topics like reinforcement learning, sparse coding, and GAN research. +It is required when you are using 2+ optimizers because with automatic optimization, you can only use one optimizer. + +.. code-block:: python + + def __init__(self): + self.automatic_optimization = False + + + def training_step(self, batch, batch_idx): + # access your optimizers with use_pl_optimizer=False. Default is True + opt_a, opt_b = self.optimizers(use_pl_optimizer=True) + + gen_loss = ... + opt_a.zero_grad() + self.manual_backward(gen_loss) + opt_a.step() + + disc_loss = ... + opt_b.zero_grad() + self.manual_backward(disc_loss) + opt_b.step() + +example_input_array +~~~~~~~~~~~~~~~~~~~ + +Set and access example_input_array, which basically represents a single batch. + +.. code-block:: python + + def __init__(self): + self.example_input_array = ... + self.generator = ... + + + def on_train_epoch_end(self): + # generate some images using the example_input_array + gen_images = self.generator(self.example_input_array) + +-------------- + +.. _lightning_hooks: + +Hooks +===== + +This is the pseudocode to describe the structure of :meth:`~lightning.pytorch.trainer.Trainer.fit`. +The inputs and outputs of each function are not represented for simplicity. Please check each function's API reference +for more information. + +.. code-block:: python + + def fit(self): + if global_rank == 0: + # prepare data is called on GLOBAL_ZERO only + prepare_data() + + configure_callbacks() + + with parallel(devices): + # devices can be GPUs, TPUs, ... + train_on_device(model) + + + def train_on_device(model): + # called PER DEVICE + setup("fit") + configure_optimizers() + on_fit_start() + + # the sanity check runs here + + on_train_start() + for epoch in epochs: + fit_loop() + on_train_end() + + on_fit_end() + teardown("fit") + + + def fit_loop(): + model.train() + torch.set_grad_enabled(True) + + on_train_epoch_start() + + for batch in train_dataloader(): + on_train_batch_start() + + on_before_batch_transfer() + transfer_batch_to_device() + on_after_batch_transfer() + + out = training_step() + + on_before_zero_grad() + optimizer_zero_grad() + + on_before_backward() + backward() + on_after_backward() + + on_before_optimizer_step() + configure_gradient_clipping() + optimizer_step() + + on_train_batch_end(out, batch, batch_idx) + + if should_check_val: + val_loop() + + on_train_epoch_end() + + + def val_loop(): + on_validation_model_eval() # calls `model.eval()` + torch.set_grad_enabled(False) + + on_validation_start() + on_validation_epoch_start() + + for batch_idx, batch in enumerate(val_dataloader()): + on_validation_batch_start(batch, batch_idx) + + batch = on_before_batch_transfer(batch) + batch = transfer_batch_to_device(batch) + batch = on_after_batch_transfer(batch) + + out = validation_step(batch, batch_idx) + + on_validation_batch_end(out, batch, batch_idx) + + on_validation_epoch_end() + on_validation_end() + + # set up for train + on_validation_model_train() # calls `model.train()` + torch.set_grad_enabled(True) + +backward +~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.backward + :noindex: + +on_before_backward +~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_before_backward + :noindex: + +on_after_backward +~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_after_backward + :noindex: + +on_before_zero_grad +~~~~~~~~~~~~~~~~~~~ +.. automethod:: lightning.pytorch.core.module.LightningModule.on_before_zero_grad + :noindex: + +on_fit_start +~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_fit_start + :noindex: + +on_fit_end +~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_fit_end + :noindex: + + +on_load_checkpoint +~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_load_checkpoint + :noindex: + +on_save_checkpoint +~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_save_checkpoint + :noindex: + +load_from_checkpoint +~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.load_from_checkpoint + :noindex: + +on_train_start +~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_train_start + :noindex: + +on_train_end +~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_train_end + :noindex: + +on_validation_start +~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_validation_start + :noindex: + +on_validation_end +~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_validation_end + :noindex: + +on_test_batch_start +~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_test_batch_start + :noindex: + +on_test_batch_end +~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_test_batch_end + :noindex: + +on_test_epoch_start +~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_test_epoch_start + :noindex: + +on_test_epoch_end +~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_test_epoch_end + :noindex: + +on_test_start +~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_test_start + :noindex: + +on_test_end +~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_test_end + :noindex: + +on_predict_batch_start +~~~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_predict_batch_start + :noindex: + +on_predict_batch_end +~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_predict_batch_end + :noindex: + +on_predict_epoch_start +~~~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_predict_epoch_start + :noindex: + +on_predict_epoch_end +~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_predict_epoch_end + :noindex: + +on_predict_start +~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_predict_start + :noindex: + +on_predict_end +~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_predict_end + :noindex: + +on_train_batch_start +~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_train_batch_start + :noindex: + +on_train_batch_end +~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_train_batch_end + :noindex: + +on_train_epoch_start +~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_train_epoch_start + :noindex: + +on_train_epoch_end +~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_train_epoch_end + :noindex: + +on_validation_batch_start +~~~~~~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_validation_batch_start + :noindex: + +on_validation_batch_end +~~~~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_validation_batch_end + :noindex: + +on_validation_epoch_start +~~~~~~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_validation_epoch_start + :noindex: + +on_validation_epoch_end +~~~~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_validation_epoch_end + :noindex: + +configure_model +~~~~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.configure_model + :noindex: + +on_validation_model_eval +~~~~~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_validation_model_eval + :noindex: + +on_validation_model_train +~~~~~~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_validation_model_train + :noindex: + +on_test_model_eval +~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_test_model_eval + :noindex: + +on_test_model_train +~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_test_model_train + :noindex: + +on_before_optimizer_step +~~~~~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_before_optimizer_step + :noindex: + +configure_gradient_clipping +~~~~~~~~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.configure_gradient_clipping + :noindex: + +optimizer_step +~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.optimizer_step + :noindex: + +optimizer_zero_grad +~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.optimizer_zero_grad + :noindex: + +prepare_data +~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.prepare_data + :noindex: + +setup +~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.setup + :noindex: + +teardown +~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.teardown + :noindex: + +train_dataloader +~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.train_dataloader + :noindex: + +val_dataloader +~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.val_dataloader + :noindex: + +test_dataloader +~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.test_dataloader + :noindex: + +predict_dataloader +~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.predict_dataloader + :noindex: + +transfer_batch_to_device +~~~~~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.transfer_batch_to_device + :noindex: + +on_before_batch_transfer +~~~~~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_before_batch_transfer + :noindex: + +on_after_batch_transfer +~~~~~~~~~~~~~~~~~~~~~~~ + +.. automethod:: lightning.pytorch.core.module.LightningModule.on_after_batch_transfer + :noindex: diff --git a/docs/source-pytorch/common/optimization.rst b/docs/source-pytorch/common/optimization.rst new file mode 100644 index 0000000..d29415b --- /dev/null +++ b/docs/source-pytorch/common/optimization.rst @@ -0,0 +1,173 @@ +:orphan: + +.. _optimization: + +############ +Optimization +############ + +Lightning offers two modes for managing the optimization process: + +- Manual Optimization +- Automatic Optimization + +For the majority of research cases, **automatic optimization** will do the right thing for you and it is what most +users should use. + +For more advanced use cases like multiple optimizers, esoteric optimization schedules or techniques, use **manual optimization**. + +.. _manual_optimization: + +---- + +.. include:: ../model/manual_optimization.rst + +----- + +********************** +Automatic Optimization +********************** + +With Lightning, most users don't have to think about when to call ``.zero_grad()``, ``.backward()`` and ``.step()`` +since Lightning automates that for you. + +Under the hood, Lightning does the following: + +.. code-block:: python + + for epoch in epochs: + for batch in data: + + def closure(): + loss = model.training_step(batch, batch_idx) + optimizer.zero_grad() + loss.backward() + return loss + + optimizer.step(closure) + + lr_scheduler.step() + +As can be seen in the code snippet above, Lightning defines a closure with ``training_step()``, ``optimizer.zero_grad()`` +and ``loss.backward()`` for the optimization. This mechanism is in place to support optimizers which operate on the +output of the closure (e.g. the loss) or need to call the closure several times (e.g. :class:`~torch.optim.LBFGS`). + +Should you still require the flexibility of calling ``.zero_grad()``, ``.backward()``, or ``.step()`` yourself, you can +always switch to :ref:`manual optimization `. +Manual optimization is required if you wish to work with multiple optimizers. + + +.. _gradient_accumulation: + +Gradient Accumulation +===================== + +.. include:: ../common/gradient_accumulation.rst + + +Access your Own Optimizer +========================= + +The provided ``optimizer`` is a :class:`~lightning.pytorch.core.optimizer.LightningOptimizer` object wrapping your own optimizer +configured in your :meth:`~lightning.pytorch.core.module.LightningModule.configure_optimizers`. +You can access your own optimizer with ``optimizer.optimizer``. However, if you use your own optimizer +to perform a step, Lightning won't be able to support accelerators, precision and profiling for you. + +.. testcode:: python + + # function hook in LightningModule + def optimizer_step( + self, + epoch, + batch_idx, + optimizer, + optimizer_closure, + ): + optimizer.step(closure=optimizer_closure) + + + # `optimizer` is a `LightningOptimizer` wrapping the optimizer. + # To access it, do the following. + # However, it won't work on TPU, AMP, etc... + def optimizer_step( + self, + epoch, + batch_idx, + optimizer, + optimizer_closure, + ): + optimizer = optimizer.optimizer + optimizer.step(closure=optimizer_closure) + +----- + + +Bring your own Custom Learning Rate Schedulers +============================================== + +Lightning allows using custom learning rate schedulers that aren't available in `PyTorch natively `_. +One good example is `Timm Schedulers `_. When using custom learning rate schedulers +relying on a different API from Native PyTorch ones, you should override the :meth:`~lightning.pytorch.core.module.LightningModule.lr_scheduler_step` with your desired logic. +If you are using native PyTorch schedulers, there is no need to override this hook since Lightning will handle it automatically by default. + +.. code-block:: python + + from timm.scheduler import TanhLRScheduler + + + def configure_optimizers(self): + optimizer = ... + scheduler = TanhLRScheduler(optimizer, ...) + return [optimizer], [{"scheduler": scheduler, "interval": "epoch"}] + + + def lr_scheduler_step(self, scheduler, metric): + scheduler.step(epoch=self.current_epoch) # timm's scheduler need the epoch value + + +.. _configure_gradient_clipping: + +Configure Gradient Clipping +=========================== + +To configure custom gradient clipping, consider overriding +the :meth:`~lightning.pytorch.core.module.LightningModule.configure_gradient_clipping` method. +The attributes ``gradient_clip_val`` and ``gradient_clip_algorithm`` from Trainer will be passed in the +respective arguments here and Lightning will handle gradient clipping for you. In case you want to set +different values for your arguments of your choice and let Lightning handle the gradient clipping, you can +use the inbuilt :meth:`~lightning.pytorch.core.module.LightningModule.clip_gradients` method and pass +the arguments along with your optimizer. + +.. warning:: + Make sure to not override :meth:`~lightning.pytorch.core.module.LightningModule.clip_gradients` + method. If you want to customize gradient clipping, consider using + :meth:`~lightning.pytorch.core.module.LightningModule.configure_gradient_clipping` method. + +For example, here we will apply a stronger gradient clipping after a certain number of epochs: + +.. testcode:: python + + def configure_gradient_clipping(self, optimizer, gradient_clip_val, gradient_clip_algorithm): + if self.current_epoch > 5: + gradient_clip_val = gradient_clip_val * 2 + + # Lightning will handle the gradient clipping + self.clip_gradients(optimizer, gradient_clip_val=gradient_clip_val, gradient_clip_algorithm=gradient_clip_algorithm) + + +Total Stepping Batches +====================== + +You can use built-in trainer property :paramref:`~lightning.pytorch.trainer.trainer.Trainer.estimated_stepping_batches` to compute +total number of stepping batches for the complete training. The property is computed considering gradient accumulation factor and +distributed setting into consideration so you don't have to derive it manually. One good example where this can be helpful is while using +:class:`~torch.optim.lr_scheduler.OneCycleLR` scheduler, which requires pre-computed ``total_steps`` during initialization. + +.. code-block:: python + + def configure_optimizers(self): + optimizer = ... + scheduler = torch.optim.lr_scheduler.OneCycleLR( + optimizer, max_lr=1e-3, total_steps=self.trainer.estimated_stepping_batches + ) + return optimizer, scheduler diff --git a/source/common/precision.rst b/docs/source-pytorch/common/precision.rst similarity index 100% rename from source/common/precision.rst rename to docs/source-pytorch/common/precision.rst diff --git a/docs/source-pytorch/common/precision_basic.rst b/docs/source-pytorch/common/precision_basic.rst new file mode 100644 index 0000000..033f580 --- /dev/null +++ b/docs/source-pytorch/common/precision_basic.rst @@ -0,0 +1,104 @@ +:orphan: + +.. _precision_basic: + +####################### +N-Bit Precision (Basic) +####################### +**Audience:** Users looking to train models faster and consume less memory. + +---- + +If you're looking to run models faster or consume less memory, consider tweaking the precision settings of your models. + +Lower precision, such as 16-bit floating-point, requires less memory and enables training and deploying larger models. +Higher precision, such as the 64-bit floating-point, can be used for highly sensitive use-cases. + +---- + +**************** +16-bit Precision +**************** + +Use 16-bit mixed precision to lower your memory consumption by up to half so that you can train and deploy larger models. If your GPUs are [`Tensor Core `_] GPUs, you can also get a ~3x speed improvement. Half precision can sometimes lead to unstable training. + +.. code:: + + Trainer(precision='16-mixed') + +---- + +**************** +32-bit Precision +**************** + +32-bit precision is the default used across all models and research. This precision is known to be stable in contrast to lower precision settings. + +.. testcode:: + + Trainer(precision="32-true") + + # or + Trainer(precision="32") + + # or + Trainer(precision=32) + +---- + +**************** +64-bit Precision +**************** + +For certain scientific computations, 64-bit precision enables more accurate models. However, doubling the precision from 32 to 64 bit also doubles the memory requirements. + +.. testcode:: + + Trainer(precision="64-true") + + # or + Trainer(precision="64") + + # or + Trainer(precision=64) + +.. note:: + + Since in deep learning, memory is always a bottleneck, especially when dealing with a large volume of data and with limited resources. + It is recommended using single precision for better speed. Although you can still use it if you want for your particular use-case. + +---- + +******************************** +Precision support by accelerator +******************************** + +.. list-table:: Precision with Accelerators + :widths: 20 20 20 20 20 + :header-rows: 1 + + * - Precision + - CPU + - GPU + - TPU + - IPU + * - 16 Mixed + - No + - Yes + - No + - Yes + * - BFloat16 Mixed + - Yes + - Yes + - Yes + - No + * - 32 True + - Yes + - Yes + - Yes + - Yes + * - 64 True + - Yes + - Yes + - No + - No diff --git a/source/common/precision_expert.rst b/docs/source-pytorch/common/precision_expert.rst similarity index 87% rename from source/common/precision_expert.rst rename to docs/source-pytorch/common/precision_expert.rst index 34bc955..a450297 100644 --- a/source/common/precision_expert.rst +++ b/docs/source-pytorch/common/precision_expert.rst @@ -12,7 +12,7 @@ N-Bit Precision (Expert) Precision Plugins ***************** -You can also customize and pass your own Precision Plugin by subclassing the :class:`~pytorch_lightning.plugins.precision.precision_plugin.PrecisionPlugin` class. +You can also customize and pass your own Precision Plugin by subclassing the :class:`~lightning.pytorch.plugins.precision.precision_plugin.PrecisionPlugin` class. - Perform pre and post backward/optimizer step operations such as scaling gradients. - Provide context managers for forward, training_step, etc. @@ -20,7 +20,7 @@ You can also customize and pass your own Precision Plugin by subclassing the :cl .. code-block:: python class CustomPrecisionPlugin(PrecisionPlugin): - precision = 16 + precision = "16-mixed" ... diff --git a/docs/source-pytorch/common/precision_intermediate.rst b/docs/source-pytorch/common/precision_intermediate.rst new file mode 100644 index 0000000..e0590df --- /dev/null +++ b/docs/source-pytorch/common/precision_intermediate.rst @@ -0,0 +1,113 @@ +:orphan: + +.. _precision_intermediate: + +############################## +N-Bit Precision (Intermediate) +############################## +**Audience:** Users looking to scale larger models or take advantage of optimized accelerators. + +---- + +************************ +What is Mixed Precision? +************************ + +PyTorch, like most deep learning frameworks, trains on 32-bit floating-point (FP32) arithmetic by default. However, many deep learning models do not require this to reach complete accuracy. By conducting +operations in half-precision format while keeping minimum information in single-precision to maintain as much information as possible in crucial areas of the network, mixed precision training delivers +significant computational speedup. Switching to mixed precision has resulted in considerable training speedups since the introduction of Tensor Cores in the Volta and Turing architectures. It combines +FP32 and lower-bit floating-points (such as FP16) to reduce memory footprint and increase performance during model training and evaluation. It accomplishes this by recognizing the steps that require +complete accuracy and employing a 32-bit floating-point for those steps only, while using a 16-bit floating-point for the rest. When compared to complete precision training, mixed precision training +delivers all of these benefits while ensuring that no task-specific accuracy is lost. [`2 `_]. + +.. note:: + + In some cases, it is essential to remain in FP32 for numerical stability, so keep this in mind when using mixed precision. + For example, when running scatter operations during the forward (such as torchpoint3d), computation must remain in FP32. + +.. warning:: + + Do not cast anything to other dtypes manually using ``torch.autocast`` or ``tensor.half()`` when using native precision because + this can bring instability. + + .. code-block:: python + + class LitModel(LightningModule): + def training_step(self, batch, batch_idx): + outs = self(batch) + + a_float32 = torch.rand((8, 8), device=self.device, dtype=self.dtype) + b_float32 = torch.rand((8, 4), device=self.device, dtype=self.dtype) + + # casting to float16 manually + with torch.autocast(device_type=self.device.type): + c_float16 = torch.mm(a_float32, b_float32) + target = self.layer(c_float16.flatten()[None]) + + # here outs is of type float32 and target is of type float16 + loss = torch.mm(target @ outs).float() + return loss + + + trainer = Trainer(accelerator="gpu", devices=1, precision=32) + +---- + +******************** +FP16 Mixed Precision +******************** + +In most cases, mixed precision uses FP16. Supported `PyTorch operations `__ automatically run in FP16, saving memory and improving throughput on the supported accelerators. +Since computation happens in FP16, there is a chance of numerical instability during training. This is handled internally by a dynamic grad scaler which skips invalid steps and adjusts the scaler to ensure subsequent steps fall within a finite range. For more information `see the autocast docs `__. + + +.. note:: + + When using TPUs, setting ``precision='16-mixed'`` will enable bfloat16, the only supported half precision type on TPUs. + +.. testcode:: + :skipif: not torch.cuda.is_available() + + Trainer(accelerator="gpu", devices=1, precision=16) + +************************ +BFloat16 Mixed Precision +************************ + +.. warning:: + + BFloat16 may not provide significant speedups or memory improvements or offer better numerical stability. + Do note for GPUs, the most significant benefits require `Ampere `__ based GPUs, such as A100s or 3090s. + +BFloat16 Mixed precision is similar to FP16 mixed precision, however, it maintains more of the "dynamic range" that FP32 offers. This means it is able to improve numerical stability than FP16 mixed precision. For more information, see `this TPU performance blogpost `__. + +Under the hood, we use `torch.autocast `__ with the dtype set to ``bfloat16``, with no gradient scaling. + +.. testcode:: + :skipif: not torch.cuda.is_available() + + Trainer(accelerator="gpu", devices=1, precision="bf16") + +It is also possible to use BFloat16 mixed precision on the CPU, relying on MKLDNN under the hood. + +.. testcode:: + + Trainer(precision="bf16") + +---- + +*************** +8-bit Optimizer +*************** + +It is possible to further reduce the precision using third-party libraries like `bitsandbytes `_. Although, +Lightning doesn't support it out of the box yet but you can still use it by configuring it in your LightningModule and setting ``Trainer(precision=32)``. + +.. code-block:: python + + import bitsandbytes as bnb + + + # in your LightningModule, return the 8-bit optimizer + def configure_optimizers(self): + return bnb.optim.Adam8bit(model.parameters(), lr=0.001, betas=(0.9, 0.995)) diff --git a/docs/source-pytorch/common/progress_bar.rst b/docs/source-pytorch/common/progress_bar.rst new file mode 100644 index 0000000..385d17e --- /dev/null +++ b/docs/source-pytorch/common/progress_bar.rst @@ -0,0 +1,138 @@ +.. testsetup:: * + + from lightning.pytorch.trainer.trainer import Trainer + +.. _progress_bar: + + +Customize the progress bar +========================== + +Lightning supports two different types of progress bars (`tqdm `_ and `rich `_). :class:`~lightning.pytorch.callbacks.TQDMProgressBar` is used by default, +but you can override it by passing a custom :class:`~lightning.pytorch.callbacks.TQDMProgressBar` or :class:`~lightning.pytorch.callbacks.RichProgressBar` to the ``callbacks`` argument of the :class:`~lightning.pytorch.trainer.trainer.Trainer`. + +You could also use the :class:`~lightning.pytorch.callbacks.ProgressBar` class to implement your own progress bar. + +------------- + +TQDMProgressBar +--------------- + +The :class:`~lightning.pytorch.callbacks.TQDMProgressBar` uses the `tqdm `_ library internally and is the default progress bar used by Lightning. +It prints to ``stdout`` and shows up to four different bars: + +- **sanity check progress:** the progress during the sanity check run +- **train progress:** shows the training progress. It will pause if validation starts and will resume when it ends, and also accounts for multiple validation runs during training when :paramref:`~lightning.pytorch.trainer.trainer.Trainer.val_check_interval` is used. +- **validation progress:** only visible during validation; shows total progress over all validation datasets. +- **test progress:** only active when testing; shows total progress over all test datasets. + +For infinite datasets, the progress bar never ends. + +You can update ``refresh_rate`` (rate (number of batches) at which the progress bar get updated) for :class:`~lightning.pytorch.callbacks.TQDMProgressBar` by: + +.. code-block:: python + + from lightning.pytorch.callbacks import TQDMProgressBar + + trainer = Trainer(callbacks=[TQDMProgressBar(refresh_rate=10)]) + +If you want to customize the default :class:`~lightning.pytorch.callbacks.TQDMProgressBar` used by Lightning, you can override +specific methods of the callback class and pass your custom implementation to the :class:`~lightning.pytorch.trainer.trainer.Trainer`. + +.. code-block:: python + + class LitProgressBar(TQDMProgressBar): + def init_validation_tqdm(self): + bar = super().init_validation_tqdm() + bar.set_description("running validation...") + return bar + + + trainer = Trainer(callbacks=[LitProgressBar()]) + +.. seealso:: + - :class:`~lightning.pytorch.callbacks.TQDMProgressBar` docs. + - `tqdm library `__ + +---------------- + +RichProgressBar +--------------- + +`Rich `_ is a Python library for rich text and beautiful formatting in the terminal. +To use the :class:`~lightning.pytorch.callbacks.RichProgressBar` as your progress bar, first install the package: + +.. code-block:: bash + + pip install rich + +Then configure the callback and pass it to the :class:`~lightning.pytorch.trainer.trainer.Trainer`: + +.. code-block:: python + + from lightning.pytorch.callbacks import RichProgressBar + + trainer = Trainer(callbacks=[RichProgressBar()]) + +Customize the theme for your :class:`~lightning.pytorch.callbacks.RichProgressBar` like this: + +.. code-block:: python + + from lightning.pytorch.callbacks import RichProgressBar + from lightning.pytorch.callbacks.progress.rich_progress import RichProgressBarTheme + + # create your own theme! + progress_bar = RichProgressBar( + theme=RichProgressBarTheme( + description="green_yellow", + progress_bar="green1", + progress_bar_finished="green1", + progress_bar_pulse="#6206E0", + batch_progress="green_yellow", + time="grey82", + processing_speed="grey82", + metrics="grey82", + ) + ) + + trainer = Trainer(callbacks=progress_bar) + +You can customize the components used within :class:`~lightning.pytorch.callbacks.RichProgressBar` with ease by overriding the +:func:`~lightning.pytorch.callbacks.RichProgressBar.configure_columns` method. + +.. code-block:: python + + from rich.progress import TextColumn + + custom_column = TextColumn("[progress.description]Custom Rich Progress Bar!") + + + class CustomRichProgressBar(RichProgressBar): + def configure_columns(self, trainer): + return [custom_column] + + + progress_bar = CustomRichProgressBar() + +If you wish for a new progress bar to be displayed at the end of every epoch, you should enable +:paramref:`RichProgressBar.leave ` by passing ``True`` + +.. code-block:: python + + from lightning.pytorch.callbacks import RichProgressBar + + trainer = Trainer(callbacks=[RichProgressBar(leave=True)]) + +.. seealso:: + - :class:`~lightning.pytorch.callbacks.RichProgressBar` docs. + - :class:`~lightning.pytorch.callbacks.RichModelSummary` docs to customize the model summary table. + - `Rich library `__. + + +.. note:: + + Progress bar is automatically enabled with the Trainer, and to disable it, one should do this: + + .. code-block:: python + + trainer = Trainer(enable_progress_bar=False) diff --git a/source/common/remote_fs.rst b/docs/source-pytorch/common/remote_fs.rst similarity index 91% rename from source/common/remote_fs.rst rename to docs/source-pytorch/common/remote_fs.rst index 29a4fe7..1b842ca 100644 --- a/source/common/remote_fs.rst +++ b/docs/source-pytorch/common/remote_fs.rst @@ -17,11 +17,12 @@ Working with different filesystems can be accomplished by appending a protocol l trainer = Trainer(default_root_dir="s3://my_bucket/data/") trainer.fit(model) -You could pass custom paths to loggers for logging data. + +For logging, remote filesystem support depends on the particular logger integration being used. Consult :ref:`the documentation of the individual logger ` for more details. .. code-block:: python - from pytorch_lightning.loggers import TensorBoardLogger + from lightning.pytorch.loggers import TensorBoardLogger logger = TensorBoardLogger(save_dir="s3://my_bucket/logs/") diff --git a/docs/source-pytorch/common/trainer.rst b/docs/source-pytorch/common/trainer.rst new file mode 100644 index 0000000..742555b --- /dev/null +++ b/docs/source-pytorch/common/trainer.rst @@ -0,0 +1,1355 @@ +.. role:: hidden + :class: hidden-section + +.. testsetup:: * + + import os + from lightning.pytorch import Trainer, LightningModule, seed_everything + +.. _trainer: + +Trainer +======= + +Once you've organized your PyTorch code into a :class:`~lightning.pytorch.core.module.LightningModule`, the ``Trainer`` automates everything else. + +The ``Trainer`` achieves the following: + +1. You maintain control over all aspects via PyTorch code in your :class:`~lightning.pytorch.core.module.LightningModule`. + +2. The trainer uses best practices embedded by contributors and users + from top AI labs such as Facebook AI Research, NYU, MIT, Stanford, etc... + +3. The trainer allows disabling any key part that you don't want automated. + +| + +----------- + +Basic use +--------- + +This is the basic use of the trainer: + +.. code-block:: python + + model = MyLightningModule() + + trainer = Trainer() + trainer.fit(model, train_dataloader, val_dataloader) + +-------- + +Under the hood +-------------- + +The Lightning ``Trainer`` does much more than just "training". Under the hood, it handles all loop details for you, some examples include: + +- Automatically enabling/disabling grads +- Running the training, validation and test dataloaders +- Calling the Callbacks at the appropriate times +- Putting batches and computations on the correct devices + +Here's the pseudocode for what the trainer does under the hood (showing the train loop only) + +.. code-block:: python + + # put model in train mode + model.train() + torch.set_grad_enabled(True) + + losses = [] + for batch in train_dataloader: + # calls hooks like this one + on_train_batch_start() + + # train step + loss = training_step(batch) + + # clear gradients + optimizer.zero_grad() + + # backward + loss.backward() + + # update parameters + optimizer.step() + + losses.append(loss) + + +-------- + +Trainer in Python scripts +------------------------- +In Python scripts, it's recommended you use a main function to call the Trainer. + +.. code-block:: python + + from argparse import ArgumentParser + + + def main(hparams): + model = LightningModule() + trainer = Trainer(accelerator=hparams.accelerator, devices=hparams.devices) + trainer.fit(model) + + + if __name__ == "__main__": + parser = ArgumentParser() + parser.add_argument("--accelerator", default=None) + parser.add_argument("--devices", default=None) + args = parser.parse_args() + + main(args) + +So you can run it like so: + +.. code-block:: bash + + python main.py --accelerator 'gpu' --devices 2 + +.. note:: + + Pro-tip: You don't need to define all flags manually. + You can let the :doc:`LightningCLI <../cli/lightning_cli>` create the Trainer and model with arguments supplied from the CLI. + + +If you want to stop a training run early, you can press "Ctrl + C" on your keyboard. +The trainer will catch the ``KeyboardInterrupt`` and attempt a graceful shutdown. The trainer object will also set +an attribute ``interrupted`` to ``True`` in such cases. If you have a callback which shuts down compute +resources, for example, you can conditionally run the shutdown logic for only uninterrupted runs by overriding :meth:`lightning.pytorch.Callback.on_exception`. + +------------ + +Validation +---------- +You can perform an evaluation epoch over the validation set, outside of the training loop, +using :meth:`~lightning.pytorch.trainer.trainer.Trainer.validate`. This might be +useful if you want to collect new metrics from a model right at its initialization +or after it has already been trained. + +.. code-block:: python + + trainer.validate(model=model, dataloaders=val_dataloaders) + +------------ + +Testing +------- +Once you're done training, feel free to run the test set! +(Only right before publishing your paper or pushing to production) + +.. code-block:: python + + trainer.test(dataloaders=test_dataloaders) + +------------ + +Reproducibility +--------------- + +To ensure full reproducibility from run to run you need to set seeds for pseudo-random generators, +and set ``deterministic`` flag in ``Trainer``. + +Example:: + + from lightning.pytorch import Trainer, seed_everything + + seed_everything(42, workers=True) + # sets seeds for numpy, torch and python.random. + model = Model() + trainer = Trainer(deterministic=True) + + +By setting ``workers=True`` in :func:`~lightning.pytorch.seed_everything`, Lightning derives +unique seeds across all dataloader workers and processes for :mod:`torch`, :mod:`numpy` and stdlib +:mod:`random` number generators. When turned on, it ensures that e.g. data augmentations are not repeated across workers. + +------- + +.. _trainer_flags: + +Trainer flags +------------- + +accelerator +^^^^^^^^^^^ + +Supports passing different accelerator types (``"cpu", "gpu", "tpu", "ipu", "auto"``) +as well as custom accelerator instances. + +.. code-block:: python + + # CPU accelerator + trainer = Trainer(accelerator="cpu") + + # Training with GPU Accelerator using 2 GPUs + trainer = Trainer(devices=2, accelerator="gpu") + + # Training with TPU Accelerator using 8 tpu cores + trainer = Trainer(devices=8, accelerator="tpu") + + # Training with GPU Accelerator using the DistributedDataParallel strategy + trainer = Trainer(devices=4, accelerator="gpu", strategy="ddp") + +.. note:: The ``"auto"`` option recognizes the machine you are on, and selects the appropriate ``Accelerator``. + +.. code-block:: python + + # If your machine has GPUs, it will use the GPU Accelerator for training + trainer = Trainer(devices=2, accelerator="auto") + +You can also modify hardware behavior by subclassing an existing accelerator to adjust for your needs. + +Example:: + + class MyOwnAcc(CPUAccelerator): + ... + + Trainer(accelerator=MyOwnAcc()) + +.. note:: + + If the ``devices`` flag is not defined, it will assume ``devices`` to be ``"auto"`` and fetch the ``auto_device_count`` + from the accelerator. + + .. code-block:: python + + # This is part of the built-in `CUDAAccelerator` + class CUDAAccelerator(Accelerator): + """Accelerator for GPU devices.""" + + @staticmethod + def auto_device_count() -> int: + """Get the devices when set to auto.""" + return torch.cuda.device_count() + + + # Training with GPU Accelerator using total number of gpus available on the system + Trainer(accelerator="gpu") + +accumulate_grad_batches +^^^^^^^^^^^^^^^^^^^^^^^ + +Accumulates gradients over k batches before stepping the optimizer. + +.. testcode:: + + # default used by the Trainer (no accumulation) + trainer = Trainer(accumulate_grad_batches=1) + +Example:: + + # accumulate every 4 batches (effective batch size is batch*4) + trainer = Trainer(accumulate_grad_batches=4) + +See also: :ref:`gradient_accumulation` to enable more fine-grained accumulation schedules. + + +benchmark +^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/benchmark.mp4 + :poster: ../_static/fetched-s3-assets/benchmark.jpg + :width: 400 + :muted: + +The value (``True`` or ``False``) to set ``torch.backends.cudnn.benchmark`` to. The value for +``torch.backends.cudnn.benchmark`` set in the current session will be used (``False`` if not manually set). +If :paramref:`~lightning.pytorch.trainer.Trainer.deterministic` is set to ``True``, this will default to ``False``. +You can read more about the interaction of ``torch.backends.cudnn.benchmark`` and ``torch.backends.cudnn.deterministic`` +`here `__ + +Setting this flag to ``True`` can increase the speed of your system if your input sizes don't +change. However, if they do, then it might make your system slower. The CUDNN auto-tuner will try to find the best +algorithm for the hardware when a new input size is encountered. This might also increase the memory usage. +Read more about it `here `__. + +Example:: + + # Will use whatever the current value for torch.backends.cudnn.benchmark, normally False + trainer = Trainer(benchmark=None) # default + + # you can overwrite the value + trainer = Trainer(benchmark=True) + +deterministic +^^^^^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/deterministic.mp4 + :poster: ../_static/fetched-s3-assets/deterministic.jpg + :width: 400 + :muted: + +This flag sets the ``torch.backends.cudnn.deterministic`` flag. +Might make your system slower, but ensures reproducibility. + +For more info check `PyTorch docs `_. + +Example:: + + # default used by the Trainer + trainer = Trainer(deterministic=False) + +callbacks +^^^^^^^^^ + +This argument can be used to add a :class:`~lightning.pytorch.callbacks.callback.Callback` or a list of them. +Callbacks run sequentially in the order defined here +with the exception of :class:`~lightning.pytorch.callbacks.model_checkpoint.ModelCheckpoint` callbacks which run +after all others to ensure all states are saved to the checkpoints. + +.. code-block:: python + + # single callback + trainer = Trainer(callbacks=PrintCallback()) + + # a list of callbacks + trainer = Trainer(callbacks=[PrintCallback()]) + +Example:: + + from lightning.pytorch.callbacks import Callback + + class PrintCallback(Callback): + def on_train_start(self, trainer, pl_module): + print("Training is started!") + def on_train_end(self, trainer, pl_module): + print("Training is done.") + + +Model-specific callbacks can also be added inside the ``LightningModule`` through +:meth:`~lightning.pytorch.core.module.LightningModule.configure_callbacks`. +Callbacks returned in this hook will extend the list initially given to the ``Trainer`` argument, and replace +the trainer callbacks should there be two or more of the same type. +:class:`~lightning.pytorch.callbacks.model_checkpoint.ModelCheckpoint` callbacks always run last. + + +check_val_every_n_epoch +^^^^^^^^^^^^^^^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/check_val_every_n_epoch.mp4 + :poster: ../_static/fetched-s3-assets/check_val_every_n_epoch.jpg + :width: 400 + :muted: + +Check val every n train epochs. + +Example:: + + # default used by the Trainer + trainer = Trainer(check_val_every_n_epoch=1) + + # run val loop every 10 training epochs + trainer = Trainer(check_val_every_n_epoch=10) + + +default_root_dir +^^^^^^^^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/default_root_dir.mp4 + :poster: ../_static/fetched-s3-assets/default%E2%80%A8_root_dir.jpg + :width: 400 + :muted: + +Default path for logs and weights when no logger or +:class:`lightning.pytorch.callbacks.ModelCheckpoint` callback passed. On +certain clusters you might want to separate where logs and checkpoints are +stored. If you don't then use this argument for convenience. Paths can be local +paths or remote paths such as ``s3://bucket/path`` or ``hdfs://path/``. Credentials +will need to be set up to use remote filepaths. + +.. testcode:: + + # default used by the Trainer + trainer = Trainer(default_root_dir=os.getcwd()) + +devices +^^^^^^^ + +Number of devices to train on (``int``), which devices to train on (``list`` or ``str``), or ``"auto"``. + +.. code-block:: python + + # Training with CPU Accelerator using 2 processes + trainer = Trainer(devices=2, accelerator="cpu") + + # Training with GPU Accelerator using GPUs 1 and 3 + trainer = Trainer(devices=[1, 3], accelerator="gpu") + + # Training with TPU Accelerator using 8 tpu cores + trainer = Trainer(devices=8, accelerator="tpu") + +.. tip:: The ``"auto"`` option recognizes the devices to train on, depending on the ``Accelerator`` being used. + +.. code-block:: python + + # Use whatever hardware your machine has available + trainer = Trainer(devices="auto", accelerator="auto") + + # Training with CPU Accelerator using 1 process + trainer = Trainer(devices="auto", accelerator="cpu") + + # Training with TPU Accelerator using 8 tpu cores + trainer = Trainer(devices="auto", accelerator="tpu") + + # Training with IPU Accelerator using 4 ipus + trainer = Trainer(devices="auto", accelerator="ipu") + +.. note:: + + If the ``devices`` flag is not defined, it will assume ``devices`` to be ``"auto"`` and fetch the ``auto_device_count`` + from the accelerator. + + .. code-block:: python + + # This is part of the built-in `CUDAAccelerator` + class CUDAAccelerator(Accelerator): + """Accelerator for GPU devices.""" + + @staticmethod + def auto_device_count() -> int: + """Get the devices when set to auto.""" + return torch.cuda.device_count() + + + # Training with GPU Accelerator using total number of gpus available on the system + Trainer(accelerator="gpu") + +enable_checkpointing +^^^^^^^^^^^^^^^^^^^^ + +By default Lightning saves a checkpoint for you in your current working directory, with the state of your last training epoch, +Checkpoints capture the exact value of all parameters used by a model. +To disable automatic checkpointing, set this to `False`. + +.. code-block:: python + + # default used by Trainer, saves the most recent model to a single checkpoint after each epoch + trainer = Trainer(enable_checkpointing=True) + + # turn off automatic checkpointing + trainer = Trainer(enable_checkpointing=False) + + +You can override the default behavior by initializing the :class:`~lightning.pytorch.callbacks.ModelCheckpoint` +callback, and adding it to the :paramref:`~lightning.pytorch.trainer.trainer.Trainer.callbacks` list. +See :doc:`Saving and Loading Checkpoints <../common/checkpointing>` for how to customize checkpointing. + +.. testcode:: + + from lightning.pytorch.callbacks import ModelCheckpoint + + # Init ModelCheckpoint callback, monitoring 'val_loss' + checkpoint_callback = ModelCheckpoint(monitor="val_loss") + + # Add your callback to the callbacks list + trainer = Trainer(callbacks=[checkpoint_callback]) + +fast_dev_run +^^^^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/fast_dev_run.mp4 + :poster: ../_static/fetched-s3-assets/fast_dev_run.jpg + :width: 400 + :muted: + +Runs n if set to ``n`` (int) else 1 if set to ``True`` batch(es) to ensure your code will execute without errors. This +applies to fitting, validating, testing, and predicting. This flag is **only** recommended for debugging purposes and +should not be used to limit the number of batches to run. + +.. code-block:: python + + # default used by the Trainer + trainer = Trainer(fast_dev_run=False) + + # runs only 1 training and 1 validation batch and the program ends + trainer = Trainer(fast_dev_run=True) + trainer.fit(...) + + # runs 7 predict batches and program ends + trainer = Trainer(fast_dev_run=7) + trainer.predict(...) + +This argument is different from ``limit_{train,val,test,predict}_batches`` because side effects are avoided to reduce the +impact to subsequent runs. These are the changes enabled: + +- Sets ``Trainer(max_epochs=1)``. +- Sets ``Trainer(max_steps=...)`` to 1 or the number passed. +- Sets ``Trainer(num_sanity_val_steps=0)``. +- Sets ``Trainer(val_check_interval=1.0)``. +- Sets ``Trainer(check_every_n_epoch=1)``. +- Disables all loggers. +- Disables passing logged metrics to loggers. +- The :class:`~lightning.pytorch.callbacks.model_checkpoint.ModelCheckpoint` callbacks will not trigger. +- The :class:`~lightning.pytorch.callbacks.early_stopping.EarlyStopping` callbacks will not trigger. +- Sets ``limit_{train,val,test,predict}_batches`` to 1 or the number passed. +- Disables the tuning callbacks (:class:`~lightning.pytorch.callbacks.batch_size_finder.BatchSizeFinder`, :class:`~lightning.pytorch.callbacks.lr_finder.LearningRateFinder`). +- If using the CLI, the configuration file is not saved. + + +gradient_clip_val +^^^^^^^^^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/gradient_clip_val.mp4 + :poster: ../_static/fetched-s3-assets/gradient+_clip_val.jpg + :width: 400 + :muted: + +Gradient clipping value + +.. testcode:: + + # default used by the Trainer + trainer = Trainer(gradient_clip_val=None) + +limit_train_batches +^^^^^^^^^^^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/limit_batches.mp4 + :poster: ../_static/fetched-s3-assets/limit_train_batches.jpg + :width: 400 + :muted: + +How much of training dataset to check. +Useful when debugging or testing something that happens at the end of an epoch. + +.. testcode:: + + # default used by the Trainer + trainer = Trainer(limit_train_batches=1.0) + +Example:: + + # default used by the Trainer + trainer = Trainer(limit_train_batches=1.0) + + # run through only 25% of the training set each epoch + trainer = Trainer(limit_train_batches=0.25) + + # run through only 10 batches of the training set each epoch + trainer = Trainer(limit_train_batches=10) + +limit_test_batches +^^^^^^^^^^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/limit_batches.mp4 + :poster: ../_static/fetched-s3-assets/limit_test_batches.jpg + :width: 400 + :muted: + +How much of test dataset to check. + +.. testcode:: + + # default used by the Trainer + trainer = Trainer(limit_test_batches=1.0) + + # run through only 25% of the test set each epoch + trainer = Trainer(limit_test_batches=0.25) + + # run for only 10 batches + trainer = Trainer(limit_test_batches=10) + +In the case of multiple test dataloaders, the limit applies to each dataloader individually. + +limit_val_batches +^^^^^^^^^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/limit_batches.mp4 + :poster: ../_static/fetched-s3-assets/limit_val_batches.jpg + :width: 400 + :muted: + +How much of validation dataset to check. +Useful when debugging or testing something that happens at the end of an epoch. + +.. testcode:: + + # default used by the Trainer + trainer = Trainer(limit_val_batches=1.0) + + # run through only 25% of the validation set each epoch + trainer = Trainer(limit_val_batches=0.25) + + # run for only 10 batches + trainer = Trainer(limit_val_batches=10) + + # disable validation + trainer = Trainer(limit_val_batches=0) + +In the case of multiple validation dataloaders, the limit applies to each dataloader individually. + +log_every_n_steps +^^^^^^^^^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/log_every_n_steps.mp4 + :poster: ../_static/fetched-s3-assets/log_every_n_steps.jpg + :width: 400 + :muted: + +How often to add logging rows (does not write to disk) + +.. testcode:: + + # default used by the Trainer + trainer = Trainer(log_every_n_steps=50) + +See Also: + - :doc:`logging <../extensions/logging>` + +logger +^^^^^^ + +:doc:`Logger <../visualize/loggers>` (or iterable collection of loggers) for experiment tracking. A ``True`` value uses the default ``TensorBoardLogger`` shown below. ``False`` will disable logging. + +.. testcode:: + :skipif: not _TENSORBOARD_AVAILABLE and not _TENSORBOARDX_AVAILABLE + + from lightning.pytorch.loggers import TensorBoardLogger + + # default logger used by trainer (if tensorboard is installed) + logger = TensorBoardLogger(save_dir=os.getcwd(), version=1, name="lightning_logs") + Trainer(logger=logger) + +max_epochs +^^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/min_max_epochs.mp4 + :poster: ../_static/fetched-s3-assets/max_epochs.jpg + :width: 400 + :muted: + +Stop training once this number of epochs is reached + +.. testcode:: + + # default used by the Trainer + trainer = Trainer(max_epochs=1000) + +If both ``max_epochs`` and ``max_steps`` aren't specified, ``max_epochs`` will default to ``1000``. +To enable infinite training, set ``max_epochs = -1``. + +min_epochs +^^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/min_max_epochs.mp4 + :poster: ../_static/fetched-s3-assets/min_epochs.jpg + :width: 400 + :muted: + +Force training for at least these many epochs + +.. testcode:: + + # default used by the Trainer + trainer = Trainer(min_epochs=1) + +max_steps +^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/min_max_steps.mp4 + :poster: ../_static/fetched-s3-assets/max_steps.jpg + :width: 400 + :muted: + +Stop training after this number of :ref:`global steps `. +Training will stop if max_steps or max_epochs have reached (earliest). + +.. testcode:: + + # Default (disabled) + trainer = Trainer(max_steps=-1) + + # Stop after 100 steps + trainer = Trainer(max_steps=100) + +If ``max_steps`` is not specified, ``max_epochs`` will be used instead (and ``max_epochs`` defaults to +``1000`` if ``max_epochs`` is not specified). To disable this default, set ``max_steps = -1``. + +min_steps +^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/min_max_steps.mp4 + :poster: ../_static/fetched-s3-assets/min_steps.jpg + :width: 400 + :muted: + +Force training for at least this number of :ref:`global steps `. +Trainer will train model for at least min_steps or min_epochs (latest). + +.. testcode:: + + # Default (disabled) + trainer = Trainer(min_steps=None) + + # Run at least for 100 steps (disable min_epochs) + trainer = Trainer(min_steps=100, min_epochs=0) + +max_time +^^^^^^^^ + +Set the maximum amount of time for training. Training will get interrupted mid-epoch. +For customizable options use the :class:`~lightning.pytorch.callbacks.timer.Timer` callback. + +.. testcode:: + + # Default (disabled) + trainer = Trainer(max_time=None) + + # Stop after 12 hours of training or when reaching 10 epochs (string) + trainer = Trainer(max_time="00:12:00:00", max_epochs=10) + + # Stop after 1 day and 5 hours (dict) + trainer = Trainer(max_time={"days": 1, "hours": 5}) + +In case ``max_time`` is used together with ``min_steps`` or ``min_epochs``, the ``min_*`` requirement +always has precedence. + +num_nodes +^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/num_nodes.mp4 + :poster: ../_static/fetched-s3-assets/num_nodes.jpg + :width: 400 + :muted: + +Number of GPU nodes for distributed training. + +.. testcode:: + + # default used by the Trainer + trainer = Trainer(num_nodes=1) + + # to train on 8 nodes + trainer = Trainer(num_nodes=8) + + +num_sanity_val_steps +^^^^^^^^^^^^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/num_sanity_val_steps.mp4 + :poster: ../_static/fetched-s3-assets/num_sanity%E2%80%A8_val_steps.jp + :width: 400 + :muted: + +Sanity check runs n batches of val before starting the training routine. +This catches any bugs in your validation without having to wait for the first validation check. +The Trainer uses 2 steps by default. Turn it off or modify it here. + +.. testcode:: + + # default used by the Trainer + trainer = Trainer(num_sanity_val_steps=2) + + # turn it off + trainer = Trainer(num_sanity_val_steps=0) + + # check all validation data + trainer = Trainer(num_sanity_val_steps=-1) + + +This option will reset the validation dataloader unless ``num_sanity_val_steps=0``. + +overfit_batches +^^^^^^^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/overfit_batches.mp4 + :poster: ../_static/fetched-s3-assets/overfit_batches.jpg + :width: 400 + :muted: + +Uses this much data of the training & validation set. +If the training & validation dataloaders have ``shuffle=True``, Lightning will automatically disable it. + +Useful for quickly debugging or trying to overfit on purpose. + +.. testcode:: + + # default used by the Trainer + trainer = Trainer(overfit_batches=0.0) + + # use only 1% of the train & val set + trainer = Trainer(overfit_batches=0.01) + + # overfit on 10 of the same batches + trainer = Trainer(overfit_batches=10) + +plugins +^^^^^^^ + +:ref:`Plugins` allow you to connect arbitrary backends, precision libraries, clusters etc. For example: + +- :ref:`Checkpoint IO ` +- `TorchElastic `_ +- :ref:`Precision Plugins ` + +To define your own behavior, subclass the relevant class and pass it in. Here's an example linking up your own +:class:`~lightning.pytorch.plugins.environments.ClusterEnvironment`. + +.. code-block:: python + + from lightning.pytorch.plugins.environments import ClusterEnvironment + + + class MyCluster(ClusterEnvironment): + def main_address(self): + return your_main_address + + def main_port(self): + return your_main_port + + def world_size(self): + return the_world_size + + + trainer = Trainer(plugins=[MyCluster()], ...) + +precision +^^^^^^^^^ + +Lightning supports either double (64), float (32), bfloat16 (bf16), or half (16) precision training. + +Half precision, or mixed precision, is the combined use of 32 and 16 bit floating points to reduce memory footprint during model training. This can result in improved performance, achieving +3X speedups on modern GPUs. + +.. testcode:: + :skipif: not torch.cuda.is_available() + + # default used by the Trainer + trainer = Trainer(precision=32) + + # 16-bit precision + trainer = Trainer(precision="16-mixed", accelerator="gpu", devices=1) # works only on CUDA + + # bfloat16 precision + trainer = Trainer(precision="bf16-mixed") + + # 64-bit precision + trainer = Trainer(precision=64) + + +.. note:: When running on TPUs, torch.bfloat16 will be used but tensor printing will still show torch.float32. + +profiler +^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/profiler.mp4 + :poster: ../_static/fetched-s3-assets/profiler.jpg + :width: 400 + :muted: + +To profile individual steps during training and assist in identifying bottlenecks. + +See the :doc:`profiler documentation <../tuning/profiler>`. for more details. + +.. testcode:: + + from lightning.pytorch.profilers import SimpleProfiler, AdvancedProfiler + + # default used by the Trainer + trainer = Trainer(profiler=None) + + # to profile standard training events, equivalent to `profiler=SimpleProfiler()` + trainer = Trainer(profiler="simple") + + # advanced profiler for function-level stats, equivalent to `profiler=AdvancedProfiler()` + trainer = Trainer(profiler="advanced") + +enable_progress_bar +^^^^^^^^^^^^^^^^^^^ + +Whether to enable or disable the progress bar. Defaults to True. + +.. testcode:: + + # default used by the Trainer + trainer = Trainer(enable_progress_bar=True) + + # disable progress bar + trainer = Trainer(enable_progress_bar=False) + +reload_dataloaders_every_n_epochs +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/reload_dataloaders_every_epoch.mp4 + :poster: ../_static/fetched-s3-assets/reload_%E2%80%A8dataloaders_%E2%80%A8every_epoch.jpg + :width: 400 + :muted: + +Set to a positive integer to reload dataloaders every n epochs from your currently used data source. +DataSource can be a ``LightningModule`` or a ``LightningDataModule``. + + +.. code-block:: python + + # if 0 (default) + train_loader = model.train_dataloader() + # or if using data module: datamodule.train_dataloader() + for epoch in epochs: + for batch in train_loader: + ... + + # if a positive integer + for epoch in epochs: + if not epoch % reload_dataloaders_every_n_epochs: + train_loader = model.train_dataloader() + # or if using data module: datamodule.train_dataloader() + for batch in train_loader: + ... + +The pseudocode applies also to the ``val_dataloader``. + +.. _replace-sampler-ddp: + +use_distributed_sampler +^^^^^^^^^^^^^^^^^^^^^^^ + +See :paramref:`lightning.pytorch.trainer.Trainer.params.use_distributed_sampler`. + +.. testcode:: + + # default used by the Trainer + trainer = Trainer(use_distributed_sampler=True) + +By setting to False, you have to add your own distributed sampler: + +.. code-block:: python + + # in your LightningModule or LightningDataModule + def train_dataloader(self): + dataset = ... + # default used by the Trainer + sampler = torch.utils.data.DistributedSampler(dataset, shuffle=True) + dataloader = DataLoader(dataset, batch_size=32, sampler=sampler) + return dataloader + + +strategy +^^^^^^^^ + +Supports passing different training strategies with aliases (ddp, fsdp, etc) as well as configured strategies. + +.. code-block:: python + + # Data-parallel training with the DDP strategy on 4 GPUs + trainer = Trainer(strategy="ddp", accelerator="gpu", devices=4) + + # Model-parallel training with the FSDP strategy on 4 GPUs + trainer = Trainer(strategy="fsdp", accelerator="gpu", devices=4) + +Additionally, you can pass a strategy object. + +.. code-block:: python + + from lightning.pytorch.strategies import DDPStrategy + + trainer = Trainer(strategy=DDPStrategy(static_graph=True), accelerator="gpu", devices=2) + +See Also: + - :ref:`Multi GPU Training `. + - :doc:`Model Parallel GPU training guide <../advanced/model_parallel>`. + - :doc:`TPU training guide <../accelerators/tpu>`. + + +sync_batchnorm +^^^^^^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/sync_batchnorm.mp4 + :poster: ../_static/fetched-s3-assets/sync_batchnorm.jpg + :width: 400 + :muted: + +Enable synchronization between batchnorm layers across all GPUs. + +.. testcode:: + + trainer = Trainer(sync_batchnorm=True) + + +val_check_interval +^^^^^^^^^^^^^^^^^^ + +.. video:: ../_static/fetched-s3-assets/val_check_interval.mp4 + :poster: ../_static/fetched-s3-assets/val_check_interval.jpg + :width: 400 + :muted: + +How often within one training epoch to check the validation set. +Can specify as float or int. + +- pass a ``float`` in the range [0.0, 1.0] to check after a fraction of the training epoch. +- pass an ``int`` to check after a fixed number of training batches. An ``int`` value can only be higher than the number of training + batches when ``check_val_every_n_epoch=None``, which validates after every ``N`` training batches across epochs or iteration-based training. + +.. testcode:: + + # default used by the Trainer + trainer = Trainer(val_check_interval=1.0) + + # check validation set 4 times during a training epoch + trainer = Trainer(val_check_interval=0.25) + + # check validation set every 1000 training batches in the current epoch + trainer = Trainer(val_check_interval=1000) + + # check validation set every 1000 training batches across complete epochs or during iteration-based training + # use this when using iterableDataset and your dataset has no length + # (ie: production cases with streaming data) + trainer = Trainer(val_check_interval=1000, check_val_every_n_epoch=None) + + +.. code-block:: python + + # Here is the computation to estimate the total number of batches seen within an epoch. + + # Find the total number of train batches + total_train_batches = total_train_samples // (train_batch_size * world_size) + + # Compute how many times we will call validation during the training loop + val_check_batch = max(1, int(total_train_batches * val_check_interval)) + val_checks_per_epoch = total_train_batches / val_check_batch + + # Find the total number of validation batches + total_val_batches = total_val_samples // (val_batch_size * world_size) + + # Total number of batches run + total_fit_batches = total_train_batches + total_val_batches + + +enable_model_summary +^^^^^^^^^^^^^^^^^^^^ + +Whether to enable or disable the model summarization. Defaults to True. + +.. testcode:: + + # default used by the Trainer + trainer = Trainer(enable_model_summary=True) + + # disable summarization + trainer = Trainer(enable_model_summary=False) + + # enable custom summarization + from lightning.pytorch.callbacks import ModelSummary + + trainer = Trainer(enable_model_summary=True, callbacks=[ModelSummary(max_depth=-1)]) + + +inference_mode +^^^^^^^^^^^^^^ + +Whether to use :func:`torch.inference_mode` or :func:`torch.no_grad` mode during evaluation +(``validate``/``test``/``predict``) + +.. testcode:: + + # default used by the Trainer + trainer = Trainer(inference_mode=True) + + # Use `torch.no_grad` instead + trainer = Trainer(inference_mode=False) + + +With :func:`torch.inference_mode` disabled, you can enable the grad of your model layers if required. + +.. code-block:: python + + class LitModel(LightningModule): + def validation_step(self, batch, batch_idx): + preds = self.layer1(batch) + with torch.enable_grad(): + grad_preds = preds.requires_grad_() + preds2 = self.layer2(grad_preds) + + + model = LitModel() + trainer = Trainer(inference_mode=False) + trainer.validate(model) + + +----- + +Trainer class API +----------------- + +Methods +^^^^^^^ + +init +**** + +.. automethod:: lightning.pytorch.trainer.Trainer.__init__ + :noindex: + +fit +**** + +.. automethod:: lightning.pytorch.trainer.Trainer.fit + :noindex: + +validate +******** + +.. automethod:: lightning.pytorch.trainer.Trainer.validate + :noindex: + +test +**** + +.. automethod:: lightning.pytorch.trainer.Trainer.test + :noindex: + +predict +******* + +.. automethod:: lightning.pytorch.trainer.Trainer.predict + :noindex: + + +Properties +^^^^^^^^^^ + +callback_metrics +**************** + +The metrics available to callbacks. + +This includes metrics logged via :meth:`~lightning.pytorch.core.module.LightningModule.log`. + +.. code-block:: python + + def training_step(self, batch, batch_idx): + self.log("a_val", 2.0) + + + callback_metrics = trainer.callback_metrics + assert callback_metrics["a_val"] == 2.0 + +logged_metrics +************** + +The metrics sent to the loggers. + +This includes metrics logged via :meth:`~lightning.pytorch.core.module.LightningModule.log` with the +:paramref:`~lightning.pytorch.core.module.LightningModule.log.logger` argument set. + +progress_bar_metrics +******************** + +The metrics sent to the progress bar. + +This includes metrics logged via :meth:`~lightning.pytorch.core.module.LightningModule.log` with the +:paramref:`~lightning.pytorch.core.module.LightningModule.log.prog_bar` argument set. + +current_epoch +************* + +The current epoch, updated after the epoch end hooks are run. + +datamodule +********** + +The current datamodule, which is used by the trainer. + +.. code-block:: python + + used_datamodule = trainer.datamodule + +is_last_batch +************* + +Whether trainer is executing the last batch. + +global_step +*********** + +The number of optimizer steps taken (does not reset each epoch). + +This includes multiple optimizers (if enabled). + +logger +******* + +The first :class:`~lightning.pytorch.loggers.logger.Logger` being used. + +loggers +******** + +The list of :class:`~lightning.pytorch.loggers.logger.Logger` used. + +.. code-block:: python + + for logger in trainer.loggers: + logger.log_metrics({"foo": 1.0}) + +log_dir +******* + +The directory for the current experiment. Use this to save images to, etc... + +.. code-block:: python + + def training_step(self, batch, batch_idx): + img = ... + save_img(img, self.trainer.log_dir) + +is_global_zero +************** + +Whether this process is the global zero in multi-node training. + +.. code-block:: python + + def training_step(self, batch, batch_idx): + if self.trainer.is_global_zero: + print("in node 0, accelerator 0") + +estimated_stepping_batches +************************** + +The estimated number of batches that will ``optimizer.step()`` during training. + +This accounts for gradient accumulation and the current trainer configuration. This might sets up your training +dataloader if hadn't been set up already. + +.. code-block:: python + + def configure_optimizers(self): + optimizer = ... + stepping_batches = self.trainer.estimated_stepping_batches + scheduler = torch.optim.lr_scheduler.OneCycleLR(optimizer, max_lr=1e-3, total_steps=stepping_batches) + return [optimizer], [scheduler] + +state +***** + +The current state of the Trainer, including the current function that is running, the stage of +execution within that function, and the status of the Trainer. + +.. code-block:: python + + # fn in ("fit", "validate", "test", "predict") + trainer.state.fn + # status in ("initializing", "running", "finished", "interrupted") + trainer.state.status + # stage in ("train", "sanity_check", "validate", "test", "predict") + trainer.state.stage + +should_stop +*********** + +If you want to terminate the training during ``.fit``, you can set ``trainer.should_stop=True`` to terminate the training +as soon as possible. Note that, it will respect the arguments ``min_steps`` and ``min_epochs`` to check whether to stop. If these +arguments are set and the ``current_epoch`` or ``global_step`` don't meet these minimum conditions, training will continue until +both conditions are met. If any of these arguments is not set, it won't be considered for the final decision. + + +.. code-block:: python + + # setting `trainer.should_stop` at any point of training will terminate it + class LitModel(LightningModule): + def training_step(self, *args, **kwargs): + self.trainer.should_stop = True + + + trainer = Trainer() + model = LitModel() + trainer.fit(model) + +.. code-block:: python + + # setting `trainer.should_stop` will stop training only after at least 5 epochs have run + class LitModel(LightningModule): + def training_step(self, *args, **kwargs): + if self.current_epoch == 2: + self.trainer.should_stop = True + + + trainer = Trainer(min_epochs=5, max_epochs=100) + model = LitModel() + trainer.fit(model) + +.. code-block:: python + + # setting `trainer.should_stop` will stop training only after at least 5 steps have run + class LitModel(LightningModule): + def training_step(self, *args, **kwargs): + if self.global_step == 2: + self.trainer.should_stop = True + + + trainer = Trainer(min_steps=5, max_epochs=100) + model = LitModel() + trainer.fit(model) + +.. code-block:: python + + # setting `trainer.should_stop` at any until both min_steps and min_epochs are satisfied + class LitModel(LightningModule): + def training_step(self, *args, **kwargs): + if self.global_step == 7: + self.trainer.should_stop = True + + + trainer = Trainer(min_steps=5, min_epochs=5, max_epochs=100) + model = LitModel() + trainer.fit(model) + +sanity_checking +*************** + +Indicates if the trainer is currently running sanity checking. This property can be useful to disable some hooks, +logging or callbacks during the sanity checking. + +.. code-block:: python + + def validation_step(self, batch, batch_idx): + ... + if not self.trainer.sanity_checking: + self.log("value", value) + +num_training_batches +******************** + +The number of training batches that will be used during ``trainer.fit()``. + +num_sanity_val_batches +********************** + +The number of validation batches that will be used during the sanity-checking part of ``trainer.fit()``. + +num_val_batches +*************** + +The number of validation batches that will be used during ``trainer.fit()`` or ``trainer.validate()``. + +num_test_batches +**************** + +The number of test batches that will be used during ``trainer.test()``. + +num_predict_batches +******************* + +The number of prediction batches that will be used during ``trainer.predict()``. + +train_dataloader +**************** + +The training dataloader(s) used during ``trainer.fit()``. + +val_dataloaders +*************** + +The validation dataloader(s) used during ``trainer.fit()`` or ``trainer.validate()``. + +test_dataloaders +**************** + +The test dataloader(s) used during ``trainer.test()``. + +predict_dataloaders +******************* + +The prediction dataloader(s) used during ``trainer.predict()``. diff --git a/source/common_usecases.rst b/docs/source-pytorch/common_usecases.rst similarity index 94% rename from source/common_usecases.rst rename to docs/source-pytorch/common_usecases.rst index 606eea9..263fb34 100644 --- a/source/common_usecases.rst +++ b/docs/source-pytorch/common_usecases.rst @@ -6,10 +6,6 @@ Common Workflows Customize and extend Lightning for things like custom hardware or distributed strategies. -.. join_slack:: - :align: left - ----- .. raw:: html @@ -116,13 +112,6 @@ Customize and extend Lightning for things like custom hardware or distributed st :button_link: advanced/model_parallel.html :height: 100 -.. displayitem:: - :header: Train on the cloud - :description: Run models on the cloud. - :col_css: col-md-12 - :button_link: clouds/cloud_training.html - :height: 100 - .. displayitem:: :header: Train on single or multiple GPUs :description: Train models faster with GPUs. @@ -134,7 +123,7 @@ Customize and extend Lightning for things like custom hardware or distributed st :header: Train on single or multiple HPUs :description: Train models faster with HPUs. :col_css: col-md-12 - :button_link: accelerators/hpu.html + :button_link: integrations/hpu/index.html :height: 100 .. displayitem:: diff --git a/docs/source-pytorch/community/governance.rst b/docs/source-pytorch/community/governance.rst new file mode 100644 index 0000000..3530664 --- /dev/null +++ b/docs/source-pytorch/community/governance.rst @@ -0,0 +1,71 @@ +.. _governance: + +Lightning Governance +#################### + +This document describes governance processes we follow in developing PyTorch Lightning. + +Persons of Interest +******************* + +.. _governance_bdfl: + +BDFL +---- +Role: All final decisions related to Lightning. + +- William Falcon (`williamFalcon `_) (Lightning founder) + +Maintainers +----------- +- Adrian Wälchli (`awaelchli `_) +- Carlos Mocholí (`carmocca `_) +- Jirka Borovec (`Borda `_) +- Justus Schock (`justusschock `_) + + +Emeritus Maintainers +-------------------- +- Ethan Harris (`ethanwharris `_) (Torchbearer founder) +- Nicki Skafte (`SkafteNicki `_) +- Thomas Chaton (`tchaton `_) + + +Alumni +------ +- Akihiro Nitta (`akihironitta `_) +- Ananth Subramaniam (`ananthsub `_) +- Danielle Pintz (`daniellepintz `_) +- Jeff Ling (`jeffling `_) +- Jeff Yang (`ydcjeff `_) +- Jeremy Jordan (`jeremyjordan `_) +- Kaushik Bokka (`kaushikb11 `_) +- Kushashwa Ravi Shrimali (`krshrimali `_) +- Lezwon Castelino (`lezwon `_) +- Matthew Painter (`MattPainter01 `_) (Torchbearer founder) +- Nate Raw (`nateraw `_) +- Nic Eggert (`neggert `_) +- Ota Jasek (`otaj `_) +- Peter Yu (`yukw777 `_) +- Roger Shieh (`s-rog `_) +- Rohit Gupta (`rohitgr7 `_) +- Sean Narenthiran (`SeanNaren `_) +- Siyu Wang (`four4fish `_) +- Teddy Koker (`teddykoker `_) +- Tullie Murrell (`tullie `_) + + +Project Management and Decision Making +************************************** + +The decision what goes into a release is governed by the maintainers of ``lightning.pytorch``. +Whenever possible, discussion happens publicly on GitHub and includes the whole community. +For controversial changes, it is mandatory to seek consultation from :ref:`governance_bdfl` for a final decision. +When a consensus is reached, maintainers assign milestones and labels to the issue and/or pull request +and start tracking the development. It is possible that priorities change over time. + +Commits to the project are exclusively to be added by pull requests on GitHub and anyone in the community is welcome to +review them. However, reviews submitted by +`code owners `_ +have higher weight and it is necessary to get the approval of code owners before a pull request can be merged. +Additional requirements may apply case by case. diff --git a/docs/source-pytorch/community/index.rst b/docs/source-pytorch/community/index.rst new file mode 100644 index 0000000..95f30a6 --- /dev/null +++ b/docs/source-pytorch/community/index.rst @@ -0,0 +1,75 @@ + +.. toctree:: + :maxdepth: 1 + :hidden: + + ../generated/CODE_OF_CONDUCT.md + ../generated/CONTRIBUTING.md + ../generated/BECOMING_A_CORE_CONTRIBUTOR.md + governance + ../versioning + ../past_versions + ../generated/CHANGELOG.md + +######### +Community +######### + +.. raw:: html + +
+
+ +.. displayitem:: + :header: Code of conduct + :description: Contributor Covenant Code of Conduct + :col_css: col-md-12 + :button_link: ../generated/CODE_OF_CONDUCT.html + :height: 100 + +.. displayitem:: + :header: Contribution guide + :description: How to contribute to PyTorch Lightning + :col_css: col-md-12 + :button_link: ../generated/CONTRIBUTING.html + :height: 100 + +.. displayitem:: + :header: How to Become a core contributor + :description: Steps to be a core contributor + :col_css: col-md-12 + :button_link: ../generated/BECOMING_A_CORE_CONTRIBUTOR.html + :height: 100 + +.. displayitem:: + :header: Lightning Governance + :description: The governance processes we follow + :col_css: col-md-12 + :button_link: governance.html + :height: 100 + +.. displayitem:: + :header: Versioning + :description: PyTorch Lightning's versioning policy + :col_css: col-md-12 + :button_link: ../versioning.html + :height: 100 + +.. displayitem:: + :header: Past PyTorch Lightning versions + :description: Docs and upgrade guide for past versions + :col_css: col-md-12 + :button_link: ../past_versions.html + :height: 100 + +.. displayitem:: + :header: Changelog + :description: All notable changes to PyTorch Lightning + :col_css: col-md-12 + :button_link: ../generated/CHANGELOG.html + :height: 100 + +.. raw:: html + +
+
diff --git a/docs/source-pytorch/conf.py b/docs/source-pytorch/conf.py new file mode 100644 index 0000000..4a65e2e --- /dev/null +++ b/docs/source-pytorch/conf.py @@ -0,0 +1,451 @@ +# +# Configuration file for the Sphinx documentation builder. +# +# This file does only contain a selection of the most common options. For a +# full list see the documentation: +# http://www.sphinx-doc.org/en/master/config + +# -- Path setup -------------------------------------------------------------- + +# If extensions (or modules to document with autodoc) are in another directory, +# add these directories to sys.path here. If the directory is relative to the +# documentation root, use os.path.abspath to make it absolute, like shown here. + +import glob +import os +import shutil +import warnings +from importlib.util import module_from_spec, spec_from_file_location +from types import ModuleType + +import pt_lightning_sphinx_theme +from lightning_utilities.docs import fetch_external_assets +from lightning_utilities.docs.formatting import _transform_changelog + +import lightning + +# ----------------------- +# VARIABLES WHEN WORKING ON DOCS... MAKE THIS TRUE TO BUILD FASTER +# ----------------------- +_PL_FAST_DOCS_DEV = bool(int(os.getenv("PL_FAST_DOCS_DEV", 0))) + +# ----------------------- +# BUILD stuff +# ----------------------- +_PATH_HERE = os.path.abspath(os.path.dirname(__file__)) +_PATH_ROOT = os.path.join(_PATH_HERE, "..", "..") +_PATH_RAW_NB = os.path.join(_PATH_ROOT, "_notebooks") +_SHOULD_COPY_NOTEBOOKS = True + + +def _load_py_module(name: str, location: str) -> ModuleType: + spec = spec_from_file_location(name, location) + py = module_from_spec(spec) + spec.loader.exec_module(py) + return py + + +assist_local = _load_py_module("assistant", os.path.join(_PATH_ROOT, ".actions", "assistant.py")) + +if os.path.isdir(os.path.join(_PATH_RAW_NB, ".actions")): + assist_nb = _load_py_module("assistant", os.path.join(_PATH_RAW_NB, ".actions", "assistant.py")) +else: + _SHOULD_COPY_NOTEBOOKS = False + warnings.warn("To build the code, please run: `git submodule update --init --recursive`", stacklevel=2) + +FOLDER_GENERATED = "generated" +SPHINX_MOCK_REQUIREMENTS = int(os.environ.get("SPHINX_MOCK_REQUIREMENTS", True)) + +# -- Project documents ------------------------------------------------------- + +if _SHOULD_COPY_NOTEBOOKS: + assist_nb.AssistantCLI.copy_notebooks( + _PATH_RAW_NB, + _PATH_HERE, + "notebooks", + patterns=[".", "course_UvA-DL", "lightning_examples"], + ) + # TODO: Complete converting the missing items and add them back + ignore = [ + "course_UvA-DL/13-contrastive-learning", + "lightning_examples/augmentation_kornia", + "lightning_examples/finetuning-scheduler", + "lightning_examples/reinforce-learning-DQN", + "lightning_examples/text-transformers", + "lightning_examples/warp-drive", + ] + for file in ignore: + file = os.path.join(_PATH_HERE, "notebooks", file) + if os.path.exists(file): + os.remove(file) + + +os.makedirs(os.path.join(_PATH_HERE, FOLDER_GENERATED), exist_ok=True) +# copy all documents from GH templates like contribution guide +for md in glob.glob(os.path.join(_PATH_ROOT, ".github", "*.md")): + shutil.copy(md, os.path.join(_PATH_HERE, FOLDER_GENERATED, os.path.basename(md))) +# DISABLE CHANGELOG for KR-site +# copy also the changelog +# _transform_changelog( + # os.path.join(_PATH_ROOT, "src", "lightning", "fabric", "CHANGELOG.md"), + # os.path.join(_PATH_HERE, FOLDER_GENERATED, "CHANGELOG.md"), +# ) + + +assist_local.AssistantCLI.pull_docs_files( + gh_user_repo="Lightning-AI/lightning-Habana", + target_dir="docs/source-pytorch/integrations/hpu", + checkout="tags/1.0.0", +) + +if not _PL_FAST_DOCS_DEV: + fetch_external_assets( + docs_folder=_PATH_HERE, + assets_folder="_static/fetched-s3-assets", + retrieve_pattern=r"https?://[-a-zA-Z0-9_]+\.s3\.[-a-zA-Z0-9()_\\+.\\/=]+", + ) + + +# -- Project information ----------------------------------------------------- + +project = "PyTorch Lightning & PyTorch Korea User Group" +copyright = lightning.__copyright__ +author = lightning.__author__ + +# The short X.Y version +version = lightning.__version__ +# The full version, including alpha/beta/rc tags +release = lightning.__version__ + +# -- General configuration --------------------------------------------------- + +# If your documentation needs a minimal Sphinx version, state it here. + +needs_sphinx = "4.5" + +# Add any Sphinx extension module names here, as strings. They can be +# extensions coming with Sphinx (named 'sphinx.ext.*') or your custom +# ones. +extensions = [ + "sphinx.ext.autodoc", + "sphinx.ext.doctest", + "sphinx.ext.intersphinx", + "sphinx_toolbox.collapse", + "sphinx.ext.todo", + "sphinx.ext.coverage", + "sphinx.ext.viewcode", + "sphinx.ext.autosummary", + "sphinx.ext.napoleon", + "sphinx.ext.imgmath", + "sphinx.ext.autosectionlabel", + # 'sphinxcontrib.mockautodoc', # raises error: directive 'automodule' is already registered ... + # 'sphinxcontrib.fulltoc', # breaks pytorch-theme with unexpected kw argument 'titles_only' + "sphinxcontrib.video", + "myst_parser", + "nbsphinx", + "sphinx_autodoc_typehints", + "sphinx_copybutton", + "sphinx_paramlinks", + "sphinx_togglebutton", + "pt_lightning_sphinx_theme.extensions.lightning", +] + +# Suppress warnings about duplicate labels (needed for PL tutorials) +suppress_warnings = [ + "autosectionlabel.*", +] + +copybutton_prompt_text = ">>> " +copybutton_prompt_text1 = "... " +copybutton_exclude = ".linenos" + +copybutton_only_copy_prompt_lines = True + +# Add any paths that contain templates here, relative to this directory. +templates_path = ["_templates"] + +# https://berkeley-stat159-f17.github.io/stat159-f17/lectures/14-sphinx..html#conf.py-(cont.) +# https://stackoverflow.com/questions/38526888/embed-ipython-notebook-in-sphinx-document +# I execute the notebooks manually in advance. If notebooks test the code, +# they should be run at build time. +nbsphinx_execute = "never" +nbsphinx_allow_errors = True +nbsphinx_requirejs_path = "" + +# myst-parser, forcing to parse all html pages with mathjax +# https://github.com/executablebooks/MyST-Parser/issues/394 +myst_update_mathjax = False +# https://myst-parser.readthedocs.io/en/latest/syntax/optional.html?highlight=anchor#auto-generated-header-anchors +myst_heading_anchors = 3 + +# The suffix(es) of source filenames. +# You can specify multiple suffix as a list of string: +# +source_parsers = {".rst": "restructuredtext", ".txt": "markdown", ".md": "markdown", ".ipynb": "nbsphinx"} + +# The master toctree document. +master_doc = "index" + +# The language for content autogenerated by Sphinx. Refer to documentation +# for a list of supported languages. +# +# This is also used if you do content translation via gettext catalogs. +# Usually you set "language" from the command line for these cases. +language = "ko" + +# List of patterns, relative to source directory, that match files and +# directories to ignore when looking for source files. +# This pattern also affects html_static_path and html_extra_path. +exclude_patterns = [ + f"{FOLDER_GENERATED}/PULL_REQUEST_TEMPLATE.md", + "notebooks/sample-template*", +] + +if _PL_FAST_DOCS_DEV: + exclude_patterns.append("notebooks/*") + exclude_patterns.append("tutorials.rst") + + +# The name of the Pygments (syntax highlighting) style to use. +pygments_style = None + +# -- Options for HTML output ------------------------------------------------- + +# The theme to use for HTML and HTML Help pages. See the documentation for +# a list of builtin themes. +# http://www.sphinx-doc.org/en/master/usage/theming.html#builtin-themes +# html_theme = 'bizstyle' +# https://sphinx-themes.org +html_theme = "pt_lightning_sphinx_theme" +html_theme_path = [os.environ.get("LIT_SPHINX_PATH", pt_lightning_sphinx_theme.get_html_theme_path())] + +# Theme options are theme-specific and customize the look and feel of a theme +# further. For a list of options available for each theme, see the +# documentation. + +html_theme_options = { + "pytorch_project": "https://lightning.ai", + "canonical_url": lightning.__docs_url__, + "collapse_navigation": False, + "display_version": True, + "logo_only": False, +} + +html_logo = "_static/images/logo.svg" + +html_favicon = "_static/images/icon.svg" + +# Add any paths that contain custom static files (such as style sheets) here, +# relative to this directory. They are copied after the builtin static files, +# so a file named "default.css" will overwrite the builtin "default.css". +html_static_path = ["_templates", "_static"] + +# Custom sidebar templates, must be a dictionary that maps document names +# to template names. +# +# The default sidebars (for documents that don't match any pattern) are +# defined by theme itself. Builtin themes are using these templates by +# default: ``['localtoc.html', 'relations.html', 'sourcelink.html', +# 'searchbox.html']``. +# +# html_sidebars = {} + +# -- Options for HTMLHelp output --------------------------------------------- + +# Output file base name for HTML help builder. +htmlhelp_basename = project + "-doc" + +# -- Options for LaTeX output ------------------------------------------------ + +latex_elements = { + # The paper size ('letterpaper' or 'a4paper'). + # 'papersize': 'letterpaper', + # The font size ('10pt', '11pt' or '12pt'). + # 'pointsize': '10pt', + # Additional stuff for the LaTeX preamble. + # 'preamble': '', + # Latex figure (float) alignment + "figure_align": "htbp" +} + +# Grouping the document tree into LaTeX files. List of tuples +# (source start file, target name, title, +# author, documentclass [howto, manual, or own class]). +latex_documents = [(master_doc, project + ".tex", project + " Documentation", author, "manual")] + +# -- Options for manual page output ------------------------------------------ + +# One entry per manual page. List of tuples +# (source start file, name, description, authors, manual section). +man_pages = [(master_doc, project, project + " Documentation", [author], 1)] + +# -- Options for Texinfo output ---------------------------------------------- + +# Grouping the document tree into Texinfo files. List of tuples +# (source start file, target name, title, author, +# dir menu entry, description, category) +texinfo_documents = [ + ( + master_doc, + project, + project + " Documentation", + author, + project, + "One line description of project.", + "Miscellaneous", + ) +] + +# -- Options for Epub output ------------------------------------------------- + +# Bibliographic Dublin Core info. +epub_title = project + +# The unique identifier of the text. This can be a ISBN number +# or the project homepage. +# +# epub_identifier = '' + +# A unique identification for the text. +# +# epub_uid = '' + +# A list of files that should not be packed into the epub file. +epub_exclude_files = ["search.html"] + +# -- Extension configuration ------------------------------------------------- + +# -- Options for intersphinx extension --------------------------------------- + +intersphinx_mapping = { + "python": ("https://docs.python.org/3", None), + "torch": ("https://pytorch.org/docs/stable/", None), + "numpy": ("https://numpy.org/doc/stable/", None), + "PIL": ("https://pillow.readthedocs.io/en/stable/", None), + "torchmetrics": ("https://torchmetrics.readthedocs.io/en/stable/", None), + "graphcore": ("https://docs.graphcore.ai/en/latest/", None), + "habana": ("https://lightning-ai.github.io/lightning-Habana/", None), +} + +# -- Options for todo extension ---------------------------------------------- + +# If true, `todo` and `todoList` produce output, else they produce nothing. +# todo_include_todos = True +todo_include_todos = False + + +def setup(app): + # this is for hiding doctest decoration, + # see: http://z4r.github.io/python/2011/12/02/hides-the-prompts-and-output/ + app.add_js_file("copybutton.js") + app.add_css_file("main.css") + + +# copy all notebooks to local folder +# path_nbs = os.path.join(PATH_HERE, 'notebooks') +# if not os.path.isdir(path_nbs): +# os.mkdir(path_nbs) +# for path_ipynb in glob.glob(os.path.join(PATH_ROOT, 'notebooks', '*.ipynb')): +# path_ipynb2 = os.path.join(path_nbs, os.path.basename(path_ipynb)) +# shutil.copy(path_ipynb, path_ipynb2) + + +# Ignoring Third-party packages +# https://stackoverflow.com/questions/15889621/sphinx-how-to-exclude-imports-in-automodule +def package_list_from_file(file): + """List up package name (not containing version and extras) from a package list file.""" + mocked_packages = [] + with open(file) as fp: + for ln in fp.readlines(): + # Example: `tqdm>=4.41.0` => `tqdm` + # `[` is for package with extras + found = [ln.index(ch) for ch in list(",=<>#[") if ch in ln] + pkg = ln[: min(found)] if found else ln + if pkg.rstrip(): + mocked_packages.append(pkg.rstrip()) + return mocked_packages + + +# define mapping from PyPI names to python imports +PACKAGE_MAPPING = { + "Pillow": "PIL", + "opencv-python": "cv2", + "PyYAML": "yaml", + "hydra-core": "hydra", +} +MOCK_PACKAGES = [] +if SPHINX_MOCK_REQUIREMENTS: + _path_require = lambda fname: os.path.join(_PATH_ROOT, "requirements", "pytorch", fname) + # mock also base packages when we are on RTD since we don't install them there + MOCK_PACKAGES += package_list_from_file(_path_require("base.txt")) + MOCK_PACKAGES += package_list_from_file(_path_require("extra.txt")) + MOCK_PACKAGES += package_list_from_file(_path_require("strategies.txt")) +MOCK_PACKAGES = [PACKAGE_MAPPING.get(pkg, pkg) for pkg in MOCK_PACKAGES] + +autodoc_mock_imports = MOCK_PACKAGES + +autosummary_generate = True + +autodoc_member_order = "groupwise" + +autoclass_content = "both" + +autodoc_default_options = { + "members": True, + "methods": True, + "special-members": "__call__", + "exclude-members": "_abc_impl", + "show-inheritance": True, +} + +# Sphinx will add “permalinks” for each heading and description environment as paragraph signs that +# become visible when the mouse hovers over them. +# This value determines the text for the permalink; it defaults to "¶". Set it to None or the empty +# string to disable permalinks. +# https://www.sphinx-doc.org/en/master/usage/configuration.html#confval-html_add_permalinks +html_permalinks = True +html_permalinks_icon = "¶" + +# True to prefix each section label with the name of the document it is in, followed by a colon. +# For example, index:Introduction for a section called Introduction that appears in document index.rst. +# Useful for avoiding ambiguity when the same section heading appears in different documents. +# http://www.sphinx-doc.org/en/master/usage/extensions/autosectionlabel.html +autosectionlabel_prefix_document = True + +# only run doctests marked with a ".. doctest::" directive +doctest_test_doctest_blocks = "" +doctest_global_setup = """ +import importlib +import os +import sys +from typing import Optional + +import torch +import lightning.pytorch as pl +from torch import nn +from torch.utils.data import IterableDataset, DataLoader, Dataset +from lightning.pytorch import LightningDataModule, LightningModule, Trainer, seed_everything +from lightning.pytorch.callbacks import Callback +from lightning.pytorch.cli import _JSONARGPARSE_SIGNATURES_AVAILABLE as _JSONARGPARSE_AVAILABLE +from lightning.pytorch.utilities import _TORCHVISION_AVAILABLE +from lightning.fabric.loggers.tensorboard import _TENSORBOARD_AVAILABLE, _TENSORBOARDX_AVAILABLE +from lightning.pytorch.loggers.neptune import _NEPTUNE_AVAILABLE +from lightning.pytorch.loggers.comet import _COMET_AVAILABLE +from lightning.pytorch.loggers.mlflow import _MLFLOW_AVAILABLE +from lightning.pytorch.loggers.wandb import _WANDB_AVAILABLE +""" +coverage_skip_undoc_in_source = True + +# skip false positive linkcheck errors from anchors +linkcheck_anchors = False + +# ignore all links in any CHANGELOG file +linkcheck_exclude_documents = [r"^(.*\/)*CHANGELOG.*$"] + +# ignore the following relative links (false positive errors during linkcheck) +linkcheck_ignore = [ + r"^starter/installation.html$", + r"^installation.html$", + r"^../cli/lightning_cli.html$", + r"^../common/trainer.html#trainer-flags$", +] diff --git a/source/debug/debugging.rst b/docs/source-pytorch/debug/debugging.rst similarity index 100% rename from source/debug/debugging.rst rename to docs/source-pytorch/debug/debugging.rst diff --git a/source/debug/debugging_advanced.rst b/docs/source-pytorch/debug/debugging_advanced.rst similarity index 99% rename from source/debug/debugging_advanced.rst rename to docs/source-pytorch/debug/debugging_advanced.rst index 0c1685a..444e947 100644 --- a/source/debug/debugging_advanced.rst +++ b/docs/source-pytorch/debug/debugging_advanced.rst @@ -25,7 +25,6 @@ or use regular print statements. class LitModel(LightningModule): def training_step(self, batch, batch_idx): - debugging_message = ... print(f"RANK - {self.trainer.global_rank}: {debugging_message}") diff --git a/source/debug/debugging_basic.rst b/docs/source-pytorch/debug/debugging_basic.rst similarity index 82% rename from source/debug/debugging_basic.rst rename to docs/source-pytorch/debug/debugging_basic.rst index 147285f..09075c1 100644 --- a/source/debug/debugging_basic.rst +++ b/docs/source-pytorch/debug/debugging_basic.rst @@ -5,13 +5,13 @@ ######################## Debug your model (basic) ######################## -**Audience**: Users who want to learn the basics of debugging models. -.. raw:: html +**Audience**: Users who want to learn the basics of debugging models. - +.. video:: ../_static/fetched-s3-assets/Trainer+flags+7-+debugging_1.mp4 + :poster: ../_static/fetched-s3-assets/thumb_debugging.png + :width: 400 + :muted: ---- @@ -36,7 +36,7 @@ A breakpoint stops your code execution so you can inspect variables, etc... and import pdb pdb.set_trace() - y = x ** 2 + y = x**2 In this example, the code will stop before executing the ``y = x**2`` line. @@ -47,7 +47,7 @@ Run all your model code once quickly ************************************ If you've ever trained a model for days only to crash during validation or testing then this trainer argument is about to become your best friend. -The :paramref:`~pytorch_lightning.trainer.trainer.Trainer.fast_dev_run` argument in the trainer runs 5 batch of training, validation, test and prediction data through your trainer to see if there are any bugs: +The :paramref:`~lightning.pytorch.trainer.trainer.Trainer.fast_dev_run` argument in the trainer runs 5 batch of training, validation, test and prediction data through your trainer to see if there are any bugs: .. code:: python @@ -63,8 +63,8 @@ To change how many batches to use, change the argument to an integer. Here we ru .. note:: This argument will disable tuner, checkpoint callbacks, early stopping callbacks, - loggers and logger callbacks like :class:`~pytorch_lightning.callbacks.lr_monitor.LearningRateMonitor` and - :class:`~pytorch_lightning.callbacks.device_stats_monitor.DeviceStatsMonitor`. + loggers and logger callbacks like :class:`~lightning.pytorch.callbacks.lr_monitor.LearningRateMonitor` and + :class:`~lightning.pytorch.callbacks.device_stats_monitor.DeviceStatsMonitor`. ---- @@ -92,8 +92,8 @@ Run a Sanity Check Lightning runs **2** steps of validation in the beginning of training. This avoids crashing in the validation loop sometime deep into a lengthy training loop. -(See: :paramref:`~pytorch_lightning.trainer.trainer.Trainer.num_sanity_val_steps` -argument of :class:`~pytorch_lightning.trainer.trainer.Trainer`) +(See: :paramref:`~lightning.pytorch.trainer.trainer.Trainer.num_sanity_val_steps` +argument of :class:`~lightning.pytorch.trainer.trainer.Trainer`) .. testcode:: @@ -120,14 +120,24 @@ this generate a table like: 1 | net.0 | Linear | 131 K 2 | net.1 | BatchNorm1d | 1.0 K -To add the child modules to the summary add a :class:`~pytorch_lightning.callbacks.model_summary.ModelSummary`: +To add the child modules to the summary add a :class:`~lightning.pytorch.callbacks.model_summary.ModelSummary`: .. testcode:: - from pytorch_lightning.callbacks import ModelSummary + from lightning.pytorch.callbacks import ModelSummary trainer = Trainer(callbacks=[ModelSummary(max_depth=-1)]) +To print the model summary if ``.fit()`` is not called: + +.. code-block:: python + + from lightning.pytorch.utilities.model_summary import ModelSummary + + model = LitModel() + summary = ModelSummary(model, max_depth=-1) + print(summary) + To turn off the autosummary use: .. code:: python diff --git a/docs/source-pytorch/debug/debugging_intermediate.rst b/docs/source-pytorch/debug/debugging_intermediate.rst new file mode 100644 index 0000000..9895223 --- /dev/null +++ b/docs/source-pytorch/debug/debugging_intermediate.rst @@ -0,0 +1,90 @@ +:orphan: + +.. _debugging_intermediate: + + +############################### +Debug your model (intermediate) +############################### +**Audience**: Users who want to debug their ML code + +---- + +*************************** +Why should I debug ML code? +*************************** +Machine learning code requires debugging mathematical correctness, which is not something non-ML code has to deal with. Lightning implements a few best-practice techniques to give all users, expert level ML debugging abilities. + +---- + +************************************** +Overfit your model on a Subset of Data +************************************** +A good debugging technique is to take a tiny portion of your data (say 2 samples per class), +and try to get your model to overfit. If it can't, it's a sign it won't work with large datasets. + +(See: :paramref:`~lightning.pytorch.trainer.trainer.Trainer.overfit_batches` +argument of :class:`~lightning.pytorch.trainer.trainer.Trainer`) + +.. testcode:: + + # use only 1% of training data (and turn off validation) + trainer = Trainer(overfit_batches=0.01) + + # similar, but with a fixed 10 batches + trainer = Trainer(overfit_batches=10) + +When using this argument, the validation loop will be disabled. We will also replace the sampler +in the training set to turn off shuffle for you. + +---- + +******************************** +Look-out for exploding gradients +******************************** +One major problem that plagues models is exploding gradients. +Gradient clipping is one technique that can help keep gradients from exploding. + +You can keep an eye on the gradient norm by logging it in your LightningModule: + +.. code-block:: python + + from lightning.pytorch.utilities import grad_norm + + + def on_before_optimizer_step(self, optimizer): + # Compute the 2-norm for each layer + # If using mixed precision, the gradients are already unscaled here + norms = grad_norm(self.layer, norm_type=2) + self.log_dict(norms) + + +This will plot the 2-norm of each layer to your experiment manager. +If you notice the norm is going up, there's a good chance your gradients will explode. + +One technique to stop exploding gradients is to clip the gradient when the norm is above a certain threashold: + +.. testcode:: + + # DEFAULT (ie: don't clip) + trainer = Trainer(gradient_clip_val=0) + + # clip gradients' global norm to <=0.5 using gradient_clip_algorithm='norm' by default + trainer = Trainer(gradient_clip_val=0.5) + + # clip gradients' maximum magnitude to <=0.5 + trainer = Trainer(gradient_clip_val=0.5, gradient_clip_algorithm="value") + +---- + +************************* +Detect autograd anomalies +************************* +Lightning helps you detect anomalies in the PyTorh autograd engine via PyTorch's built-in +`Anomaly Detection Context-manager `_. + +Enable it via the **detect_anomaly** trainer argument: + +.. testcode:: + + trainer = Trainer(detect_anomaly=True) diff --git a/source/deploy/production.rst b/docs/source-pytorch/deploy/production.rst similarity index 100% rename from source/deploy/production.rst rename to docs/source-pytorch/deploy/production.rst diff --git a/docs/source-pytorch/deploy/production_advanced.rst b/docs/source-pytorch/deploy/production_advanced.rst new file mode 100644 index 0000000..5e02423 --- /dev/null +++ b/docs/source-pytorch/deploy/production_advanced.rst @@ -0,0 +1,78 @@ +######################################## +Deploy models into production (advanced) +######################################## +**Audience**: Machine learning engineers optimizing models for enterprise-scale production environments. + +---- + +************************** +Compile your model to ONNX +************************** +`ONNX `_ is a package developed by Microsoft to optimize inference. ONNX allows the model to be independent of PyTorch and run on any ONNX Runtime. + +To export your model to ONNX format call the :meth:`~lightning.pytorch.core.module.LightningModule.to_onnx` function on your :class:`~lightning.pytorch.core.module.LightningModule` with the ``filepath`` and ``input_sample``. + +.. code-block:: python + + class SimpleModel(LightningModule): + def __init__(self): + super().__init__() + self.l1 = torch.nn.Linear(in_features=64, out_features=4) + + def forward(self, x): + return torch.relu(self.l1(x.view(x.size(0), -1))) + + + # create the model + model = SimpleModel() + filepath = "model.onnx" + input_sample = torch.randn((1, 64)) + model.to_onnx(filepath, input_sample, export_params=True) + +You can also skip passing the input sample if the ``example_input_array`` property is specified in your :class:`~lightning.pytorch.core.module.LightningModule`. + +.. code-block:: python + + class SimpleModel(LightningModule): + def __init__(self): + super().__init__() + self.l1 = torch.nn.Linear(in_features=64, out_features=4) + self.example_input_array = torch.randn(7, 64) + + def forward(self, x): + return torch.relu(self.l1(x.view(x.size(0), -1))) + + + # create the model + model = SimpleModel() + filepath = "model.onnx" + model.to_onnx(filepath, export_params=True) + +Once you have the exported model, you can run it on your ONNX runtime in the following way: + +.. code-block:: python + + import onnxruntime + + ort_session = onnxruntime.InferenceSession(filepath) + input_name = ort_session.get_inputs()[0].name + ort_inputs = {input_name: np.random.randn(1, 64)} + ort_outs = ort_session.run(None, ort_inputs) + +---- + +**************************** +Validate a Model Is Servable +**************************** + +.. warning:: This is an :ref:`experimental ` feature. + +Production ML Engineers would argue that a model shouldn't be trained if it can't be deployed reliably and in a fully automated manner. + +In order to ease transition from training to production, PyTorch Lightning provides a way for you to validate a model can be served even before starting training. + +In order to do so, your LightningModule needs to subclass the :class:`~lightning.pytorch.serve.servable_module.ServableModule`, implements its hooks and pass a :class:`~lightning.pytorch.serve.servable_module_validator.ServableModuleValidator` callback to the Trainer. + +Below you can find an example of how the serving of a resnet18 can be validated. + +.. literalinclude:: ../../../examples/pytorch/servable_module/production.py diff --git a/source/deploy/production_advanced_2.rst b/docs/source-pytorch/deploy/production_advanced_2.rst similarity index 90% rename from source/deploy/production_advanced_2.rst rename to docs/source-pytorch/deploy/production_advanced_2.rst index e86aee8..09014d2 100644 --- a/source/deploy/production_advanced_2.rst +++ b/docs/source-pytorch/deploy/production_advanced_2.rst @@ -11,7 +11,7 @@ Deploy models into production (advanced) Compile your model to TorchScript ********************************* `TorchScript `_ allows you to serialize your models in a way that it can be loaded in non-Python environments. -The ``LightningModule`` has a handy method :meth:`~pytorch_lightning.core.lightning.LightningModule.to_torchscript` that returns a scripted module which you +The ``LightningModule`` has a handy method :meth:`~lightning.pytorch.core.module.LightningModule.to_torchscript` that returns a scripted module which you can save or directly use. .. testcode:: python @@ -34,7 +34,7 @@ can save or directly use. It is recommended that you install the latest supported version of PyTorch to use this feature without limitations. -Once you have the exported model, you can run it in Pytorch or C++ runtime: +Once you have the exported model, you can run it in PyTorch or C++ runtime: .. code-block:: python diff --git a/docs/source-pytorch/deploy/production_basic.rst b/docs/source-pytorch/deploy/production_basic.rst new file mode 100644 index 0000000..e03a2b5 --- /dev/null +++ b/docs/source-pytorch/deploy/production_basic.rst @@ -0,0 +1,102 @@ +##################################### +Deploy models into production (basic) +##################################### +**Audience**: All users. + +---- + +***************************** +Load a checkpoint and predict +***************************** +The easiest way to use a model for predictions is to load the weights using **load_from_checkpoint** found in the LightningModule. + +.. code-block:: python + + model = LitModel.load_from_checkpoint("best_model.ckpt") + model.eval() + x = torch.randn(1, 64) + + with torch.no_grad(): + y_hat = model(x) + +---- + +************************************** +Predict step with your LightningModule +************************************** +Loading a checkpoint and predicting still leaves you with a lot of boilerplate around the predict epoch. The **predict step** in the LightningModule removes this boilerplate. + +.. code-block:: python + + class MyModel(LightningModule): + def predict_step(self, batch, batch_idx, dataloader_idx=0): + return self(batch) + +And pass in any dataloader to the Lightning Trainer: + +.. code-block:: python + + data_loader = DataLoader(...) + model = MyModel() + trainer = Trainer() + predictions = trainer.predict(model, data_loader) + +---- + +******************************** +Enable complicated predict logic +******************************** +When you need to add complicated pre-processing or post-processing logic to your data use the predict step. For example here we do `Monte Carlo Dropout `_ for predictions: + +.. code-block:: python + + class LitMCdropoutModel(pl.LightningModule): + def __init__(self, model, mc_iteration): + super().__init__() + self.model = model + self.dropout = nn.Dropout() + self.mc_iteration = mc_iteration + + def predict_step(self, batch, batch_idx): + # enable Monte Carlo Dropout + self.dropout.train() + + # take average of `self.mc_iteration` iterations + pred = [self.dropout(self.model(x)).unsqueeze(0) for _ in range(self.mc_iteration)] + pred = torch.vstack(pred).mean(dim=0) + return pred + +---- + +**************************** +Enable distributed inference +**************************** +By using the predict step in Lightning you get free distributed inference using :class:`~lightning.pytorch.callbacks.prediction_writer.BasePredictionWriter`. + +.. code-block:: python + + import torch + from lightning.pytorch.callbacks import BasePredictionWriter + + + class CustomWriter(BasePredictionWriter): + def __init__(self, output_dir, write_interval): + super().__init__(write_interval) + self.output_dir = output_dir + + def write_on_epoch_end(self, trainer, pl_module, predictions, batch_indices): + # this will create N (num processes) files in `output_dir` each containing + # the predictions of it's respective rank + torch.save(predictions, os.path.join(self.output_dir, f"predictions_{trainer.global_rank}.pt")) + + # optionally, you can also save `batch_indices` to get the information about the data index + # from your prediction data + torch.save(batch_indices, os.path.join(self.output_dir, f"batch_indices_{trainer.global_rank}.pt")) + + + # or you can set `writer_interval="batch"` and override `write_on_batch_end` to save + # predictions at batch level + pred_writer = CustomWriter(output_dir="pred_path", write_interval="epoch") + trainer = Trainer(accelerator="gpu", strategy="ddp", devices=8, callbacks=[pred_writer]) + model = BoringModel() + trainer.predict(model, return_predictions=False) diff --git a/source/deploy/production_intermediate.rst b/docs/source-pytorch/deploy/production_intermediate.rst similarity index 89% rename from source/deploy/production_intermediate.rst rename to docs/source-pytorch/deploy/production_intermediate.rst index eacb03d..61034b7 100644 --- a/source/deploy/production_intermediate.rst +++ b/docs/source-pytorch/deploy/production_intermediate.rst @@ -14,16 +14,15 @@ If you prefer to use PyTorch directly, feel free to use any Lightning checkpoint import torch - model = torch.load("path/to/lightning/checkpoint.ckpt") - model.eval() -You can also pull out the specific modules you want out of the checkpoint: + class MyModel(nn.Module): + ... -.. code-block:: python - model = torch.load("path/to/lightning/checkpoint.ckpt") - encoder = model["encoder"] - encoder.eval() + model = MyModel() + checkpoint = torch.load("path/to/lightning/checkpoint.ckpt") + model.load_state_dict(checkpoint["state_dict"]) + model.eval() ---- @@ -85,7 +84,7 @@ from your LightningModule ``init`` and ``forward`` method. # if you want to restore any hyperparameters, you can pass them too model = AutoEncoderProd(**hyper_parameters) - state_dict = checkpoint["state_dict"] + model_weights = checkpoint["state_dict"] # update keys by dropping `auto_encoder.` for key in list(model_weights): diff --git a/source/ecosystem/asr_nlp_tts.rst b/docs/source-pytorch/ecosystem/asr_nlp_tts.rst similarity index 99% rename from source/ecosystem/asr_nlp_tts.rst rename to docs/source-pytorch/ecosystem/asr_nlp_tts.rst index b624696..09d5bb0 100644 --- a/source/ecosystem/asr_nlp_tts.rst +++ b/docs/source-pytorch/ecosystem/asr_nlp_tts.rst @@ -48,7 +48,7 @@ so that each can be configured from .yaml or the Hydra CLI. .. note:: Every NeMo model has an example configuration file and a corresponding script that contains all configurations needed for training. -The end result of using NeMo, Pytorch Lightning, and Hydra is that +The end result of using NeMo, PyTorch Lightning, and Hydra is that NeMo models all have the same look and feel. This makes it easy to do Conversational AI research across multiple domains. NeMo models are also fully compatible with the PyTorch ecosystem. @@ -719,6 +719,7 @@ be customized with PyTorch Lightning since every NeMo model is a LightningModule """ ... + # NeMo models come with neural type checking @typecheck( input_types={ diff --git a/source/ecosystem/bolts.rst b/docs/source-pytorch/ecosystem/bolts.rst similarity index 98% rename from source/ecosystem/bolts.rst rename to docs/source-pytorch/ecosystem/bolts.rst index 56c7768..a82184d 100644 --- a/source/ecosystem/bolts.rst +++ b/docs/source-pytorch/ecosystem/bolts.rst @@ -83,7 +83,7 @@ We also have a collection of callbacks. .. code-block:: python from pl_bolts.callbacks import PrintTableMetricsCallback - import pytorch_lightning as pl + import lightning.pytorch as pl trainer = pl.Trainer(callbacks=[PrintTableMetricsCallback()]) diff --git a/source/ecosystem/community_examples.rst b/docs/source-pytorch/ecosystem/community_examples.rst similarity index 93% rename from source/ecosystem/community_examples.rst rename to docs/source-pytorch/ecosystem/community_examples.rst index f535857..bd95f21 100644 --- a/source/ecosystem/community_examples.rst +++ b/docs/source-pytorch/ecosystem/community_examples.rst @@ -4,8 +4,8 @@ Community Examples ================== -- `Lightning Bolts: Deep Learning components for extending PyTorch Lightning `_. -- `Lightning Flash: Your PyTorch AI Factory - Flash enables you to easily configure and run complex AI recipes `_. +- `Lightning Bolts: Deep Learning components for extending PyTorch Lightning `_. +- `Lightning Flash: Your PyTorch AI Factory - Flash enables you to easily configure and run complex AI recipes `_. - `Contextual Emotion Detection (DoubleDistilBert) `_ - `Cotatron: Transcription-Guided Speech Encoder `_ - `FasterRCNN object detection + Hydra `_ @@ -33,4 +33,4 @@ PyTorch Ecosystem Examples ========================== - `PyTorch Geometric: Deep learning on graphs and other irregular structures `_. -- `TorchIO, MONAI and Lightning for 3D medical image segmentation `_. +- `TorchIO, MONAI and Lightning for 3D medical image segmentation `_. diff --git a/source/ecosystem/ecosystem-ci.rst b/docs/source-pytorch/ecosystem/ecosystem-ci.rst similarity index 81% rename from source/ecosystem/ecosystem-ci.rst rename to docs/source-pytorch/ecosystem/ecosystem-ci.rst index 04ff342..5a4d7b0 100644 --- a/source/ecosystem/ecosystem-ci.rst +++ b/docs/source-pytorch/ecosystem/ecosystem-ci.rst @@ -3,7 +3,7 @@ Ecosystem CI ============ -`Ecosystem CI `_ automates issue discovery for your projects against Lightning nightly and releases. +`Ecosystem CI `_ automates issue discovery for your projects against Lightning nightly and releases. It is a lightweight repository that provides easy configuration of Continues Integration running on CPUs and GPUs. Any user who wants to keep their project aligned with current and future Lightning releases can use the EcoSystem CI to configure their integrations. Read more: `Stay Ahead of Breaking Changes with the New Lightning Ecosystem CI `_ @@ -23,8 +23,7 @@ Follow the instructions below to add a new project to the PyTorch Lightning ecos For GPU integrations, you only add the path to the config (OS/Linux and Python version is fixed) to be running with Azure pipelines. 4. Add a Contact to the ``.github/CODEOWNERS`` list for your organization folder or just a single project. 5. Create a Draft PR with all mentioned requirements. -6. Join our `Slack `_ (Optional) channel ``#alerts-ecosystem-ci`` to be notified if your project is breaking. +6. Join our `Discord `_ (Optional) channel ``#alerts-ecosystem-ci`` to be notified if your project is breaking. - -To learn more about Ecosystem CI, please refer to the `Ecosystem CI repo `_. +To learn more about Ecosystem CI, please refer to the `Ecosystem CI repo `_. Also, note that some particular implementation details described above may evolve over time. diff --git a/source/ecosystem/flash.rst b/docs/source-pytorch/ecosystem/flash.rst similarity index 100% rename from source/ecosystem/flash.rst rename to docs/source-pytorch/ecosystem/flash.rst diff --git a/source/ecosystem/metrics.rst b/docs/source-pytorch/ecosystem/metrics.rst similarity index 100% rename from source/ecosystem/metrics.rst rename to docs/source-pytorch/ecosystem/metrics.rst diff --git a/source/expertise_levels.rst b/docs/source-pytorch/expertise_levels.rst similarity index 82% rename from source/expertise_levels.rst rename to docs/source-pytorch/expertise_levels.rst index 9b563f7..3f98c8e 100644 --- a/source/expertise_levels.rst +++ b/docs/source-pytorch/expertise_levels.rst @@ -4,11 +4,6 @@ Level up ======== Learn enough Lightning to match the level of expertise required by your research or job. -.. join_slack:: - :align: left - :margin: 30 - ----- Basic skills ------------ @@ -97,15 +92,7 @@ Learn to scale up your models and enable collaborative model development at acad :tag: intermediate .. displayitem:: - :header: Level 8: Train in the background on the cloud - :description: Learn how to run models on the cloud in the background. - :button_link: levels/intermediate_level_8.html - :col_css: col-md-6 - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 9: Modularize your projects + :header: Level 8: Modularize your projects :description: Create DataModules to enable dataset reusability. :col_css: col-md-6 :button_link: levels/intermediate_level_9.html @@ -113,7 +100,7 @@ Learn to scale up your models and enable collaborative model development at acad :tag: intermediate .. displayitem:: - :header: Level 10: Understand your model + :header: Level 9: Understand your model :description: Use advanced visuals to find the best performing model. :col_css: col-md-6 :button_link: levels/intermediate_level_10.html @@ -121,7 +108,7 @@ Learn to scale up your models and enable collaborative model development at acad :tag: intermediate .. displayitem:: - :header: Level 11: Explore SOTA scaling techniques + :header: Level 10: Explore SOTA scaling techniques :description: Explore SOTA techniques to help convergence, stability and scalability. :col_css: col-md-6 :button_link: levels/intermediate_level_11.html @@ -129,7 +116,7 @@ Learn to scale up your models and enable collaborative model development at acad :tag: intermediate .. displayitem:: - :header: Level 12: Deploy your models + :header: Level 11: Deploy your models :description: Learn how to deploy your models with optimizations like ONNX and torchscript. :col_css: col-md-6 :button_link: levels/intermediate_level_12.html @@ -137,7 +124,7 @@ Learn to scale up your models and enable collaborative model development at acad :tag: intermediate .. displayitem:: - :header: Level 13: Optimize training speed + :header: Level 12: Optimize training speed :description: Use advanced profilers to mixed precision to train bigger models, faster. :col_css: col-md-6 :button_link: levels/intermediate_level_13.html @@ -145,7 +132,7 @@ Learn to scale up your models and enable collaborative model development at acad :tag: intermediate .. displayitem:: - :header: Level 14: Run on on-prem clusters + :header: Level 13: Run on on-prem clusters :description: Run on a custom on-prem cluster or SLURM cluster. :col_css: col-md-6 :button_link: levels/intermediate_level_14.html @@ -171,7 +158,7 @@ Configure all aspects of Lightning for advanced usecases. .. Add callout items below this line .. displayitem:: - :header: Level 15: Customize configs to run in production + :header: Level 14: Customize configs to run in production :description: Enable composable YAMLs :col_css: col-md-6 :button_link: levels/advanced_level_15.html @@ -179,7 +166,7 @@ Configure all aspects of Lightning for advanced usecases. :tag: advanced .. displayitem:: - :header: Level 16: Customize the trainer + :header: Level 15: Customize the trainer :description: Inject custom code into the trainer and modify the progress bar. :col_css: col-md-6 :button_link: levels/advanced_level_16.html @@ -187,7 +174,7 @@ Configure all aspects of Lightning for advanced usecases. :tag: advanced .. displayitem:: - :header: Level 17: Own the training loop + :header: Level 16: Own the training loop :description: Learn all the ways of owning your raw PyTorch loops with Lighting. :col_css: col-md-6 :button_link: levels/advanced_level_17.html @@ -195,7 +182,7 @@ Configure all aspects of Lightning for advanced usecases. :tag: advanced .. displayitem:: - :header: Level 18: Enable advanced checkpointing + :header: Level 17: Enable advanced checkpointing :description: Enable composable or cloud based checkpoints. :col_css: col-md-6 :button_link: levels/advanced_level_18.html @@ -203,7 +190,7 @@ Configure all aspects of Lightning for advanced usecases. :tag: advanced .. displayitem:: - :header: Level 19: Explore IPUs + :header: Level 18: Explore IPUs :description: Explore Intelligence Processing Unit (IPU) for model scaling. :col_css: col-md-6 :button_link: levels/advanced_level_19.html @@ -211,7 +198,7 @@ Configure all aspects of Lightning for advanced usecases. :tag: advanced .. displayitem:: - :header: Level 20: Explore HPUs + :header: Level 19: Explore HPUs :description: Explore Havana Gaudi Processing Unit (HPU) for model scaling. :col_css: col-md-6 :button_link: levels/advanced_level_20.html @@ -219,7 +206,7 @@ Configure all aspects of Lightning for advanced usecases. :tag: advanced .. displayitem:: - :header: Level 21: Master TPUs + :header: Level 20: Master TPUs :description: Master TPUs and run on cloud TPUs. :col_css: col-md-6 :button_link: levels/advanced_level_21.html @@ -227,7 +214,7 @@ Configure all aspects of Lightning for advanced usecases. :tag: advanced .. displayitem:: - :header: Level 22: Reach 1 trillion parameters on GPUs + :header: Level 21: Reach 1 trillion parameters on GPUs :description: Scale to 1 trillion params on GPUs. :col_css: col-md-6 :button_link: levels/advanced_level_22.html @@ -253,7 +240,7 @@ Customize and extend Lightning for things like custom hardware or distributed st .. Add callout items below this line .. displayitem:: - :header: Level 23: Extend the Lightning CLI + :header: Level 22: Extend the Lightning CLI :description: Extend the functionality of the Lightning CLI. :col_css: col-md-6 :button_link: levels/expert_level_23.html @@ -261,7 +248,7 @@ Customize and extend Lightning for things like custom hardware or distributed st :tag: expert .. displayitem:: - :header: Level 24: Integrate a custom cluster + :header: Level 23: Integrate a custom cluster :description: Integrate a custom cluster into Lightning. :col_css: col-md-6 :button_link: levels/expert_level_24.html @@ -269,15 +256,7 @@ Customize and extend Lightning for things like custom hardware or distributed st :tag: expert .. displayitem:: - :header: Level 25: Explore fault-tolerance in-depth - :description: Understand the details of fault-tolerance. - :col_css: col-md-6 - :button_link: clouds/fault_tolerant_training_faq.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: Level 26: Make your own profiler + :header: Level 24: Make your own profiler :description: Make your own profiler. :col_css: col-md-6 :button_link: tuning/profiler_expert.html @@ -285,7 +264,7 @@ Customize and extend Lightning for things like custom hardware or distributed st :tag: expert .. displayitem:: - :header: Level 27: Add a new accelerator or Strategy + :header: Level 25: Add a new accelerator or Strategy :description: Integrate a new accelerator or distributed strategy. :col_css: col-md-6 :button_link: levels/expert_level_27.html diff --git a/source/extensions/accelerator.rst b/docs/source-pytorch/extensions/accelerator.rst similarity index 85% rename from source/extensions/accelerator.rst rename to docs/source-pytorch/extensions/accelerator.rst index dd5a067..fb71d37 100644 --- a/source/extensions/accelerator.rst +++ b/docs/source-pytorch/extensions/accelerator.rst @@ -4,19 +4,20 @@ Accelerator ########### -The Accelerator connects a Lightning Trainer to arbitrary hardware (CPUs, GPUs, TPUs, IPUs, ...). +The Accelerator connects a Lightning Trainer to arbitrary hardware (CPUs, GPUs, TPUs, IPUs, MPS, ...). Currently there are accelerators for: - CPU - :doc:`GPU <../accelerators/gpu>` - :doc:`TPU <../accelerators/tpu>` - :doc:`IPU <../accelerators/ipu>` -- :doc:`HPU <../accelerators/hpu>` +- :doc:`HPU <../integrations/hpu/index>` +- :doc:`MPS <../accelerators/mps>` The Accelerator is part of the Strategy which manages communication across multiple devices (distributed communication). Whenever the Trainer, the loops or any other component in Lightning needs to talk to hardware, it calls into the Strategy and the Strategy calls into the Accelerator. -.. image:: https://pl-public-data.s3.amazonaws.com/docs/static/images/strategies/overview.jpeg +.. image:: ../_static/fetched-s3-assets/overview.jpeg :alt: Illustration of the Strategy as a composition of the Accelerator and several plugins We expose Accelerators and Strategies mainly for expert users who want to extend Lightning to work with new @@ -28,6 +29,8 @@ hardware and distributed training or clusters. Create a Custom Accelerator --------------------------- +.. warning:: This is an :ref:`experimental ` feature. + Here is how you create a new Accelerator. Let's pretend we want to integrate the fictional XPU accelerator and we have access to its hardware through a library ``xpulib``. @@ -38,7 +41,7 @@ Let's pretend we want to integrate the fictional XPU accelerator and we have acc class XPUAccelerator(Accelerator): - """Experimental support for XPU, optimized for large-scale machine learning.""" + """Support for a hypothetical XPU, optimized for large-scale machine learning.""" @staticmethod def parse_devices(devices: Any) -> Any: @@ -69,7 +72,7 @@ Finally, add the XPUAccelerator to the Trainer: .. code-block:: python - from pytorch_lightning import Trainer + from lightning.pytorch import Trainer accelerator = XPUAccelerator() trainer = Trainer(accelerator=accelerator, devices=2) @@ -83,7 +86,7 @@ Finally, add the XPUAccelerator to the Trainer: Registering Accelerators ------------------------ -If you wish to switch to a custom accelerator from the CLI without code changes, you can implement the :meth:`~pytorch_lightning.accelerators.accelerator.Accelerator.register_accelerators` class method to register your new accelerator under a shorthand name like so: +If you wish to switch to a custom accelerator from the CLI without code changes, you can implement the :meth:`~lightning.pytorch.accelerators.accelerator.Accelerator.register_accelerators` class method to register your new accelerator under a shorthand name like so: .. code-block:: python @@ -116,7 +119,7 @@ Or if you are using the Lightning CLI, for example: Accelerator API --------------- -.. currentmodule:: pytorch_lightning.accelerators +.. currentmodule:: lightning.pytorch.accelerators .. autosummary:: :nosignatures: @@ -124,7 +127,6 @@ Accelerator API Accelerator CPUAccelerator - GPUAccelerator - HPUAccelerator - IPUAccelerator - TPUAccelerator + CUDAAccelerator + MPSAccelerator + XLAAccelerator diff --git a/docs/source-pytorch/extensions/callbacks.rst b/docs/source-pytorch/extensions/callbacks.rst new file mode 100644 index 0000000..0e43c23 --- /dev/null +++ b/docs/source-pytorch/extensions/callbacks.rst @@ -0,0 +1,368 @@ +.. role:: hidden + :class: hidden-section + +.. _callbacks: + +######## +Callback +######## + +Callbacks allow you to add arbitrary self-contained programs to your training. +At specific points during the flow of execution (hooks), the Callback interface allows you to design programs that encapsulate a full set of functionality. +It de-couples functionality that does not need to be in the :doc:`lightning module <../common/lightning_module>` and can be shared across projects. + +Lightning has a callback system to execute them when needed. Callbacks should capture NON-ESSENTIAL +logic that is NOT required for your :doc:`lightning module <../common/lightning_module>` to run. + +A complete list of Callback hooks can be found in :class:`~lightning.pytorch.callbacks.callback.Callback`. + +An overall Lightning system should have: + +1. Trainer for all engineering +2. LightningModule for all research code. +3. Callbacks for non-essential code. + +| + +Example: + +.. testcode:: + + from lightning.pytorch.callbacks import Callback + + + class MyPrintingCallback(Callback): + def on_train_start(self, trainer, pl_module): + print("Training is starting") + + def on_train_end(self, trainer, pl_module): + print("Training is ending") + + + trainer = Trainer(callbacks=[MyPrintingCallback()]) + +We successfully extended functionality without polluting our super clean +:doc:`lightning module <../common/lightning_module>` research code. + +You can do pretty much anything with callbacks. + +-------------- + +****************** +Built-in Callbacks +****************** +Lightning has a few built-in callbacks. + +.. note:: + For a richer collection of callbacks, check out our + `bolts library `_. + +.. currentmodule:: lightning.pytorch.callbacks + +.. autosummary:: + :nosignatures: + :template: classtemplate.rst + + BackboneFinetuning + BaseFinetuning + BasePredictionWriter + BatchSizeFinder + Callback + DeviceStatsMonitor + EarlyStopping + GradientAccumulationScheduler + LambdaCallback + LearningRateFinder + LearningRateMonitor + ModelCheckpoint + ModelPruning + ModelSummary + ProgressBar + RichModelSummary + RichProgressBar + StochasticWeightAveraging + Timer + TQDMProgressBar + +---------- + +.. include:: callbacks_state.rst + +---------- + + +************** +Best Practices +************** +The following are best practices when using/designing callbacks. + +1. Callbacks should be isolated in their functionality. +2. Your callback should not rely on the behavior of other callbacks in order to work properly. +3. Do not manually call methods from the callback. +4. Directly calling methods (eg. `on_validation_end`) is strongly discouraged. +5. Whenever possible, your callbacks should not depend on the order in which they are executed. + + +----------- + +.. include:: entry_points.rst + +----------- + +.. _callback_hooks: + +************ +Callback API +************ +Here is the full API of methods available in the Callback base class. + +The :class:`~lightning.pytorch.callbacks.Callback` class is the base for all the callbacks in Lightning just like the :class:`~lightning.pytorch.core.module.LightningModule` is the base for all models. +It defines a public interface that each callback implementation must follow, the key ones are: + +Properties +========== + +state_key +^^^^^^^^^ + +.. autoattribute:: lightning.pytorch.callbacks.Callback.state_key + :noindex: + + +Hooks +===== + +setup +^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.setup + :noindex: + +teardown +^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.teardown + :noindex: + +on_fit_start +^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_fit_start + :noindex: + +on_fit_end +^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_fit_end + :noindex: + +on_sanity_check_start +^^^^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_sanity_check_start + :noindex: + +on_sanity_check_end +^^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_sanity_check_end + :noindex: + +on_train_batch_start +^^^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_train_batch_start + :noindex: + +on_train_batch_end +^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_train_batch_end + :noindex: + +on_train_epoch_start +^^^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_train_epoch_start + :noindex: + +on_train_epoch_end +^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_train_epoch_end + :noindex: + +on_validation_epoch_start +^^^^^^^^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_validation_epoch_start + :noindex: + +on_validation_epoch_end +^^^^^^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_validation_epoch_end + :noindex: + +on_test_epoch_start +^^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_test_epoch_start + :noindex: + +on_test_epoch_end +^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_test_epoch_end + :noindex: + +on_predict_epoch_start +^^^^^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_predict_epoch_start + :noindex: + +on_predict_epoch_end +^^^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_predict_epoch_end + :noindex: + +on_validation_batch_start +^^^^^^^^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_validation_batch_start + :noindex: + +on_validation_batch_end +^^^^^^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_validation_batch_end + :noindex: + +on_test_batch_start +^^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_test_batch_start + :noindex: + +on_test_batch_end +^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_test_batch_end + :noindex: + +on_predict_batch_start +^^^^^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_predict_batch_start + :noindex: + +on_predict_batch_end +^^^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_predict_batch_end + :noindex: + +on_train_start +^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_train_start + :noindex: + +on_train_end +^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_train_end + :noindex: + +on_validation_start +^^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_validation_start + :noindex: + +on_validation_end +^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_validation_end + :noindex: + +on_test_start +^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_test_start + :noindex: + +on_test_end +^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_test_end + :noindex: + +on_predict_start +^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_predict_start + :noindex: + +on_predict_end +^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_predict_end + :noindex: + + +on_exception +^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_exception + :noindex: + +state_dict +^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.state_dict + :noindex: + +on_save_checkpoint +^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_save_checkpoint + :noindex: + +load_state_dict +^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.load_state_dict + :noindex: + +on_load_checkpoint +^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_load_checkpoint + :noindex: + +on_before_backward +^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_before_backward + :noindex: + +on_after_backward +^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_after_backward + :noindex: + +on_before_optimizer_step +^^^^^^^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_before_optimizer_step + :noindex: + +on_before_zero_grad +^^^^^^^^^^^^^^^^^^^ + +.. automethod:: lightning.pytorch.callbacks.Callback.on_before_zero_grad + :noindex: diff --git a/source/extensions/callbacks_state.rst b/docs/source-pytorch/extensions/callbacks_state.rst similarity index 84% rename from source/extensions/callbacks_state.rst rename to docs/source-pytorch/extensions/callbacks_state.rst index 0a104ca..c83f373 100644 --- a/source/extensions/callbacks_state.rst +++ b/docs/source-pytorch/extensions/callbacks_state.rst @@ -4,12 +4,12 @@ Save Callback state Some callbacks require internal state in order to function properly. You can optionally choose to persist your callback's state as part of model checkpoint files using -:meth:`~pytorch_lightning.callbacks.Callback.state_dict` and :meth:`~pytorch_lightning.callbacks.Callback.load_state_dict`. +:meth:`~lightning.pytorch.callbacks.Callback.state_dict` and :meth:`~lightning.pytorch.callbacks.Callback.load_state_dict`. Note that the returned state must be able to be pickled. When your callback is meant to be used only as a singleton callback then implementing the above two hooks is enough to persist state effectively. However, if passing multiple instances of the callback to the Trainer is supported, then -the callback must define a :attr:`~pytorch_lightning.callbacks.Callback.state_key` property in order for Lightning +the callback must define a :attr:`~lightning.pytorch.callbacks.Callback.state_key` property in order for Lightning to be able to distinguish the different states when loading the callback state. This concept is best illustrated by the following example. @@ -22,9 +22,9 @@ the following example. self.state = {"epochs": 0, "batches": 0} @property - def state_key(self): + def state_key(self) -> str: # note: we do not include `verbose` here on purpose - return self._generate_state_key(what=self.what) + return f"Counter[what={self.what}]" def on_train_epoch_end(self, *args, **kwargs): if self.what == "epochs": @@ -57,6 +57,6 @@ A Lightning checkpoint from this Trainer with the two stateful callbacks will in } } -The implementation of a :attr:`~pytorch_lightning.callbacks.Callback.state_key` is essential here. If it were missing, -Lightning would not be able to disambiguate the state for these two callbacks, and :attr:`~pytorch_lightning.callbacks.Callback.state_key` +The implementation of a :attr:`~lightning.pytorch.callbacks.Callback.state_key` is essential here. If it were missing, +Lightning would not be able to disambiguate the state for these two callbacks, and :attr:`~lightning.pytorch.callbacks.Callback.state_key` by default only defines the class name as the key, e.g., here ``Counter``. diff --git a/source/extensions/datamodules_state.rst b/docs/source-pytorch/extensions/datamodules_state.rst similarity index 100% rename from source/extensions/datamodules_state.rst rename to docs/source-pytorch/extensions/datamodules_state.rst diff --git a/docs/source-pytorch/extensions/entry_points.rst b/docs/source-pytorch/extensions/entry_points.rst new file mode 100644 index 0000000..bf1279a --- /dev/null +++ b/docs/source-pytorch/extensions/entry_points.rst @@ -0,0 +1,45 @@ +************ +Entry Points +************ + +Lightning supports registering Trainer callbacks directly through +`Entry Points `_. Entry points allow an arbitrary +package to include callbacks that the Lightning Trainer can automatically use, without you having to add them +to the Trainer manually. This is useful in production environments where it is common to provide specialized monitoring +and logging callbacks globally for every application. + +Here is a callback factory function that returns two special callbacks: + +.. code-block:: python + :caption: factories.py + + def my_custom_callbacks_factory(): + return [MyCallback1(), MyCallback2()] + +If we make this `factories.py` file into an installable package, we can define an **entry point** for this factory function. +Here is a minimal example of the `setup.py` file for the package `my-package`: + +.. code-block:: python + :caption: setup.py + + from setuptools import setup + + setup( + name="my-package", + version="0.0.1", + install_requires=["lightning"], + entry_points={ + "lightning.pytorch.callbacks_factory": [ + # The format here must be [any name]=[module path]:[function name] + "monitor_callbacks=factories:my_custom_callbacks_factory" + ] + }, + ) + +The group name for the entry points is ``lightning.pytorch.callbacks_factory`` and it contains a list of strings that +specify where to find the function within the package. + +Now, if you `pip install -e .` this package, it will register the ``my_custom_callbacks_factory`` function and Lightning +will automatically call it to collect the callbacks whenever you run the Trainer! + +To unregister the factory, simply uninstall the package with `pip uninstall "my-package"`. diff --git a/docs/source-pytorch/extensions/logging.rst b/docs/source-pytorch/extensions/logging.rst new file mode 100644 index 0000000..a96e332 --- /dev/null +++ b/docs/source-pytorch/extensions/logging.rst @@ -0,0 +1,408 @@ +:orphan: + +.. testsetup:: * + + from lightning.pytorch import loggers as pl_loggers + +.. role:: hidden + :class: hidden-section + +.. _logging: + + +####### +Logging +####### + +***************** +Supported Loggers +***************** + +The following are loggers we support: + +.. currentmodule:: lightning.pytorch.loggers + +.. autosummary:: + :toctree: generated + :nosignatures: + :template: classtemplate.rst + + CometLogger + CSVLogger + MLFlowLogger + NeptuneLogger + TensorBoardLogger + WandbLogger + + +The above loggers will normally plot an additional chart (**global_step VS epoch**). Depending on the loggers you use, there might be some additional charts too. + +By default, Lightning uses ``TensorBoard`` logger under the hood, and stores the logs to a directory (by default in ``lightning_logs/``). + +.. testcode:: + + from lightning.pytorch import Trainer + + # Automatically logs to a directory (by default ``lightning_logs/``) + trainer = Trainer() + +To see your logs: + +.. code-block:: bash + + tensorboard --logdir=lightning_logs/ + +To visualize tensorboard in a jupyter notebook environment, run the following command in a jupyter cell: + +.. code-block:: bash + + %reload_ext tensorboard + %tensorboard --logdir=lightning_logs/ + +You can also pass a custom Logger to the :class:`~lightning.pytorch.trainer.trainer.Trainer`. + +.. testcode:: + :skipif: not _TENSORBOARD_AVAILABLE and not _TENSORBOARDX_AVAILABLE + + from lightning.pytorch import loggers as pl_loggers + + tb_logger = pl_loggers.TensorBoardLogger(save_dir="logs/") + trainer = Trainer(logger=tb_logger) + +Choose from any of the others such as MLflow, Comet, Neptune, WandB, etc. + +.. testcode:: + :skipif: not _COMET_AVAILABLE + + comet_logger = pl_loggers.CometLogger(save_dir="logs/") + trainer = Trainer(logger=comet_logger) + +To use multiple loggers, simply pass in a ``list`` or ``tuple`` of loggers. + +.. testcode:: + :skipif: (not _TENSORBOARD_AVAILABLE and not _TENSORBOARDX_AVAILABLE) or not _COMET_AVAILABLE + + tb_logger = pl_loggers.TensorBoardLogger(save_dir="logs/") + comet_logger = pl_loggers.CometLogger(save_dir="logs/") + trainer = Trainer(logger=[tb_logger, comet_logger]) + +.. note:: + + By default, Lightning logs every 50 steps. Use Trainer flags to :ref:`logging_frequency`. + +.. note:: + + By default, all loggers log to ``os.getcwd()``. You can change the logging path using + ``Trainer(default_root_dir="/your/path/to/save/checkpoints")`` without instantiating a logger. + +---------- + +****************************** +Logging from a LightningModule +****************************** + +Lightning offers automatic log functionalities for logging scalars, or manual logging for anything else. + +Automatic Logging +================= + +Use the :meth:`~lightning.pytorch.core.module.LightningModule.log` or :meth:`~lightning.pytorch.core.module.LightningModule.log_dict` +methods to log from anywhere in a :doc:`LightningModule <../common/lightning_module>` and :doc:`callbacks <../extensions/callbacks>`. + +.. code-block:: python + + def training_step(self, batch, batch_idx): + self.log("my_metric", x) + + + # or a dict to log all metrics at once with individual plots + def training_step(self, batch, batch_idx): + self.log_dict({"acc": acc, "recall": recall}) + +.. note:: + Everything explained below applies to both :meth:`~lightning.pytorch.core.module.LightningModule.log` or :meth:`~lightning.pytorch.core.module.LightningModule.log_dict` methods. + +Depending on where the :meth:`~lightning.pytorch.core.module.LightningModule.log` method is called, Lightning auto-determines +the correct logging mode for you. Of course you can override the default behavior by manually setting the +:meth:`~lightning.pytorch.core.module.LightningModule.log` parameters. + +.. code-block:: python + + def training_step(self, batch, batch_idx): + self.log("my_loss", loss, on_step=True, on_epoch=True, prog_bar=True, logger=True) + +The :meth:`~lightning.pytorch.core.module.LightningModule.log` method has a few options: + +* ``on_step``: Logs the metric at the current step. +* ``on_epoch``: Automatically accumulates and logs at the end of the epoch. +* ``prog_bar``: Logs to the progress bar (Default: ``False``). +* ``logger``: Logs to the logger like ``Tensorboard``, or any other custom logger passed to the :class:`~lightning.pytorch.trainer.trainer.Trainer` (Default: ``True``). +* ``reduce_fx``: Reduction function over step values for end of epoch. Uses :meth:`torch.mean` by default and is not applied when a :class:`torchmetrics.Metric` is logged. +* ``enable_graph``: If True, will not auto detach the graph. +* ``sync_dist``: If True, reduces the metric across devices. Use with care as this may lead to a significant communication overhead. +* ``sync_dist_group``: The DDP group to sync across. +* ``add_dataloader_idx``: If True, appends the index of the current dataloader to the name (when using multiple dataloaders). If False, user needs to give unique names for each dataloader to not mix the values. +* ``batch_size``: Current batch size used for accumulating logs logged with ``on_epoch=True``. This will be directly inferred from the loaded batch, but for some data structures you might need to explicitly provide it. +* ``rank_zero_only``: Whether the value will be logged only on rank 0. This will prevent synchronization which would produce a deadlock as not all processes would perform this log call. + +.. list-table:: Default behavior of logging in Callback or LightningModule + :widths: 50 25 25 + :header-rows: 1 + + * - Hook + - on_step + - on_epoch + * - on_train_start, on_train_epoch_start, on_train_epoch_end + - False + - True + * - on_before_backward, on_after_backward, on_before_optimizer_step, on_before_zero_grad + - True + - False + * - on_train_batch_start, on_train_batch_end, training_step + - True + - False + * - on_validation_start, on_validation_epoch_start, on_validation_epoch_end + - False + - True + * - on_validation_batch_start, on_validation_batch_end, validation_step + - False + - True + + +.. note:: + + While logging tensor metrics with ``on_epoch=True`` inside step-level hooks and using mean-reduction (default) to accumulate the metrics across the current epoch, Lightning tries to extract the + batch size from the current batch. If multiple possible batch sizes are found, a warning is logged and if it fails to extract the batch size from the current batch, which is possible if + the batch is a custom structure/collection, then an error is raised. To avoid this, you can specify the ``batch_size`` inside the ``self.log(... batch_size=batch_size)`` call. + + .. code-block:: python + + def training_step(self, batch, batch_idx): + # extracts the batch size from `batch` + self.log("train_loss", loss, on_epoch=True) + + + def validation_step(self, batch, batch_idx): + # uses `batch_size=10` + self.log("val_loss", loss, batch_size=10) + +.. note:: + + - The above config for ``validation`` applies for ``test`` hooks as well. + + - Setting ``on_epoch=True`` will cache all your logged values during the full training epoch and perform a + reduction in ``on_train_epoch_end``. We recommend using `TorchMetrics `_, when working with custom reduction. + + - Setting both ``on_step=True`` and ``on_epoch=True`` will create two keys per metric you log with + suffix ``_step`` and ``_epoch`` respectively. You can refer to these keys e.g. in the `monitor` + argument of :class:`~lightning.pytorch.callbacks.model_checkpoint.ModelCheckpoint` or in the graphs plotted to the logger of your choice. + + +If your work requires to log in an unsupported method, please open an issue with a clear description of why it is blocking you. + + +Manual Logging Non-Scalar Artifacts +=================================== + +If you want to log anything that is not a scalar, like histograms, text, images, etc., you may need to use the logger object directly. + +.. code-block:: python + + def training_step(self): + ... + # the logger you used (in this case tensorboard) + tensorboard = self.logger.experiment + tensorboard.add_image() + tensorboard.add_histogram(...) + tensorboard.add_figure(...) + + +---------- + +******************** +Make a Custom Logger +******************** + +You can implement your own logger by writing a class that inherits from :class:`~lightning.pytorch.loggers.logger.Logger`. +Use the :func:`~lightning.pytorch.loggers.logger.rank_zero_experiment` and :func:`~lightning.pytorch.utilities.rank_zero.rank_zero_only` decorators to make sure that only the first process in DDP training creates the experiment and logs the data respectively. + +.. testcode:: + + from lightning.pytorch.loggers.logger import Logger, rank_zero_experiment + from lightning.pytorch.utilities import rank_zero_only + + + class MyLogger(Logger): + @property + def name(self): + return "MyLogger" + + @property + def version(self): + # Return the experiment version, int or str. + return "0.1" + + @rank_zero_only + def log_hyperparams(self, params): + # params is an argparse.Namespace + # your code to record hyperparameters goes here + pass + + @rank_zero_only + def log_metrics(self, metrics, step): + # metrics is a dictionary of metric names and values + # your code to record metrics goes here + pass + + @rank_zero_only + def save(self): + # Optional. Any code necessary to save logger data goes here + pass + + @rank_zero_only + def finalize(self, status): + # Optional. Any code that needs to be run after training + # finishes goes here + pass + +If you write a logger that may be useful to others, please send +a pull request to add it to Lightning! + +---------- + +.. _logging_frequency: + + +************************* +Control Logging Frequency +************************* + +Logging frequency +================= + +It may slow down training to log on every single batch. By default, Lightning logs every 50 rows, or 50 training steps. +To change this behaviour, set the ``log_every_n_steps`` :class:`~lightning.pytorch.trainer.trainer.Trainer` flag. + +.. testcode:: + + k = 10 + trainer = Trainer(log_every_n_steps=k) + + +Log Writing Frequency +===================== + +Individual logger implementations determine their flushing frequency. For example, on the +:class:`~lightning.pytorch.loggers.csv_logs.CSVLogger` you can set the flag ``flush_logs_every_n_steps``. + +---------- + +************ +Progress Bar +************ + +You can add any metric to the progress bar using :meth:`~lightning.pytorch.core.module.LightningModule.log` +method, setting ``prog_bar=True``. + + +.. code-block:: python + + def training_step(self, batch, batch_idx): + self.log("my_loss", loss, prog_bar=True) + + +You could learn more about progress bars supported by Lightning :doc:`here <../common/progress_bar>`. + +Modifying the Progress Bar +========================== + +The progress bar by default already includes the training loss and version number of the experiment +if you are using a logger. These defaults can be customized by overriding the +:meth:`~lightning.pytorch.callbacks.progress.progress_bar.ProgressBar.get_metrics` hook in your logger. + +.. code-block:: python + + from lightning.pytorch.callbacks.progress import TQDMProgressBar + + + class CustomProgressBar(TQDMProgressBar): + def get_metrics(self, *args, **kwargs): + # don't show the version number + items = super().get_metrics() + items.pop("v_num", None) + return items + + +---------- + + +************************* +Configure Console Logging +************************* + +Lightning logs useful information about the training process and user warnings to the console. +You can retrieve the Lightning console logger and change it to your liking. For example, adjust the logging level +or redirect output for certain modules to log files: + +.. testcode:: + + import logging + + # configure logging at the root level of Lightning + logging.getLogger("lightning.pytorch").setLevel(logging.ERROR) + + # configure logging on module level, redirect to file + logger = logging.getLogger("lightning.pytorch.core") + logger.addHandler(logging.FileHandler("core.log")) + +Read more about custom Python logging `here `_. + + +---------- + +*********************** +Logging Hyperparameters +*********************** + +When training a model, it is useful to know what hyperparams went into that model. +When Lightning creates a checkpoint, it stores a key ``"hyper_parameters"`` with the hyperparams. + +.. code-block:: python + + lightning_checkpoint = torch.load(filepath, map_location=lambda storage, loc: storage) + hyperparams = lightning_checkpoint["hyper_parameters"] + +Some loggers also allow logging the hyperparams used in the experiment. For instance, +when using the ``TensorBoardLogger``, all hyperparams will show +in the hparams tab at :meth:`torch.utils.tensorboard.writer.SummaryWriter.add_hparams`. + +.. note:: + If you want to track a metric in the tensorboard hparams tab, log scalars to the key ``hp_metric``. If tracking multiple metrics, initialize ``TensorBoardLogger`` with ``default_hp_metric=False`` and call ``log_hyperparams`` only once with your metric keys and initial values. Subsequent updates can simply be logged to the metric keys. Refer to the examples below for setting up proper hyperparams metrics tracking within the :doc:`LightningModule <../common/lightning_module>`. + + .. code-block:: python + + # Using default_hp_metric + def validation_step(self, batch, batch_idx): + self.log("hp_metric", some_scalar) + + + # Using custom or multiple metrics (default_hp_metric=False) + def on_train_start(self): + self.logger.log_hyperparams(self.hparams, {"hp/metric_1": 0, "hp/metric_2": 0}) + + + def validation_step(self, batch, batch_idx): + self.log("hp/metric_1", some_scalar_1) + self.log("hp/metric_2", some_scalar_2) + + In the example, using ``"hp/"`` as a prefix allows for the metrics to be grouped under "hp" in the tensorboard scalar tab where you can collapse them. + +----------- + +*************************** +Managing Remote Filesystems +*************************** + +Lightning supports saving logs to a variety of filesystems, including local filesystems and several cloud storage providers. + +Check out the :doc:`Remote Filesystems <../common/remote_fs>` doc for more info. diff --git a/source/extensions/plugins.rst b/docs/source-pytorch/extensions/plugins.rst similarity index 82% rename from source/extensions/plugins.rst rename to docs/source-pytorch/extensions/plugins.rst index 392a072..83d9f66 100644 --- a/source/extensions/plugins.rst +++ b/docs/source-pytorch/extensions/plugins.rst @@ -46,24 +46,19 @@ We provide precision plugins for you to benefit from numerical representations w The full list of built-in precision plugins is listed below. -.. currentmodule:: pytorch_lightning.plugins.precision +.. currentmodule:: lightning.pytorch.plugins.precision .. autosummary:: :nosignatures: :template: classtemplate.rst - ApexMixedPrecisionPlugin DeepSpeedPrecisionPlugin DoublePrecisionPlugin - FullyShardedNativeMixedPrecisionPlugin - HPUPrecisionPlugin - IPUPrecisionPlugin + FSDPMixedPrecisionPlugin MixedPrecisionPlugin - NativeMixedPrecisionPlugin PrecisionPlugin - ShardedNativeMixedPrecisionPlugin - TPUBf16PrecisionPlugin - TPUPrecisionPlugin + XLABf16PrecisionPlugin + XLAPrecisionPlugin More information regarding precision with Lightning can be found :ref:`here ` @@ -76,19 +71,19 @@ More information regarding precision with Lightning can be found :ref:`here
`. It can be controlled by passing different
+strategy with aliases (``"ddp"``, ``"ddp_spawn"``, ``"deepspeed"`` and so on) as well as a custom strategy to the ``strategy`` parameter for Trainer.
+
+The Strategy in PyTorch Lightning handles the following responsibilities:
+
+* Launch and teardown of training processes (if applicable).
+* Setup communication between processes (NCCL, GLOO, MPI, and so on).
+* Provide a unified communication interface for reduction, broadcast, and so on.
+* Owns the :class:`~lightning.pytorch.core.module.LightningModule`
+* Handles/owns optimizers and schedulers.
+
+
+Strategy is a composition of one :doc:`Accelerator <../extensions/accelerator>`, one :ref:`Precision Plugin `, a :ref:`CheckpointIO `
+plugin and other optional plugins such as the :ref:`ClusterEnvironment `.
+
+.. image:: ../_static/fetched-s3-assets/overview.jpeg
+    :alt: Illustration of the Strategy as a composition of the Accelerator and several plugins
+
+We expose Strategies mainly for expert users that want to extend Lightning for new hardware support or new distributed backends (e.g. a backend not yet supported by `PyTorch `_ itself).
+
+
+----
+
+*****************************
+Selecting a Built-in Strategy
+*****************************
+
+Built-in strategies can be selected in two ways.
+
+1. Pass the shorthand name to the ``strategy`` Trainer argument
+2. Import a Strategy from :mod:`lightning.pytorch.strategies`, instantiate it and pass it to the ``strategy`` Trainer argument
+
+The latter allows you to configure further options on the specifc strategy.
+Here are some examples:
+
+.. code-block:: python
+
+    # Training with the DistributedDataParallel strategy on 4 GPUs
+    trainer = Trainer(strategy="ddp", accelerator="gpu", devices=4)
+
+    # Training with the DistributedDataParallel strategy on 4 GPUs, with options configured
+    trainer = Trainer(strategy=DDPStrategy(static_graph=True), accelerator="gpu", devices=4)
+
+    # Training with the DDP Spawn strategy using auto accelerator selection
+    trainer = Trainer(strategy="ddp_spawn", accelerator="auto", devices=4)
+
+    # Training with the DeepSpeed strategy on available GPUs
+    trainer = Trainer(strategy="deepspeed", accelerator="gpu", devices="auto")
+
+    # Training with the DDP strategy using 3 CPU processes
+    trainer = Trainer(strategy="ddp", accelerator="cpu", devices=3)
+
+    # Training with the DDP Spawn strategy on 8 TPU cores
+    trainer = Trainer(strategy="ddp_spawn", accelerator="tpu", devices=8)
+
+    # Training with the default IPU strategy on 8 IPUs
+    trainer = Trainer(accelerator="ipu", devices=8)
+
+The below table lists all relevant strategies available in Lightning with their corresponding short-hand name:
+
+.. list-table:: Strategy Classes and Nicknames
+   :widths: 20 20 20
+   :header-rows: 1
+
+   * - Name
+     - Class
+     - Description
+   * - fsdp
+     - :class:`~lightning.pytorch.strategies.FSDPStrategy`
+     - Strategy for Fully Sharded Data Parallel training. :ref:`Learn more. `
+   * - ddp
+     - :class:`~lightning.pytorch.strategies.DDPStrategy`
+     - Strategy for multi-process single-device training on one or multiple nodes. :ref:`Learn more. `
+   * - ddp_spawn
+     - :class:`~lightning.pytorch.strategies.DDPStrategy`
+     - Same as "ddp" but launches processes using :func:`torch.multiprocessing.spawn` method and joins processes after training finishes. :ref:`Learn more. `
+   * - deepspeed
+     - :class:`~lightning.pytorch.strategies.DeepSpeedStrategy`
+     - Provides capabilities to run training using the DeepSpeed library, with training optimizations for large billion parameter models. :ref:`Learn more. `
+   * - hpu_parallel
+     - ``HPUParallelStrategy``
+     - Strategy for distributed training on multiple HPU devices. :doc:`Learn more. <../integrations/hpu/index>`
+   * - hpu_single
+     - ``SingleHPUStrategy``
+     - Strategy for training on a single HPU device. :doc:`Learn more. <../integrations/hpu/index>`
+   * - ipu_strategy
+     - ``IPUStrategy``
+     - Plugin for training on IPU devices. :doc:`Learn more. <../accelerators/ipu>`
+   * - xla
+     - :class:`~lightning.pytorch.strategies.XLAStrategy`
+     - Strategy for training on multiple TPU devices using the :func:`torch_xla.distributed.xla_multiprocessing.spawn` method. :doc:`Learn more. <../accelerators/tpu>`
+   * - single_xla
+     - :class:`~lightning.pytorch.strategies.SingleXLAStrategy`
+     - Strategy for training on a single XLA device, like TPUs. :doc:`Learn more. <../accelerators/tpu>`
+
+----
+
+
+**********************
+Third-party Strategies
+**********************
+
+There are powerful third-party strategies that integrate well with Lightning but aren't maintained as part of the ``lightning`` package.
+
+.. list-table:: List of third-party strategy implementations
+   :widths: 20 20 20
+   :header-rows: 1
+
+   * - Name
+     - Package
+     - Description
+   * - ColossalAI
+     - `Lightning-AI/lightning-colossalai `_
+     - Colossal-AI provides a collection of parallel components for you. It aims to support you to write your distributed deep learning models just like how you write your model on your laptop. `Learn more. `__
+   * - Bagua
+     - `Lightning-AI/lightning-Bagua `_
+     - Bagua is a deep learning training acceleration framework for PyTorch, with advanced distributed training algorithms and system optimizations. `Learn more. `__
+   * - hivemind
+     - `Lightning-AI/lightning-hivemind `_
+     - Hivemind is a PyTorch library for decentralized deep learning across the Internet. Its intended usage is training one large model on hundreds of computers from different universities, companies, and volunteers. `Learn more. `__
+
+
+----
+
+
+************************
+Create a Custom Strategy
+************************
+
+Every strategy in Lightning is a subclass of one of the main base classes: :class:`~lightning.pytorch.strategies.Strategy`, :class:`~lightning.pytorch.strategies.SingleDeviceStrategy` or :class:`~lightning.pytorch.strategies.ParallelStrategy`.
+
+.. image:: ../_static/fetched-s3-assets/hierarchy.jpeg
+    :alt: Strategy base classes
+
+As an expert user, you may choose to extend either an existing built-in Strategy or create a completely new one by
+subclassing the base classes.
+
+.. code-block:: python
+
+    from lightning.pytorch.strategies import DDPStrategy
+
+
+    class CustomDDPStrategy(DDPStrategy):
+        def configure_ddp(self):
+            self.model = MyCustomDistributedDataParallel(
+                self.model,
+                device_ids=...,
+            )
+
+        def setup(self, trainer):
+            # you can access the accelerator and plugins directly
+            self.accelerator.setup()
+            self.precision_plugin.connect(...)
+
+
+The custom strategy can then be passed into the ``Trainer`` directly via the ``strategy`` parameter.
+
+.. code-block:: python
+
+    # custom strategy
+    trainer = Trainer(strategy=CustomDDPStrategy())
+
+
+Since the strategy also hosts the Accelerator and various plugins, you can customize all of them to work together as you like:
+
+.. code-block:: python
+
+    # custom strategy, with new accelerator and plugins
+    accelerator = MyAccelerator()
+    precision_plugin = MyPrecisionPlugin()
+    strategy = CustomDDPStrategy(accelerator=accelerator, precision_plugin=precision_plugin)
+    trainer = Trainer(strategy=strategy)
diff --git a/docs/source-pytorch/generated/CHANGELOG.md b/docs/source-pytorch/generated/CHANGELOG.md
new file mode 100644
index 0000000..0d01829
--- /dev/null
+++ b/docs/source-pytorch/generated/CHANGELOG.md
@@ -0,0 +1,7 @@
+# Changelog
+
+이 프로젝트의 모든 주요한 변경 사항은 이 파일에 문서화됩니다.
+하지만, 한국어 번역에서는 최신 버전을 반영하지 못할 수 있으므로, [원본 문서](https://lightning.ai/docs/pytorch/stable/generated/CHANGELOG.html)를 참고해주세요.
+
+> All notable changes to this project will be documented in this file.
+> However, the Korean site may not reflect the latest version, so please refer to the [original documentation](https://lightning.ai/docs/pytorch/stable/generated/CHANGELOG.html).
\ No newline at end of file
diff --git a/docs/source-pytorch/glossary/index.rst b/docs/source-pytorch/glossary/index.rst
new file mode 100644
index 0000000..94a042b
--- /dev/null
+++ b/docs/source-pytorch/glossary/index.rst
@@ -0,0 +1,331 @@
+
+.. toctree::
+   :maxdepth: 1
+   :hidden:
+
+   Accelerators <../extensions/accelerator>
+   Callback <../extensions/callbacks>
+   Checkpointing <../common/checkpointing>
+   Cluster <../clouds/cluster>
+   Cloud checkpoint <../common/checkpointing_advanced>
+   Console Logging <../common/console_logs>
+   Debugging <../debug/debugging>
+   Early stopping <../common/early_stopping>
+   Experiment manager (Logger) <../visualize/experiment_managers>
+   Finetuning <../advanced/finetuning>
+   GPU <../accelerators/gpu>
+   Half precision <../common/precision>
+   HPU <../integrations/hpu/index>
+   Inference <../deploy/production_intermediate>
+   IPU <../accelerators/ipu>
+   Lightning CLI <../cli/lightning_cli>
+   LightningDataModule <../data/datamodule>
+   LightningModule <../common/lightning_module>
+   Log <../visualize/loggers>
+   TPU <../accelerators/tpu>
+   Metrics 
+   Model <../model/build_model.rst>
+   Model Parallel <../advanced/model_parallel>
+   Plugins <../extensions/plugins>
+   Progress bar <../common/progress_bar>
+   Production <../deploy/production_advanced>
+   Predict <../deploy/production_basic>
+   Pretrained models <../advanced/pretrained>
+   Profiler <../tuning/profiler>
+   Pruning and Quantization <../advanced/pruning_quantization>
+   Remote filesystem and FSSPEC <../common/remote_fs>
+   Strategy <../extensions/strategy>
+   Strategy registry <../advanced/strategy_registry>
+   Style guide <../starter/style_guide>
+   SWA <../advanced/training_tricks>
+   SLURM <../clouds/cluster_advanced>
+   Transfer learning <../advanced/transfer_learning>
+   Trainer <../common/trainer>
+   Torch distributed <../clouds/cluster_intermediate_2>
+
+########
+Glossary
+########
+
+.. raw:: html
+
+    
+
+ +.. displayitem:: + :header: Accelerators + :description: Accelerators connect the Trainer to hardware to train faster + :col_css: col-md-12 + :button_link: ../extensions/accelerator.html + :height: 100 + +.. displayitem:: + :header: Callback + :description: Add self-contained extra functionality during training execution + :col_css: col-md-12 + :button_link: ../extensions/callbacks.html + :height: 100 + +.. displayitem:: + :header: Checkpointing + :description: Save and load progress with checkpoints + :col_css: col-md-12 + :button_link: ../common/checkpointing.html + :height: 100 + +.. displayitem:: + :header: Cluster + :description: Run on your own group of servers + :col_css: col-md-12 + :button_link: ../clouds/cluster.html + :height: 100 + +.. displayitem:: + :header: Cloud checkpoint + :description: Save your models to cloud filesystems + :col_css: col-md-12 + :button_link: ../common/checkpointing_advanced.html + :height: 100 + +.. displayitem:: + :header: Console Logging + :description: Capture more visible logs + :col_css: col-md-12 + :button_link: ../common/console_logs.html + :height: 100 + +.. displayitem:: + :header: Debugging + :description: Fix errors in your code + :col_css: col-md-12 + :button_link: ../debug/debugging.html + :height: 100 + +.. displayitem:: + :header: Early stopping + :description: Stop the training when no improvement is observed + :col_css: col-md-12 + :button_link: ../common/early_stopping.html + :height: 100 + +.. displayitem:: + :header: Experiment manager (Logger) + :description: Tools for tracking and visualizing artifacts and logs + :col_css: col-md-12 + :button_link: ../visualize/experiment_managers.html + :height: 100 + +.. displayitem:: + :header: Finetuning + :description: Technique for training pretrained models + :col_css: col-md-12 + :button_link: ../advanced/finetuning.html + :height: 100 + +.. displayitem:: + :header: GPU + :description: Graphics Processing Unit for faster training + :col_css: col-md-12 + :button_link: ../accelerators/gpu.html + :height: 100 + +.. displayitem:: + :header: Half precision + :description: Using different numerical formats to save memory and run fatser + :col_css: col-md-12 + :button_link: ../common/precision.html + :height: 100 + +.. displayitem:: + :header: HPU + :description: Habana Gaudi AI Processor Unit for faster training + :col_css: col-md-12 + :button_link: ../integrations/hpu/index.html + :height: 100 + +.. displayitem:: + :header: Inference + :description: Making predictions by applying a trained model to unlabeled examples + :col_css: col-md-12 + :button_link: ../deploy/production_intermediate.html + :height: 100 + +.. displayitem:: + :header: IPU + :description: Graphcore Intelligence Processing Unit for faster training + :col_css: col-md-12 + :button_link: ../accelerators/ipu.html + :height: 100 + +.. displayitem:: + :header: Lightning CLI + :description: A Command-line Interface (CLI) to interact with Lightning code via a terminal + :col_css: col-md-12 + :button_link: ../cli/lightning_cli.html + :height: 100 + +.. displayitem:: + :header: LightningDataModule + :description: A shareable, reusable class that encapsulates all the steps needed to process data + :col_css: col-md-12 + :button_link: ../data/datamodule.html + :height: 100 + +.. displayitem:: + :header: LightningModule + :description: A base class organizug your neural network module + :col_css: col-md-12 + :button_link: ../common/lightning_module.html + :height: 100 + +.. displayitem:: + :header: Log + :description: Outpus or results used for visualization and tracking + :col_css: col-md-12 + :button_link: ../visualize/loggers.html + :height: 100 + +.. displayitem:: + :header: Metrics + :description: A statistic used to measure performance or other objectives we want to optimize + :col_css: col-md-12 + :button_link: https://torchmetrics.readthedocs.io/en/stable/ + :height: 100 + +.. displayitem:: + :header: Model + :description: The set of parameters and structure for a system to make predictions + :col_css: col-md-12 + :button_link: ../model/build_model.html + :height: 100 + +.. displayitem:: + :header: Model Parallelism + :description: A way to scale training that splits a model between multiple devices. + :col_css: col-md-12 + :button_link: ../advanced/model_parallel.html + :height: 100 + +.. displayitem:: + :header: Plugins + :description: Custom trainer integrations such as custom precision, checkpointing or cluster environment implementation + :col_css: col-md-12 + :button_link: ../extensions/plugins.html + :height: 100 + +.. displayitem:: + :header: Progress bar + :description: Output printed to the terminal to visualize the progression of training + :col_css: col-md-12 + :button_link: ../common/progress_bar.html + :height: 100 + +.. displayitem:: + :header: Production + :description: Using ML models in real world systems + :col_css: col-md-12 + :button_link: ../deploy/production_advanced.html + :height: 100 + +.. displayitem:: + :header: Prediction + :description: Computing a model's output + :col_css: col-md-12 + :button_link: ../deploy/production_basic.html + :height: 100 + +.. displayitem:: + :header: Pretrained models + :description: Models that have already been trained for a particular task + :col_css: col-md-12 + :button_link: ../advanced/pretrained.html + :height: 100 + +.. displayitem:: + :header: Profiler + :description: Tool to identify bottlenecks and performance of different parts of a model + :col_css: col-md-12 + :button_link: ../tuning/profiler.html + :height: 100 + +.. displayitem:: + :header: Pruning + :description: A technique to eliminae some of the model weights to reduce the model size and decrease inference requirements + :col_css: col-md-12 + :button_link: ../advanced/pruning_quantization.html + :height: 100 + +.. displayitem:: + :header: Quantization + :description: A technique to accelerate the model inference speed and decrease the memory load while still maintaining the model accuracy + :col_css: col-md-12 + :button_link: ../advanced/post_training_quantization.html + :height: 100 + +.. displayitem:: + :header: Remote filesystem and FSSPEC + :description: Accessing files from cloud storage providers + :col_css: col-md-12 + :button_link: ../common/remote_fs.html + :height: 100 + +.. displayitem:: + :header: Strategy + :description: Ways the trainer controls the model distribution across training, evaluation, and prediction + :col_css: col-md-12 + :button_link: ../extensions/strategy.html + :height: 100 + +.. displayitem:: + :header: Strategy registry + :description: A class that holds information about training strategies and allows adding new custom strategies + :col_css: col-md-12 + :button_link: ../advanced/strategy_registry.html + :height: 100 + +.. displayitem:: + :header: Style guide + :description: Best practices to improve readability and reproducability + :col_css: col-md-12 + :button_link: ../starter/style_guide.html + :height: 100 + +.. displayitem:: + :header: SWA + :description: Stochastic Weight Averaging (SWA) can make your models generalize better + :col_css: col-md-12 + :button_link: ../advanced/training_tricks.html#stochastic-weight-averaging + :height: 100 + +.. displayitem:: + :header: SLURM + :description: Simple Linux Utility for Resource Management, or simply Slurm, is a free and open-source job scheduler for Linux clusters + :col_css: col-md-12 + :button_link: ../clouds/cluster_advanced.html + :height: 100 + +.. displayitem:: + :header: Transfer learning + :description: Using pre-trained models to improve learning + :col_css: col-md-12 + :button_link: ../advanced/transfer_learning.html + :height: 100 + +.. displayitem:: + :header: Trainer + :description: The class that automates and customizes model training + :col_css: col-md-12 + :button_link: ../common/trainer.html + :height: 100 + +.. displayitem:: + :header: Torch distributed + :description: Setup for running on distributed environments + :col_css: col-md-12 + :button_link: ../clouds/cluster_intermediate_2.html + :height: 100 + +.. raw:: html + +
+
diff --git a/docs/source-pytorch/index.rst b/docs/source-pytorch/index.rst new file mode 100644 index 0000000..e2b6501 --- /dev/null +++ b/docs/source-pytorch/index.rst @@ -0,0 +1,200 @@ +⚡ PyTorch Lightning에 오신 것을 환영합니다! +======================================== + +.. twocolumns:: + :left: + .. image:: _static/fetched-s3-assets/mov.gif + :alt: Animation showing how to convert standard training code to Lightning + :right: + PyTorch Lightning(파이토치 라이트닝))은 대규모에서 성능을 포기하지 않으면서 최대한의 유연성을 필요로 하는 전문적인 AI 연구자들과 머신러닝 엔지니어들을 위한 딥러닝 프레임워크입니다. + Lightning(라이트닝)은 프로젝트가 생각으로부터 문서 / 제품화에 이르는 동안 함께 발전합니다. + +.. raw:: html + +
+
+
+
+ +.. raw:: html + +
+
+ + +.. raw:: html + +
+ + +Lightning 설치하기 +---------------------- + + +.. raw:: html + +
+
+ +Pip 사용자라면, + +.. code-block:: bash + + pip install lightning + +.. raw:: html + +
+
+ +Conda 사용자라면, + +.. code-block:: bash + + conda install lightning -c conda-forge + +.. raw:: html + +
+
+ +또는 `advanced install guide `_ 참조하세요. + +지원하는 PyTorch 버전은 :ref:`compatibility matrix ` 에서 확인할 수 있습니다. + +.. raw:: html + +
+ +처음이신가요? +----------- + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. customcalloutitem:: + :description: Learn the 7 key steps of a typical Lightning workflow. + :header: Lightning in 15 minutes + :button_link: starter/introduction.html + +.. customcalloutitem:: + :description: Learn how to benchmark PyTorch Lightning. + :header: Benchmarking + :button_link: benchmarking/benchmarks.html + +.. raw:: html + +
+
+ +.. End of callout item section + +.. raw:: html + +
+ +이미 Lightning 사용자라면? +----------------------- + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. customcalloutitem:: + :description: Learn Lightning in small bites at 4 levels of expertise: Introductory, intermediate, advanced and expert. + :header: Level Up! + :button_link: expertise_levels.html + +.. customcalloutitem:: + :description: Detailed description of API each package. Assumes you already have basic Lightning knowledge. + :header: API Reference + :button_link: api_references.html + +.. customcalloutitem:: + :description: From NLP, Computer vision to RL and meta learning - see how to use Lightning in ALL research areas. + :header: Hands-on Examples + :button_link: tutorials.html + +.. customcalloutitem:: + :description: Learn how to do everything from hyper-parameters sweeps to cloud training to Pruning and Quantization with Lightning. + :header: Common Workflows + :button_link: common_usecases.html + +.. customcalloutitem:: + :description: Convert your current code to Lightning + :header: Convert code to PyTorch Lightning + :button_link: starter/converting.html + + +.. raw:: html + +
+
+ +.. End of callout item section + +.. raw:: html + +
+ +.. toctree:: + :maxdepth: 1 + :name: start + :caption: Home + + starter/introduction + Install + upgrade/migration_guide + + +.. toctree:: + :maxdepth: 2 + :name: levels + :caption: Level Up + + levels/core_skills + levels/intermediate + levels/advanced + levels/expert + +.. toctree:: + :maxdepth: 1 + :name: pl_docs + :caption: Core API + + common/lightning_module + common/trainer + +.. toctree:: + :maxdepth: 1 + :name: api + :caption: Optional API + + api_references + +.. toctree:: + :maxdepth: 1 + :name: More + :caption: More + + Community + Examples + Glossary + How to + + +.. raw:: html + +
+ +.. PyTorch-Lightning documentation master file, created by + sphinx-quickstart on Fri Nov 15 07:48:22 2019. + You can adapt this file completely to your liking, but it should at least + contain the root `toctree` directive. diff --git a/docs/source-pytorch/integrations/hpu/advanced.rst b/docs/source-pytorch/integrations/hpu/advanced.rst new file mode 100644 index 0000000..a3b34c4 --- /dev/null +++ b/docs/source-pytorch/integrations/hpu/advanced.rst @@ -0,0 +1,140 @@ +:orphan: + +.. _hpu_advanced: + +Accelerator: HPU Training +========================= +This document offers instructions to Gaudi chip users who want to use advanced strategies and profiling HPUs. + +---- + +Using HPUProfiler +----------------- + +HPUProfiler is a Lightning implementation of PyTorch profiler for HPU. It aids in obtaining profiling summary of PyTorch functions. +It subclasses PyTorch Lightning's `PyTorch profiler `_. + +Default Profiling +^^^^^^^^^^^^^^^^^^ +For auto profiling, create an ``HPUProfiler`` instance and pass it to the trainer. +At the end of ``profiler.fit()``, it will generate a JSON trace for the run. +In case ``accelerator= HPUAccelerator()`` is not used with ``HPUProfiler``, it will dump only CPU traces, similar to ``PyTorchProfiler``. + +.. code-block:: python + + from lightning import Trainer + from lightning_habana.pytorch.accelerator import HPUAccelerator + from lightning_habana.pytorch.profiler.profiler import HPUProfiler + + trainer = Trainer(accelerator=HPUAccelerator(), profiler=HPUProfiler()) + +Distributed Profiling +^^^^^^^^^^^^^^^^^^^^^^ + +To profile a distributed model, use ``HPUProfiler`` with the filename argument which will save a report per rank. + +.. code-block:: python + + from pytorch_lightning import Trainer + from lightning_habana.pytorch.accelerator import HPUAccelerator + from lightning_habana.pytorch.profiler.profiler import HPUProfiler + + profiler = HPUProfiler(filename="perf-logs") + trainer = Trainer(profiler=profiler, accelerator=HPUAccelerator()) + +Custom Profiling +^^^^^^^^^^^^^^^^^ + +To `profile custom actions of interest `_, +reference a profiler in the ``LightningModule``. + +.. code-block:: python + + from pytorch_lightning import Trainer + from lightning_habana.pytorch.accelerator import HPUAccelerator + from lightning_habana.pytorch.profiler.profiler import HPUProfiler + + # Reference profiler in LightningModule + class MyModel(LightningModule): + def __init__(self, profiler=None): + self.profiler = profiler + + # To profile in any part of your code, use the self.profiler.profile() function + def custom_processing_step_basic(self, data): + with self.profiler.profile("my_custom_action"): + print("do somthing") + return data + + # Alternatively, use self.profiler.start("my_custom_action") + # and self.profiler.stop("my_custom_action") functions + # to enclose the part of code to be profiled. + def custom_processing_step_granular(self, data): + self.profiler.start("my_custom_action") + print("do somthing") + self.profiler.stop("my_custom_action") + return data + + # Pass profiler instance to LightningModule + profiler = HPUProfiler() + model = MyModel(profiler) + trainer = Trainer(accelerator=HPUAccelerator(), profiler=profiler) + +For more details on Profiler, refer to `PyTorchProfiler `_ + +Visualizing Profiled Operations +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +Profiler dumps traces in JSON format. The traces can be visualized in 2 ways as described below. + +Using PyTorch TensorBoard Profiler +"""""""""""""""""""""""""""""""""" + +For further instructions see, https://github.com/pytorch/kineto/tree/master/tb_plugin. + +1. Install tensorboard + +.. code-block:: bash + + python -um pip install tensorboard torch-tb-profiler + +2. Start the TensorBoard server (default at port 6006) + +.. code-block:: bash + + tensorboard --logdir ./tensorboard --port 6006 + +3. Open the following URL in your browser: `http://localhost:6006/#profile`. + +Using Chrome +""""""""""""" + + 1. Open Chrome and paste this URL: `chrome://tracing/`. + 2. Once tracing opens, click on `Load` at the top-right and load one of the generated traces. + +Limitations +^^^^^^^^^^^^ + +- When using ``HPUProfiler``, wall clock time will not be representative of the true wall clock time. This is due to forcing profiled operations to be measured synchronously, when many HPU ops happen asynchronously. + It is recommended to use this Profiler to find bottlenecks/breakdowns, however for end to end wall clock time use the ``SimpleProfiler``. + +- ``HPUProfiler.summary()`` is not supported. + +- Passing the Profiler name as a string "hpu" to the trainer is not supported. + +---- + +Using DeepSpeed +------------------------ + +HPU supports advanced strategies like ``deepspeed``. By default, HPU training uses 32-bit precision. +To enable mixed precision, set the ``precision`` flag. + +.. code-block:: python + + from lightning.pytorch.plugins import DeepSpeedPrecisionPlugin + from lightning_habana.pytorch.accelerator import HPUAccelerator + from lightning_habana.pytorch.strategies import HPUDeepSpeedStrategy + + trainer = Trainer(devices=8, accelerator=HPUAccelerator(), strategy=HPUDeepSpeedStrategy(), plugins=[DeepSpeedPrecisionPlugin(precision="bf16-mixed")]) + +For further details on the supported DeepSpeed features and functionalities, refer to `Using Deepspeed with HPU `_. diff --git a/docs/source-pytorch/integrations/hpu/basic.rst b/docs/source-pytorch/integrations/hpu/basic.rst new file mode 100644 index 0000000..58f6c8d --- /dev/null +++ b/docs/source-pytorch/integrations/hpu/basic.rst @@ -0,0 +1,112 @@ +:orphan: + +.. _hpu_basics: + +Accelerator: HPU training +========================= +**Audience:** Users looking to save money and run large models faster using single or multiple Gaudi devices. + +---- + +What is an HPU? +--------------- + +`Habana® Gaudi® AI Processor (HPU) `__ training processors are built on a heterogeneous architecture with a cluster of fully programmable Tensor Processing Cores (TPC) along with its associated development tools and libraries, and a configurable Matrix Math engine. + +The TPC core is a VLIW SIMD processor with an instruction set and hardware tailored to serve training workloads efficiently. +The Gaudi memory architecture includes on-die SRAM and local memories in each TPC and, +Gaudi is the first DL training processor that has integrated RDMA over Converged Ethernet (RoCE v2) engines on-chip. + +On the software side, the PyTorch Habana bridge interfaces between the framework and SynapseAI software stack to enable the execution of deep learning models on the Habana Gaudi device. + +Gaudi offers a substantial price/performance advantage -- so you get to do more deep learning training while spending less. + +For more information, check out `Gaudi Architecture `__ and `Gaudi Developer Docs `__. + +---- + +Run on Gaudi +------------ + +To enable PyTorch Lightning to utilize the HPU accelerator, simply provide ``accelerator=HPUAccelerator()"`` parameter to the Trainer class. + +.. code-block:: python + + from lightning_habana.pytorch.accelerator import HPUAccelerator + + # run on as many Gaudi devices as available by default + trainer = Trainer(accelerator="auto", devices="auto", strategy="auto") + # equivalent to + trainer = Trainer() + + # run on one Gaudi device + trainer = Trainer(accelerator=HPUAccelerator(), devices=1) + # run on multiple Gaudi devices + trainer = Trainer(accelerator=HPUAccelerator(), devices=8) + # choose the number of devices automatically + trainer = Trainer(accelerator=HPUAccelerator(), devices="auto") + + +The ``devices=1`` parameter with HPUs enables the Habana accelerator for single card training. +It uses :class:`~lightning_habana.pytorch.strategies.SingleHPUStrategy`. + +The ``devices>1`` parameter with HPUs enables the Habana accelerator for distributed training. +It uses :class:`~lightning_habana.pytorch.strategies.HPUParallelStrategy` which is based on DDP +strategy with the addition of Habana's collective communication library (HCCL) to support scale-up within a node and +scale-out across multiple nodes. + +.. note:: + accelerator="auto" or accelerator="hpu" is not yet enabled with lightning>2.0.0 and lightning-habana. + However passing class object :class:`HPUAccelerator()` is supported. + +---- + +Scale-out on Gaudis +------------------- + +To train a Lightning model using multiple HPU nodes, set the ``num_nodes`` parameter with the available nodes in the ``Trainer`` class. + +.. code-block:: python + + from lightning_habana.pytorch.accelerator import HPUAccelerator + from lightning_habana.pytorch.strategies import HPUParallelStrategy + + hpus = 8 + parallel_hpus = [torch.device("hpu")] * hpus + trainer = Trainer(accelerator=HPUAccelerator(), devices=hpus, strategy=HPUParallelStrategy(parallel_devices=parallel_hpus), num_nodes=2) + +In addition to this, the following environment variables need to be set to establish communication across nodes. + +- *MASTER_PORT* - required; has to be a free port on machine with NODE_RANK 0 +- *MASTER_ADDR* - required (except for NODE_RANK 0); address of NODE_RANK 0 node +- *WORLD_SIZE* - required; how many workers are in the cluster +- *NODE_RANK* - required; id of the node in the cluster + +The trainer needs to be instantiated on every node participating in the training. + +On Node 1: + +.. code-block:: bash + + MASTER_ADDR= MASTER_PORT= NODE_RANK=0 WORLD_SIZE=16 + python -m some_model_trainer.py (--arg1 ... train script args...) + +On Node 2: + +.. code-block:: bash + + MASTER_ADDR= MASTER_PORT= NODE_RANK=1 WORLD_SIZE=16 + python -m some_model_trainer.py (--arg1 ... train script args...) + +---- + +How to access HPUs +------------------ + +To use HPUs, you must have access to a system with HPU devices. + +AWS +^^^ +You can either use `Gaudi-based AWS EC2 DL1 instances `__ or `Supermicro X12 Gaudi server `__ to get access to HPUs. + +Check out the `PyTorch Model on AWS DL1 Instance Quick Start `__. diff --git a/docs/source-pytorch/integrations/hpu/index.rst b/docs/source-pytorch/integrations/hpu/index.rst new file mode 100644 index 0000000..2f8607d --- /dev/null +++ b/docs/source-pytorch/integrations/hpu/index.rst @@ -0,0 +1,40 @@ +.. _hpu: + +Accelerator: HPU training +========================= + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Basic + :description: Learn the basics of single and multi-HPU core training. + :col_css: col-md-4 + :button_link: basic.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: Intermediate + :description: Enable state-of-the-art scaling with advanced mix-precision settings. + :col_css: col-md-4 + :button_link: intermediate.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Advanced + :description: Explore state-of-the-art scaling with additional advanced configurations. + :col_css: col-md-4 + :button_link: advanced.html + :height: 150 + :tag: advanced + +.. raw:: html + +
+
diff --git a/docs/source-pytorch/integrations/hpu/intermediate.rst b/docs/source-pytorch/integrations/hpu/intermediate.rst new file mode 100644 index 0000000..b5b1565 --- /dev/null +++ b/docs/source-pytorch/integrations/hpu/intermediate.rst @@ -0,0 +1,116 @@ +:orphan: + +.. _hpu_intermediate: + +Accelerator: HPU Training +========================= +This document offers instructions to Gaudi chip users who want to conserve memory and scale models using mixed-precision training. + +---- + +Enable Mixed Precision +---------------------- + +With Lightning, you can leverage mixed precision training on HPUs. By default, HPU training +uses 32-bit precision. To enable mixed precision, set the ``precision`` flag. + +.. code-block:: python + + from lightning_habana.pytorch.accelerator import HPUAccelerator + + trainer = Trainer(devices=1, accelerator=HPUAccelerator(), precision="bf16-mixed") + +---- + +Customize Mixed Precision +------------------------- + +Internally, :class:`~lightning_habana.pytorch.plugins.precision.HPUPrecisionPlugin` uses the Habana Mixed Precision (HMP) package to enable mixed precision training. + +You can execute the ops in FP32 or BF16 precision. The HMP package modifies the Python operators to add the appropriate cast operations for the arguments before execution. +With the default settings, you can easily enable mixed precision training with minimal code. + +In addition to the default settings in HMP, you can choose to override these defaults and provide your own BF16 and FP32 operator lists by passing them as parameters +to :class:`~lightning_habana.pytorch.plugins.precision.HPUPrecisionPlugin`. + +The following is an excerpt from an MNIST example implemented on a single HPU. + +.. code-block:: python + + import pytorch_lightning as pl + from lightning_habana.pytorch.accelerator import HPUAccelerator + from lightning_habana.pytorch.plugins.precision import HPUPrecisionPlugin + + # Initialize a trainer with HPU accelerator for HPU strategy for single device, + # with mixed precision using overidden HMP settings + trainer = pl.Trainer( + accelerator=HPUAccelerator(), + devices=1, + # Optional Habana mixed precision params to be set + # Checkout `examples/pl_hpu/ops_bf16_mnist.txt` for the format + plugins=[ + HPUPrecisionPlugin( + precision="bf16-mixed", + opt_level="O1", + verbose=False, + bf16_file_path="ops_bf16_mnist.txt", + fp32_file_path="ops_fp32_mnist.txt", + ) + ], + ) + + # Init our model + model = LitClassifier() + # Init the data + dm = MNISTDataModule(batch_size=batch_size) + + # Train the model ⚡ + trainer.fit(model, datamodule=dm) + +For more details, please refer to `PyTorch Mixed Precision Training on Gaudi `__. + +---- + +Enabling DeviceStatsMonitor with HPUs +---------------------------------------- + +:class:`~pytorch_lightning.callbacks.device_stats_monitor.DeviceStatsMonitor` is a callback that automatically monitors and logs device stats during the training stage. +This callback can be passed for training with HPUs. It returns a map of the following metrics with their values in bytes of type uint64: + ++-------------------+---------------------------------------------+ +| Metric | Value | ++===================+=============================================+ +| Limit | Amount of total memory on HPU. | ++-------------------+---------------------------------------------+ +| InUse | Amount of allocated memory at any instance. | ++-------------------+---------------------------------------------+ +| MaxInUse | Amount of total active memory allocated. | ++-------------------+---------------------------------------------+ +| NumAllocs | Number of allocations. | ++-------------------+---------------------------------------------+ +| NumFrees | Number of freed chunks. | ++-------------------+---------------------------------------------+ +| ActiveAllocs | Number of active allocations. | ++-------------------+---------------------------------------------+ +| MaxAllocSize | Maximum allocated size. | ++-------------------+---------------------------------------------+ +| TotalSystemAllocs | Total number of system allocations. | ++-------------------+---------------------------------------------+ +| TotalSystemFrees | Total number of system frees. | ++-------------------+---------------------------------------------+ +| TotalActiveAllocs | Total number of active allocations. | ++-------------------+---------------------------------------------+ + + +The below shows how ``DeviceStatsMonitor`` can be enabled. + +.. code-block:: python + + from pytorch_lightning import Trainer + from pytorch_lightning.callbacks import DeviceStatsMonitor + from lightning_habana.pytorch.accelerator import HPUAccelerator + + device_stats = DeviceStatsMonitor() + trainer = Trainer(accelerator=HPUAccelerator(), callbacks=[device_stats]) + +For more details, please refer to `Memory Stats APIs `__. diff --git a/docs/source-pytorch/integrations/strategies/bagua.rst b/docs/source-pytorch/integrations/strategies/bagua.rst new file mode 100644 index 0000000..60214f8 --- /dev/null +++ b/docs/source-pytorch/integrations/strategies/bagua.rst @@ -0,0 +1,53 @@ +:orphan: + +##### +Bagua +##### + +The `Bagua strategy `_ speeds up PyTorch training from a single node to large scale. +Bagua is a deep learning training acceleration framework for PyTorch, with advanced distributed training algorithms and system optimizations. +Bagua currently supports: + +- **Advanced Distributed Training Algorithms**: Users can extend the training on a single GPU to multi-GPUs (may across multiple machines) by simply adding a few lines of code (optionally in `elastic mode `_). One prominent feature of Bagua is to provide a flexible system abstraction that supports state-of-the-art system relaxation techniques of distributed training. So far, Bagua has integrated communication primitives including + + - Centralized Synchronous Communication (e.g. `Gradient AllReduce `_) + + - Decentralized Synchronous Communication (e.g. `Decentralized SGD `_) + + - Low Precision Communication (e.g. `ByteGrad `_) + + - Asynchronous Communication (e.g. `Async Model Average `_) +- `Cached Dataset `_: When samples in a dataset need tedious preprocessing, or reading the dataset itself is slow, they could become a major bottleneck of the whole training process. Bagua provides cached dataset to speedup this process by caching data samples in memory, so that reading these samples after the first time can be much faster. +- `TCP Communication Acceleration (Bagua-Net) `_: Bagua-Net is a low level communication acceleration feature provided by Bagua. It can greatly improve the throughput of AllReduce on TCP network. You can enable Bagua-Net optimization on any distributed training job that uses NCCL to do GPU communication (this includes PyTorch-DDP, Horovod, DeepSpeed, and more). +- `Performance Autotuning `_: Bagua can automatically tune system parameters to achieve the highest throughput. +- `Generic Fused Optimizer `_: Bagua provides generic fused optimizer which improves the performance of optimizers, by fusing the optimizer `.step()` operation on multiple layers. It can be applied to arbitrary PyTorch optimizer, in contrast to `NVIDIA Apex `_'s approach, where only some specific optimizers are implemented. +- `Load Balanced Data Loader `_: When the computation complexity of samples in training data are different, for example in NLP and speech tasks, where each sample have different lengths, distributed training throughput can be greatly improved by using Bagua's load balanced data loader, which distributes samples in a way that each worker's workload are similar. + +You can install the Bagua integration by running + +.. code-block:: bash + + pip install lightning-bagua + +This will install both the `bagua `_ package as well as the ``BaguaStrategy`` for the Lightning Trainer: + +.. code-block:: python + + trainer = Trainer(strategy="bagua", accelerator="gpu", devices=...) + + +You can tune several settings by instantiating the strategy objects and pass options in: + +.. code-block:: python + + from lightning_bagua import BaguaStrategy + + strategy = BaguaStrategy(algorithm="bytegrad") + trainer = Trainer(strategy=strategy, accelerator="gpu", devices=...) + + +.. note:: + + * Bagua is only supported on Linux systems with GPU(s). + +See `Bagua Tutorials `_ for more details on installation and advanced features. diff --git a/docs/source-pytorch/integrations/strategies/colossalai.rst b/docs/source-pytorch/integrations/strategies/colossalai.rst new file mode 100644 index 0000000..2165673 --- /dev/null +++ b/docs/source-pytorch/integrations/strategies/colossalai.rst @@ -0,0 +1,112 @@ +:orphan: + +########### +Colossal-AI +########### + +The `Colossal-AI strategy `_ implements ZeRO-DP with chunk-based memory management. +With this chunk mechanism, really large models can be trained with a small number of GPUs. +It supports larger trainable model size and batch size than usual heterogeneous training by reducing CUDA memory fragments and CPU memory consumption. +Also, it speeds up this kind of heterogeneous training by fully utilizing all kinds of resources. + +.. warning:: This is an :ref:`experimental ` feature. + +When enabling chunk mechanism, a set of consecutive parameters are stored in a chunk, and then the chunk is sharded across different processes. +This can reduce communication and data transmission frequency and fully utilize communication and PCI-E bandwidth, which makes training faster. + +Unlike traditional implementations, which adopt static memory partition, we implemented a dynamic heterogeneous memory management system named Gemini. +During the first training step, the warmup phase will sample the maximum non-model data memory (memory usage expect parameters, gradients, and optimizer states). +In later training, it will use the collected memory usage information to evict chunks dynamically. +Gemini allows you to fit much larger models with limited GPU memory. + +According to our benchmark results, we can train models with up to 24 billion parameters in 1 GPU. + +You can install the Colossal-AI integration by running + +.. code-block:: bash + + pip install lightning-colossalai + +This will install both the `colossalai `_ package as well as the ``ColossalAIStrategy`` for the Lightning Trainer: + +.. code-block:: python + + trainer = Trainer(strategy="colossalai", precision=16, devices=...) + + +You can tune several settings by instantiating the strategy objects and pass options in: + +.. code-block:: python + + from lightning_colossalai import ColossalAIStrategy + + strategy = ColossalAIStrategy(...) + trainer = Trainer(strategy=strategy, precision=16, devices=...) + + +See a full example of a benchmark with the a `GPT-2 model `_ of up to 24 billion parameters + +.. note:: + + * The only accelerator which ColossalAI supports is ``"gpu"``. But CPU resources will be used when the placement policy is set to "auto" or "cpu". + + * The only precision which ColossalAI allows is 16-bit mixed precision (FP16). + + * It only supports a single optimizer, which must be ``colossalai.nn.optimizer.CPUAdam`` or ``colossalai.nn.optimizer. + HybridAdam`` now. You can set ``adamw_mode`` to False to use normal Adam. Noticing that ``HybridAdam`` is highly optimized, it uses fused CUDA kernel and parallel CPU kernel. + It is recomended to use ``HybridAdam``, since it updates parameters in GPU and CPU both. + + * Your model must be created using the :meth:`~lightning.pytorch.core.module.LightningModule.configure_model` method. + + * ``ColossalaiStrategy`` doesn't support gradient accumulation as of now. + +.. _colossal_placement_policy: + +Model Definition +================ + +ColossalAI requires the layers of your model to be created in the special :meth:`~lightning.pytorch.core.module.LightningModule.configure_model` hook. +This allows the strategy to efficiently shard your model before materializing the weight tensors. + +.. code-block:: python + + class MyModel(LightningModule): + def __init__(self): + super().__init__() + # don't instantiate layers here + # move the creation of layers to `configure_model` + + def configure_model(self): + # create all your layers here + self.layers = nn.Sequential(...) + + +Placement Policy +================ + +Placement policies can help users fully exploit their GPU-CPU heterogeneous memory space for better training efficiency. +There are three options for the placement policy. +They are "cpu", "cuda" and "auto" respectively. + +When the placement policy is set to "cpu", all participated parameters will be offloaded into CPU memory immediately at the end of every auto-grad operation. +In this way, "cpu" placement policy uses the least CUDA memory. +It is the best choice for users who want to exceptionally enlarge their model size or training batch size. + +When using "cuda" option, all parameters are placed in the CUDA memory, no CPU resources will be used during the training. +It is for users who get plenty of CUDA memory. + +The third option, "auto", enables Gemini. +It monitors the consumption of CUDA memory during the warmup phase and collects CUDA memory usage of all auto-grad operations. +In later training steps, Gemini automatically manages the data transmission between GPU and CPU according to collected CUDA memory usage information. +It is the fastest option when CUDA memory is enough. + +Here's an example of changing the placement policy to "cpu". + +.. code-block:: python + + from lightning_colossalai import ColossalAIStrategy + + model = MyModel() + my_strategy = ColossalAIStrategy(placement_policy="cpu") + trainer = Trainer(accelerator="gpu", devices=4, precision=16, strategy=my_strategy) + trainer.fit(model) diff --git a/docs/source-pytorch/integrations/strategies/hivemind.rst b/docs/source-pytorch/integrations/strategies/hivemind.rst new file mode 100644 index 0000000..32079b8 --- /dev/null +++ b/docs/source-pytorch/integrations/strategies/hivemind.rst @@ -0,0 +1,114 @@ +:orphan: + +################################################################ +Hivemind - training on unreliable mixed GPUs across the internet +################################################################ + +Collaborative Training tries to solve the need for top-tier multi-GPU servers by allowing you to train across unreliable machines, +such as local machines or even preemptible cloud compute across the internet. + +Under the hood, we use `Hivemind `__ which provides de-centralized training across the internet. + +.. warning:: This is an :ref:`experimental ` feature. + + +To use Collaborative Training, you need to first this extension. + +.. code-block:: bash + + pip install lightning-hivemind + +This will install both the `Hivemind `__ package as well as the ``HivemindStrategy`` for the Lightning Trainer: + +Reducing Communication By Overlapping Communication +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +We can reduce the impact of communication across all machines by overlapping communication with our training iterations. In short, we enable communication to happen +in the background of training. + +Overlap Gradient and State Averaging +"""""""""""""""""""""""""""""""""""" + +When the target batch size is reached, all processes that are included in the step send gradients and model states to each other. By enabling some flags through +the strategy, communication can happen in the background. This allows training to continue (with slightly outdated weights) but provides us the means +to overlap communication with computation. + +.. warning:: + Enabling overlapping communication means convergence will slightly be affected. + +.. note:: + Enabling these flags means that you must pass in a ``scheduler_fn`` to the ``HivemindStrategy`` instead of relying on a scheduler from ``configure_optimizers``. + The optimizer is re-created by Hivemind, and as a result, the scheduler has to be re-created. + +.. code-block:: python + + import torch + from functools import partial + from lightning import Trainer + from lightning_hivemind.strategy import HivemindStrategy + + trainer = Trainer( + strategy=HivemindStrategy( + target_batch_size=8192, + delay_state_averaging=True, + delay_grad_averaging=True, + delay_optimizer_step=True, + offload_optimizer=True, # required to delay averaging + scheduler_fn=partial(torch.optim.lr_scheduler.ExponentialLR, gamma=...), + ), + accelerator="gpu", + devices=1, + ) + + +Reducing GPU Memory requirements by re-using buffers & CPU offloading +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +We can also offload the optimizer state to the CPU whilst re-using gradient buffers to reduce the memory requirement for machines. + +Offloading Optimizer State to the CPU +""""""""""""""""""""""""""""""""""""" + +Offloading the Optimizer state to the CPU works the same as Deepspeed Zero-stage-2-offload, where we save GPU memory by keeping all optimizer states on the CPU. + +.. note:: + Enabling these flags means that you must pass in a ``scheduler_fn`` to the ``HivemindStrategy`` instead of relying on a scheduler from ``configure_optimizers``. + The optimizer is re-created by Hivemind, and as a result, the scheduler has to be re-created. + + We suggest enabling offloading and overlapping communication to hide the additional overhead from having to communicate with the CPU. + +.. code-block:: python + + import torch + from functools import partial + from lightning import Trainer + from lightning_hivemind.strategy import HivemindStrategy + + trainer = Trainer( + strategy=HivemindStrategy( + target_batch_size=8192, + offload_optimizer=True, + scheduler_fn=partial(torch.optim.lr_scheduler.ExponentialLR, gamma=...), + ), + accelerator="gpu", + devices=1, + ) + + +Re-using Gradient Buffers +""""""""""""""""""""""""" + +By default, Hivemind accumulates gradients in a separate buffer. This means additional GPU memory is required to store gradients. You can enable re-using the model parameter gradient buffers by passing ``reuse_grad_buffers=True`` to the ``HivemindStrategy``. + +.. warning:: + The ``HivemindStrategy`` will override ``zero_grad`` in your ``LightningModule`` to have no effect. This is because gradients are accumulated in the model + and Hivemind manages when they need to be cleared. + +.. code-block:: python + + from pytorch_lightning import Trainer + from lightning_hivemind.strategy import HivemindStrategy + + trainer = Trainer( + strategy=HivemindStrategy(target_batch_size=8192, reuse_grad_buffers=True), accelerator="gpu", devices=1 + ) diff --git a/docs/source-pytorch/levels/advanced.rst b/docs/source-pytorch/levels/advanced.rst new file mode 100644 index 0000000..f04f562 --- /dev/null +++ b/docs/source-pytorch/levels/advanced.rst @@ -0,0 +1,83 @@ + +############### +Advanced skills +############### + +Configure all aspects of Lightning for advanced usecases. + + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Level 14: Customize configs to run in production + :description: Enable composable YAMLs + :col_css: col-md-6 + :button_link: advanced_level_15.html + :height: 150 + :tag: advanced + +.. displayitem:: + :header: Level 15: Customize the trainer + :description: Inject custom code into the trainer and modify the progress bar. + :col_css: col-md-6 + :button_link: advanced_level_16.html + :height: 150 + :tag: advanced + +.. displayitem:: + :header: Level 16: Own the training loop + :description: Learn all the ways of owning your raw PyTorch loops with Lighting. + :col_css: col-md-6 + :button_link: advanced_level_17.html + :height: 150 + :tag: advanced + +.. displayitem:: + :header: Level 17: Enable advanced checkpointing + :description: Enable composable or cloud based checkpoints. + :col_css: col-md-6 + :button_link: advanced_level_18.html + :height: 150 + :tag: advanced + +.. displayitem:: + :header: Level 18: Explore IPUs + :description: Explore Intelligence Processing Unit (IPU) for model scaling. + :col_css: col-md-6 + :button_link: advanced_level_19.html + :height: 150 + :tag: advanced + +.. displayitem:: + :header: Level 19: Explore HPUs + :description: Explore Habana Gaudi Processing Unit (HPU) for model scaling. + :col_css: col-md-6 + :button_link: advanced_level_20.html + :height: 150 + :tag: advanced + +.. displayitem:: + :header: Level 20: Master TPUs + :description: Master TPUs and run on cloud TPUs. + :col_css: col-md-6 + :button_link: advanced_level_21.html + :height: 150 + :tag: advanced + +.. displayitem:: + :header: Level 21: Reach 1 trillion parameters on GPUs + :description: Scale to 1 trillion params on GPUs. + :col_css: col-md-6 + :button_link: advanced_level_22.html + :height: 150 + :tag: advanced + +.. raw:: html + +
+
diff --git a/source/levels/advanced_level_15.rst b/docs/source-pytorch/levels/advanced_level_15.rst similarity index 94% rename from source/levels/advanced_level_15.rst rename to docs/source-pytorch/levels/advanced_level_15.rst index 761dbd3..fbbb4ef 100644 --- a/source/levels/advanced_level_15.rst +++ b/docs/source-pytorch/levels/advanced_level_15.rst @@ -1,7 +1,7 @@ :orphan: ################################################ -Level 15: Customize configs to run in production +Level 14: Customize configs to run in production ################################################ This level goes over advanced YAML use for running models in production. diff --git a/source/levels/advanced_level_16.rst b/docs/source-pytorch/levels/advanced_level_16.rst similarity index 87% rename from source/levels/advanced_level_16.rst rename to docs/source-pytorch/levels/advanced_level_16.rst index fd41df1..2e70c4b 100644 --- a/source/levels/advanced_level_16.rst +++ b/docs/source-pytorch/levels/advanced_level_16.rst @@ -1,10 +1,10 @@ :orphan: ############################### -Level 16: Customize the trainer +Level 15: Customize the trainer ############################### -In this level, you'll learn to modify the Trainer behavior. +In this level you'll learn to modify the behavior of the Trainer. ---- diff --git a/docs/source-pytorch/levels/advanced_level_17.rst b/docs/source-pytorch/levels/advanced_level_17.rst new file mode 100644 index 0000000..cc375dd --- /dev/null +++ b/docs/source-pytorch/levels/advanced_level_17.rst @@ -0,0 +1,37 @@ +:orphan: + +############################### +Level 16: Own the training loop +############################### + +Learn all the ways of owning your raw PyTorch loops with Lightning. + +---- + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Enable manual optimization + :description: Gain control of the training loop with manual optimization and LightningModule methods. + :col_css: col-md-4 + :button_link: ../model/build_model_advanced.html + :height: 150 + :tag: advanced + +.. displayitem:: + :header: Use Lightning Fabric + :description: Write your own training loops using lightning Fabric. + :col_css: col-md-4 + :button_link: https://lightning.ai/docs/fabric/stable/ + :height: 150 + :tag: advanced + +.. raw:: html + +
+
diff --git a/source/levels/advanced_level_18.rst b/docs/source-pytorch/levels/advanced_level_18.rst similarity index 87% rename from source/levels/advanced_level_18.rst rename to docs/source-pytorch/levels/advanced_level_18.rst index a7d7966..b34861d 100644 --- a/source/levels/advanced_level_18.rst +++ b/docs/source-pytorch/levels/advanced_level_18.rst @@ -1,10 +1,10 @@ :orphan: ####################################### -Level 18: Enable advanced checkpointing +Level 17: Enable advanced checkpointing ####################################### -This level shows you how to enable composable and/or cloud based checkpoints. +This level shows you how to enable composable and/or cloud-based checkpoints. ---- diff --git a/source/levels/advanced_level_19.rst b/docs/source-pytorch/levels/advanced_level_19.rst similarity index 97% rename from source/levels/advanced_level_19.rst rename to docs/source-pytorch/levels/advanced_level_19.rst index c7b6697..4265b03 100644 --- a/source/levels/advanced_level_19.rst +++ b/docs/source-pytorch/levels/advanced_level_19.rst @@ -1,7 +1,7 @@ :orphan: ###################### -Level 19: Explore IPUs +Level 18: Explore IPUs ###################### Explore Intelligence Processing Unit (IPU) for model scaling. diff --git a/source/levels/advanced_level_20.rst b/docs/source-pytorch/levels/advanced_level_20.rst similarity index 79% rename from source/levels/advanced_level_20.rst rename to docs/source-pytorch/levels/advanced_level_20.rst index 7e9d562..f17ebdf 100644 --- a/source/levels/advanced_level_20.rst +++ b/docs/source-pytorch/levels/advanced_level_20.rst @@ -4,7 +4,7 @@ Level 19: Explore HPUs ###################### -Explore Intelligence Processing Unit (IPU) for model scaling. +Explore Intel Habana Processing Unit (HPU) for model scaling. ---- @@ -19,7 +19,7 @@ Explore Intelligence Processing Unit (IPU) for model scaling. :header: Train models on HPUs :description: Learn the basics of single and multi-HPU core training. :col_css: col-md-6 - :button_link: ../accelerators/hpu_basic.html + :button_link: ../integrations/hpu/basic.html :height: 150 :tag: basic @@ -27,7 +27,7 @@ Explore Intelligence Processing Unit (IPU) for model scaling. :header: Optimize models training on HPUs :description: Enable state-of-the-art scaling with advanced mix-precision settings. :col_css: col-md-6 - :button_link: ../accelerators/hpu_intermediate.html + :button_link: ../integrations/hpu/intermediate.html :height: 150 :tag: intermediate diff --git a/source/levels/advanced_level_21.rst b/docs/source-pytorch/levels/advanced_level_21.rst similarity index 97% rename from source/levels/advanced_level_21.rst rename to docs/source-pytorch/levels/advanced_level_21.rst index 5252a1c..92358c0 100644 --- a/source/levels/advanced_level_21.rst +++ b/docs/source-pytorch/levels/advanced_level_21.rst @@ -1,7 +1,7 @@ :orphan: ##################### -Level 21: Master TPUs +Level 20: Master TPUs ##################### Master cloud TPU training with profiling and scaling techniques. diff --git a/source/levels/advanced_level_22.rst b/docs/source-pytorch/levels/advanced_level_22.rst similarity index 94% rename from source/levels/advanced_level_22.rst rename to docs/source-pytorch/levels/advanced_level_22.rst index a90a482..1e4dc39 100644 --- a/source/levels/advanced_level_22.rst +++ b/docs/source-pytorch/levels/advanced_level_22.rst @@ -1,7 +1,7 @@ :orphan: ############################################# -Level 22: Reach 1 trillion parameters on GPUs +Level 21: Reach 1 trillion parameters on GPUs ############################################# Scale to 1 trillion+ parameters with multiple distributed strategies. diff --git a/source/levels/basic_level_2.rst b/docs/source-pytorch/levels/basic_level_2.rst similarity index 100% rename from source/levels/basic_level_2.rst rename to docs/source-pytorch/levels/basic_level_2.rst diff --git a/source/levels/basic_level_5.rst b/docs/source-pytorch/levels/basic_level_5.rst similarity index 100% rename from source/levels/basic_level_5.rst rename to docs/source-pytorch/levels/basic_level_5.rst diff --git a/source/levels/core_level_3.rst b/docs/source-pytorch/levels/core_level_3.rst similarity index 100% rename from source/levels/core_level_3.rst rename to docs/source-pytorch/levels/core_level_3.rst diff --git a/source/levels/core_level_6.rst b/docs/source-pytorch/levels/core_level_6.rst similarity index 100% rename from source/levels/core_level_6.rst rename to docs/source-pytorch/levels/core_level_6.rst diff --git a/source/levels/core_skills.rst b/docs/source-pytorch/levels/core_skills.rst similarity index 95% rename from source/levels/core_skills.rst rename to docs/source-pytorch/levels/core_skills.rst index 19cab69..75c4002 100644 --- a/source/levels/core_skills.rst +++ b/docs/source-pytorch/levels/core_skills.rst @@ -4,10 +4,6 @@ Basic skills ############ Learn the basics of model development with Lightning. Researchers and machine learning engineers should start here. -.. join_slack:: - :align: left - ----- .. raw:: html @@ -27,7 +23,7 @@ Learn the basics of model development with Lightning. Researchers and machine le .. displayitem:: :header: Level 2: Add a validation and test set :description: Add validation and test sets to avoid over/underfitting. - :button_link: /levels/basic_level_2.html + :button_link: ../levels/basic_level_2.html :col_css: col-md-6 :height: 150 :tag: basic diff --git a/docs/source-pytorch/levels/expert.rst b/docs/source-pytorch/levels/expert.rst new file mode 100644 index 0000000..c734142 --- /dev/null +++ b/docs/source-pytorch/levels/expert.rst @@ -0,0 +1,51 @@ + +############# +Expert skills +############# + +Customize and extend Lightning for things like custom hardware or distributed strategies. + + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Level 22: Extend the Lightning CLI + :description: Extend the functionality of the Lightning CLI. + :col_css: col-md-6 + :button_link: expert_level_23.html + :height: 150 + :tag: expert + +.. displayitem:: + :header: Level 23: Integrate a custom cluster + :description: Integrate a custom cluster into Lightning. + :col_css: col-md-6 + :button_link: expert_level_24.html + :height: 150 + :tag: expert + +.. displayitem:: + :header: Level 24: Make your own profiler + :description: Make your own profiler. + :col_css: col-md-6 + :button_link: ../tuning/profiler_expert.html + :height: 150 + :tag: expert + +.. displayitem:: + :header: Level 25: Add a new accelerator or Strategy + :description: Integrate a new accelerator or distributed strategy. + :col_css: col-md-6 + :button_link: expert_level_27.html + :height: 150 + :tag: expert + +.. raw:: html + +
+
diff --git a/source/levels/expert_level_23.rst b/docs/source-pytorch/levels/expert_level_23.rst similarity index 95% rename from source/levels/expert_level_23.rst rename to docs/source-pytorch/levels/expert_level_23.rst index 9b143a0..5d1ba67 100644 --- a/source/levels/expert_level_23.rst +++ b/docs/source-pytorch/levels/expert_level_23.rst @@ -1,7 +1,7 @@ :orphan: ################################## -Level 23: Extend the Lightning CLI +Level 22: Extend the Lightning CLI ################################## Extend the functionality of the Lightning CLI. diff --git a/docs/source-pytorch/levels/expert_level_24.rst b/docs/source-pytorch/levels/expert_level_24.rst new file mode 100644 index 0000000..54c544e --- /dev/null +++ b/docs/source-pytorch/levels/expert_level_24.rst @@ -0,0 +1,29 @@ +:orphan: + +#################################### +Level 23: Integrate a custom cluster +#################################### + +Extend the functionality of the Lightning CLI. + +---- + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Integrate your own cluster + :description: Learn how to integrate your own cluster + :col_css: col-md-6 + :button_link: ../clouds/cluster_expert.html + :height: 150 + :tag: expert + +.. raw:: html + +
+
diff --git a/source/levels/expert_level_27.rst b/docs/source-pytorch/levels/expert_level_27.rst similarity index 96% rename from source/levels/expert_level_27.rst rename to docs/source-pytorch/levels/expert_level_27.rst index c2d682b..9b06b10 100644 --- a/source/levels/expert_level_27.rst +++ b/docs/source-pytorch/levels/expert_level_27.rst @@ -1,7 +1,7 @@ :orphan: ########################################### -Level 27: Add a new accelerator or Strategy +Level 25: Add a new accelerator or Strategy ########################################### Integrate a new accelerator or distributed strategy. diff --git a/docs/source-pytorch/levels/intermediate.rst b/docs/source-pytorch/levels/intermediate.rst new file mode 100644 index 0000000..f7beb29 --- /dev/null +++ b/docs/source-pytorch/levels/intermediate.rst @@ -0,0 +1,77 @@ + +################### +Intermediate skills +################### + +Learn to scale up your models and enable collaborative model development at academic or industry research labs. + + +.. include:: ../links.rst + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Level 7: Interactive cloud development + :description: Learn how to access GPUs and TPUs on the cloud. + :button_link: intermediate_level_7.html + :col_css: col-md-6 + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Level 8: Modularize your projects + :description: Create DataModules to enable dataset reusability. + :col_css: col-md-6 + :button_link: intermediate_level_9.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Level 9: Understand your model + :description: Use advanced visuals to find the best performing model. + :col_css: col-md-6 + :button_link: intermediate_level_10.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Level 10: Explore SOTA scaling techniques + :description: Explore SOTA techniques to help convergence, stability and scalability. + :col_css: col-md-6 + :button_link: intermediate_level_11.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Level 11: Deploy your models + :description: Learn how to deploy your models with optimizations like ONNX and torchscript. + :col_css: col-md-6 + :button_link: intermediate_level_12.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Level 12: Optimize training speed + :description: Use advanced profilers to mixed precision to train bigger models, faster. + :col_css: col-md-6 + :button_link: intermediate_level_13.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: Level 13: Run on on-prem clusters + :description: Run on a custom on-prem cluster or SLURM cluster. + :col_css: col-md-6 + :button_link: intermediate_level_14.html + :height: 150 + :tag: intermediate + +.. raw:: html + +
+
diff --git a/source/levels/intermediate_level_10.rst b/docs/source-pytorch/levels/intermediate_level_10.rst similarity index 97% rename from source/levels/intermediate_level_10.rst rename to docs/source-pytorch/levels/intermediate_level_10.rst index d7f5dc5..1c9b646 100644 --- a/source/levels/intermediate_level_10.rst +++ b/docs/source-pytorch/levels/intermediate_level_10.rst @@ -1,7 +1,7 @@ :orphan: ############################### -Level 10: Understand your model +Level 9: Understand your model ############################### Find the best model using advanced visualizations for deeper insights. diff --git a/source/levels/intermediate_level_11.rst b/docs/source-pytorch/levels/intermediate_level_11.rst similarity index 95% rename from source/levels/intermediate_level_11.rst rename to docs/source-pytorch/levels/intermediate_level_11.rst index 4c7ed06..77dbbf9 100644 --- a/source/levels/intermediate_level_11.rst +++ b/docs/source-pytorch/levels/intermediate_level_11.rst @@ -1,7 +1,7 @@ :orphan: ######################################### -Level 11: Explore SOTA scaling techniques +Level 10: Explore SOTA scaling techniques ######################################### In this level you'll explore SOTA techniques to help convergence, stability and scalability. diff --git a/source/levels/intermediate_level_12.rst b/docs/source-pytorch/levels/intermediate_level_12.rst similarity index 97% rename from source/levels/intermediate_level_12.rst rename to docs/source-pytorch/levels/intermediate_level_12.rst index fe1c076..b929355 100644 --- a/source/levels/intermediate_level_12.rst +++ b/docs/source-pytorch/levels/intermediate_level_12.rst @@ -1,7 +1,7 @@ :orphan: ############################ -Level 12: Deploy your models +Level 11: Deploy your models ############################ In this level you'll learn a few options for deploying models into production. diff --git a/source/levels/intermediate_level_13.rst b/docs/source-pytorch/levels/intermediate_level_13.rst similarity index 96% rename from source/levels/intermediate_level_13.rst rename to docs/source-pytorch/levels/intermediate_level_13.rst index 38ac7aa..345e6d6 100644 --- a/source/levels/intermediate_level_13.rst +++ b/docs/source-pytorch/levels/intermediate_level_13.rst @@ -1,7 +1,7 @@ :orphan: ################################# -Level 13: Optimize training speed +Level 12: Optimize training speed ################################# In this level you'll use advanced profilers and mixed precision techniques to train bigger models faster. diff --git a/source/levels/intermediate_level_14.rst b/docs/source-pytorch/levels/intermediate_level_14.rst similarity index 91% rename from source/levels/intermediate_level_14.rst rename to docs/source-pytorch/levels/intermediate_level_14.rst index a779ede..b73cce2 100644 --- a/source/levels/intermediate_level_14.rst +++ b/docs/source-pytorch/levels/intermediate_level_14.rst @@ -1,10 +1,10 @@ :orphan: ################################# -Level 14: Run on on-prem clusters +Level 13: Run on on-prem clusters ################################# -In this level you'll learn to run on onprem clusters. +In this level you'll learn to run on on-prem clusters. ---- diff --git a/source/levels/intermediate_level_7.rst b/docs/source-pytorch/levels/intermediate_level_7.rst similarity index 79% rename from source/levels/intermediate_level_7.rst rename to docs/source-pytorch/levels/intermediate_level_7.rst index cc55fd7..ef4122d 100644 --- a/source/levels/intermediate_level_7.rst +++ b/docs/source-pytorch/levels/intermediate_level_7.rst @@ -21,14 +21,6 @@ Learn to develop models on cloud GPUs and TPUs. :height: 180 :tag: basic -.. displayitem:: - :header: Access a cloud machine with GPUs - :description: Learn how to get a cloud machine with single or multiple GPUs. - :col_css: col-md-3 - :button_link: ../clouds/session_basic.html - :height: 180 - :tag: basic - .. displayitem:: :header: GPU Training :description: Learn the basics on single and multi-GPU training. diff --git a/source/levels/intermediate_level_9.rst b/docs/source-pytorch/levels/intermediate_level_9.rst similarity index 96% rename from source/levels/intermediate_level_9.rst rename to docs/source-pytorch/levels/intermediate_level_9.rst index 8c537d7..b09db07 100644 --- a/source/levels/intermediate_level_9.rst +++ b/docs/source-pytorch/levels/intermediate_level_9.rst @@ -1,7 +1,7 @@ :orphan: ################################# -Level 9: Modularize your projects +Level 8: Modularize your projects ################################# This module teaches you how to setup complex projects that can be controlled via the CLI. diff --git a/source/links.rst b/docs/source-pytorch/links.rst similarity index 100% rename from source/links.rst rename to docs/source-pytorch/links.rst diff --git a/docs/source-pytorch/make.bat b/docs/source-pytorch/make.bat new file mode 100644 index 0000000..9b56514 --- /dev/null +++ b/docs/source-pytorch/make.bat @@ -0,0 +1,35 @@ +@ECHO OFF + +pushd %~dp0 + +REM Command file for Sphinx documentation + +if "%SPHINXBUILD%" == "" ( + set SPHINXBUILD=sphinx-build +) +set SOURCEDIR=. +set BUILDDIR=../build + +if "%1" == "" goto help + +%SPHINXBUILD% >NUL 2>NUL +if errorlevel 9009 ( + echo. + echo.The 'sphinx-build' command was not found. Make sure you have Sphinx + echo.installed, then set the SPHINXBUILD environment variable to point + echo.to the full path of the 'sphinx-build' executable. Alternatively you + echo.may add the Sphinx directory to PATH. + echo. + echo.If you don't have Sphinx installed, grab it from + echo.http://sphinx-doc.org/ + exit /b 1 +) + +%SPHINXBUILD% -M %1 %SOURCEDIR% %BUILDDIR% %SPHINXOPTS% +goto end + +:help +%SPHINXBUILD% -M help %SOURCEDIR% %BUILDDIR% %SPHINXOPTS% + +:end +popd diff --git a/docs/source-pytorch/model/build_model.rst b/docs/source-pytorch/model/build_model.rst new file mode 100644 index 0000000..c480a90 --- /dev/null +++ b/docs/source-pytorch/model/build_model.rst @@ -0,0 +1,55 @@ +:orphan: + +############# +Build a Model +############# + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: 1: Train a model + :description: Build a model to learn the basic ideas of Lightning + :col_css: col-md-4 + :button_link: train_model_basic.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: 2: Validate and test a model + :description: Add a validation and test data split to avoid overfitting. + :col_css: col-md-4 + :button_link: ../common/evaluation_basic.html + :height: 150 + :tag: basic + +.. displayitem:: + :header: 3: Supercharge training + :description: Enable state-of-the-art training techniques with the Trainer features. + :col_css: col-md-4 + :button_link: build_model_intermediate.html + :height: 150 + :tag: intermediate + +.. displayitem:: + :header: LightningModule API + :description: Dig into LightningModule API in depth + :col_css: col-md-4 + :button_link: ../common/lightning_module.html#lightningmodule-api + :height: 150 + +.. displayitem:: + :header: Trainer API + :description: Dig into Trainer API in depth + :col_css: col-md-4 + :button_link: ../common/trainer.html#trainer-class-api + :height: 150 + +.. raw:: html + +
+
diff --git a/source/model/build_model_advanced.rst b/docs/source-pytorch/model/build_model_advanced.rst similarity index 77% rename from source/model/build_model_advanced.rst rename to docs/source-pytorch/model/build_model_advanced.rst index 33be842..fb06cdf 100644 --- a/source/model/build_model_advanced.rst +++ b/docs/source-pytorch/model/build_model_advanced.rst @@ -8,7 +8,7 @@ Own your loop (advanced) Customize training loop *********************** -.. image:: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/custom_loop.png +.. image:: ../_static/fetched-s3-assets/custom_loop.png :width: 600 :alt: Injecting custom code in a training loop @@ -17,7 +17,7 @@ Inject custom code anywhere in the Training loop using any of the 20+ methods (: .. testcode:: class LitModel(pl.LightningModule): - def backward(self, loss, optimizer, optimizer_idx): + def backward(self, loss): loss.backward() ---- diff --git a/source/model/build_model_intermediate.rst b/docs/source-pytorch/model/build_model_intermediate.rst similarity index 86% rename from source/model/build_model_intermediate.rst rename to docs/source-pytorch/model/build_model_intermediate.rst index 55f1247..1ecf1d4 100644 --- a/source/model/build_model_intermediate.rst +++ b/docs/source-pytorch/model/build_model_intermediate.rst @@ -35,10 +35,11 @@ Enable advanced training features using Trainer arguments. These are SOTA techni Extend the Trainer ****************** -.. raw:: html - - +.. video:: ../_static/fetched-s3-assets/cb.mp4 + :width: 600 + :autoplay: + :loop: + :muted: If you have multiple lines of code with similar functionalities, you can use *callbacks* to easily group them together and toggle all of those lines on or off at the same time. diff --git a/docs/source-pytorch/model/manual_optimization.rst b/docs/source-pytorch/model/manual_optimization.rst new file mode 100644 index 0000000..964f095 --- /dev/null +++ b/docs/source-pytorch/model/manual_optimization.rst @@ -0,0 +1,348 @@ +******************* +Manual Optimization +******************* + +For advanced research topics like reinforcement learning, sparse coding, or GAN research, it may be desirable to +manually manage the optimization process, especially when dealing with multiple optimizers at the same time. + +In this mode, Lightning will handle only accelerator, precision and strategy logic. +The users are left with ``optimizer.zero_grad()``, gradient accumulation, optimizer toggling, etc.. + +To manually optimize, do the following: + +* Set ``self.automatic_optimization=False`` in your ``LightningModule``'s ``__init__``. +* Use the following functions and call them manually: + + * ``self.optimizers()`` to access your optimizers (one or multiple) + * ``optimizer.zero_grad()`` to clear the gradients from the previous training step + * ``self.manual_backward(loss)`` instead of ``loss.backward()`` + * ``optimizer.step()`` to update your model parameters + * ``self.toggle_optimizer()`` and ``self.untoggle_optimizer()`` if needed + +Here is a minimal example of manual optimization. + +.. testcode:: python + + from lightning.pytorch import LightningModule + + + class MyModel(LightningModule): + def __init__(self): + super().__init__() + # Important: This property activates manual optimization. + self.automatic_optimization = False + + def training_step(self, batch, batch_idx): + opt = self.optimizers() + opt.zero_grad() + loss = self.compute_loss(batch) + self.manual_backward(loss) + opt.step() + +.. tip:: + Be careful where you call ``optimizer.zero_grad()``, or your model won't converge. + It is good practice to call ``optimizer.zero_grad()`` before ``self.manual_backward(loss)``. + + +Access your Own Optimizer +========================= + +The provided ``optimizer`` is a :class:`~lightning.pytorch.core.optimizer.LightningOptimizer` object wrapping your own optimizer +configured in your :meth:`~lightning.pytorch.core.module.LightningModule.configure_optimizers`. You can access your own optimizer +with ``optimizer.optimizer``. However, if you use your own optimizer to perform a step, Lightning won't be able to +support accelerators, precision and profiling for you. + +.. testcode:: python + + class Model(LightningModule): + def __init__(self): + super().__init__() + self.automatic_optimization = False + ... + + def training_step(self, batch, batch_idx): + optimizer = self.optimizers() + + # `optimizer` is a `LightningOptimizer` wrapping the optimizer. + # To access it, do the following. + # However, it won't work on TPU, AMP, etc... + optimizer = optimizer.optimizer + ... + +Gradient Accumulation +===================== + +You can accumulate gradients over batches similarly to ``accumulate_grad_batches`` argument in +:ref:`Trainer ` for automatic optimization. To perform gradient accumulation with one optimizer +after every ``N`` steps, you can do as such. + +.. testcode:: python + + def __init__(self): + super().__init__() + self.automatic_optimization = False + + + def training_step(self, batch, batch_idx): + opt = self.optimizers() + + # scale losses by 1/N (for N batches of gradient accumulation) + loss = self.compute_loss(batch) / N + self.manual_backward(loss) + + # accumulate gradients of N batches + if (batch_idx + 1) % N == 0: + opt.step() + opt.zero_grad() + +Gradient Clipping +================= + +You can clip optimizer gradients during manual optimization similar to passing the ``gradient_clip_val`` and +``gradient_clip_algorithm`` argument in :ref:`Trainer ` during automatic optimization. +To perform gradient clipping with one optimizer with manual optimization, you can do as such. + +.. testcode:: python + + from lightning.pytorch import LightningModule + + + class SimpleModel(LightningModule): + def __init__(self): + super().__init__() + self.automatic_optimization = False + + def training_step(self, batch, batch_idx): + opt = self.optimizers() + + # compute loss + loss = self.compute_loss(batch) + + opt.zero_grad() + self.manual_backward(loss) + + # clip gradients + self.clip_gradients(opt, gradient_clip_val=0.5, gradient_clip_algorithm="norm") + + opt.step() + +.. warning:: + * Note that ``configure_gradient_clipping()`` won't be called in Manual Optimization. Instead consider using ``self. clip_gradients()`` manually like in the example above. + + +Use Multiple Optimizers (like GANs) +=================================== + +Here is an example training a simple GAN with multiple optimizers using manual optimization. + +.. testcode:: python + + import torch + from torch import Tensor + from lightning.pytorch import LightningModule + + + class SimpleGAN(LightningModule): + def __init__(self): + super().__init__() + self.G = Generator() + self.D = Discriminator() + + # Important: This property activates manual optimization. + self.automatic_optimization = False + + def sample_z(self, n) -> Tensor: + sample = self._Z.sample((n,)) + return sample + + def sample_G(self, n) -> Tensor: + z = self.sample_z(n) + return self.G(z) + + def training_step(self, batch, batch_idx): + # Implementation follows the PyTorch tutorial: + # https://pytorch.org/tutorials/beginner/dcgan_faces_tutorial.html + g_opt, d_opt = self.optimizers() + + X, _ = batch + batch_size = X.shape[0] + + real_label = torch.ones((batch_size, 1), device=self.device) + fake_label = torch.zeros((batch_size, 1), device=self.device) + + g_X = self.sample_G(batch_size) + + ########################## + # Optimize Discriminator # + ########################## + d_x = self.D(X) + errD_real = self.criterion(d_x, real_label) + + d_z = self.D(g_X.detach()) + errD_fake = self.criterion(d_z, fake_label) + + errD = errD_real + errD_fake + + d_opt.zero_grad() + self.manual_backward(errD) + d_opt.step() + + ###################### + # Optimize Generator # + ###################### + d_z = self.D(g_X) + errG = self.criterion(d_z, real_label) + + g_opt.zero_grad() + self.manual_backward(errG) + g_opt.step() + + self.log_dict({"g_loss": errG, "d_loss": errD}, prog_bar=True) + + def configure_optimizers(self): + g_opt = torch.optim.Adam(self.G.parameters(), lr=1e-5) + d_opt = torch.optim.Adam(self.D.parameters(), lr=1e-5) + return g_opt, d_opt + + +Learning Rate Scheduling +======================== + +Every optimizer you use can be paired with any +`Learning Rate Scheduler `_. Please see the +documentation of :meth:`~lightning.pytorch.core.module.LightningModule.configure_optimizers` for all the available options + +You can call ``lr_scheduler.step()`` at arbitrary intervals. +Use ``self.lr_schedulers()`` in your :class:`~lightning.pytorch.core.module.LightningModule` to access any learning rate schedulers +defined in your :meth:`~lightning.pytorch.core.module.LightningModule.configure_optimizers`. + +.. warning:: + * ``lr_scheduler.step()`` can be called at arbitrary intervals by the user in case of manual optimization, or by Lightning if ``"interval"`` is defined in :meth:`~lightning.pytorch.core.module.LightningModule.configure_optimizers` in case of automatic optimization. + * Note that the ``lr_scheduler_config`` keys, such as ``"frequency"`` and ``"interval"``, will be ignored even if they are provided in + your :meth:`~lightning.pytorch.core.module.LightningModule.configure_optimizers` during manual optimization. + +Here is an example calling ``lr_scheduler.step()`` every step. + +.. testcode:: python + + # step every batch + def __init__(self): + super().__init__() + self.automatic_optimization = False + + + def training_step(self, batch, batch_idx): + # do forward, backward, and optimization + ... + + # single scheduler + sch = self.lr_schedulers() + sch.step() + + # multiple schedulers + sch1, sch2 = self.lr_schedulers() + sch1.step() + sch2.step() + +If you want to call ``lr_scheduler.step()`` every ``N`` steps/epochs, do the following. + +.. testcode:: python + + def __init__(self): + super().__init__() + self.automatic_optimization = False + + + def training_step(self, batch, batch_idx): + # do forward, backward, and optimization + ... + + sch = self.lr_schedulers() + + # step every N batches + if (batch_idx + 1) % N == 0: + sch.step() + + # step every N epochs + if self.trainer.is_last_batch and (self.trainer.current_epoch + 1) % N == 0: + sch.step() + +If you want to call schedulers that require a metric value after each epoch, consider doing the following: + +.. testcode:: + + def __init__(self): + super().__init__() + self.automatic_optimization = False + + + def on_train_epoch_end(self): + sch = self.lr_schedulers() + + # If the selected scheduler is a ReduceLROnPlateau scheduler. + if isinstance(sch, torch.optim.lr_scheduler.ReduceLROnPlateau): + sch.step(self.trainer.callback_metrics["loss"]) + + +Optimizer Steps at Different Frequencies +======================================== + +In manual optimization, you are free to ``step()`` one optimizer more often than another one. +For example, here we step the optimizer for the *discriminator* weights twice as often as the optimizer for the *generator*. + +.. testcode:: python + + # Alternating schedule for optimizer steps (e.g. GANs) + def training_step(self, batch, batch_idx): + g_opt, d_opt = self.optimizers() + ... + + # update discriminator every other step + d_opt.zero_grad() + self.manual_backward(errD) + if (batch_idx + 1) % 2 == 0: + d_opt.step() + + ... + + # update generator every step + g_opt.zero_grad() + self.manual_backward(errG) + g_opt.step() + + +Use Closure for LBFGS-like Optimizers +===================================== + +It is a good practice to provide the optimizer with a closure function that performs a ``forward``, ``zero_grad`` and +``backward`` of your model. It is optional for most optimizers, but makes your code compatible if you switch to an +optimizer which requires a closure, such as :class:`~torch.optim.LBFGS`. + +See `the PyTorch docs `_ for more about the closure. + +Here is an example using a closure function. + +.. testcode:: python + + def __init__(self): + super().__init__() + self.automatic_optimization = False + + + def configure_optimizers(self): + return torch.optim.LBFGS(...) + + + def training_step(self, batch, batch_idx): + opt = self.optimizers() + + def closure(): + loss = self.compute_loss(batch) + opt.zero_grad() + self.manual_backward(loss) + return loss + + opt.step(closure=closure) + +.. warning:: + The :class:`~torch.optim.LBFGS` optimizer is not supported for AMP, IPUs, or DeepSpeed. diff --git a/docs/source-pytorch/model/own_your_loop.rst b/docs/source-pytorch/model/own_your_loop.rst new file mode 100644 index 0000000..ad0c889 --- /dev/null +++ b/docs/source-pytorch/model/own_your_loop.rst @@ -0,0 +1,25 @@ +:orphan: + +################################ +Use a pure PyTorch training loop +################################ + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Enable manual optimization + :description: Gain control of the training loop with manual optimization and LightningModule methods. + :col_css: col-md-4 + :button_link: build_model_advanced.html + :height: 150 + :tag: advanced + +.. raw:: html + +
+
diff --git a/source/model/train_model_basic.rst b/docs/source-pytorch/model/train_model_basic.rst similarity index 91% rename from source/model/train_model_basic.rst rename to docs/source-pytorch/model/train_model_basic.rst index 24bdab8..028734e 100644 --- a/source/model/train_model_basic.rst +++ b/docs/source-pytorch/model/train_model_basic.rst @@ -20,8 +20,8 @@ Add the relevant imports at the top of the file import torch.nn.functional as F from torchvision import transforms from torchvision.datasets import MNIST - from torch.utils.data import DataLoader, random_split - import pytorch_lightning as pl + from torch.utils.data import DataLoader + import lightning.pytorch as pl ---- @@ -33,6 +33,7 @@ Define the PyTorch nn.Modules class Encoder(nn.Module): def __init__(self): + super().__init__() self.l1 = nn.Sequential(nn.Linear(28 * 28, 64), nn.ReLU(), nn.Linear(64, 3)) def forward(self, x): @@ -41,6 +42,7 @@ Define the PyTorch nn.Modules class Decoder(nn.Module): def __init__(self): + super().__init__() self.l1 = nn.Sequential(nn.Linear(3, 64), nn.ReLU(), nn.Linear(64, 28 * 28)) def forward(self, x): @@ -114,11 +116,11 @@ Under the hood, the Lightning Trainer runs the following training loop on your b .. code:: python - autoencoder = LitAutoEncoder(encoder, decoder) + autoencoder = LitAutoEncoder(Encoder(), Decoder()) optimizer = autoencoder.configure_optimizers() - for batch, batch_idx in enumerate(train_loader): - loss = autoencoder(batch, batch_idx) + for batch_idx, batch in enumerate(train_loader): + loss = autoencoder.training_step(batch, batch_idx) loss.backward() optimizer.step() diff --git a/docs/source-pytorch/notebooks.rst b/docs/source-pytorch/notebooks.rst new file mode 100644 index 0000000..1fcafec --- /dev/null +++ b/docs/source-pytorch/notebooks.rst @@ -0,0 +1,12 @@ +:orphan: + +PyTorch Lightning Tutorials +=========================== + +.. toctree:: + :maxdepth: 1 + :name: Notebooks + :caption: Notebooks + :glob: + + notebooks/**/* diff --git a/docs/source-pytorch/past_versions.rst b/docs/source-pytorch/past_versions.rst new file mode 100644 index 0000000..597e2c1 --- /dev/null +++ b/docs/source-pytorch/past_versions.rst @@ -0,0 +1,141 @@ +Past PyTorch Lightning versions +=============================== + +PyTorch Lightning :doc:`evolved over time `. Here's the history of versions with links to their respective docs. + +To help you with keeping up to spead, check :doc:`Migration guide `. + +.. list-table:: Past versions + :widths: 5 50 30 15 + :header-rows: 1 + + * - Version + - Title + - Bug-fix versions + - Upgrade guide + + * - `1.9 `_ + - `Stability and additional improvements `_ + - `1.9.0 `_, + `1.9.1 `_, + `1.9.2 `_, + `1.9.3 `_, + `1.9.4 `_, + `1.9.5 `_ + - :doc:`from 1.9 to 2.0 ` + + * - `1.8 `_ + - `Colossal-AI Strategy, Commands and Secrets for Apps, FSDP Improvements and More! `_ + - `1.8.0 `_, + `1.8.1 `_, + `1.8.2 `_, + `1.8.3 `_, + `1.8.4 `_, + `1.8.5 `_, + `1.8.6 `_ + - :doc:`from 1.8 to 2.0 ` + + * - `1.7 `_ + - `Apple Silicon support, Native FSDP, Collaborative training, and multi-GPU support with Jupyter notebooks `_ + - `1.7.0 `_, + `1.7.1 `_, + `1.7.2 `_, + `1.7.3 `_, + `1.7.4 `_, + `1.7.5 `_, + `1.7.6 `_, + `1.7.7 `_ + - :doc:`from 1.7 to 2.0 ` + + * - `1.6 `_ + - `Support Intel's Habana Accelerator, New efficient DDP strategy (Bagua), Manual Fault-tolerance, Stability and Reliability `_ + - `1.6.0 `_, + `1.6.1 `_, + `1.6.2 `_, + `1.6.3 `_, + `1.6.4 `_, + `1.6.5 `_ + - :doc:`from 1.6 to 2.0 ` + + * - `1.5 `_ + - `LightningLite, Fault-Tolerant Training, Loop Customization, Lightning Tutorials, LightningCLI v2, RichProgressBar, CheckpointIO Plugin, and Trainer Strategy Flag `_ + - `1.5.0 `_, + `1.5.1 `_, + `1.5.2 `_, + `1.5.3 `_, + `1.5.4 `_, + `1.5.5 `_, + `1.5.6 `_, + `1.5.7 `_, + `1.5.8 `_, + `1.5.9 `_, + `1.5.10 `_ + - :doc:`from 1.5 to 2.0 ` + + * - `1.4 `_ + - `TPU Pod Training, IPU Accelerator, DeepSpeed Infinity, Fully Sharded Data Parallel `_ + - `1.4.0 `_, + `1.4.1 `_, + `1.4.2 `_, + `1.4.3 `_, + `1.4.4 `_, + `1.4.5 `_, + `1.4.6 `_, + `1.4.7 `_, + `1.4.8 `_, + `1.4.9 `_ + - :doc:`from 1.4 to 2.0 ` + + * - `1.3 `_ + - `Lightning CLI, PyTorch Profiler, Improved Early Stopping `_ + - `1.3.0 `_, + `1.3.1 `_, + `1.3.2 `_, + `1.3.3 `_, + `1.3.4 `_, + `1.3.5 `_, + `1.3.6 `_, + `1.3.7 `_, + `1.3.8 `_ + - + + * - `1.2 `_ + - `Pruning & Quantization & SWA `_ + - `1.2.0 `_, + `1.2.1 `_, + `1.2.2 `_, + `1.2.3 `_, + `1.2.4 `_, + `1.2.5 `_, + `1.2.6 `_, + `1.2.7 `_, + `1.2.8 `_, + `1.2.9 `_, + `1.2.10 `_ + - + + * - `1.1 `_ + - `Model Parallelism Training and More Logging Options `_ + - `1.1.0 `_, + `1.1.1 `_, + `1.1.2 `_, + `1.1.3 `_, + `1.1.4 `_, + `1.1.5 `_, + `1.1.6 `_, + `1.1.7 `_, + `1.1.8 `_ + - + + * - `1.0 `_ + - `General availability `_ + - `1.0.0 `_, + `1.0.1 `_, + `1.0.2 `_, + `1.0.3 `_, + `1.0.4 `_, + `1.0.5 `_, + `1.0.6 `_, + `1.0.7 `_, + `1.0.8 `_ + - diff --git a/source/starter/converting.rst b/docs/source-pytorch/starter/converting.rst similarity index 92% rename from source/starter/converting.rst rename to docs/source-pytorch/starter/converting.rst index 9e664d6..1e0d179 100644 --- a/source/starter/converting.rst +++ b/docs/source-pytorch/starter/converting.rst @@ -8,15 +8,15 @@ PyTorch를 Lightning으로 구성하기 -------- -****************************** +******************************* 1. 연산 코드 가져오기 -****************************** +******************************* 일반적인 nn.Module 구조를 가져옵니다 .. testcode:: - import pytorch_lightning as pl + import lightning.pytorch as pl import torch import torch.nn as nn import torch.nn.functional as F @@ -37,9 +37,9 @@ PyTorch를 Lightning으로 구성하기 -------- -*************************** +******************************** 2. 학습 로직 구성하기 -*************************** +******************************** LightningModule의 training_step에 학습 데이터를 묶음(batch)으로 가져와 학습하는 과정을 구성합니다: .. testcode:: @@ -59,9 +59,9 @@ LightningModule의 training_step에 학습 데이터를 묶음(batch)으로 가 ---- -**************************************** -3. 옵티마이저와 LR스케줄러 이동하기 -**************************************** +************************************************** +3. Move Optimizer(s) and LR Scheduler(s) +************************************************** 옵티마이저(들)를 :meth:`~pytorch_lightning.core.lightning.LightningModule.configure_optimizers` 훅(hook)으로 이동합니다. .. testcode:: @@ -92,9 +92,9 @@ LightningModule의 training_step에 학습 데이터를 묶음(batch)으로 가 -------- -************************************ +***************************************** 5. (선택사항) 테스트 로직 구성하기 -************************************ +***************************************** 테스트(test) 루프가 필요하면, 테스트 데이터를 묶음(batch)으로 가져와 테스트하는 과정을 구성합니다: .. testcode:: @@ -127,8 +127,6 @@ LightningModule의 training_step에 학습 데이터를 묶음(batch)으로 가 7. .cuda() 또는 .to(device) 호출 제거하기 ****************************************** -:doc:`LightningModule <../common/lightning_module>` 은 어떠한 하드웨어에서도 자동으로 실행됩니다! - ``LightningModule.__init__`` 내에서 초기화된 :class:`~torch.nn.Module` 인스턴스들과 :class:`~torch.utils.data.DataLoader` 에서 가져온 데이터는 Lightning이 자동으로 해당 장치로 이동해서 실행하므로, 기존에 명시적으로 ``.cuda()`` 또는 ``.to(device)`` 을 호출하는 부분은 제거해도 됩니다. @@ -154,17 +152,16 @@ Hint: ``LightningModule.__init__`` 메소드 내에서 :class:`~torch.Tensor` -------- -************************* +****************************** 8. 기존 데이터 사용하기 -************************* +****************************** 일반적인 PyTorch DataLoader는 Lightning에서 동작합니다. 더 모듈화되고 확장 가능한 데이터셋들은 :doc:`LightningDataModule <../data/datamodule>` 를 참고하세요. - ---- -************ +********************** 더 알아두기 -************ +********************** 추가로, :meth:`~pytorch_lightning.trainer.trainer.Trainer.validate` 메소드를 사용하면 검증(validation) 루프만 실행할 수 있습니다. @@ -175,7 +172,6 @@ Hint: ``LightningModule.__init__`` 메소드 내에서 :class:`~torch.Tensor` .. note:: ``model.eval()`` 와 ``torch.no_grad()`` 는 검증 시에 자동으로 호출됩니다. - 테스트 루프(test loop)는 :meth:`~pytorch_lightning.trainer.trainer.Trainer.fit` 에서 사용되지 않으므로, 필요 시 명시적으로 :meth:`~pytorch_lightning.trainer.trainer.Trainer.test` 을 호출해야 합니다. diff --git a/docs/source-pytorch/starter/installation.rst b/docs/source-pytorch/starter/installation.rst new file mode 100644 index 0000000..4d34f87 --- /dev/null +++ b/docs/source-pytorch/starter/installation.rst @@ -0,0 +1,91 @@ +:orphan: + +.. _installation: + +############ +설치하기 +############ + +********************* +pip를 사용하여 설치 +********************* + +라이트닝(lightning)을 가상환경이나 conda 환경에서 pip로 설치할 수 있습니다 + +.. code-block:: bash + + python -m pip install lightning + +-------------- + +*********************** +Conda를 사용하여 설치 +*********************** + +만약 conda를 아직 설치하지 않았다면, `Conda 설치 가이드 `_ 를 참고하세요. +Lightning은 아래 명령어로 `conda `_ 를 사용하여 설치할 수 있습니다: + +.. code-block:: bash + + conda install lightning -c conda-forge + +`Conda 가상환경(Environments) `_ 을 사용할 수도 있습니다: + +.. code-block:: bash + + conda activate my_env + conda install lightning -c conda-forge + +---- + +GRPC 패키지를 가져오는 데 어려움이 있는 경우 `이 글 `_ 을 따라해보세요. + + + +---- + +********************** +소스 코드에서 설치 +********************** + +소스 코드로 최신 버전(nightly)을 설치합니다. 아직 배포되지 않은 버그 수정(bug fix)과 새롭게 출시할 기능들이 +포함되어 있습니다. 미검증·불안정 최신 기능(bleeding edge)이므로, 신중하게 사용하세요. + +.. code-block:: bash + + pip install https://github.com/Lightning-AI/lightning/archive/refs/heads/master.zip -U + +향후 공개될 개선 버전(patch release)를 소스 코드로부터 설치합니다. 개선 버전은 가장 최근의 주요 버전(major release)에 대한 버그 수정만 +포함되어 있습니다. + +.. code-block:: bash + + pip install https://github.com/Lightning-AI/lightning/archive/refs/heads/release/stable.zip -U + +---- + +******************************* +모델 개발에 최적화된 버전 설치 +******************************* +이미 Lightning으로 개발한 모델을 배포하기 위해 최소한의 의존성만을 필요로 하는 경우, 최적화된 `lightning[pytorch]` 패키지를 설치하세요: + +.. code-block:: bash + + pip install 'lightning[pytorch]' + +^^^^^^^^^^^^^^^^^^^^^^^^^^^ +PyTorch 버전 지정하기 +^^^^^^^^^^^^^^^^^^^^^^^^^^^ +특정한 PyTorch 버전을 사용하려면 `PyTorch 설치 페이지 `_ 를 참고하세요. + +---- + + +***************************************************** +ML 워크플로우에 최적화된 버전 설치하기 (lightning Apps) +***************************************************** +이미 Lightning으로 개발한 워크플로우를 배포하기 위해 최소한의 의존성만을 필요로 하는 경우, 최적화된 `lightning[apps]` 패키지를 설치하세요: + +.. code-block:: bash + + pip install lightning-app diff --git a/docs/source-pytorch/starter/introduction.rst b/docs/source-pytorch/starter/introduction.rst new file mode 100644 index 0000000..e6d5440 --- /dev/null +++ b/docs/source-pytorch/starter/introduction.rst @@ -0,0 +1,371 @@ +:orphan: + +####################### +Lightning in 15 minutes +####################### +**Required background:** None + +**Goal:** In this guide, we'll walk you through the 7 key steps of a typical Lightning workflow. + +PyTorch Lightning is the deep learning framework with "batteries included" for professional AI researchers and machine learning engineers who need maximal flexibility while super-charging performance at scale. + +Lightning organizes PyTorch code to remove boilerplate and unlock scalability. + +.. video:: ../_static/fetched-s3-assets/pl_readme_gif_2_0.mp4 + :width: 800 + :autoplay: + :loop: + :muted: + +By organizing PyTorch code, lightning enables: + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Full flexibility + :description: Try any ideas using raw PyTorch without the boilerplate. + :col_css: col-md-3 + :image_center: ../_static/fetched-s3-assets/card_full_control.png + :height: 290 + +.. displayitem:: + :description: Decoupled research and engineering code enable reproducibility and better readability. + :header: Reproducible + Readable + :col_css: col-md-3 + :image_center: ../_static/fetched-s3-assets/card_no_boilerplate.png + :height: 290 + +.. displayitem:: + :description: Use multiple GPUs/TPUs/HPUs etc... without code changes. + :header: Simple multi-GPU training + :col_css: col-md-3 + :image_center: ../_static/fetched-s3-assets/card_hardware.png + :height: 290 + +.. displayitem:: + :description: We've done all the testing so you don't have to. + :header: Built-in testing + :col_css: col-md-3 + :image_center: ../_static/fetched-s3-assets/card_testing.png + :height: 290 + +.. raw:: html + +
+
+ +.. End of callout item section + +---- + +**************************** +1: Install PyTorch Lightning +**************************** +.. raw:: html + +
+
+ +For `pip `_ users + +.. code-block:: bash + + pip install lightning + +.. raw:: html + +
+
+ +For `conda `_ users + +.. code-block:: bash + + conda install lightning -c conda-forge + +.. raw:: html + +
+
+ +Or read the `advanced install guide `_ + +---- + +.. _new_project: + +*************************** +2: Define a LightningModule +*************************** + +A LightningModule enables your PyTorch nn.Module to play together in complex ways inside the training_step (there is also an optional validation_step and test_step). + +.. testcode:: + :skipif: not _TORCHVISION_AVAILABLE + + import os + from torch import optim, nn, utils, Tensor + from torchvision.datasets import MNIST + from torchvision.transforms import ToTensor + import lightning.pytorch as pl + + # define any number of nn.Modules (or use your current ones) + encoder = nn.Sequential(nn.Linear(28 * 28, 64), nn.ReLU(), nn.Linear(64, 3)) + decoder = nn.Sequential(nn.Linear(3, 64), nn.ReLU(), nn.Linear(64, 28 * 28)) + + + # define the LightningModule + class LitAutoEncoder(pl.LightningModule): + def __init__(self, encoder, decoder): + super().__init__() + self.encoder = encoder + self.decoder = decoder + + def training_step(self, batch, batch_idx): + # training_step defines the train loop. + # it is independent of forward + x, y = batch + x = x.view(x.size(0), -1) + z = self.encoder(x) + x_hat = self.decoder(z) + loss = nn.functional.mse_loss(x_hat, x) + # Logging to TensorBoard (if installed) by default + self.log("train_loss", loss) + return loss + + def configure_optimizers(self): + optimizer = optim.Adam(self.parameters(), lr=1e-3) + return optimizer + + + # init the autoencoder + autoencoder = LitAutoEncoder(encoder, decoder) + +---- + +******************* +3: Define a dataset +******************* + +Lightning supports ANY iterable (:class:`~torch.utils.data.DataLoader`, numpy, etc...) for the train/val/test/predict splits. + +.. code-block:: python + + # setup data + dataset = MNIST(os.getcwd(), download=True, transform=ToTensor()) + train_loader = utils.data.DataLoader(dataset) + +---- + +****************** +4: Train the model +****************** + +The Lightning :doc:`Trainer <../common/trainer>` "mixes" any :doc:`LightningModule <../common/lightning_module>` with any dataset and abstracts away all the engineering complexity needed for scale. + +.. code-block:: python + + # train the model (hint: here are some helpful Trainer arguments for rapid idea iteration) + trainer = pl.Trainer(limit_train_batches=100, max_epochs=1) + trainer.fit(model=autoencoder, train_dataloaders=train_loader) + +The Lightning :doc:`Trainer <../common/trainer>` automates `40+ tricks <../common/trainer.html#trainer-flags>`_ including: + +* Epoch and batch iteration +* ``optimizer.step()``, ``loss.backward()``, ``optimizer.zero_grad()`` calls +* Calling of ``model.eval()``, enabling/disabling grads during evaluation +* :doc:`Checkpoint Saving and Loading <../common/checkpointing>` +* Tensorboard (see :doc:`loggers <../visualize/loggers>` options) +* :doc:`Multi-GPU <../accelerators/gpu>` support +* :doc:`TPU <../accelerators/tpu>` +* :ref:`16-bit precision AMP ` support + +---- + + +**************** +5: Use the model +**************** +Once you've trained the model you can export to onnx, torchscript and put it into production or simply load the weights and run predictions. + +.. code:: python + + # load checkpoint + checkpoint = "./lightning_logs/version_0/checkpoints/epoch=0-step=100.ckpt" + autoencoder = LitAutoEncoder.load_from_checkpoint(checkpoint, encoder=encoder, decoder=decoder) + + # choose your trained nn.Module + encoder = autoencoder.encoder + encoder.eval() + + # embed 4 fake images! + fake_image_batch = torch.rand(4, 28 * 28, device=autoencoder.device) + embeddings = encoder(fake_image_batch) + print("⚡" * 20, "\nPredictions (4 image embeddings):\n", embeddings, "\n", "⚡" * 20) + +---- + +********************* +6: Visualize training +********************* +If you have tensorboard installed, you can use it for visualizing experiments. + +Run this on your commandline and open your browser to **http://localhost:6006/** + +.. code:: bash + + tensorboard --logdir . + +---- + +*********************** +7: Supercharge training +*********************** +Enable advanced training features using Trainer arguments. These are state-of-the-art techniques that are automatically integrated into your training loop without changes to your code. + +.. code:: + + # train on 4 GPUs + trainer = Trainer( + devices=4, + accelerator="gpu", + ) + + # train 1TB+ parameter models with Deepspeed/fsdp + trainer = Trainer( + devices=4, + accelerator="gpu", + strategy="deepspeed_stage_2", + precision=16 + ) + + # 20+ helpful flags for rapid idea iteration + trainer = Trainer( + max_epochs=10, + min_epochs=5, + overfit_batches=1 + ) + + # access the latest state of the art techniques + trainer = Trainer(callbacks=[StochasticWeightAveraging(...)]) + +---- + +******************** +Maximize flexibility +******************** +Lightning's core guiding principle is to always provide maximal flexibility **without ever hiding any of the PyTorch**. + +Lightning offers 5 *added* degrees of flexibility depending on your project's complexity. + +---- + +Customize training loop +======================= + +.. image:: ../_static/fetched-s3-assets/custom_loop.png + :width: 600 + :alt: Injecting custom code in a training loop + +Inject custom code anywhere in the Training loop using any of the 20+ methods (:ref:`lightning_hooks`) available in the LightningModule. + +.. testcode:: + + class LitAutoEncoder(pl.LightningModule): + def backward(self, loss): + loss.backward() + +---- + +Extend the Trainer +================== + +.. video:: ../_static/fetched-s3-assets/cb.mp4 + :width: 600 + :autoplay: + :loop: + :muted: + +If you have multiple lines of code with similar functionalities, you can use callbacks to easily group them together and toggle all of those lines on or off at the same time. + +.. code:: + + trainer = Trainer(callbacks=[AWSCheckpoints()]) + +---- + +Use a raw PyTorch loop +====================== + +For certain types of work at the bleeding-edge of research, Lightning offers experts full control of optimization or the training loop in various ways. + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Manual optimization + :description: Automated training loop, but you own the optimization steps. + :col_css: col-md-4 + :image_center: ../_static/fetched-s3-assets/manual_opt.png + :button_link: ../model/build_model_advanced.html#manual-optimization + :image_height: 220px + :height: 320 + +.. raw:: html + +
+
+ +.. End of callout item section + +---- + +********** +Next steps +********** +Depending on your use case, you might want to check one of these out next. + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: Level 2: Add a validation and test set + :description: Add validation and test sets to avoid over/underfitting. + :button_link: ../levels/basic_level_2.html + :col_css: col-md-3 + :height: 180 + :tag: basic + +.. displayitem:: + :header: See more examples + :description: See examples across computer vision, NLP, RL, etc... + :col_css: col-md-3 + :button_link: ../tutorials.html + :height: 180 + :tag: basic + +.. displayitem:: + :header: Deploy your model + :description: Learn how to predict or put your model into production + :col_css: col-md-3 + :button_link: ../deploy/production.html + :height: 180 + :tag: basic + +.. raw:: html + +
+
diff --git a/docs/source-pytorch/starter/style_guide.rst b/docs/source-pytorch/starter/style_guide.rst new file mode 100644 index 0000000..7bfc959 --- /dev/null +++ b/docs/source-pytorch/starter/style_guide.rst @@ -0,0 +1,223 @@ +########### +Style Guide +########### +The main goal of PyTorch Lightning is to improve readability and reproducibility. Imagine looking into any GitHub repo or a research project, +finding a :class:`~lightning.pytorch.core.module.LightningModule`, and knowing exactly where to look to find the things you care about. + +The goal of this style guide is to encourage Lightning code to be structured similarly. + +-------------- + +*************** +LightningModule +*************** + +These are best practices for structuring your :class:`~lightning.pytorch.core.module.LightningModule` class: + +Systems vs Models +================= + +.. figure:: ../_static/fetched-s3-assets/model_system.png + :width: 400 + +The main principle behind a LightningModule is that a full system should be self-contained. +In Lightning, we differentiate between a system and a model. + +A model is something like a resnet18, RNN, and so on. + +A system defines how a collection of models interact with each other with user-defined training/evaluation logic. Examples of this are: + +* GANs +* Seq2Seq +* BERT +* etc. + +A LightningModule can define both a system and a model: + +Here's a LightningModule that defines a system. This structure is what we recommend as a best practice. Keeping the model separate from the system improves +modularity, which eventually helps in better testing, reduces dependencies on the system and makes it easier to refactor. + +.. testcode:: + + class Encoder(nn.Module): + ... + + + class Decoder(nn.Module): + ... + + + class AutoEncoder(nn.Module): + def __init__(self): + super().__init__() + self.encoder = Encoder() + self.decoder = Decoder() + + def forward(self, x): + return self.encoder(x) + + + class AutoEncoderSystem(LightningModule): + def __init__(self): + super().__init__() + self.auto_encoder = AutoEncoder() + + +For fast prototyping, it's often useful to define all the computations in a LightningModule. For reusability +and scalability, it might be better to pass in the relevant backbones. + +Here's a LightningModule that defines a model. Although, we do not recommend to define a model like in the example. + +.. testcode:: + + class LitModel(LightningModule): + def __init__(self): + super().__init__() + self.layer_1 = nn.Linear() + self.layer_2 = nn.Linear() + self.layer_3 = nn.Linear() + + +Self-contained +============== + +A Lightning module should be self-contained. To see how self-contained your model is, a good test is to ask +yourself this question: + +"Can someone drop this file into a Trainer without knowing anything about the internals?" + +For example, we couple the optimizer with a model because the majority of models require a specific optimizer with +a specific learning rate scheduler to work well. + +Init +==== +The first place where LightningModules tend to stop being self-contained is in the init. Try to define all the relevant +sensible defaults in the init so that the user doesn't have to guess. + +Here's an example where a user will have to go hunt through files to figure out how to init this LightningModule. + +.. testcode:: + + class LitModel(LightningModule): + def __init__(self, params): + self.lr = params.lr + self.coef_x = params.coef_x + +Models defined as such leave you with many questions, such as what is ``coef_x``? Is it a string? A float? What is the range? +Instead, be explicit in your init + +.. testcode:: + + class LitModel(LightningModule): + def __init__(self, encoder: nn.Module, coef_x: float = 0.2, lr: float = 1e-3): + ... + +Now the user doesn't have to guess. Instead, they know the value type, and the model has a sensible default where the +user can see the value immediately. + + +Method Order +============ +The only required methods in the LightningModule are: + +* init +* training_step +* configure_optimizers + +However, if you decide to implement the rest of the optional methods, the recommended order is: + +* model/system definition (init) +* if doing inference, define forward +* training hooks +* validation hooks +* test hooks +* predict hooks +* configure_optimizers +* any other hooks + +In practice, the code looks like this: + +.. code-block:: + + class LitModel(pl.LightningModule): + + def __init__(...): + + def forward(...): + + def training_step(...): + + def on_train_epoch_end(...): + + def validation_step(...): + + def on_validation_epoch_end(...): + + def test_step(...): + + def on_test_epoch_end(...): + + def configure_optimizers(...): + + def any_extra_hook(...): + + +Forward vs training_step +======================== + +We recommend using :meth:`~lightning.pytorch.core.module.LightningModule.forward` for inference/predictions and keeping +:meth:`~lightning.pytorch.core.module.LightningModule.training_step` independent. + +.. code-block:: python + + def forward(self, x): + embeddings = self.encoder(x) + return embeddings + + + def training_step(self, batch, batch_idx): + x, _ = batch + z = self.encoder(x) + pred = self.decoder(z) + ... + + +-------------- + +**** +Data +**** + +These are best practices for handling data. + +DataLoaders +=========== + +Lightning uses :class:`~torch.utils.data.DataLoader` to handle all the data flow through the system. Whenever you structure dataloaders, +make sure to tune the number of workers for maximum efficiency. + + +DataModules +=========== + +The :class:`~lightning.pytorch.core.datamodule.LightningDataModule` is designed as a way of decoupling data-related +hooks from the :class:`~lightning.pytorch.core.module.LightningModule` so you can develop dataset agnostic models. It makes it easy to hot swap different +datasets with your model, so you can test it and benchmark it across domains. It also makes sharing and reusing the exact data splits and transforms across projects possible. + +Check out :ref:`data` document to understand data management within Lightning and its best practices. + +* What dataset splits were used? +* How many samples does this dataset have overall and within each split? +* Which transforms were used? + +It's for this reason that we recommend you use datamodules. This is especially important when collaborating because +it will save your team a lot of time as well. + +All they need to do is drop a datamodule into the Trainer and not worry about what was done to the data. + +This is true for both academic and corporate settings where data cleaning and ad-hoc instructions slow down the progress +of iterating through ideas. + +- Checkout the live examples to get your hands dirty: +- `Introduction to PyTorch Lightning `_ +- `Introduction to DataModules `_ diff --git a/source/tuning/profiler.rst b/docs/source-pytorch/tuning/profiler.rst similarity index 100% rename from source/tuning/profiler.rst rename to docs/source-pytorch/tuning/profiler.rst diff --git a/source/tuning/profiler_advanced.rst b/docs/source-pytorch/tuning/profiler_advanced.rst similarity index 93% rename from source/tuning/profiler_advanced.rst rename to docs/source-pytorch/tuning/profiler_advanced.rst index ad2ab9e..63a0013 100644 --- a/source/tuning/profiler_advanced.rst +++ b/docs/source-pytorch/tuning/profiler_advanced.rst @@ -12,11 +12,11 @@ Find bottlenecks in your code (advanced) ************************ Profile cloud TPU models ************************ -To profile TPU models use the :class:`~pytorch_lightning.profiler.xla.XLAProfiler` +To profile TPU models use the :class:`~lightning.pytorch.profilers.xla.XLAProfiler` .. code-block:: python - from pytorch_lightning.profiler import XLAProfiler + from lightning.pytorch.profilers import XLAProfiler profiler = XLAProfiler(port=9001) trainer = Trainer(profiler=profiler) diff --git a/source/tuning/profiler_basic.rst b/docs/source-pytorch/tuning/profiler_basic.rst similarity index 88% rename from source/tuning/profiler_basic.rst rename to docs/source-pytorch/tuning/profiler_basic.rst index 899e657..d248cc6 100644 --- a/source/tuning/profiler_basic.rst +++ b/docs/source-pytorch/tuning/profiler_basic.rst @@ -59,7 +59,6 @@ The simple profiler measures all the standard methods used in the training loop - on_after_backward - optimizer_step - on_train_batch_end -- training_step_end - on_training_end - etc... @@ -68,7 +67,7 @@ The simple profiler measures all the standard methods used in the training loop ************************************** Profile the time within every function ************************************** -To profile the time within every function, use the :class:`~pytorch_lightning.profiler.advanced.AdvancedProfiler` built on top of Python's `cProfiler `_. +To profile the time within every function, use the :class:`~lightning.pytorch.profilers.advanced.AdvancedProfiler` built on top of Python's `cProfiler `_. .. code-block:: python @@ -101,7 +100,7 @@ If the profiler report becomes too long, you can stream the report to a file: .. code-block:: python - from pytorch_lightning.profiler import AdvancedProfiler + from lightning.pytorch.profilers import AdvancedProfiler profiler = AdvancedProfiler(dirpath=".", filename="perf_logs") trainer = Trainer(profiler=profiler) @@ -112,10 +111,13 @@ If the profiler report becomes too long, you can stream the report to a file: Measure accelerator usage ************************* Another helpful technique to detect bottlenecks is to ensure that you're using the full capacity of your accelerator (GPU/TPU/IPU/HPU). -This can be measured with the :class:`~pytorch_lightning.callbacks.device_stats_monitor.DeviceStatsMonitor`: +This can be measured with the :class:`~lightning.pytorch.callbacks.device_stats_monitor.DeviceStatsMonitor`: .. testcode:: - from pytorch_lightning.callbacks import DeviceStatsMonitor + from lightning.pytorch.callbacks import DeviceStatsMonitor trainer = Trainer(callbacks=[DeviceStatsMonitor()]) + +CPU metrics will be tracked by default on the CPU accelerator. To enable it for other accelerators set ``DeviceStatsMonitor(cpu_stats=True)``. To disable logging +CPU metrics, you can specify ``DeviceStatsMonitor(cpu_stats=False)``. diff --git a/source/tuning/profiler_expert.rst b/docs/source-pytorch/tuning/profiler_expert.rst similarity index 90% rename from source/tuning/profiler_expert.rst rename to docs/source-pytorch/tuning/profiler_expert.rst index 64ff784..a64c0fa 100644 --- a/source/tuning/profiler_expert.rst +++ b/docs/source-pytorch/tuning/profiler_expert.rst @@ -12,12 +12,12 @@ Find bottlenecks in your code (expert) *********************** Build your own profiler *********************** -To build your own profiler, subclass :class:`~pytorch_lightning.profiler.base.Profiler` +To build your own profiler, subclass :class:`~lightning.pytorch.profilers.profiler.Profiler` and override some of its methods. Here is a simple example that profiles the first occurrence and total calls of each action: .. code-block:: python - from pytorch_lightning.profiler import Profiler + from lightning.pytorch.profilers import Profiler from collections import defaultdict import time @@ -69,7 +69,7 @@ To profile a specific action of interest, reference a profiler in the LightningM .. code-block:: python - from pytorch_lightning.profiler import SimpleProfiler, PassThroughProfiler + from lightning.pytorch.profilers import SimpleProfiler, PassThroughProfiler class MyModel(LightningModule): @@ -90,7 +90,7 @@ Here's the full code: .. code-block:: python - from pytorch_lightning.profiler import SimpleProfiler, PassThroughProfiler + from lightning.pytorch.profilers import SimpleProfiler, PassThroughProfiler class MyModel(LightningModule): diff --git a/source/tuning/profiler_intermediate.rst b/docs/source-pytorch/tuning/profiler_intermediate.rst similarity index 92% rename from source/tuning/profiler_intermediate.rst rename to docs/source-pytorch/tuning/profiler_intermediate.rst index d2b64b5..802bfc5 100644 --- a/source/tuning/profiler_intermediate.rst +++ b/docs/source-pytorch/tuning/profiler_intermediate.rst @@ -12,11 +12,11 @@ Find bottlenecks in your code (intermediate) ************************** Profile pytorch operations ************************** -To understand the cost of each PyTorch operation, use the :class:`~pytorch_lightning.profiler.pytorch.PyTorchProfiler` built on top of the `PyTorch profiler `__. +To understand the cost of each PyTorch operation, use the :class:`~lightning.pytorch.profilers.pytorch.PyTorchProfiler` built on top of the `PyTorch profiler `__. .. code-block:: python - from pytorch_lightning.profiler import PyTorchProfiler + from lightning.pytorch.profilers import PyTorchProfiler profiler = PyTorchProfiler() trainer = Trainer(profiler=profiler) @@ -65,11 +65,11 @@ The profiler will generate an output like this: *************************** Profile a distributed model *************************** -To profile a distributed model, use the :class:`~pytorch_lightning.profiler.pytorch.PyTorchProfiler` with the *filename* argument which will save a report per rank. +To profile a distributed model, use the :class:`~lightning.pytorch.profilers.pytorch.PyTorchProfiler` with the *filename* argument which will save a report per rank. .. code-block:: python - from pytorch_lightning.profiler import PyTorchProfiler + from lightning.pytorch.profilers import PyTorchProfiler profiler = PyTorchProfiler(filename="perf-logs") trainer = Trainer(profiler=profiler) @@ -138,9 +138,8 @@ With two ranks, it will generate a report like so: --------------------- --------------- --------------- --------------- --------------- --------------- Self CPU time total: 1.681ms -This profiler will record ``training_step``, ``backward``, ``validation_step``, ``test_step``, and ``predict_step`` by default. -The output below shows the profiling for the action ``training_step``. The user can provide ``PyTorchProfiler(record_functions={...})`` -to extend the scope of profiled functions. +This profiler will record ``training_step``, ``validation_step``, ``test_step``, and ``predict_step``. +The output above shows the profiling for the action ``training_step``. .. note:: When using the PyTorch Profiler, wall clock time will not not be representative of the true wall clock time. @@ -153,11 +152,11 @@ to extend the scope of profiled functions. ***************************** Visualize profiled operations ***************************** -To visualize the profiled operations, enable **emit_nvtx** in the :class:`~pytorch_lightning.profiler.pytorch.PyTorchProfiler`. +To visualize the profiled operations, enable **emit_nvtx** in the :class:`~lightning.pytorch.profilers.pytorch.PyTorchProfiler`. .. code-block:: python - from pytorch_lightning.profiler import PyTorchProfiler + from lightning.pytorch.profilers import PyTorchProfiler profiler = PyTorchProfiler(emit_nvtx=True) trainer = Trainer(profiler=profiler) diff --git a/source/tutorials.rst b/docs/source-pytorch/tutorials.rst similarity index 88% rename from source/tutorials.rst rename to docs/source-pytorch/tutorials.rst index 67b1abb..1d69b07 100644 --- a/source/tutorials.rst +++ b/docs/source-pytorch/tutorials.rst @@ -1,5 +1,3 @@ -:orphan: - PyTorch Lightning Tutorials =========================== diff --git a/docs/source-pytorch/upgrade/from_1_4.rst b/docs/source-pytorch/upgrade/from_1_4.rst new file mode 100644 index 0000000..d0117be --- /dev/null +++ b/docs/source-pytorch/upgrade/from_1_4.rst @@ -0,0 +1,34 @@ +:orphan: + +Upgrade from 1.4 to the 2.0 +########################### + +Regular User +************ + +.. include:: sections/1_4_regular.rst +.. include:: sections/1_5_regular.rst +.. include:: sections/1_6_regular.rst +.. include:: sections/1_7_regular.rst +.. include:: sections/1_8_regular.rst +.. include:: sections/1_9_regular.rst + +Advanced User +************* + +.. include:: sections/1_4_advanced.rst +.. include:: sections/1_5_advanced.rst +.. include:: sections/1_6_advanced.rst +.. include:: sections/1_7_advanced.rst +.. include:: sections/1_8_advanced.rst +.. include:: sections/1_9_advanced.rst + +Developer +********* + +.. include:: sections/1_4_devel.rst +.. include:: sections/1_5_devel.rst +.. include:: sections/1_6_devel.rst +.. include:: sections/1_7_devel.rst +.. include:: sections/1_8_devel.rst +.. include:: sections/1_9_devel.rst diff --git a/docs/source-pytorch/upgrade/from_1_5.rst b/docs/source-pytorch/upgrade/from_1_5.rst new file mode 100644 index 0000000..16d13e6 --- /dev/null +++ b/docs/source-pytorch/upgrade/from_1_5.rst @@ -0,0 +1,31 @@ +:orphan: + +Upgrade from 1.5 to the 2.0 +########################### + +Regular User +************ + +.. include:: sections/1_5_regular.rst +.. include:: sections/1_6_regular.rst +.. include:: sections/1_7_regular.rst +.. include:: sections/1_8_regular.rst +.. include:: sections/1_9_regular.rst + +Advanced User +************* + +.. include:: sections/1_5_advanced.rst +.. include:: sections/1_6_advanced.rst +.. include:: sections/1_7_advanced.rst +.. include:: sections/1_8_advanced.rst +.. include:: sections/1_9_advanced.rst + +Developer +********* + +.. include:: sections/1_5_devel.rst +.. include:: sections/1_6_devel.rst +.. include:: sections/1_7_devel.rst +.. include:: sections/1_8_devel.rst +.. include:: sections/1_9_devel.rst diff --git a/docs/source-pytorch/upgrade/from_1_6.rst b/docs/source-pytorch/upgrade/from_1_6.rst new file mode 100644 index 0000000..c0d5155 --- /dev/null +++ b/docs/source-pytorch/upgrade/from_1_6.rst @@ -0,0 +1,28 @@ +:orphan: + +Upgrade from 1.6 to the 2.0 +########################### + +Regular User +************ + +.. include:: sections/1_6_regular.rst +.. include:: sections/1_7_regular.rst +.. include:: sections/1_8_regular.rst +.. include:: sections/1_9_regular.rst + +Advanced User +************* + +.. include:: sections/1_6_advanced.rst +.. include:: sections/1_7_advanced.rst +.. include:: sections/1_8_advanced.rst +.. include:: sections/1_9_advanced.rst + +Developer +********* + +.. include:: sections/1_6_devel.rst +.. include:: sections/1_7_devel.rst +.. include:: sections/1_8_devel.rst +.. include:: sections/1_9_devel.rst diff --git a/docs/source-pytorch/upgrade/from_1_7.rst b/docs/source-pytorch/upgrade/from_1_7.rst new file mode 100644 index 0000000..b1413b9 --- /dev/null +++ b/docs/source-pytorch/upgrade/from_1_7.rst @@ -0,0 +1,25 @@ +:orphan: + +Upgrade from 1.7 to the 2.0 +########################### + +Regular User +************ + +.. include:: sections/1_7_regular.rst +.. include:: sections/1_8_regular.rst +.. include:: sections/1_9_regular.rst + +Advanced User +************* + +.. include:: sections/1_7_advanced.rst +.. include:: sections/1_8_advanced.rst +.. include:: sections/1_9_advanced.rst + +Developer +********* + +.. include:: sections/1_7_devel.rst +.. include:: sections/1_8_devel.rst +.. include:: sections/1_9_devel.rst diff --git a/docs/source-pytorch/upgrade/from_1_8.rst b/docs/source-pytorch/upgrade/from_1_8.rst new file mode 100644 index 0000000..c844d3f --- /dev/null +++ b/docs/source-pytorch/upgrade/from_1_8.rst @@ -0,0 +1,22 @@ +:orphan: + +Upgrade from 1.8 to the 2.0 +########################### + +Regular User +************ + +.. include:: sections/1_8_regular.rst +.. include:: sections/1_9_regular.rst + +Advanced User +************* + +.. include:: sections/1_8_advanced.rst +.. include:: sections/1_9_advanced.rst + +Developer +********* + +.. include:: sections/1_8_devel.rst +.. include:: sections/1_9_devel.rst diff --git a/docs/source-pytorch/upgrade/from_1_9.rst b/docs/source-pytorch/upgrade/from_1_9.rst new file mode 100644 index 0000000..e1233d9 --- /dev/null +++ b/docs/source-pytorch/upgrade/from_1_9.rst @@ -0,0 +1,16 @@ +:orphan: + +Regular User +************ + +.. include:: sections/1_9_regular.rst + +Advanced User +************* + +.. include:: sections/1_9_advanced.rst + +Developer +********* + +.. include:: sections/1_9_devel.rst diff --git a/docs/source-pytorch/upgrade/migration_guide.rst b/docs/source-pytorch/upgrade/migration_guide.rst new file mode 100644 index 0000000..8e2d451 --- /dev/null +++ b/docs/source-pytorch/upgrade/migration_guide.rst @@ -0,0 +1,63 @@ +Guide how to upgrade to the 2.0 version +####################################### + +The following section will guide you through updating to the 2.0 release. + +Particular versions +******************* + + + +.. raw:: html + +
+
+ +.. Add callout items below this line + +.. displayitem:: + :header: 1.9.x + :description: Upgrade from 1.9.x series to the 2.0. + :col_css: col-md-12 + :button_link: from_1_9.html + :height: 100 + +.. displayitem:: + :header: 1.8.x + :description: Upgrade from 1.8.x series to the 2.0. + :col_css: col-md-12 + :button_link: from_1_8.html + :height: 100 + +.. displayitem:: + :header: 1.7.x + :description: Upgrade from 1.7.x series to the 2.0. + :col_css: col-md-12 + :button_link: from_1_7.html + :height: 100 + +.. displayitem:: + :header: 1.6.x + :description: Upgrade from 1.6.x series to the 2.0. + :col_css: col-md-12 + :button_link: from_1_6.html + :height: 100 + +.. displayitem:: + :header: 1.5.x + :description: Upgrade from 1.5.x series to the 2.0. + :col_css: col-md-12 + :button_link: from_1_5.html + :height: 100 + +.. displayitem:: + :header: 1.4.x + :description: Upgrade from 1.4.x series to the 2.0. + :col_css: col-md-12 + :button_link: from_1_4.html + :height: 100 + +.. raw:: html + +
+
diff --git a/docs/source-pytorch/upgrade/sections/1_4_advanced.rst b/docs/source-pytorch/upgrade/sections/1_4_advanced.rst new file mode 100644 index 0000000..b43a316 --- /dev/null +++ b/docs/source-pytorch/upgrade/sections/1_4_advanced.rst @@ -0,0 +1,43 @@ +.. list-table:: adv. user 1.4 + :widths: 40 40 20 + :header-rows: 1 + + * - If + - Then + - Ref + + * - called ``ModelCheckpoint.save_function`` + - now call ``Trainer.save_checkpoint`` + - `PR7201`_ + + * - accessed the ``Trainer.running_sanity_check`` property + - now access the ``Trainer.sanity_checking`` property + - `PR4945`_ + + * - used ``LightningModule.grad_norm`` + - now use the ``pl.utilities.grad_norm`` utility function instead + - `PR7292`_ + + * - used ``TrainerTrainingTricksMixin.detect_nan_tensors`` + - now use ``pl.utilities.grads.grad_norm`` + - `PR6834`_ + + * - used ``TrainerTrainingTricksMixin.print_nan_gradients`` + - now use ``pl.utilities.finite_checks.print_nan_gradients`` + - `PR6834`_ + + * - If you relied on ``TrainerLoggingMixin.metrics_to_scalars`` + - now use ``pl.utilities.metrics.metrics_to_scalars`` + - `PR7180`_ + + * - selected the i-th GPU with ``Trainer(gpus="i,j")`` + - now this will set the number of GPUs, just like passing ``Trainer(devices=i)``, you can still select the specific GPU by setting the ``CUDA_VISIBLE_DEVICES=i,j`` environment variable + - `PR6388`_ + + +.. _pr7201: https://github.com/Lightning-AI/lightning/pull/7201 +.. _pr4945: https://github.com/Lightning-AI/lightning/pull/4945 +.. _pr7292: https://github.com/Lightning-AI/lightning/pull/7292 +.. _pr6834: https://github.com/Lightning-AI/lightning/pull/6834 +.. _pr7180: https://github.com/Lightning-AI/lightning/pull/7180 +.. _pr6388: https://github.com/Lightning-AI/lightning/pull/6388 diff --git a/docs/source-pytorch/upgrade/sections/1_4_devel.rst b/docs/source-pytorch/upgrade/sections/1_4_devel.rst new file mode 100644 index 0000000..e69de29 diff --git a/docs/source-pytorch/upgrade/sections/1_4_regular.rst b/docs/source-pytorch/upgrade/sections/1_4_regular.rst new file mode 100644 index 0000000..866bef5 --- /dev/null +++ b/docs/source-pytorch/upgrade/sections/1_4_regular.rst @@ -0,0 +1,59 @@ +.. list-table:: reg. user 1.4 + :widths: 40 40 20 + :header-rows: 1 + + * - If + - Then + - Ref + + * - relied on the ``outputs`` in your ``LightningModule.on_train_epoch_end`` or ``Callback.on_train_epoch_end`` hooks + - rely on either ``on_train_epoch_end`` or set outputs as attributes in your ``LightningModule`` instances and access them from the hook + - `PR7339`_ + + * - accessed ``Trainer.truncated_bptt_steps`` + - swicth to manual optimization + - `PR7323`_ + + * - called ``LightningModule.write_predictions`` and ``LightningModule.write_predictions_dict`` + - rely on ``predict_step`` and ``Trainer.predict`` + callbacks to write out predictions + - `PR7066`_ + + * - passed the ``period`` argument to the ``ModelCheckpoint`` callback + - pass the ``every_n_epochs`` argument to the ``ModelCheckpoint`` callback + - `PR6146`_ + + * - passed the ``output_filename`` argument to ``Profiler`` + - now pass ``dirpath`` and ``filename``, that is ``Profiler(dirpath=...., filename=...)`` + - `PR6621`_ + + * - passed the ``profiled_functions`` argument in ``PytorchProfiler`` + - now pass the ``record_functions`` argument + - `PR6349`_ + + * - relied on the ``@auto_move_data`` decorator to use the ``LightningModule`` outside of the ``Trainer`` for inference + - use ``Trainer.predict`` + - `PR6993`_ + + * - implemented ``on_load_checkpoint`` with a ``checkpoint`` only argument, as in ``Callback.on_load_checkpoint(checkpoint)`` + - now update the signature to include ``pl_module`` and ``trainer``, as in ``Callback.on_load_checkpoint(trainer, pl_module, checkpoint)`` + - `PR7253`_ + + * - relied on ``pl.metrics`` + - now import separate package ``torchmetrics`` + - `torchmetrics`_ + + * - accessed ``datamodule`` attribute of ``LightningModule``, that is ``model.datamodule`` + - now access ``Trainer.datamodule``, that is ``model.trainer.datamodule`` + - `PR7168`_ + + +.. _torchmetrics: https://torchmetrics.readthedocs.io/en/stable +.. _pr7339: https://github.com/Lightning-AI/lightning/pull/7339 +.. _pr7323: https://github.com/Lightning-AI/lightning/pull/7323 +.. _pr7066: https://github.com/Lightning-AI/lightning/pull/7066 +.. _pr6146: https://github.com/Lightning-AI/lightning/pull/6146 +.. _pr6621: https://github.com/Lightning-AI/lightning/pull/6621 +.. _pr6349: https://github.com/Lightning-AI/lightning/pull/6349 +.. _pr6993: https://github.com/Lightning-AI/lightning/pull/6993 +.. _pr7253: https://github.com/Lightning-AI/lightning/pull/7253 +.. _pr7168: https://github.com/Lightning-AI/lightning/pull/7168 diff --git a/docs/source-pytorch/upgrade/sections/1_5_advanced.rst b/docs/source-pytorch/upgrade/sections/1_5_advanced.rst new file mode 100644 index 0000000..22ba000 --- /dev/null +++ b/docs/source-pytorch/upgrade/sections/1_5_advanced.rst @@ -0,0 +1,75 @@ +.. list-table:: adv. user 1.5 + :widths: 40 40 20 + :header-rows: 1 + + * - If + - Then + - Ref + + * - used ``self.log(sync_dist_op=...)`` + - use ``self.log(reduce_fx=...)`` instead. Passing ``"mean"`` will still work, but it also takes a callable + - `PR7891`_ + + * - used the argument ``model`` from ``pytorch_lightning.utilities.model_helper.is_overridden`` + - use ``instance`` instead + - `PR7918`_ + + * - returned values from ``training_step`` that had ``.grad`` defined (e.g., a loss) and expected ``.detach()`` to be called for you + - call ``.detach()`` manually + - `PR7994`_ + + * - imported ``pl.utilities.distributed.rank_zero_warn`` + - import ``pl.utilities.rank_zero.rank_zero_warn`` + - + + * - relied on ``DataModule.has_prepared_data`` attribute + - manage data lifecycle in customer methods + - `PR7657`_ + + * - relied on ``DataModule.has_setup_fit`` attribute + - manage data lifecycle in customer methods + - `PR7657`_ + + * - relied on ``DataModule.has_setup_validate`` attribute + - manage data lifecycle in customer methods + - `PR7657`_ + + * - relied on ``DataModule.has_setup_test`` attribute + - manage data lifecycle in customer methods + - `PR7657`_ + + * - relied on ``DataModule.has_setup_predict`` attribute + - manage data lifecycle in customer methods + - `PR7657`_ + + * - relied on ``DataModule.has_teardown_fit`` attribute + - manage data lifecycle in customer methods + - `PR7657`_ + + * - relied on ``DataModule.has_teardown_validate`` attribute + - manage data lifecycle in customer methods + - `PR7657`_ + + * - relied on ``DataModule.has_teardown_test`` attribute + - manage data lifecycle in customer methods + - `PR7657`_ + + * - relied on ``DataModule.has_teardown_predict`` attribute + - manage data lifecycle in customer methods + - `PR7657`_ + + * - used ``DDPPlugin.task_idx`` + - use ``DDPStrategy.local_rank`` + - `PR8203`_ + + * - used ``Trainer.disable_validation`` + - use the condition ``not Trainer.enable_validation`` + - `PR8291`_ + + +.. _pr7891: https://github.com/Lightning-AI/lightning/pull/7891 +.. _pr7918: https://github.com/Lightning-AI/lightning/pull/7918 +.. _pr7994: https://github.com/Lightning-AI/lightning/pull/7994 +.. _pr7657: https://github.com/Lightning-AI/lightning/pull/7657 +.. _pr8203: https://github.com/Lightning-AI/lightning/pull/8203 +.. _pr8291: https://github.com/Lightning-AI/lightning/pull/8291 diff --git a/docs/source-pytorch/upgrade/sections/1_5_devel.rst b/docs/source-pytorch/upgrade/sections/1_5_devel.rst new file mode 100644 index 0000000..dcaefe4 --- /dev/null +++ b/docs/source-pytorch/upgrade/sections/1_5_devel.rst @@ -0,0 +1,30 @@ +.. list-table:: devel 1.5 + :widths: 40 40 20 + :header-rows: 1 + + * - If + - Then + - Ref + + + * - called ``CheckpointConnector.hpc_load()`` + - just call ``CheckpointConnector.restore()`` + - `PR7652`_ + + * - used ``TrainerModelHooksMixin`` + - now rely on the corresponding utility functions in ``pytorch_lightning.utilities.signature_utils`` + - `PR7422`_ + + * - assigned the ``Trainer.train_loop`` property + - now assign the equivalent ``Trainer.fit_loop`` property + - `PR8025`_ + + * - accessed ``LightningModule.loaded_optimizer_states_dict`` + - the property has been removed + - `PR8229`_ + + +.. _pr7652: https://github.com/Lightning-AI/lightning/pull/7652 +.. _pr7422: https://github.com/Lightning-AI/lightning/pull/7422 +.. _pr8025: https://github.com/Lightning-AI/lightning/pull/8025 +.. _pr8229: https://github.com/Lightning-AI/lightning/pull/8229 diff --git a/docs/source-pytorch/upgrade/sections/1_5_regular.rst b/docs/source-pytorch/upgrade/sections/1_5_regular.rst new file mode 100644 index 0000000..994cfae --- /dev/null +++ b/docs/source-pytorch/upgrade/sections/1_5_regular.rst @@ -0,0 +1,47 @@ +.. list-table:: reg. user 1.5 + :widths: 40 40 20 + :header-rows: 1 + + * - If + - Then + - Ref + + * - used ``trainer.fit(train_dataloaders=...)`` + - use ``trainer.fit(dataloaders=...)`` + - `PR7431`_ + + * - used ``trainer.validate(val_dataloaders...)`` + - use ``trainer.validate(dataloaders=...)`` + - `PR7431`_ + + * - passed ``num_nodes`` to ``DDPPlugin`` and ``DDPSpawnPlugin`` + - remove them since these parameters are now passed from the ``Trainer`` + - `PR7026`_ + + * - passed ``sync_batchnorm`` to ``DDPPlugin`` and ``DDPSpawnPlugin`` + - remove them since these parameters are now passed from the ``Trainer`` + - `PR7026`_ + + * - didn’t provide a ``monitor`` argument to the ``EarlyStopping`` callback and just relied on the default value + - pass ``monitor`` as it is now a required argument + - `PR7907`_ + + * - used ``every_n_val_epochs`` in ``ModelCheckpoint`` + - change the argument to ``every_n_epochs`` + - `PR8383`_ + + * - used Trainer’s flag ``reload_dataloaders_every_epoch`` + - use pass ``reload_dataloaders_every_n_epochs`` + - `PR5043`_ + + * - used Trainer’s flag ``distributed_backend`` + - use ``strategy`` + - `PR8575`_ + + +.. _pr7431: https://github.com/Lightning-AI/lightning/pull/7431 +.. _pr7026: https://github.com/Lightning-AI/lightning/pull/7026 +.. _pr7907: https://github.com/Lightning-AI/lightning/pull/7907 +.. _pr8383: https://github.com/Lightning-AI/lightning/pull/8383 +.. _pr5043: https://github.com/Lightning-AI/lightning/pull/5043 +.. _pr8575: https://github.com/Lightning-AI/lightning/pull/8575 diff --git a/docs/source-pytorch/upgrade/sections/1_6_advanced.rst b/docs/source-pytorch/upgrade/sections/1_6_advanced.rst new file mode 100644 index 0000000..c17be4a --- /dev/null +++ b/docs/source-pytorch/upgrade/sections/1_6_advanced.rst @@ -0,0 +1,61 @@ +.. list-table:: adv. user 1.6 + :widths: 40 40 20 + :header-rows: 1 + + * - If + - Then + - Ref + + * - passed ``prepare_data_per_node`` to the ``Trainer`` + - set it as a property of ``DataHooks``, accessible in the ``LightningModule`` and ``LightningDataModule`` instead + - `PR8958`_ + + * - used ``process_position`` flag + - specify your ``ProgressBar`` callback and set it as ``process_position`` directly + - `PR9222`_ + + * - used distributed training attributes ``add_to_queue`` and ``get_from_queue`` in ``LightningModule`` + - user the same methods in ``DDPStrategy(start_method='spawn')`` + - `PR9118`_ + + * - called ``LightningModule.get_progress_bar_dict`` + - use the utility function ``pl.callbacks.progress.base.get_standard_metrics(module.trainer)`` + - `PR9118`_ + + * - used ``LightningModule.on_post_move_to_device`` + - remove it as parameters tying happens automatically without the need of implementing your own logic + - `PR9525`_ + + * - relied on ``Trainer.progress_bar_dict`` + - use ``ProgressBarBase.get_metrics`` + - `PR9118`_ + + * - used ``LightningDistributed`` + - rely on the logic in ``DDPStrategy(start_method='...')`` + - `PR9691`_ + + * - used the Accelerator collective API ``Accelerator.barrier``, ``Accelerator.broadcast``, and ``Accelerator.all_gather`` + - call ``Strategy`` collectives API directly, without going through ``Accelerator`` + - `PR9677`_ + + * - used ``pytorch_lightning.core.decorators.parameter_validation`` + - rely on automatic parameters tying with ``pytorch_lightning.utilities.params_tying.set_shared_parameters`` + - `PR9525`_ + + * - used ``LearningRateMonitor.lr_sch_names`` + - access them using ``LearningRateMonitor.lrs.keys()`` which will return the names of all the optimizers, even those without a scheduler. + - `PR10066`_ + + * - implemented ``DataModule`` ``train_transforms``, ``val_transforms``, ``test_transforms``, ``size``, ``dims`` + - switch to ``LightningDataModule`` + - `PR8851`_ + + +.. _pr8958: https://github.com/Lightning-AI/lightning/pull/8958 +.. _pr9222: https://github.com/Lightning-AI/lightning/pull/9222 +.. _pr9118: https://github.com/Lightning-AI/lightning/pull/9118 +.. _pr9525: https://github.com/Lightning-AI/lightning/pull/9525 +.. _pr9691: https://github.com/Lightning-AI/lightning/pull/9691 +.. _pr9677: https://github.com/Lightning-AI/lightning/pull/9677 +.. _pr10066: https://github.com/Lightning-AI/lightning/pull/10066 +.. _pr8851: https://github.com/Lightning-AI/lightning/pull/8851 diff --git a/docs/source-pytorch/upgrade/sections/1_6_devel.rst b/docs/source-pytorch/upgrade/sections/1_6_devel.rst new file mode 100644 index 0000000..9369de0 --- /dev/null +++ b/docs/source-pytorch/upgrade/sections/1_6_devel.rst @@ -0,0 +1,37 @@ +.. list-table:: devel 1.6 + :widths: 40 40 20 + :header-rows: 1 + + * - If + - Then + - Ref + + * - called ``LightningLoggerBase.close`` + - switch to ``LightningLoggerBase.finalize``. + - `PR9422`_ + + * - called ``LoggerCollection.close`` + - switch to ``LoggerCollection.finalize``. + - `PR9422`_ + + * - used ``AcceleratorConnector.is_slurm_managing_tasks`` attribute + - it is set not as protected and discouraged from direct use + - `PR10101`_ + + * - used ``AcceleratorConnector.configure_slurm_ddp`` attributes + - it is set not as protected and discouraged from direct use + - `PR10101`_ + + * - used ``ClusterEnvironment.creates_children()`` method + - change it to ``ClusterEnvironment.creates_processes_externally`` which is property now. + - `PR10106`_ + + * - called ``PrecisionPlugin.master_params()`` + - update it ``PrecisionPlugin.main_params()`` + - `PR10105`_ + + +.. _pr9422: https://github.com/Lightning-AI/lightning/pull/9422 +.. _pr10101: https://github.com/Lightning-AI/lightning/pull/10101 +.. _pr10105: https://github.com/Lightning-AI/lightning/pull/10105 +.. _pr10106: https://github.com/Lightning-AI/lightning/pull/10106 diff --git a/docs/source-pytorch/upgrade/sections/1_6_regular.rst b/docs/source-pytorch/upgrade/sections/1_6_regular.rst new file mode 100644 index 0000000..e016084 --- /dev/null +++ b/docs/source-pytorch/upgrade/sections/1_6_regular.rst @@ -0,0 +1,105 @@ +.. list-table:: reg. user 1.6 + :widths: 40 40 20 + :header-rows: 1 + + * - If + - Then + - Ref + + * - used Trainer’s flag ``terminate_on_nan`` + - set ``detect_anomaly`` instead, which enables detecting anomalies in the autograd engine + - `PR9175`_ + + * - used Trainer’s flag ``weights_summary`` + - pass a ``ModelSummary`` callback with ``max_depth`` instead + - `PR9699`_ + + * - used Trainer’s flag ``checkpoint_callback`` + - set ``enable_checkpointing``. If you set ``enable_checkpointing=True``, it configures a default ``ModelCheckpoint`` callback if none is provided ``lightning_pytorch.trainer.trainer.Trainer.callbacks.ModelCheckpoint`` + - `PR9754`_ + + * - used Trainer’s flag ``stochastic_weight_avg`` + - add the ``StochasticWeightAveraging`` callback directly to the list of callbacks, so for example, ``Trainer(..., callbacks=[StochasticWeightAveraging(), ...])`` + - `PR8989`_ + + * - used Trainer’s flag ``flush_logs_every_n_steps`` + - pass it to the logger init if it is supported for the particular logger + - `PR9366`_ + + * - used Trainer’s flag ``max_steps`` to the ``Trainer``, ``max_steps=None`` won't have any effect + - turn off the limit by passing ``Trainer(max_steps=-1)`` which is the default + - `PR9460`_ + + * - used Trainer’s flag ``resume_from_checkpoint="..."`` + - pass the same path to the fit function instead, ``trainer.fit(ckpt_path="...")`` + - `PR9693`_ + + * - used Trainer’s flag ``log_gpu_memory``, ``gpu_metrics`` + - use the ``DeviceStatsMonitor`` callback instead + - `PR9921`_ + + * - used Trainer’s flag ``progress_bar_refresh_rate`` + - set the ``ProgressBar`` callback and set ``refresh_rate`` there, or pass ``enable_progress_bar=False`` to disable the progress bar + - `PR9616`_ + + * - called ``LightningModule.summarize()`` + - use the utility function ``pl.utilities.model_summary.summarize(model)`` + - `PR8513`_ + + * - used the ``LightningModule.model_size`` property + - use the utility function ``pl.utilities.memory.get_model_size_mb(model)`` + - `PR8495`_ + + * - relied on the ``on_train_dataloader()`` hooks in ``LightningModule`` and ``LightningDataModule`` + - use ``train_dataloader`` + - `PR9098`_ + + * - relied on the ``on_val_dataloader()`` hooks in ``LightningModule`` and ``LightningDataModule`` + - use ``val_dataloader`` + - `PR9098`_ + + * - relied on the ``on_test_dataloader()`` hooks in ``LightningModule`` and ``LightningDataModule`` + - use ``test_dataloader`` + - `PR9098`_ + + * - relied on the ``on_predict_dataloader()`` hooks in ``LightningModule`` and ``LightningDataModule`` + - use ``predict_dataloader`` + - `PR9098`_ + + * - implemented the ``on_keyboard_interrupt`` callback hook + - implement the ``on_exception`` hook, and specify the exception type + - `PR9260`_ + + * - relied on the ``TestTubeLogger`` + - Use another logger like ``TensorBoardLogger`` + - `PR9065`_ + + * - used the basic progress bar ``ProgressBar`` callback + - use the ``TQDMProgressBar`` callback instead with the same arguments + - `PR10134`_ + + * - were using ``GPUStatsMonitor`` callbacks + - use ``DeviceStatsMonitor`` callback instead + - `PR9924`_ + + * - were using ``XLAStatsMonitor`` callbacks + - use ``DeviceStatsMonitor`` callback instead + - `PR9924`_ + + +.. _pr9175: https://github.com/Lightning-AI/lightning/pull/9175 +.. _pr9699: https://github.com/Lightning-AI/lightning/pull/9699 +.. _pr9754: https://github.com/Lightning-AI/lightning/pull/9754 +.. _pr8989: https://github.com/Lightning-AI/lightning/pull/8989 +.. _pr9366: https://github.com/Lightning-AI/lightning/pull/9366 +.. _pr9460: https://github.com/Lightning-AI/lightning/pull/9460 +.. _pr9693: https://github.com/Lightning-AI/lightning/pull/9693 +.. _pr9921: https://github.com/Lightning-AI/lightning/pull/9921 +.. _pr9616: https://github.com/Lightning-AI/lightning/pull/9616 +.. _pr8513: https://github.com/Lightning-AI/lightning/pull/8513 +.. _pr8495: https://github.com/Lightning-AI/lightning/pull/8495 +.. _pr9098: https://github.com/Lightning-AI/lightning/pull/9098 +.. _pr9260: https://github.com/Lightning-AI/lightning/pull/9260 +.. _pr9065: https://github.com/Lightning-AI/lightning/pull/9065 +.. _pr10134: https://github.com/Lightning-AI/lightning/pull/10134 +.. _pr9924: https://github.com/Lightning-AI/lightning/pull/9924 diff --git a/docs/source-pytorch/upgrade/sections/1_7_advanced.rst b/docs/source-pytorch/upgrade/sections/1_7_advanced.rst new file mode 100644 index 0000000..8b92044 --- /dev/null +++ b/docs/source-pytorch/upgrade/sections/1_7_advanced.rst @@ -0,0 +1,139 @@ +.. list-table:: adv. user 1.7 + :widths: 40 40 20 + :header-rows: 1 + + * - If + - Then + - Ref + + * - used ``DDP2Strategy`` + - switch to ``DDPStrategy`` + - `PR14026`_ + + * - used ``Trainer.training_type_plugin`` property + - now use ``Trainer.strategy`` and update the references + - `PR11141`_ + + * - used any ``TrainingTypePluginsn`` + - rename them to ``Strategy`` + - `PR11120`_ + + * - used ``DistributedType`` + - rely on protected ``_StrategyType`` + - `PR10505`_ + + * - used ``DeviceType`` + - rely on protected ``_AcceleratorType`` + - `PR10503`_ + + * - used ``pl.utiltiies.meta`` functions + - switch to built-in https://github.com/pytorch/torchdistx support + - `PR13868`_ + + * - have implemented ``Callback.on_configure_sharded_model`` hook + - move your implementation to ``Callback.setup`` + - `PR14834`_ + + * - have implemented the ``Callback.on_before_accelerator_backend_setup`` hook + - move your implementation to ``Callback.setup`` + - `PR14834`_ + + * - have implemented the ``Callback.on_batch_start`` hook + - move your implementation to ``Callback.on_train_batch_start`` + - `PR14834`_ + + * - have implemented the ``Callback.on_batch_end`` hook + - move your implementation to ``Callback.on_train_batch_end`` + - `PR14834`_ + + * - have implemented the ``Callback.on_epoch_start`` hook + - move your implementation to ``Callback.on_train_epoch_start`` , to ``Callback.on_validation_epoch_start`` , to ``Callback.on_test_epoch_start`` + - `PR14834`_ + + * - have implemented the ``Callback.on_pretrain_routine_{start,end}`` hook + - move your implementation to ``Callback.on_fit_start`` + - `PR14834`_ + + * - used ``Callback.on_init_start`` hook + - use ``Callback.on_train_start`` instead + - `PR10940`_ + + * - used ``Callback.on_init_end`` hook + - use ``Callback.on_train_start`` instead + - `PR10940`_ + + * - used Trainer’s attribute ``Trainer.num_processes`` + - it was replaced by ``Trainer.num_devices`` + - `PR12388`_ + + * - used Trainer’s attribute ``Trainer.gpus`` + - it was replaced by ``Trainer.num_devices`` + - `PR12436`_ + + * - used Trainer’s attribute ``Trainer.num_gpus`` + - use ``Trainer.num_devices`` instead + - `PR12384`_ + + * - used Trainer’s attribute ``Trainer.ipus`` + - use ``Trainer.num_devices`` instead + - `PR12386`_ + + * - used Trainer’s attribute ``Trainer.tpu_cores`` + - use ``Trainer.num_devices`` instead + - `PR12437`_ + + * - used ``Trainer.num_processes`` attribute + - switch to using ``Trainer.num_devices`` + - `PR12388`_ + + * - used ``LightningIPUModule`` + - it was removed + - `PR14830`_ + + * - logged with ``LightningLoggerBase.agg_and_log_metrics`` + - switch to ``LightningLoggerBase.log_metrics`` + - `PR11832`_ + + * - used ``agg_key_funcs`` parameter from ``LightningLoggerBase`` + - log metrics explicitly + - `PR11871`_ + + * - used ``agg_default_func`` parameters in ``LightningLoggerBase`` + - log metrics explicitly + - `PR11871`_ + + * - used ``Trainer.validated_ckpt_path`` attribute + - rely on generic read-only property ``Trainer.ckpt_path`` which is set when checkpoints are loaded via ``Trainer.validate(````ckpt_path=...)`` + - `PR11696`_ + + * - used ``Trainer.tested_ckpt_path`` attribute + - rely on generic read-only property ``Trainer.ckpt_path`` which is set when checkpoints are loaded via ``Trainer.test(````ckpt_path=...)`` + - `PR11696`_ + + * - used ``Trainer.predicted_ckpt_path`` attribute + - rely on generic read-only property ``Trainer.ckpt_path``, which is set when checkpoints are loaded via ``Trainer.predict(````ckpt_path=...)`` + - `PR11696`_ + + * - rely on the returned dictionary from ``Callback.on_save_checkpoint`` + - call directly ``Callback.state_dict`` instead + - `PR11887`_ + + +.. _pr14026: https://github.com/Lightning-AI/lightning/pull/14026 +.. _pr11141: https://github.com/Lightning-AI/lightning/pull/11141 +.. _pr11120: https://github.com/Lightning-AI/lightning/pull/11120 +.. _pr10505: https://github.com/Lightning-AI/lightning/pull/10505 +.. _pr10503: https://github.com/Lightning-AI/lightning/pull/10503 +.. _pr13868: https://github.com/Lightning-AI/lightning/pull/13868 +.. _pr14834: https://github.com/Lightning-AI/lightning/pull/14834 +.. _pr10940: https://github.com/Lightning-AI/lightning/pull/10940 +.. _pr12388: https://github.com/Lightning-AI/lightning/pull/12388 +.. _pr12436: https://github.com/Lightning-AI/lightning/pull/12436 +.. _pr12384: https://github.com/Lightning-AI/lightning/pull/12384 +.. _pr12386: https://github.com/Lightning-AI/lightning/pull/12386 +.. _pr12437: https://github.com/Lightning-AI/lightning/pull/12437 +.. _pr14830: https://github.com/Lightning-AI/lightning/pull/14830 +.. _pr11832: https://github.com/Lightning-AI/lightning/pull/11832 +.. _pr11871: https://github.com/Lightning-AI/lightning/pull/11871 +.. _pr11696: https://github.com/Lightning-AI/lightning/pull/11696 +.. _pr11887: https://github.com/Lightning-AI/lightning/pull/11887 diff --git a/docs/source-pytorch/upgrade/sections/1_7_devel.rst b/docs/source-pytorch/upgrade/sections/1_7_devel.rst new file mode 100644 index 0000000..11fab55 --- /dev/null +++ b/docs/source-pytorch/upgrade/sections/1_7_devel.rst @@ -0,0 +1,145 @@ +.. list-table:: devel 1.7 + :widths: 40 40 20 + :header-rows: 1 + + * - If + - Then + - Ref + + * - Removed the legacy ``Trainer.get_deprecated_arg_names()`` + - + - `PR14415`_ + + * - used the generic method ``Trainer.run_stage`` + - switch to a specific one depending on your purpose ``Trainer.{fit,validate,test,predict}`` . + - `PR11000`_ + + * - used ``rank_zero_only`` from ``pl.utilities.distributed`` + - import it from ``pl.utilities.rank_zero`` + - `PR11747`_ + + * - used ``rank_zero_debug`` from ``pl.utilities.distributed`` + - import it from ``pl.utilities.rank_zero`` + - `PR11747`_ + + * - used ``rank_zero_info`` from ``pl.utilities.distributed`` + - import it from ``pl.utilities.rank_zero`` + - `PR11747`_ + + * - used ``rank_zero_warn`` from ``pl.utilities.warnings`` + - import it from ``pl.utilities.rank_zero`` + - `PR11747`_ + + * - used ``rank_zero_deprecation`` from ``pl.utilities.warnings`` + - import it from ``pl.utilities.rank_zero`` + - `PR11747`_ + + * - used ``LightningDeprecationWarning`` from ``pl.utilities.warnings`` + - import it from ``pl.utilities.rank_zero`` + - `PR11747`_ + + * - used ``LightningDeprecationWarning`` from ``pl.utilities.warnings`` + - import it from ``pl.utilities.rank_zero`` + - `PR11747`_ + + * - used ``Trainer.data_parallel_device_ids`` attribute + - switch it to ``Trainer.device_ids`` + - `PR12072`_ + + * - derived it from ``TrainerCallbackHookMixin`` + - use Trainer base class + - `PR14401`_ + + * - used base class ``pytorch_lightning.profiler.BaseProfilerto`` + - switch to use ``pytorch_lightning.profiler.Profiler`` instead + - `PR12150`_ + + * - set distributed backend via the environment variable ``PL_TORCH_DISTRIBUTED_BACKEND`` + - use ``process_group_backend`` in the strategy constructor + - `PR11745`_ + + * - used ``PrecisionPlugin.on_load_checkpoint`` hooks + - switch to ``PrecisionPlugin.load_state_dict`` + - `PR11978`_ + + * - used ``PrecisionPlugin.on_save_checkpoint`` hooks + - switch to ``PrecisionPlugin.load_state_dict`` + - `PR11978`_ + + * - used ``Trainer.root_gpu`` attribute + - use ``Trainer.strategy.root_device.index`` when GPU is used + - `PR12262`_ + + * - used ``Trainer.use_amp`` attribute + - rely on Torch native AMP + - `PR12312`_ + + * - used ``LightingModule.use_amp`` attribute + - rely on Torch native AMP + - `PR12315`_ + + * - used Trainer’s attribute ``Trainer.verbose_evaluate`` + - rely on loop constructor ``EvaluationLoop(verbose=...)`` + - `PR10931`_ + + * - used Trainer’s attribute ``Trainer.should_rank_save_checkpoint`` + - it was removed + - `PR11068`_ + + * - derived from ``TrainerOptimizersMixin`` + - rely on ``core/optimizer.py`` + - `PR11155`_ + + * - derived from ``TrainerDataLoadingMixin`` + - rely on methods from ``Trainer`` and ``DataConnector`` + - `PR11282`_ + + * - used Trainer’s attribute ``Trainer.lightning_optimizers`` + - switch to the ``Strategy`` and its attributes. + - `PR11444`_ + + * - used ``Trainer.call_hook`` + - it was set as a protected method ``Trainer._call_callback_hooks``, ``Trainer._call_lightning_module_hook``, ``Trainer._call_ttp_hook``, ``Trainer._call_accelerator_hook`` and shall not be used. + - `PR10979`_ + + * - used Profiler’s attribute ``SimpleProfiler.profile_iterable`` + - it was removed + - `PR12102`_ + + * - used Profiler’s attribute ``AdvancedProfiler.profile_iterable`` + - it was removed + - `PR12102`_ + + * - used the ``device_stats_monitor.prefix_metric_keys`` + - + - `PR11254`_ + + * - used ``on_train_batch_end(outputs, ...)`` with 2d list with sizes (n_optimizers, tbptt_steps) + - chang it to (tbptt_steps, n_optimizers). You can update your code by adding the following parameter to your hook signature: ``on_train_batch_end(outputs, ..., new_format=True)``. + - `PR12182`_ + + * - used ``training_epoch_end(outputs)`` with a 3d list with sizes (n_optimizers, n_batches, tbptt_steps) + - change it to (n_batches, tbptt_steps, n_optimizers). You can update your code by adding the following parameter to your hook signature: ``training_epoch_end(outputs, new_format=True)``. + - `PR12182`_ + + +.. _pr14415: https://github.com/Lightning-AI/lightning/pull/14415 +.. _pr11000: https://github.com/Lightning-AI/lightning/pull/11000 +.. _pr11747: https://github.com/Lightning-AI/lightning/pull/11747 +.. _pr12072: https://github.com/Lightning-AI/lightning/pull/12072 +.. _pr14401: https://github.com/Lightning-AI/lightning/pull/14401 +.. _pr12150: https://github.com/Lightning-AI/lightning/pull/12150 +.. _pr11745: https://github.com/Lightning-AI/lightning/pull/11745 +.. _pr11978: https://github.com/Lightning-AI/lightning/pull/11978 +.. _pr12262: https://github.com/Lightning-AI/lightning/pull/12262 +.. _pr12312: https://github.com/Lightning-AI/lightning/pull/12312 +.. _pr12315: https://github.com/Lightning-AI/lightning/pull/12315 +.. _pr10931: https://github.com/Lightning-AI/lightning/pull/10931 +.. _pr11068: https://github.com/Lightning-AI/lightning/pull/11068 +.. _pr11155: https://github.com/Lightning-AI/lightning/pull/11155 +.. _pr11282: https://github.com/Lightning-AI/lightning/pull/11282 +.. _pr11444: https://github.com/Lightning-AI/lightning/pull/11444 +.. _pr10979: https://github.com/Lightning-AI/lightning/pull/10979 +.. _pr12102: https://github.com/Lightning-AI/lightning/pull/12102 +.. _pr11254: https://github.com/Lightning-AI/lightning/pull/11254 +.. _pr12182: https://github.com/Lightning-AI/lightning/pull/12182 diff --git a/docs/source-pytorch/upgrade/sections/1_7_regular.rst b/docs/source-pytorch/upgrade/sections/1_7_regular.rst new file mode 100644 index 0000000..acfb741 --- /dev/null +++ b/docs/source-pytorch/upgrade/sections/1_7_regular.rst @@ -0,0 +1,51 @@ +.. list-table:: reg. user 1.7 + :widths: 40 40 20 + :header-rows: 1 + + * - If + - Then + - Ref + + * - have wrapped your loggers with ``LoggerCollection`` + - directly pass a list of loggers to the Trainer and access the list via the ``trainer.loggers`` attribute. + - `PR12147`_ + + * - used ``Trainer.lr_schedulers`` + - access ``trainer.lr_scheduler_configs`` instead, which contains dataclasses instead of dictionaries. + - `PR11443`_ + + * - used ``neptune-client`` API in the ``NeptuneLogger`` + - upgrade to the latest API + - `PR14727`_ + + * - used ``LightningDataModule.on_save`` hook + - use ``LightningDataModule.on_save_checkpoint`` instead + - `PR11887`_ + + * - used ``LightningDataModule.on_load_checkpoint`` hook + - use ``LightningDataModule.on_load_checkpoint`` hook instead + - `PR11887`_ + + * - used ``LightningModule.on_hpc_load`` hook + - switch to general purpose hook ``LightningModule.on_load_checkpoint`` + - `PR14315`_ + + * - used ``LightningModule.on_hpc_save`` hook + - switch to general purpose hook ``LightningModule.on_save_checkpoint`` + - `PR14315`_ + + * - used Trainer’s flag ``weights_save_path`` + - use directly ``dirpath`` argument in the ``ModelCheckpoint`` callback. + - `PR14424`_ + + * - used Trainer’s property ``Trainer.weights_save_path`` is dropped + - + - `PR14424`_ + + +.. _pr12147: https://github.com/Lightning-AI/lightning/pull/12147 +.. _pr11443: https://github.com/Lightning-AI/lightning/pull/11443 +.. _pr14727: https://github.com/Lightning-AI/lightning/pull/14727 +.. _pr11887: https://github.com/Lightning-AI/lightning/pull/11887 +.. _pr14315: https://github.com/Lightning-AI/lightning/pull/14315 +.. _pr14424: https://github.com/Lightning-AI/lightning/pull/14424 diff --git a/docs/source-pytorch/upgrade/sections/1_8_advanced.rst b/docs/source-pytorch/upgrade/sections/1_8_advanced.rst new file mode 100644 index 0000000..2d4a45e --- /dev/null +++ b/docs/source-pytorch/upgrade/sections/1_8_advanced.rst @@ -0,0 +1,52 @@ +.. list-table:: adv. user 1.8 + :widths: 40 40 20 + :header-rows: 1 + + * - If + - Then + - Ref + + * - imported ``pl.callbacks.base`` + - import ``pl.callbacks.callback`` + - `PR13031`_ + + * - imported ``pl.loops.base`` + - import ``pl.loops.loop`` instead + - `PR13043`_ + + * - imported ``pl.utilities.cli`` + - import ``pl.cli`` instead + - `PR13767`_ + + * - imported profiler classes from ``pl.profiler.*`` + - import ``pl.profilers`` instead + - `PR12308`_ + + * - used ``pl.accelerators.GPUAccelerator`` + - use ``pl.accelerators.CUDAAccelerator`` + - `PR13636`_ + + * - used ``LightningDeepSpeedModule`` + - use ``strategy="deepspeed"`` or ``strategy=DeepSpeedStrategy(...)`` + - :class:`~lightning.pytorch.strategies.DeepSpeedStrategy` + + * - used the ``with init_meta_context()`` context manager from ``import pl.utilities.meta`` + - switch to ``deepspeed-zero-stage-3`` + - :ref:`deepspeed-zero-stage-3` + + * - used the Lightning Hydra multi-run integration + - removed support for it as it caused issues with processes hanging + - `PR15689`_ + + * - used ``pl.utilities.memory.get_gpu_memory_map`` + - use ``pl.accelerators.cuda.get_nvidia_gpu_stats`` + - `PR9921`_ + + +.. _pr13031: https://github.com/Lightning-AI/lightning/pull/13031 +.. _pr13043: https://github.com/Lightning-AI/lightning/pull/13043 +.. _pr13767: https://github.com/Lightning-AI/lightning/pull/13767 +.. _pr12308: https://github.com/Lightning-AI/lightning/pull/12308 +.. _pr13636: https://github.com/Lightning-AI/lightning/pull/13636 +.. _pr15689: https://github.com/Lightning-AI/lightning/pull/15689 +.. _pr9921: https://github.com/Lightning-AI/lightning/pull/9921 diff --git a/docs/source-pytorch/upgrade/sections/1_8_devel.rst b/docs/source-pytorch/upgrade/sections/1_8_devel.rst new file mode 100644 index 0000000..8c69736 --- /dev/null +++ b/docs/source-pytorch/upgrade/sections/1_8_devel.rst @@ -0,0 +1,24 @@ +.. list-table:: devel 1.8 + :widths: 40 40 20 + :header-rows: 1 + + * - If + - Then + - Ref + + * - derived from ``pytorch_lightning.loggers.base.LightningLoggerBase`` + - derive from ``pytorch_lightning.loggers.logger.Logger`` + - `PR12014`_ + + * - derived from ``pytorch_lightning.profiler.base.BaseProfiler`` + - derive from ``pytorch_lightning.profilers.profiler.Profiler`` + - `PR12150`_ + + * - derived from ``pytorch_lightning.profiler.base.AbstractProfiler`` + - derive from ``pytorch_lightning.profilers.profiler.Profiler`` + - `PR12106`_ + + +.. _pr12014: https://github.com/Lightning-AI/lightning/pull/12014 +.. _pr12150: https://github.com/Lightning-AI/lightning/pull/12150 +.. _pr12106: https://github.com/Lightning-AI/lightning/pull/12106 diff --git a/docs/source-pytorch/upgrade/sections/1_8_regular.rst b/docs/source-pytorch/upgrade/sections/1_8_regular.rst new file mode 100644 index 0000000..5f4fac2 --- /dev/null +++ b/docs/source-pytorch/upgrade/sections/1_8_regular.rst @@ -0,0 +1,24 @@ +.. list-table:: reg. user 1.8 + :widths: 40 40 20 + :header-rows: 1 + + * - If + - Then + - Ref + + * - used ``seed_everything_default=None`` in ``LightningCLI`` + - set ``seed_everything_default=False`` instead + - `PR12804`_ + + * - used ``Trainer.reset_train_val_dataloaders()`` + - call ``Trainer.reset_train_dataloaders()`` and ``Trainer.reset_val_dataloaders()`` separately + - `PR12184`_ + + * - imported ``pl.core.lightning`` + - import ``pl.core.module`` instead + - `PR12740`_ + + +.. _pr12804: https://github.com/Lightning-AI/lightning/pull/12804 +.. _pr12184: https://github.com/Lightning-AI/lightning/pull/12184 +.. _pr12740: https://github.com/Lightning-AI/lightning/pull/12740 diff --git a/docs/source-pytorch/upgrade/sections/1_9_advanced.rst b/docs/source-pytorch/upgrade/sections/1_9_advanced.rst new file mode 100644 index 0000000..f9ef1b8 --- /dev/null +++ b/docs/source-pytorch/upgrade/sections/1_9_advanced.rst @@ -0,0 +1,285 @@ +.. list-table:: adv. user 1.9 + :widths: 40 40 20 + :header-rows: 1 + + * - If + - Then + - Ref + + * - used the ``pl.lite`` module + - switch to ``lightning_fabric`` + - `PR15953`_ + + * - used Trainer’s flag ``strategy='dp'`` + - use DDP with ``strategy='ddp'`` or DeepSpeed instead + - `PR16748`_ + + * - implemented ``LightningModule.training_epoch_end`` hooks + - port your logic to ``LightningModule.on_train_epoch_end`` hook + - `PR16520`_ + + * - implemented ``LightningModule.validation_epoch_end`` hook + - port your logic to ``LightningModule.on_validation_epoch_end`` hook + - `PR16520`_ + + * - implemented ``LightningModule.test_epoch_end`` hooks + - port your logic to ``LightningModule.on_test_epoch_end`` hook + - `PR16520`_ + + * - used Trainer’s flag ``multiple_trainloader_mode`` + - switch to ``CombinedLoader(..., mode=...)`` and set mode directly now + - `PR16800`_ + + * - used Trainer’s flag ``move_metrics_to_cpu`` + - implement particular offload logic in your custom metric or turn it on in ``torchmetrics`` + - `PR16358`_ + + * - used Trainer’s flag ``track_grad_norm`` + - overwrite ``on_before_optimizer_step`` hook and pass the argument directly and ``LightningModule.log_grad_norm()`` hook + - `PR16745`_ `PR16745`_ + + * - used Trainer’s flag ``replace_sampler_ddp`` + - use ``use_distributed_sampler``; the sampler gets created not only for the DDP strategies + - + + * - relied on the ``on_tpu`` argument in ``LightningModule.optimizer_step`` hook + - switch to manual optimization + - `PR16537`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - relied on the ``using_lbfgs`` argument in ``LightningModule.optimizer_step`` hook + - switch to manual optimization + - `PR16538`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - were using ``nvidia/apex`` in any form + - switch to PyTorch native mixed precision ``torch.amp`` instead + - `PR16039`_ :doc:`Precision <../../common/precision>` + + * - used Trainer’s flag ``using_native_amp`` + - use PyTorch native mixed precision + - `PR16039`_ :doc:`Precision <../../common/precision>` + + * - used Trainer’s flag ``amp_backend`` + - use PyTorch native mixed precision + - `PR16039`_ :doc:`Precision <../../common/precision>` + + * - used Trainer’s flag ``amp_level`` + - use PyTorch native mixed precision + - `PR16039`_ :doc:`Precision <../../common/precision>` + + * - used Trainer’s attribute ``using_native_amp`` + - use PyTorch native mixed precision + - `PR16039`_ :doc:`Precision <../../common/precision>` + + * - used Trainer’s attribute ``amp_backend`` + - use PyTorch native mixed precision + - `PR16039`_ :doc:`Precision <../../common/precision>` + + * - used Trainer’s attribute ``amp_level`` + - use PyTorch native mixed precision + - `PR16039`_ :doc:`Precision <../../common/precision>` + + * - use the ``FairScale`` integration + - consider using PyTorch's native FSDP implementation or outsourced implementation into own project + - `lightning-Fairscale`_ + + * - used ``pl.overrides.fairscale.LightningShardedDataParallel`` + - use native FSDP instead + - `PR16400`_ :doc:`FSDP <../../accelerators/gpu_expert>` + + * - used ``pl.plugins.precision.fully_sharded_native_amp.FullyShardedNativeMixedPrecisionPlugin`` + - use native FSDP instead + - `PR16400`_ :doc:`FSDP <../../accelerators/gpu_expert>` + + * - used ``pl.plugins.precision.sharded_native_amp.ShardedNativeMixedPrecisionPlugin`` + - use native FSDP instead + - `PR16400`_ :doc:`FSDP <../../accelerators/gpu_expert>` + + * - used ``pl.strategies.fully_sharded.DDPFullyShardedStrategy`` + - use native FSDP instead + - `PR16400`_ :doc:`FSDP <../../accelerators/gpu_expert>` + + * - used ``pl.strategies.sharded.DDPShardedStrategy`` + - use native FSDP instead + - `PR16400`_ :doc:`FSDP <../../accelerators/gpu_expert>` + + * - used ``pl.strategies.sharded_spawn.DDPSpawnShardedStrategy`` + - use native FSDP instead + - `PR16400`_ :doc:`FSDP <../../accelerators/gpu_expert>` + + * - used ``save_config_overwrite`` parameters in ``LightningCLI`` + - pass this option and via dictionary of ``save_config_kwargs`` parameter + - `PR14998`_ + + * - used ``save_config_multifile`` parameters in ``LightningCLI`` + - pass this option and via dictionary of ``save_config_kwargs`` parameter + - `PR14998`_ + + * - have customized loops ``Loop.replace()`` + - implement your training loop with Fabric. + - `PR14998`_ `Fabric`_ + + * - have customized loops ``Loop.run()`` + - implement your training loop with Fabric. + - `PR14998`_ `Fabric`_ + + * - have customized loops ``Loop.connect()`` + - implement your training loop with Fabric. + - `PR14998`_ `Fabric`_ + + * - used the Trainer’s ``trainer.fit_loop`` property + - implement your training loop with Fabric + - `PR14998`_ `Fabric`_ + + * - used the Trainer’s ``trainer.validate_loop`` property + - implement your training loop with Fabric + - `PR14998`_ `Fabric`_ + + * - used the Trainer’s ``trainer.test_loop`` property + - implement your training loop with Fabric + - `PR14998`_ `Fabric`_ + + * - used the Trainer’s ``trainer.predict_loop`` property + - implement your training loop with Fabric + - `PR14998`_ `Fabric`_ + + * - used the ``Trainer.loop`` and fetching classes + - being marked as protected + - + + * - used ``opt_idx`` argument in ``BaseFinetuning.finetune_function`` + - use manual optimization + - `PR16539`_ + + * - used ``opt_idx`` argument in ``Callback.on_before_optimizer_step`` + - use manual optimization + - `PR16539`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used ``optimizer_idx`` as an optional argument in ``LightningModule.training_step`` + - use manual optimization + - `PR16539`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used ``optimizer_idx`` argument in ``LightningModule.on_before_optimizer_step`` + - use manual optimization + - `PR16539`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used ``optimizer_idx`` argument in ``LightningModule.configure_gradient_clipping`` + - use manual optimization + - `PR16539`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used ``optimizer_idx`` argument in ``LightningModule.optimizer_step`` + - use manual optimization + - `PR16539`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used ``optimizer_idx`` argument in ``LightningModule.optimizer_zero_grad`` + - use manual optimization + - `PR16539`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used ``optimizer_idx`` argument in ``LightningModule.lr_scheduler_step`` + - use manual optimization + - `PR16539`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used declaring optimizer frequencies in the dictionary returned from ``LightningModule.configure_optimizers`` + - use manual optimization + - `PR16539`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used ``optimizer`` argument in ``LightningModule.backward`` + - use manual optimization + - `PR16539`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used ``optimizer_idx`` argument in ``LightningModule.backward`` + - use manual optimization + - `PR16539`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used ``optimizer_idx`` argument in ``PrecisionPlugin.optimizer_step`` + - use manual optimization + - `PR16539`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used ``optimizer_idx`` argument in ``PrecisionPlugin.,backward`` + - use manual optimization + - `PR16539`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used ``optimizer_idx`` argument in ``PrecisionPlugin.optimizer_step`` + - use manual optimization + - `PR16539`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used ``optimizer_idx`` argument in ``Strategy.backward`` + - use manual optimization + - `PR16539`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used ``optimizer_idx`` argument in ``Strategy.optimizer_step`` + - use manual optimization + - `PR16539`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used Trainer’s ``Trainer.optimizer_frequencies`` attribute + - use manual optimization + - :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used ``PL_INTER_BATCH_PARALLELISM`` environment flag + - + - `PR16355`_ + + * - used training integration with Horovod + - install standalone package/project + - `lightning-Horovod`_ + + * - used training integration with ColossalAI + - install standalone package/project + - `lightning-ColossalAI`_ + + * - used ``QuantizationAwareTraining`` callback + - use Torch’s Quantization directly + - `PR16750`_ + + * - had any logic except reducing the DP outputs in ``LightningModule.training_step_end`` hook + - port it to ``LightningModule.on_train_batch_end`` hook + - `PR16791`_ + + * - had any logic except reducing the DP outputs in ``LightningModule.validation_step_end`` hook + - port it to ``LightningModule.on_validation_batch_end`` hook + - `PR16791`_ + + * - had any logic except reducing the DP outputs in ``LightningModule.test_step_end`` hook + - port it to ``LightningModule.on_test_batch_end`` hook + - `PR16791`_ + + * - used ``pl.strategies.DDPSpawnStrategy`` + - switch to general ``DDPStrategy(start_method='spawn')`` with proper starting method + - `PR16809`_ + + * - used the automatic addition of a moving average of the ``training_step`` loss in the progress bar + - use ``self.log("loss", ..., prog_bar=True)`` instead. + - `PR16192`_ + + * - rely on the ``outputs`` argument from the ``on_predict_epoch_end`` hook + - access them via ``trainer.predict_loop.predictions`` + - `PR16655`_ + + * - need to pass a dictionary to ``self.log()`` + - pass them independently. + - `PR16389`_ + + +.. _Fabric: https://lightning.ai/docs/fabric/ +.. _lightning-Horovod: https://github.com/Lightning-AI/lightning-Horovod +.. _lightning-ColossalAI: https://lightning.ai/docs/pytorch/latest/integrations/strategies/colossalai.html +.. _lightning-Fairscale: https://github.com/Lightning-Sandbox/lightning-Fairscale + +.. _pr15953: https://github.com/Lightning-AI/lightning/pull/15953 +.. _pr16748: https://github.com/Lightning-AI/lightning/pull/16748 +.. _pr16520: https://github.com/Lightning-AI/lightning/pull/16520 +.. _pr16800: https://github.com/Lightning-AI/lightning/pull/16800 +.. _pr16358: https://github.com/Lightning-AI/lightning/pull/16358 +.. _pr16745: https://github.com/Lightning-AI/lightning/pull/16745 +.. _pr16537: https://github.com/Lightning-AI/lightning/pull/16537 +.. _pr16538: https://github.com/Lightning-AI/lightning/pull/16538 +.. _pr16039: https://github.com/Lightning-AI/lightning/pull/16039 +.. _pr16400: https://github.com/Lightning-AI/lightning/pull/16400 +.. _pr14998: https://github.com/Lightning-AI/lightning/pull/14998 +.. _pr16539: https://github.com/Lightning-AI/lightning/pull/16539 +.. _pr16355: https://github.com/Lightning-AI/lightning/pull/16355 +.. _pr16750: https://github.com/Lightning-AI/lightning/pull/16750 +.. _pr16791: https://github.com/Lightning-AI/lightning/pull/16791 +.. _pr16809: https://github.com/Lightning-AI/lightning/pull/16809 +.. _pr16192: https://github.com/Lightning-AI/lightning/pull/16192 +.. _pr16655: https://github.com/Lightning-AI/lightning/pull/16655 +.. _pr16389: https://github.com/Lightning-AI/lightning/pull/16389 diff --git a/docs/source-pytorch/upgrade/sections/1_9_devel.rst b/docs/source-pytorch/upgrade/sections/1_9_devel.rst new file mode 100644 index 0000000..c7179cb --- /dev/null +++ b/docs/source-pytorch/upgrade/sections/1_9_devel.rst @@ -0,0 +1,307 @@ +.. list-table:: devel 1.9 + :widths: 40 40 20 + :header-rows: 1 + + * - If + - Then + - Ref + + * - passed the ``pl_module`` argument to distributed module wrappers + - passed the (required) ``forward_module`` argument + - `PR16386`_ + + * - used ``DataParallel`` and the ``LightningParallelModule`` wrapper + - use DDP or DeepSpeed instead + - `PR16748`_ :doc:`DDP <../../accelerators/gpu_expert>` + + * - used ``pl_module`` argument from the distributed module wrappers + - use DDP or DeepSpeed instead + - `PR16386`_ :doc:`DDP <../../accelerators/gpu_expert>` + + * - called ``pl.overrides.base.unwrap_lightning_module`` function + - use DDP or DeepSpeed instead + - `PR16386`_ :doc:`DDP <../../accelerators/gpu_expert>` + + * - used or derived from ``pl.overrides.distributed.LightningDistributedModule`` class + - use DDP instead + - `PR16386`_ :doc:`DDP <../../accelerators/gpu_expert>` + + * - used the pl.plugins.ApexMixedPrecisionPlugin`` plugin + - use PyTorch native mixed precision + - `PR16039`_ + + * - used the ``pl.plugins.NativeMixedPrecisionPlugin`` plugin + - switch to the ``pl.plugins.MixedPrecisionPlugin`` plugin + - `PR16039`_ + + * - used the ``fit_loop.min_steps`` setters + - implement your training loop with Fabric + - `PR16803`_ + + * - used the ``fit_loop.max_steps`` setters + - implement your training loop with Fabric + - `PR16803`_ + + * - used the ``data_parallel`` attribute in ``Trainer`` + - check the same using ``isinstance(trainer.strategy, ParallelStrategy)`` + - `PR16703`_ + + * - used any function from ``pl.utilities.xla_device`` + - switch to ``pl.accelerators.XLAAccelerator.is_available()`` + - `PR14514`_ `PR14550`_ + + * - imported functions from ``pl.utilities.device_parser.*`` + - import them from ``lightning_fabric.utilities.device_parser.*`` + - `PR14492`_ `PR14753`_ + + * - imported functions from ``pl.utilities.cloud_io.*`` + - import them from ``lightning_fabric.utilities.cloud_io.*`` + - `PR14515`_ + + * - imported functions from ``pl.utilities.apply_func.*`` + - import them from ``lightning_utilities.core.apply_func.*`` + - `PR14516`_ `PR14537`_ + + * - used any code from ``pl.core.mixins`` + - use the base classes + - `PR16424`_ + + * - used any code from ``pl.utilities.distributed`` + - rely on Pytorch's native functions + - `PR16390`_ + + * - used any code from ``pl.utilities.data`` + - it was removed + - `PR16440`_ + + * - used any code from ``pl.utilities.optimizer`` + - it was removed + - `PR16439`_ + + * - used any code from ``pl.utilities.seed`` + - it was removed + - `PR16422`_ + + * - were using truncated backpropagation through time (TBPTT) with ``LightningModule.truncated_bptt_steps`` + - use manual optimization + - `PR16172`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - were using truncated backpropagation through time (TBPTT) with ``LightningModule.tbptt_split_batch`` + - use manual optimization + - `PR16172`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - were using truncated backpropagation through time (TBPTT) and passing ``hidden`` to ``LightningModule.training_step`` + - use manual optimization + - `PR16172`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used ``pl.utilities.finite_checks.print_nan_gradients`` function + - it was removed + - + + * - used ``pl.utilities.finite_checks.detect_nan_parameters`` function + - it was removed + - + + * - used ``pl.utilities.parsing.flatten_dict`` function + - it was removed + - + + * - used ``pl.utilities.metrics.metrics_to_scalars`` function + - it was removed + - + + * - used ``pl.utilities.memory.get_model_size_mb`` function + - it was removed + - + + * - used ``pl.strategies.utils.on_colab_kaggle`` function + - it was removed + - `PR16437`_ + + * - used ``LightningDataModule.add_argparse_args()`` method + - switch to using ``LightningCLI`` + - `PR16708`_ + + * - used ``LightningDataModule.parse_argparser()`` method + - switch to using ``LightningCLI`` + - `PR16708`_ + + * - used ``LightningDataModule.from_argparse_args()`` method + - switch to using ``LightningCLI`` + - `PR16708`_ + + * - used ``LightningDataModule.get_init_arguments_and_types()`` method + - switch to using ``LightningCLI`` + - `PR16708`_ + + * - used ``Trainer.default_attributes()`` method + - switch to using ``LightningCLI`` + - `PR16708`_ + + * - used ``Trainer.from_argparse_args()`` method + - switch to using ``LightningCLI`` + - `PR16708`_ + + * - used ``Trainer.parse_argparser()`` method + - switch to using ``LightningCLI`` + - `PR16708`_ + + * - used ``Trainer.match_env_arguments()`` method + - switch to using ``LightningCLI`` + - `PR16708`_ + + * - used ``Trainer.add_argparse_args()`` method + - switch to using ``LightningCLI`` + - `PR16708`_ + + * - used ``pl.utilities.argparse.from_argparse_args()`` function + - switch to using ``LightningCLI`` + - `PR16708`_ + + * - used ``pl.utilities.argparse.parse_argparser()`` function + - switch to using ``LightningCLI`` + - `PR16708`_ + + * - used ``pl.utilities.argparseparse_env_variables()`` function + - switch to using ``LightningCLI`` + - `PR16708`_ + + * - used ``get_init_arguments_and_types()`` function + - switch to using ``LightningCLI`` + - `PR16708`_ + + * - used ``pl.utilities.argparse.add_argparse_args()`` function + - switch to using ``LightningCLI`` + - `PR16708`_ + + * - used ``pl.utilities.parsing.str_to_bool()`` function + - switch to using ``LightningCLI`` + - `PR16708`_ + + * - used ``pl.utilities.parsing.str_to_bool_or_int()`` function + - switch to using ``LightningCLI`` + - `PR16708`_ + + * - used ``pl.utilities.parsing.str_to_bool_or_str()`` function + - switch to using ``LightningCLI`` + - `PR16708`_ + + * - derived from ``pl.utilities.distributed.AllGatherGrad`` class + - switch to PyTorch native equivalent + - `PR15364`_ + + * - used ``PL_RECONCILE_PROCESS=1`` env. variable + - customize your logger + - `PR16204`_ + + * - if you derived from mixin’s method ``pl.core.saving.ModelIO.load_from_checkpoint`` + - rely on ``pl.core.module.LightningModule`` + - `PR16999`_ + + * - used ``Accelerator.setup_environment`` method + - switch to ``Accelerator.setup_device`` + - `PR16436`_ + + * - used ``PL_FAULT_TOLERANT_TRAINING`` env. variable + - implement own logic with Fabric + - `PR16516`_ `PR16533`_ + + * - used or derived from public ``pl.overrides.distributed.IndexBatchSamplerWrapper`` class + - it is set as protected + - `PR16826`_ + + * - used the ``DataLoaderLoop`` class + - use manual optimization + - `PR16726`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used the ``EvaluationEpochLoop`` class + - use manual optimization + - `PR16726`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used the ``PredictionEpochLoop`` class + - use manual optimization + - `PR16726`_ :doc:`Manual Optimization <../../model/manual_optimization>` + + * - used ``trainer.reset_*_dataloader()`` methods + - use ``Loop.setup_data()`` for the top-level loops + - `PR16726`_ + + * - used ``LightningModule.precision`` attribute + - rely on Trainer precision attribute + - `PR16203`_ + + * - used ``Trainer.model`` setter + - you shall pass the ``model`` in fit/test/predict method + - `PR16462`_ + + * - relied on ``pl.utilities.supporters.CombinedLoaderIterator`` class + - pass dataloders directly + - `PR16714`_ + + * - relied on ``pl.utilities.supporters.CombinedLoaderIterator`` class + - pass dataloders directly + - `PR16714`_ + + * - accessed ``ProgressBarBase.train_batch_idx`` property + - rely on Trainer internal loops’ properties + - `PR16760`_ + + * - accessed ``ProgressBarBase.val_batch_idx`` property + - rely on Trainer internal loops’ properties + - `PR16760`_ + + * - accessed ``ProgressBarBase.test_batch_idx`` property + - rely on Trainer internal loops’ properties + - `PR16760`_ + + * - accessed ``ProgressBarBase.predict_batch_idx`` property + - rely on Trainer internal loops’ properties + - `PR16760`_ + + * - used ``Trainer.prediction_writer_callbacks`` property + - rely on precision plugin + - `PR16759`_ + + * - used ``PrecisionPlugin.dispatch`` + - it was removed + - `PR16618`_ + + * - used ``Strategy.dispatch`` + - it was removed + - `PR16618`_ + + +.. _pr16386: https://github.com/Lightning-AI/lightning/pull/16386 +.. _pr16748: https://github.com/Lightning-AI/lightning/pull/16748 +.. _pr16039: https://github.com/Lightning-AI/lightning/pull/16039 +.. _pr16803: https://github.com/Lightning-AI/lightning/pull/16803 +.. _pr16703: https://github.com/Lightning-AI/lightning/pull/16703 +.. _pr14514: https://github.com/Lightning-AI/lightning/pull/14514 +.. _pr14550: https://github.com/Lightning-AI/lightning/pull/14550 +.. _pr14492: https://github.com/Lightning-AI/lightning/pull/14492 +.. _pr14753: https://github.com/Lightning-AI/lightning/pull/14753 +.. _pr14515: https://github.com/Lightning-AI/lightning/pull/14515 +.. _pr14516: https://github.com/Lightning-AI/lightning/pull/14516 +.. _pr14537: https://github.com/Lightning-AI/lightning/pull/14537 +.. _pr16424: https://github.com/Lightning-AI/lightning/pull/16424 +.. _pr16390: https://github.com/Lightning-AI/lightning/pull/16390 +.. _pr16440: https://github.com/Lightning-AI/lightning/pull/16440 +.. _pr16439: https://github.com/Lightning-AI/lightning/pull/16439 +.. _pr16422: https://github.com/Lightning-AI/lightning/pull/16422 +.. _pr16172: https://github.com/Lightning-AI/lightning/pull/16172 +.. _pr16437: https://github.com/Lightning-AI/lightning/pull/16437 +.. _pr16708: https://github.com/Lightning-AI/lightning/pull/16708 +.. _pr15364: https://github.com/Lightning-AI/lightning/pull/15364 +.. _pr16204: https://github.com/Lightning-AI/lightning/pull/16204 +.. _pr16999: https://github.com/Lightning-AI/lightning/pull/16999 +.. _pr16436: https://github.com/Lightning-AI/lightning/pull/16436 +.. _pr16516: https://github.com/Lightning-AI/lightning/pull/16516 +.. _pr16533: https://github.com/Lightning-AI/lightning/pull/16533 +.. _pr16826: https://github.com/Lightning-AI/lightning/pull/16826 +.. _pr16726: https://github.com/Lightning-AI/lightning/pull/16726 +.. _pr16203: https://github.com/Lightning-AI/lightning/pull/16203 +.. _pr16462: https://github.com/Lightning-AI/lightning/pull/16462 +.. _pr16714: https://github.com/Lightning-AI/lightning/pull/16714 +.. _pr16760: https://github.com/Lightning-AI/lightning/pull/16760 +.. _pr16759: https://github.com/Lightning-AI/lightning/pull/16759 +.. _pr16618: https://github.com/Lightning-AI/lightning/pull/16618 diff --git a/docs/source-pytorch/upgrade/sections/1_9_regular.rst b/docs/source-pytorch/upgrade/sections/1_9_regular.rst new file mode 100644 index 0000000..0aa0108 --- /dev/null +++ b/docs/source-pytorch/upgrade/sections/1_9_regular.rst @@ -0,0 +1,75 @@ +.. list-table:: reg. user 1.9 + :widths: 40 40 20 + :header-rows: 1 + + * - If + - Then + - Ref + + * - used Python 3.7 + - upgrade to Python 3.8 or higher + - `PR16579`_ + + * - used PyTorch 1.10 + - upgrade to PyTorch 1.11 or higher + - `PR16492`_ + + * - used Trainer’s flag ``gpus`` + - use ``devices`` with the same number + - `PR16171`_ + + * - used Trainer’s flag ``tpu_cores`` + - use ``devices`` with the same number + - `PR16171`_ + + * - used Trainer’s flag ``ipus`` + - use ``devices`` with the same number + - `PR16171`_ + + * - used Trainer’s flag ``num_processes`` + - use ``devices`` with the same number + - `PR16171`_ + + * - used Trainer’s flag ``resume_from_checkpoint`` + - pass the path to the ``Trainer.fit(ckpt_path="...")`` method, + - `PR10061`_ + + * - used Trainer’s flag ``auto_select_gpus`` + - use ``devices="auto"`` + - `PR16184`_ + + * - called the ``pl.tuner.auto_gpu_select.pick_single_gpu`` function + - use Trainer’s flag``devices="auto"`` + - `PR16184`_ + + * - called the ``pl.tuner.auto_gpu_select.pick_multiple_gpus`` functions + - use Trainer’s flag``devices="auto"`` + - `PR16184`_ + + * - used Trainer’s flag ``accumulate_grad_batches`` with a scheduling dictionary value + - use the ``GradientAccumulationScheduler`` callback and configure it + - `PR16729`_ + + * - imported profiles from ``pl.profiler`` + - import from ``pl.profilers`` + - `PR16359`_ + + * - used ``Tuner`` as part of ``Trainer`` in any form + - move to a standalone ``Tuner`` object or use particular callbacks ``LearningRateFinder`` and ``BatchSizeFinder`` + - :ref:`batch_size_finder` :ref:`learning_rate_finder` + + * - used Trainer’s flag ``auto_scale_batch_size`` + - use ``BatchSizeFinder`` callback instead and the ``Trainer.tune()`` method was removed + - + + * - used Trainer’s flag ``auto_lr_find`` + - use callbacks ``LearningRateFinder`` callback instead and the ``Trainer.tune()`` method was removed + - + +.. _pr16579: https://github.com/Lightning-AI/lightning/pull/16579 +.. _pr16492: https://github.com/Lightning-AI/lightning/pull/16492 +.. _pr10061: https://github.com/Lightning-AI/lightning/pull/10061 +.. _pr16171: https://github.com/Lightning-AI/lightning/pull/16171 +.. _pr16184: https://github.com/Lightning-AI/lightning/pull/16184 +.. _pr16729: https://github.com/Lightning-AI/lightning/pull/16729 +.. _pr16359: https://github.com/Lightning-AI/lightning/pull/16359 diff --git a/docs/source-pytorch/versioning.rst b/docs/source-pytorch/versioning.rst new file mode 100644 index 0000000..0b8a801 --- /dev/null +++ b/docs/source-pytorch/versioning.rst @@ -0,0 +1,155 @@ +.. _versioning: + +Versioning Policy +################# + +PyTorch Lightning follows its own versioning policy which differs from `semantic versioning (SemVer) `_. + +Versioning +********** + +A Lightning release number is in the format of ``MAJOR.MINOR.PATCH``. + +- A patch release contains only bug fixes. Since it introduces no breaking changes, we recommend users always update the package to the latest version within the minor version whenever possible. +- A minor release may contain backwards-incompatible changes **with deprecations** (unlike SemVer), such as API changes and removals, as well as new features and bugfixes since last release. +- A major release may contain backwards-incompatible changes **without deprecations**, as well as new features, and bugfixes since last release. + +With every release, we publish a changelog where we list additions, removals, deprecations, changed functionality and fixes. + +The ``lightning.app`` package is an exception to this rule, as it may contain any change with or without deprecations in any of the releases. + +API Stability +************* + +In Lightning, all public APIs are considered stable unless explicitly marked as experimental in their documentation or docstrings. +Modules, functions, classes, and methods that are protected (have a leading underscore, see https://peps.python.org/pep-0008/ for more information) may be changed or removed at any time. + +Stable API +---------- + +Everything not specifically labelled as experimental is stable. + +For stable APIs, all of the following are true: + +- The API is not expected to change. +- If anything does change, we show a deprecation warning before applying the breaking change following the policy described in the "API Evolution" section below. + +Experimental API +---------------- + +Experimental APIs are labelled as experimental in their documentation or docstrings. +For experimental features, any of the following may be true: + +- The feature uses dependencies that are under active development and may change outside our control. +- The API may change without notice in future versions. +- The performance of the feature has not been verified. +- The feature has not been battle tested by the core team in production scenarios. +- The feature is under active development. + +While we may still issue deprecation warnings for experimental API changes, this is not guaranteed. +Therefore, it is important to be cautious when using experimental features and be prepared to modify your code if the +API changes in a future release. In this case, you might want to pin your dependencies to avoid unexpected issues. + +API Evolution +************* + +Lightning's development is driven by research and best practices in a rapidly developing field of AI and machine learning. Change is inevitable and when it happens, the Lightning team is committed to minimizing user friction and maximizing ease of transition from one version to the next. We take backwards compatibility and reproducibility very seriously. + +For API removal, renaming or other forms of backwards-incompatible changes, the procedure is: + +#. A deprecation process is initiated at a minor version ``MAJOR.MINOR.PATCH`` (e.g. ``1.5.0``), producing a deprecation warning at runtime and removing it from the documentation. +#. The deprecated API remains unchanged during the deprecation phase for two minor versions or the next major update, whichever comes first. +#. The breaking change is done in version ``MAJOR.(MINOR+2).0`` (e.g. ``1.7.0``), or ``(MAJOR+1).0.0`` (e.g. ``2.0.0``), whichever comes first. +#. From that version onward, the deprecation warning gets converted into a helpful error, which will remain until next major release. + +This policy is not strict. Shorter or longer deprecation cycles may apply to some cases. +For example, in the past DDP2 was removed without a deprecation process because the feature was broken and unusable beyond fixing as discussed in `#12584 `_. +Also, `#10410 `_ is an example that a longer deprecation applied to. We deprecated the accelerator arguments, such as ``Trainer(gpus=...)``, in 1.7, however, because the APIs were so core that they would impact almost all use cases, we decided not to introduce the breaking change until 2.0. + +Compatibility matrix +******************** + +PyTorch Lightning follows `NEP 29 `_ which PyTorch also follows (`#74203 `_). +The table below indicates the coverage of tested versions in our CI. Versions outside the ranges may unofficially work in some cases. + +.. list-table:: + :header-rows: 1 + + * - ``lightning.pytorch`` + - ``pytorch_lightning`` + - ``lightning.fabric`` + - ``torch`` + - ``torchmetrics`` + - Python + * - 2.0 + - 2.0 + - 2.0 (GA) + - ≥1.11, ≤2.0 + - ≥0.7.0 + - ≥3.8, ≤3.10 + * - 1.9 + - 1.9 + - 1.9 (experimental) + - ≥1.10, ≤1.13 + - ≥0.7.0 + - ≥3.7, ≤3.10 + * - 1.8** + - 1.8 + - n/a*** + - ≥1.10, ≤1.13 + - ≥0.7.0 + - ≥3.7, ≤3.10 + * - n/a + - 1.7 + - n/a*** + - ≥1.9, ≤1.12 + - ≥0.7.0 + - ≥3.7, ≤3.10 + * - n/a + - 1.6 + - n/a*** + - ≥1.8, ≤1.11 + - ≥0.4.1 + - ≥3.7, ≤3.9 + * - n/a + - 1.5 + - n/a*** + - ≥1.7, ≤1.10 + - ≥0.4.1 + - ≥3.6, ≤3.9 + * - n/a + - 1.4 + - n/a + - ≥1.6, ≤1.9 + - ≥0.4.0 + - ≥3.6, ≤3.9 + * - n/a + - 1.3 + - n/a + - ≥1.4, ≤1.8 + - ≥0.2.0 + - ≥3.6, ≤3.9 + * - n/a + - 1.2 + - n/a + - ≥1.4, ≤1.8 + - n/a* + - ≥3.6, ≤3.8 + * - n/a + - 1.1 + - n/a + - ≥1.3, ≤1.8 + - n/a* + - ≥3.6, ≤3.8 + * - n/a + - 1.0 + - n/a + - ≥1.3, ≤1.7 + - n/a* + - ≥3.6, ≤3.8 + +\* ``torchmetrics`` was part of ``pytorch_lightning`` at the time and was decoupled to a separate package in v1.3. + +\*\* The joint ``lightning`` package was first published in version 1.8 + +\*\*\* Fabric is the evolution of ``LightningLite`` which was released inside ``pytorch_lightning`` 1.5 and was decoupled to a separate package in v1.9 diff --git a/source/visualize/experiment_managers.rst b/docs/source-pytorch/visualize/experiment_managers.rst similarity index 91% rename from source/visualize/experiment_managers.rst rename to docs/source-pytorch/visualize/experiment_managers.rst index 30fada9..e40b741 100644 --- a/source/visualize/experiment_managers.rst +++ b/docs/source-pytorch/visualize/experiment_managers.rst @@ -5,7 +5,7 @@ To track other artifacts, such as histograms or model topology graphs first sele .. code-block:: python - from pytorch_lightning import loggers as pl_loggers + from lightning.pytorch import loggers as pl_loggers tensorboard = pl_loggers.TensorBoardLogger() trainer = Trainer(logger=tensorboard) diff --git a/source/visualize/loggers.rst b/docs/source-pytorch/visualize/loggers.rst similarity index 100% rename from source/visualize/loggers.rst rename to docs/source-pytorch/visualize/loggers.rst diff --git a/source/visualize/logging_advanced.rst b/docs/source-pytorch/visualize/logging_advanced.rst similarity index 87% rename from source/visualize/logging_advanced.rst rename to docs/source-pytorch/visualize/logging_advanced.rst index ca11e39..fd9153b 100644 --- a/source/visualize/logging_advanced.rst +++ b/docs/source-pytorch/visualize/logging_advanced.rst @@ -12,11 +12,11 @@ Track and Visualize Experiments (advanced) **************************** Change progress bar defaults **************************** -To change the default values (ie: version number) shown in the progress bar, override the :meth:`~pytorch_lightning.callbacks.progress.base.ProgressBarBase.get_metrics` method in your logger. +To change the default values (ie: version number) shown in the progress bar, override the :meth:`~lightning.pytorch.callbacks.progress.progress_bar.ProgressBar.get_metrics` method in your logger. .. code-block:: python - from pytorch_lightning.callbacks.progress import Tqdm + from lightning.pytorch.callbacks.progress import Tqdm class CustomProgressBar(Tqdm): @@ -37,7 +37,7 @@ Modify logging frequency ======================== Logging a metric on every single batch can slow down training. By default, Lightning logs every 50 rows, or 50 training steps. -To change this behaviour, set the *log_every_n_steps* :class:`~pytorch_lightning.trainer.trainer.Trainer` flag. +To change this behaviour, set the *log_every_n_steps* :class:`~lightning.pytorch.trainer.trainer.Trainer` flag. .. testcode:: @@ -49,20 +49,19 @@ To change this behaviour, set the *log_every_n_steps* :class:`~pytorch_lightning Modify flushing frequency ========================= -Metrics are kept in memory for N steps to improve training efficiency. Every N steps, metrics flush to disk. To change the frequency of this flushing, use the *flush_logs_every_n_steps* Trainer argument. +Some loggers keep logged metrics in memory for N steps and only periodically flush them to disk to improve training efficiency. +Every logger handles this a bit differently. For example, here is how to fine-tune flushing for the TensorBoard logger: .. code-block:: python - # faster training, high memory - Trainer(flush_logs_every_n_steps=500) + # Default used by TensorBoard: Write to disk after 10 logging events or every two minutes + logger = TensorBoardLogger(..., max_queue=10, flush_secs=120) - # slower training, low memory - Trainer(flush_logs_every_n_steps=500) + # Faster training, more memory used + logger = TensorBoardLogger(..., max_queue=100) -The higher *flush_logs_every_n_steps* is, the faster the model will train but the memory will build up until the next flush. -The smaller *flush_logs_every_n_steps* is, the slower the model will train but memory will be kept to a minimum. - -TODO: chart + # Slower training, less memory used + logger = TensorBoardLogger(..., max_queue=1) ---- @@ -114,7 +113,7 @@ logger ====== **Default:** True -Send logs to the logger like ``Tensorboard``, or any other custom logger passed to the :class:`~pytorch_lightning.trainer.trainer.Trainer` (Default: ``True``). +Send logs to the logger like ``Tensorboard``, or any other custom logger passed to the :class:`~lightning.pytorch.trainer.trainer.Trainer` (Default: ``True``). .. code-block:: python @@ -211,11 +210,11 @@ reduce_fx ========= **Default:** :meth:`torch.mean` -Reduction function over step values for end of epoch. Uses :meth:`torch.mean` by default. +Reduction function over step values for end of epoch. Uses :meth:`torch.mean` by default and is not applied when a :class:`torchmetrics.Metric` is logged. .. code-block:: python - self.log(reduce_fx=torch.mean) + self.log(..., reduce_fx=torch.mean) ---- @@ -315,7 +314,7 @@ To save logs to a remote filesystem, prepend a protocol like "s3:/" to the root_ .. code-block:: python - from pytorch_lightning.loggers import TensorBoardLogger + from lightning.pytorch.loggers import TensorBoardLogger logger = TensorBoardLogger(save_dir="s3://my_bucket/logs/") @@ -356,10 +355,10 @@ In LightningModule * - Method - on_step - on_epoch - * - on_after_backward, on_before_backward, on_before_optimizer_step, on_before_zero_grad, training_step, training_step_end + * - on_after_backward, on_before_backward, on_before_optimizer_step, optimizer_step, configure_gradient_clipping, on_before_zero_grad, training_step - True - False - * - training_epoch_end, test_epoch_end, test_step, test_step_end, validation_epoch_end, validation_step, validation_step_end + * - test_step, validation_step - False - True diff --git a/source/visualize/logging_basic.rst b/docs/source-pytorch/visualize/logging_basic.rst similarity index 76% rename from source/visualize/logging_basic.rst rename to docs/source-pytorch/visualize/logging_basic.rst index 8732305..61de5a9 100644 --- a/source/visualize/logging_basic.rst +++ b/docs/source-pytorch/visualize/logging_basic.rst @@ -29,8 +29,8 @@ To track a metric, simply use the *self.log* method available inside the *Lightn class LitModel(pl.LightningModule): def training_step(self, batch, batch_idx): - value = self.global_step - self.log("some_value", self.global_step) + value = ... + self.log("some_value", value) To log multiple metrics at once, use *self.log_dict* @@ -50,7 +50,7 @@ To view metrics in the commandline progress bar, set the *prog_bar* argument to .. code-block:: python - self.log(prog_bar=True) + self.log(..., prog_bar=True) TODO: need progress bar here @@ -58,13 +58,13 @@ TODO: need progress bar here View in the browser =================== -To view metrics in the browser you need to use an *experiment manager* with these capabilities. By Default, Lightning uses Tensorboard which is free and opensource. +To view metrics in the browser you need to use an *experiment manager* with these capabilities. -Tensorboard is already enabled by default +By Default, Lightning uses Tensorboard (if available) and a simple CSV logger otherwise. .. code-block:: python - # every trainer already has tensorboard enabled by default + # every trainer already has tensorboard enabled by default (if the dependency is available) trainer = Trainer() To launch the tensorboard dashboard run the following command on the commandline. @@ -100,39 +100,14 @@ When you call self.log inside the *validation_step* and *test_step*, Lightning a TODO: show single point plotted -If you don't want to average, add your own function in the *reduce_fx* argument. +If you don't want to average you can also choose from ``{min,max,sum}`` by passing the *reduce_fx* argument. .. code-block:: python # default function - self.log(reduce_fx=torch.mean) + self.log(..., reduce_fx="mean") ----- - -************ -Track images -************ -If your *experiment manager* supports image visualization, simply *log* the image with *self.log* - -.. code-block:: python - - # (32 batch samples, 3 channels, 32 width, 32 height) - image = torch.Tensor(32, 3, 28, 28) - self.log("an_image", image) - ----- - -********** -Track text -********** -If your *experiment manager* supports text visualization, simply *log* the text with *self.log* - -.. code-block:: python - - text = "hello world" - self.log("some_text", text) - -# TODO: show screenshot +For other reductions, we recommend logging a :class:`torchmetrics.Metric` instance instead. ---- diff --git a/source/visualize/logging_expert.rst b/docs/source-pytorch/visualize/logging_expert.rst similarity index 77% rename from source/visualize/logging_expert.rst rename to docs/source-pytorch/visualize/logging_expert.rst index 3b44ee9..febb662 100644 --- a/source/visualize/logging_expert.rst +++ b/docs/source-pytorch/visualize/logging_expert.rst @@ -19,11 +19,11 @@ If you'd like to change the way the progress bar displays information you can us Use the TQDMProgressBar ======================= -To use the TQDMProgressBar pass it into the *callbacks* :class:`~pytorch_lightning.trainer.trainer.Trainer` argument. +To use the TQDMProgressBar pass it into the *callbacks* :class:`~lightning.pytorch.trainer.trainer.Trainer` argument. .. code-block:: python - from pytorch_lightning.callbacks import TQDMProgressBar + from lightning.pytorch.callbacks import TQDMProgressBar trainer = Trainer(callbacks=[TQDMProgressBar()]) @@ -37,11 +37,11 @@ The RichProgressBar can add custom colors and beautiful formatting for your prog pip install rich -Then pass the callback into the callbacks :class:`~pytorch_lightning.trainer.trainer.Trainer` argument: +Then pass the callback into the callbacks :class:`~lightning.pytorch.trainer.trainer.Trainer` argument: .. code-block:: python - from pytorch_lightning.callbacks import RichProgressBar + from lightning.pytorch.callbacks import RichProgressBar trainer = Trainer(callbacks=[RichProgressBar()]) @@ -49,8 +49,8 @@ The rich progress bar can also have custom themes .. code-block:: python - from pytorch_lightning.callbacks import RichProgressBar - from pytorch_lightning.callbacks.progress.rich_progress import RichProgressBarTheme + from lightning.pytorch.callbacks import RichProgressBar + from lightning.pytorch.callbacks.progress.rich_progress import RichProgressBarTheme # create your own theme! theme = RichProgressBarTheme(description="green_yellow", progress_bar="green1") @@ -64,11 +64,11 @@ The rich progress bar can also have custom themes ************************ Customize a progress bar ************************ -To customize either the :class:`~pytorch_lightning.callbacks.TQDMProgressBar` or the :class:`~pytorch_lightning.callbacks.RichProgressBar`, subclass it and override any of its methods. +To customize either the :class:`~lightning.pytorch.callbacks.TQDMProgressBar` or the :class:`~lightning.pytorch.callbacks.RichProgressBar`, subclass it and override any of its methods. .. code-block:: python - from pytorch_lightning.callbacks import TQDMProgressBar + from lightning.pytorch.callbacks import TQDMProgressBar class LitProgressBar(TQDMProgressBar): @@ -82,14 +82,14 @@ To customize either the :class:`~pytorch_lightning.callbacks.TQDMProgressBar` o *************************** Build your own progress bar *************************** -To build your own progress bar, subclass :class:`~pytorch_lightning.callbacks.ProgressBarBase` +To build your own progress bar, subclass :class:`~lightning.pytorch.callbacks.ProgressBar` .. code-block:: python - from pytorch_lightning.callbacks import ProgressBarBase + from lightning.pytorch.callbacks import ProgressBar - class LitProgressBar(ProgressBarBase): + class LitProgressBar(ProgressBar): def __init__(self): super().__init__() # don't forget this :) self.enable = True @@ -112,11 +112,11 @@ To build your own progress bar, subclass :class:`~pytorch_lightning.callbacks.Pr ******************************* Integrate an experiment manager ******************************* -To create an integration between a custom logger and Lightning, subclass :class:`~pytorch_lightning.loggers.base.LightningLoggerBase` +To create an integration between a custom logger and Lightning, subclass :class:`~lightning.pytorch.loggers.base.LightningLoggerBase` .. code-block:: python - from pytorch_lightning.loggers import Logger + from lightning.pytorch.loggers import Logger class LitLogger(Logger): diff --git a/source/visualize/logging_intermediate.rst b/docs/source-pytorch/visualize/logging_intermediate.rst similarity index 81% rename from source/visualize/logging_intermediate.rst rename to docs/source-pytorch/visualize/logging_intermediate.rst index 1b0dd6b..24c3760 100644 --- a/source/visualize/logging_intermediate.rst +++ b/docs/source-pytorch/visualize/logging_intermediate.rst @@ -14,9 +14,9 @@ To track other artifacts, such as histograms or model topology graphs first sele .. code-block:: python - from pytorch_lightning import loggers as pl_loggers + from lightning.pytorch import loggers as pl_loggers - tensorboard = pl_loggers.TensorBoardLogger() + tensorboard = pl_loggers.TensorBoardLogger(save_dir="") trainer = Trainer(logger=tensorboard) then access the logger's API directly @@ -35,17 +35,6 @@ then access the logger's API directly ---- -**************************************** -Track multiple metrics in the same chart -**************************************** -If your logger supports plotting multiple metrics on the same chart, pass in a dictionary to *self.log*. - -.. code-block:: python - - self.log("performance", {"acc": acc, "recall": recall}) - ----- - ********************* Track hyperparameters ********************* diff --git a/docs/source-pytorch/visualize/supported_exp_managers.rst b/docs/source-pytorch/visualize/supported_exp_managers.rst new file mode 100644 index 0000000..49ab10c --- /dev/null +++ b/docs/source-pytorch/visualize/supported_exp_managers.rst @@ -0,0 +1,204 @@ +Comet.ml +======== +To use `Comet.ml `_ first install the comet package: + +.. code-block:: bash + + pip install comet-ml + +Configure the logger and pass it to the :class:`~lightning.pytorch.trainer.trainer.Trainer`: + +.. testcode:: + :skipif: not _COMET_AVAILABLE + + from lightning.pytorch.loggers import CometLogger + + comet_logger = CometLogger(api_key="YOUR_COMET_API_KEY") + trainer = Trainer(logger=comet_logger) + +Access the comet logger from any function (except the LightningModule *init*) to use its API for tracking advanced artifacts + +.. code-block:: python + + class LitModel(LightningModule): + def any_lightning_module_function_or_hook(self): + comet = self.logger.experiment + fake_images = torch.Tensor(32, 3, 28, 28) + comet.add_image("generated_images", fake_images, 0) + +Here's the full documentation for the :class:`~lightning.pytorch.loggers.CometLogger`. + +---- + +MLflow +====== +To use `MLflow `_ first install the MLflow package: + +.. code-block:: bash + + pip install mlflow + +Configure the logger and pass it to the :class:`~lightning.pytorch.trainer.trainer.Trainer`: + +.. testcode:: + :skipif: not _MLFLOW_AVAILABLE + + from lightning.pytorch.loggers import MLFlowLogger + + mlf_logger = MLFlowLogger(experiment_name="lightning_logs", tracking_uri="file:./ml-runs") + trainer = Trainer(logger=mlf_logger) + +Access the mlflow logger from any function (except the LightningModule *init*) to use its API for tracking advanced artifacts + +.. code-block:: python + + class LitModel(LightningModule): + def any_lightning_module_function_or_hook(self): + mlf_logger = self.logger.experiment + fake_images = torch.Tensor(32, 3, 28, 28) + mlf_logger.add_image("generated_images", fake_images, 0) + +Here's the full documentation for the :class:`~lightning.pytorch.loggers.MLFlowLogger`. + +---- + +Neptune.ai +========== +To use `Neptune.ai `_ first install the neptune package: + +.. code-block:: bash + + pip install neptune + +or with conda: + +.. code-block:: bash + + conda install -c conda-forge neptune + +Configure the logger and pass it to the :class:`~lightning.pytorch.trainer.trainer.Trainer`: + +.. testcode:: + :skipif: not _NEPTUNE_AVAILABLE + + import neptune + from lightning.pytorch.loggers import NeptuneLogger + + neptune_logger = NeptuneLogger( + api_key=neptune.ANONYMOUS_API_TOKEN, # replace with your own + project="common/pytorch-lightning-integration", # format "" + ) + trainer = Trainer(logger=neptune_logger) + +Access the neptune logger from any function (except the LightningModule *init*) to use its API for tracking advanced artifacts + +.. code-block:: python + + class LitModel(LightningModule): + def any_lightning_module_function_or_hook(self): + neptune_logger = self.logger.experiment["your/metadata/structure"] + neptune_logger.append(metadata) + +Here's the full documentation for the :class:`~lightning.pytorch.loggers.NeptuneLogger`. + +---- + +Tensorboard +=========== +`TensorBoard `_ can be installed with: + +.. code-block:: bash + + pip install tensorboard + +Configure the logger and pass it to the :class:`~lightning.pytorch.trainer.trainer.Trainer`: + +.. code-block:: python + + from lightning.pytorch.loggers import TensorBoardLogger + + logger = TensorBoardLogger() + trainer = Trainer(logger=logger) + +Access the tensorboard logger from any function (except the LightningModule *init*) to use its API for tracking advanced artifacts + +.. code-block:: python + + class LitModel(LightningModule): + def any_lightning_module_function_or_hook(self): + tensorboard_logger = self.logger.experiment + fake_images = torch.Tensor(32, 3, 28, 28) + tensorboard_logger.add_image("generated_images", fake_images, 0) + +Here's the full documentation for the :class:`~lightning.pytorch.loggers.TensorBoardLogger`. + +---- + +Weights and Biases +================== +To use `Weights and Biases `_ (wandb) first install the wandb package: + +.. code-block:: bash + + pip install wandb + +Configure the logger and pass it to the :class:`~lightning.pytorch.trainer.trainer.Trainer`: + +.. testcode:: + :skipif: not _WANDB_AVAILABLE + + from lightning.pytorch.loggers import WandbLogger + + wandb_logger = WandbLogger(project="MNIST", log_model="all") + trainer = Trainer(logger=wandb_logger) + + # log gradients and model topology + wandb_logger.watch(model) + +Access the wandb logger from any function (except the LightningModule *init*) to use its API for tracking advanced artifacts + +.. code-block:: python + + class MyModule(LightningModule): + def any_lightning_module_function_or_hook(self): + wandb_logger = self.logger.experiment + fake_images = torch.Tensor(32, 3, 28, 28) + + # Option 1 + wandb_logger.log({"generated_images": [wandb.Image(fake_images, caption="...")]}) + + # Option 2 for specifically logging images + wandb_logger.log_image(key="generated_images", images=[fake_images]) + +Here's the full documentation for the :class:`~lightning.pytorch.loggers.WandbLogger`. +`Demo in Google Colab `__ with hyperparameter search and model logging. + +---- + +Use multiple exp managers +========================= +To use multiple experiment managers at the same time, pass a list to the *logger* :class:`~lightning.pytorch.trainer.trainer.Trainer` argument. + +.. testcode:: + :skipif: (not _TENSORBOARD_AVAILABLE and not _TENSORBOARDX_AVAILABLE) or not _WANDB_AVAILABLE + + from lightning.pytorch.loggers import TensorBoardLogger, WandbLogger + + logger1 = TensorBoardLogger() + logger2 = WandbLogger() + trainer = Trainer(logger=[logger1, logger2]) + + +Access all loggers from any function (except the LightningModule *init*) to use their APIs for tracking advanced artifacts + +.. code-block:: python + + class MyModule(LightningModule): + def any_lightning_module_function_or_hook(self): + tensorboard_logger = self.loggers.experiment[0] + wandb_logger = self.loggers.experiment[1] + + fake_images = torch.Tensor(32, 3, 28, 28) + + tensorboard_logger.add_image("generated_images", fake_images, 0) + wandb_logger.add_image("generated_images", fake_images, 0) diff --git a/docs/starter/converting.html b/docs/starter/converting.html deleted file mode 100644 index 0581990..0000000 --- a/docs/starter/converting.html +++ /dev/null @@ -1,877 +0,0 @@ - - - - - - - - - - - - - - How to Organize PyTorch Into Lightning — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • How to Organize PyTorch Into Lightning
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

How to Organize PyTorch Into Lightning

-

To enable your code to work with Lightning, perform the following to organize PyTorch into Lightning.

-
-
-

1. Keep you Computational Code

-

Keep your regular nn.Module architecture

-
import pytorch_lightning as pl
-import torch
-import torch.nn as nn
-import torch.nn.functional as F
-
-
-class LitModel(nn.Module):
-    def __init__(self):
-        super().__init__()
-        self.layer_1 = nn.Linear(28 * 28, 128)
-        self.layer_2 = nn.Linear(128, 10)
-
-    def forward(self, x):
-        x = x.view(x.size(0), -1)
-        x = self.layer_1(x)
-        x = F.relu(x)
-        x = self.layer_2(x)
-        return x
-
-
-
-
-
-

2. Configure Training Logic

-

In the training_step of the LightningModule configure how your training routine behaves with a batch of training data:

-
class LitModel(pl.LightningModule):
-    def __init__(self, encoder):
-        super().__init__()
-        self.encoder = encoder
-
-    def training_step(self, batch, batch_idx):
-        x, y = batch
-        y_hat = self.encoder(x)
-        loss = F.cross_entropy(y_hat, y)
-        return loss
-
-
-
-

Note

-

If you need to fully own the training loop for complicated legacy projects, check out Own your loop.

-
-
-
-
-

3. Move Optimizer(s) and LR Scheduler(s)

-

Move your optimizers to the configure_optimizers() hook.

-
class LitModel(pl.LightningModule):
-    def configure_optimizers(self):
-        optimizer = torch.optim.Adam(self.encoder.parameters(), lr=1e-3)
-        lr_scheduler = torch.optim.lr_scheduler.StepLR(optimizer, step_size=1)
-        return [optimizer], [lr_scheduler]
-
-
-
-
-
-

4. Organize Validation Logic (optional)

-

If you need a validation loop, configure how your validation routine behaves with a batch of validation data:

-
class LitModel(pl.LightningModule):
-    def validation_step(self, batch, batch_idx):
-        x, y = batch
-        y_hat = self.encoder(x)
-        val_loss = F.cross_entropy(y_hat, y)
-        self.log("val_loss", val_loss)
-
-
-
-

Tip

-

trainer.validate() loads the best checkpoint automatically by default if checkpointing was enabled during fitting.

-
-
-
-
-

5. Organize Testing Logic (optional)

-

If you need a test loop, configure how your testing routine behaves with a batch of test data:

-
class LitModel(pl.LightningModule):
-    def test_step(self, batch, batch_idx):
-        x, y = batch
-        y_hat = self.encoder(x)
-        test_loss = F.cross_entropy(y_hat, y)
-        self.log("test_loss", test_loss)
-
-
-
-
-
-

6. Configure Prediction Logic (optional)

-

If you need a prediction loop, configure how your prediction routine behaves with a batch of test data:

-
class LitModel(LightningModule):
-    def predict_step(self, batch, batch_idx):
-        x, y = batch
-        pred = self.encoder(x)
-        return pred
-
-
-
-
-
-

7. Remove any .cuda() or .to(device) Calls

-

Your LightningModule can automatically run on any hardware!

-

If you have any explicit calls to .cuda() or .to(device), you can remove them since Lightning makes sure that the data coming from DataLoader -and all the Module instances initialized inside LightningModule.__init__ are moved to the respective devices automatically. -If you still need to access the current device, you can use self.device anywhere in your LightningModule except in the __init__ and setup methods.

-
class LitModel(LightningModule):
-    def training_step(self, batch, batch_idx):
-        z = torch.randn(4, 5, device=self.device)
-        ...
-
-
-

Hint: If you are initializing a Tensor within the LightningModule.__init__ method and want it to be moved to the device automatically you should call -register_buffer() to register it as a parameter.

-
class LitModel(LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.register_buffer("running_mean", torch.zeros(num_features))
-
-
-
-
-
-

8. Use your own data

-

Regular PyTorch DataLoaders work with Lightning. For more modular and scalable datasets, check out LightningDataModule.

-
-
-
-

Good to know

-

Additionally, you can run only the validation loop using validate() method.

-
model = LitModel()
-trainer.validate(model)
-
-
-
-

Note

-

model.eval() and torch.no_grad() are called automatically for validation.

-
-

The test loop isn’t used within fit(), therefore, you would need to explicitly call test().

-
model = LitModel()
-trainer.test(model)
-
-
-
-

Note

-

model.eval() and torch.no_grad() are called automatically for testing.

-
-
-

Tip

-

trainer.test() loads the best checkpoint automatically by default if checkpointing is enabled.

-
-

The predict loop will not be used until you call predict().

-
model = LitModel()
-trainer.predict(model)
-
-
-
-

Note

-

model.eval() and torch.no_grad() are called automatically for testing.

-
-
-

Tip

-

trainer.predict() loads the best checkpoint automatically by default if checkpointing is enabled.

-
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/starter/installation.html b/docs/starter/installation.html deleted file mode 100644 index 908f4b9..0000000 --- a/docs/starter/installation.html +++ /dev/null @@ -1,738 +0,0 @@ - - - - - - - - - - - - - - Installation — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Installation

-
-
-

Installation with pip

-

Install any supported version of PyTorch if you want from PyTorch Installation Page. -Now you can install using pip using the following command:

-
pip install pytorch-lightning
-
-
-
-
-
-

Installation with Conda

-

If you don’t have conda installed, follow the Conda Installation Guide. -Lightning can be installed with conda using the following command:

-
conda install pytorch-lightning -c conda-forge
-
-
-

You can also use Conda Environments:

-
conda activate my_env
-conda install pytorch-lightning -c conda-forge
-
-
-
-
-
-

Installation from Source

-

Install nightly from the source. Note that it contains all the bug fixes and newly released features that -are not published yet. This is the bleeding edge, so use it at your own discretion.

-
pip install https://github.com/PyTorchLightning/pytorch-lightning/archive/master.zip
-
-
-

Install future patch releases from the source. Note that the patch release contains only the bug fixes for the recent major release.

-
pip install https://github.com/PyTorchLightning/pytorch-lightning/archive/refs/heads/release/1.5.x.zip
-
-
-
-
-
-

Lightning Coverage

-

PyTorch Lightning is maintained and tested on different Python and PyTorch versions.

-

Check out the CI Coverage for more info.

-

It is rigorously tested across multiple GPUs, TPUs, CPUs and IPUs. GPU tests run on two NVIDIA P100. TPU tests run on Google GKE TPUv2/3. -TPU py3.7 means we support Colab and Kaggle env. IPU tests run on MK1 IPU boxes.

-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/starter/introduction.html b/docs/starter/introduction.html deleted file mode 100644 index 1b6c6c8..0000000 --- a/docs/starter/introduction.html +++ /dev/null @@ -1,1038 +0,0 @@ - - - - - - - - - - - - - - Lightning 15분 만에 배워보기 — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Lightning 15분 만에 배워보기
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Lightning 15분 만에 배워보기

-

필요한 배경지식: 없음

-

목표: 이 문서에서는 일반적인 Lightning 워크플로우의 주요한 7단계를 안내합니다.

-

PyTorch Lightning(파이토치 라이트닝)은 대규모로 엄청 빠른 성능을 요구하면서 최대한의 유연성을 필요로 하는 -전문적인 AI 연구자들과 머신러닝 엔지니어들을 위한 “배터리가 포함된(batteries included)” 딥러닝 프레임워크입니다.

-

-

Lightning(라이트닝)은 반복적으로 사용하는 코드(boilerplate)를 제거하고 확장성(scalability)을 확보하도록 PyTorch 코드를 재구성합니다.

-
-

-
-

PyTorch 코드를 재구성함으로써, Lightning에서는 이런 것들이 가능해집니다:

-
-

- -
-
-

완전한 유연성

-

반복되는 코드 없이 PyTorch를 그대로 사용하여 아이디어를 구현합니다.

-
- - -

-

- -
-
-

재현성 + 가독성

-

연구용 코드와 엔지니어링 코드를 분리하여 재현성을 갖추고 더 나은 가독성을 제공합니다.

-
- - -

-

- -
-
-

간단한 다중 GPU 학습

-

코드 변경 없이 여러개의 GPU/TPU/HPU 등을 사용합니다.

-
- - -

-

- -
-
-

테스트 완료

-

이미 모든 테스트를 완료하여 직접 테스트 할 필요없습니다.

-
- - -

-
-

-
-

1: PyTorch Lightning 설치하기

-
-

pip 사용자라면,

-
pip install pytorch-lightning
-
-
-
-

conda 사용자라면,

-
conda install pytorch-lightning -c conda-forge
-
-
-
-

또는 advanced install guide 를 참조하세요.

-
-
-
-

2: LightningModule 정의하기

-

LightningModule을 사용하여 PyTorch nn.Module이 training_step (뿐만 아니라 validation_step이나 test_step) 내에서 복잡한 방식으로 함께 동작할 수 있도록 합니다.

-
import os
-from torch import optim, nn, utils, Tensor
-from tests.helpers.datasets import MNIST
-import pytorch_lightning as pl
-
-# 원하는만큼의 nn.Module (또는 기존 모델)을 정의합니다.
-encoder = nn.Sequential(nn.Linear(28 * 28, 64), nn.ReLU(), nn.Linear(64, 3))
-decoder = nn.Sequential(nn.Linear(3, 64), nn.ReLU(), nn.Linear(64, 28 * 28))
-
-# LightningModule을 정의합니다.
-class LitAutoEncoder(pl.LightningModule):
-    def __init__(self, encoder, decoder):
-        super().__init__()
-        self.encoder = encoder
-        self.decoder = decoder
-
-    def training_step(self, batch, batch_idx):
-        # training_step defines the train loop.
-        # it is independent of forward
-        x, y = batch
-        x = x.view(x.size(0), -1)
-        z = self.encoder(x)
-        x_hat = self.decoder(z)
-        loss = nn.functional.mse_loss(x_hat, x)
-        # Logging to TensorBoard by default
-        self.log("train_loss", loss)
-        return loss
-
-    def configure_optimizers(self):
-        optimizer = optim.Adam(self.parameters(), lr=1e-3)
-        return optimizer
-
-
-# 오토인코더(autoencoder)를 초기화합니다.
-autoencoder = LitAutoEncoder(encoder, decoder)
-
-
-
-
-
-

3: 데이터셋 정의하기

-

Lightning은 어떠한 순회 가능한 객체(iterable; DataLoader, numpy 등…)도 학습/검증/테스트/예측용으로 나누어 사용할 수 있습니다.

-
# 데이터를 설정합니다.
-dataset = MNIST(os.getcwd(), download=True)
-train_loader = utils.data.DataLoader(dataset)
-
-
-
-
-
-

4: 모델 학습하기

-

Lightning Trainer 는 모든 LightningModule 과 데이터셋을 “함께(mix)” 학습할 수 있으며, -확장에 필요한 모든 엔지니어링적 복잡성들을 추상화(abstract)합니다.

-
# 모델을 학습합니다 (힌트: 빠른 아이디어 반복에 도움이 되는 Trainer의 인자들을 참고하세요)
-trainer = pl.Trainer(limit_train_batches=100, max_epochs=1)
-trainer.fit(model=autoencoder, train_dataloaders=train_loader)
-
-
-

Lightning Trainer 는 아래 예시들을 포함하여 40종류 이상의 기법들 을 자동화합니다:

- -
-
-
-

5: 모델 사용하기

-

모델을 학습한 뒤에는 ONNX, TorchScript로 내보내기(export)하여 상용 환경에 포함하거나 단순히 가중치를 불러오고 예측을 실행할 수 있습니다.

-
# 체크포인트(checkpoint)를 불러옵니다.
-checkpoint = "./lightning_logs/version_0/checkpoints/epoch=0-step=100.ckpt"
-autoencoder = LitAutoEncoder.load_from_checkpoint(checkpoint, encoder=encoder, decoder=decoder)
-
-# 학습한 nn.Module을 선택합니다.
-encoder = autoencoder.encoder
-encoder.eval()
-
-# 4개의 가짜 이미지로 예측(embed)합니다!
-fake_image_batch = Tensor(4, 28 * 28)
-embeddings = encoder(fake_image_batch)
-print("⚡" * 20, "\nPredictions (4 image embeddings):\n", embeddings, "\n", "⚡" * 20)
-
-
-
-
-
-

6: 학습 시각화하기

-

Lightning에는 많은 배터리가 포함되어 있습니다. 실험을 시각화하는데 사용하는 텐서보드(Tensorboard)도 유용한 도구 중 하나입니다.

-

명령줄(commandline)에서 아래를 실행하고 브라우저에서 http://localhost:6006/ 을 열어보세요.

-
tensorboard --logdir .
-
-
-
-
-
-

7: 엄청 빠르게 학습하기

-

Trainer에 인자(argument)를 사용하여 고급 학습 기능을 사용할 수 있습니다. 이는 다른 코드를 변경하지 않으면서 학습 단계(train loop)에 자동으로 통합할 수 있도록 하는 최신(state-of-the-art)의 기술입니다.

-
# 4개의 GPU에서 학습
-trainer = Trainer(
-    devices=4,
-    accelerator="gpu",
- )
-
-# Deepspeed/FSDP를 사용하여 1TB 이상의 매개변수를 갖는 모델 학습
-trainer = Trainer(
-    devices=4,
-    accelerator="gpu",
-    strategy="deepspeed_stage_2",
-    precision=16
- )
-
-# 빠른 아이디어 반복을 위한 20개 이상의 유용한 플래그(flag)
-trainer = Trainer(
-    max_epochs=10,
-    min_epochs=5,
-    overfit_batches=1
- )
-
-# 최신 기술을 사용
-trainer = Trainer(callbacks=[StochasticWeightAveraging(...)])
-
-
-
-
-
-

유연성 극대화하기

-

Lightning의 핵심 원칙은 PyTorch의 어떠한 부분도 숨기지 않으면서 언제나 최대한의 유연성을 제공하는 것입니다.

-

Lightning은 프로젝트의 복잡도에 따라 추가적인 5단계의 유연성을 제공합니다.

-
-
-

학습 단계(loop) 사용자 정의하기

-Injecting custom code in a training loop -

LightningModule에서 사용할 수 있는 20개 이상의 메소드 (Hooks) 중 일부를 사용하여 훈련 단계 어디에든 사용자 정의 코드를 삽입할 수 있습니다.

-
class LitAutoEncoder(pl.LightningModule):
-    def backward(self, loss, optimizer, optimizer_idx):
-        loss.backward()
-
-
-
-
-
-

Trainer 확장하기

-

유사한 기능을 하는 여러줄의 코드가 있는 경우, 콜백(callback)을 사용하여 손쉽게 그룹으로 묶어서 해당하는 코드들을 동시에 켜거나 끌 수 있습니다.

-
trainer = Trainer(callbacks=[AWSCheckpoints()])
-
-
-
-
-
-

PyTorch 자체의 반복(loop) 사용하기

-

최첨단 연구 시 특정 유형의 작업들을 위해, Lightning은 전문가들이 다양한 방식으로 학습 단계를 완전히 제어할 수 있는 기능을 제공합니다.

-
-
-
-
-

다음 단계

-

사용 사례에 따라, 아래 내용들 중 하나를 다음 단계로 살펴보세요.

-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/starter/lightning_lite.html b/docs/starter/lightning_lite.html deleted file mode 100644 index 3eed1ab..0000000 --- a/docs/starter/lightning_lite.html +++ /dev/null @@ -1,1340 +0,0 @@ - - - - - - - - - - - - - - LightningLite (Stepping Stone to Lightning) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • LightningLite (Stepping Stone to Lightning)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

LightningLite (Stepping Stone to Lightning)

-

LightningLite enables pure PyTorch users to scale their existing code -on any kind of device while retaining full control over their own loops and optimization logic.

-Animation showing how to convert your PyTorch code to LightningLite. -
-

-
-

LightningLite is the right tool for you if you match one of the two following descriptions:

-
    -
  • I want to quickly scale my existing code to multiple devices with minimal code changes.

  • -
  • I would like to convert my existing code to the Lightning API, but a full path to Lightning transition might be too complex. I am looking for a stepping stone to ensure reproducibility during the transition.

  • -
-
-

Warning

-

LightningLite is currently a beta feature. Its API is subject to change based on your feedback.

-
-
-
-

Learn by example

-
-

My Existing PyTorch Code

-

The run function contains custom training loop used to train MyModel on MyDataset for num_epochs epochs.

-
import torch
-from torch import nn
-from torch.utils.data import DataLoader, Dataset
-
-
-class MyModel(nn.Module):
-    ...
-
-
-class MyDataset(Dataset):
-    ...
-
-
-def run(args):
-    device = "cuda" if torch.cuda.is_available() else "cpu"
-
-    model = MyModel(...).to(device)
-    optimizer = torch.optim.SGD(model.parameters(), ...)
-
-    dataloader = DataLoader(MyDataset(...), ...)
-
-    model.train()
-    for epoch in range(args.num_epochs):
-        for batch in dataloader:
-            batch = batch.to(device)
-            optimizer.zero_grad()
-            loss = model(batch)
-            loss.backward()
-            optimizer.step()
-
-
-run(args)
-
-
-
-
-
-

Convert to LightningLite

-

Here are five required steps to convert to LightningLite.

-
    -
  1. Subclass LightningLite and override its run() method.

  2. -
  3. Move the body of your existing run function into LightningLite run method.

  4. -
  5. Remove all .to(...), .cuda() etc calls since LightningLite will take care of it.

  6. -
  7. Apply setup() over each model and optimizers pair and setup_dataloaders() on all your dataloaders and replace loss.backward() by self.backward(loss).

  8. -
  9. Instantiate your LightningLite subclass and call its run() method.

  10. -
-
-

-
-
import torch
-from torch import nn
-from torch.utils.data import DataLoader, Dataset
-from pytorch_lightning.lite import LightningLite
-
-
-class MyModel(nn.Module):
-    ...
-
-
-class MyDataset(Dataset):
-    ...
-
-
-class Lite(LightningLite):
-    def run(self, args):
-
-        model = MyModel(...)
-        optimizer = torch.optim.SGD(model.parameters(), ...)
-        model, optimizer = self.setup(model, optimizer)  # Scale your model / optimizers
-
-        dataloader = DataLoader(MyDataset(...), ...)
-        dataloader = self.setup_dataloaders(dataloader)  # Scale your dataloaders
-
-        model.train()
-        for epoch in range(args.num_epochs):
-            for batch in dataloader:
-                optimizer.zero_grad()
-                loss = model(batch)
-                self.backward(loss)  # instead of loss.backward()
-                optimizer.step()
-
-
-Lite(...).run(args)
-
-
-

That’s all. You can now train on any kind of device and scale your training. Check out this full MNIST training example with LightningLite.

-

LightningLite takes care of device management, so you don’t have to. -You should remove any device-specific logic within your code.

-

Here is how to train on eight GPUs with torch.bfloat16 precision:

-
Lite(strategy="ddp", devices=8, accelerator="gpu", precision="bf16").run(10)
-
-
-

Here is how to use DeepSpeed Zero3 with eight GPUs and precision 16:

-
Lite(strategy="deepspeed", devices=8, accelerator="gpu", precision=16).run(10)
-
-
-

LightningLite can also figure it out automatically for you!

-
Lite(devices="auto", accelerator="auto", precision=16).run(10)
-
-
-

You can also easily use distributed collectives if required. -Here is an example while running on 256 GPUs (eight GPUs times 32 nodes).

-
class Lite(LightningLite):
-    def run(self):
-
-        # Transfer and concatenate tensors across processes
-        self.all_gather(...)
-
-        # Transfer an object from one process to all the others
-        self.broadcast(..., src=...)
-
-        # The total number of processes running across all devices and nodes.
-        self.world_size
-
-        # The global index of the current process across all devices and nodes.
-        self.global_rank
-
-        # The index of the current process among the processes running on the local node.
-        self.local_rank
-
-        # The index of the current node.
-        self.node_rank
-
-        # Wether this global rank is rank zero.
-        if self.is_global_zero:
-            # do something on rank 0
-            ...
-
-        # Wait for all processes to enter this call.
-        self.barrier()
-
-
-Lite(strategy="ddp", devices=8, num_nodes=32, accelerator="gpu").run()
-
-
-

If you require custom data or model device placement, you can deactivate -LightningLite automatic placement by doing -self.setup_dataloaders(..., move_to_device=False) for the data and -self.setup(..., move_to_device=False) for the model. -Furthermore, you can access the current device from self.device or -rely on to_device() -utility to move an object to the current device.

-
-

Note

-

We recommend instantiating the models within the run() method as large models would cause an out-of-memory error otherwise.

-
-
-

Tip

-

If you have hundreds or thousands of lines within your run() function -and you are feeling unsure about them, then that is the correct feeling. -In 2019, our LightningModule was getting larger -and we got the same feeling, so we started to organize our code for simplicity, interoperability and standardization. -This is definitely a good sign that you should consider refactoring your code and / or switching to -LightningModule ultimately.

-
-
-
-
-

Distributed Training Pitfalls

-

The LightningLite provides you with the tools to scale your training, -but there are several major challenges ahead of you now:

- ---- - - - - - - - - - - - - - - - - - - - - -

Processes divergence

This happens when processes execute a different section of the code due to different if/else conditions, race conditions on existing files and so on, resulting in hanging.

Cross processes reduction

Miscalculated metrics or gradients due to errors in their reduction.

Large sharded models

Instantiation, materialization and state management of large models.

Rank 0 only actions

Logging, profiling, and so on.

Checkpointing / Early stopping / Callbacks / Logging

Ability to customize your training behavior easily and make it stateful.

Fault-tolerant training

Ability to resume from a failure as if it never happened.

-

If you are facing one of those challenges, then you are already meeting the limit of LightningLite. -We recommend you to convert to Lightning, so you never have to worry about those.

-
-
-
-

Convert to Lightning

-

LightningLite is a stepping stone to transition fully to the Lightning API and benefit -from its hundreds of features.

-

You can see our LightningLite class as a -future LightningModule, and slowly refactor your code into its API. -Below, the training_step(), forward(), -configure_optimizers(), train_dataloader() methods -are implemented.

-
class Lite(LightningLite):
-
-    # 1. This would become the LightningModule `__init__` function.
-    def run(self, args):
-        self.args = args
-
-        self.model = MyModel(...)
-
-        self.fit()  # This would be automated by the Lightning Trainer.
-
-    # 2. This can be fully removed as Lightning creates its own fitting loop,
-    # and sets up the model, optimizer, dataloader, etc for you.
-    def fit(self):
-        # setup everything
-        optimizer = self.configure_optimizers()
-        self.model, optimizer = self.setup(self.model, optimizer)
-        dataloader = self.setup_dataloaders(self.train_dataloader())
-
-        # start fitting
-        self.model.train()
-        for epoch in range(num_epochs):
-            for batch in enumerate(dataloader):
-                optimizer.zero_grad()
-                loss = self.training_step(batch, batch_idx)
-                self.backward(loss)
-                optimizer.step()
-
-    # 3. This stays here as it belongs to the LightningModule.
-    def forward(self, x):
-        return self.model(x)
-
-    def training_step(self, batch, batch_idx):
-        return self.forward(batch)
-
-    def configure_optimizers(self):
-        return torch.optim.SGD(self.model.parameters(), ...)
-
-    # 4. [Optionally] This can stay here or be extracted to the LightningDataModule to enable higher composability.
-    def train_dataloader(self):
-        return DataLoader(MyDataset(...), ...)
-
-
-Lite(...).run(args)
-
-
-

Finally, change the run() into a -__init__() and drop the fit call from inside.

-
from pytorch_lightning import LightningDataModule, LightningModule, Trainer
-
-
-class LightningModel(LightningModule):
-    def __init__(self, args):
-        super().__init__()
-        self.model = MyModel(...)
-
-    def forward(self, x):
-        return self.model(x)
-
-    def training_step(self, batch, batch_idx):
-        loss = self(batch)
-        self.log("train_loss", loss)
-        return loss
-
-    def configure_optimizers(self):
-        return torch.optim.SGD(self.model.parameters(), lr=0.001)
-
-
-class BoringDataModule(LightningDataModule):
-    def train_dataloader(self):
-        return DataLoader(MyDataset(...), ...)
-
-
-trainer = Trainer(max_epochs=10)
-trainer.fit(LightningModel(), datamodule=BoringDataModule())
-
-
-

You have successfully converted to PyTorch Lightning, and can now benefit from its hundred of features!

-
-
-
-
-

Lightning Lite Flags

-

Lite is specialized in accelerated distributed training and inference. It offers you convenient ways to configure -your device and communication strategy and to switch seamlessly from one to the other. The terminology and usage are -identical to Lightning, which means minimum effort for you to convert when you decide to do so.

-
-

accelerator

-

Choose one of "cpu", "gpu", "tpu", "auto" (IPU support is coming soon).

-
# CPU accelerator
-lite = Lite(accelerator="cpu")
-
-# Running with GPU Accelerator using 2 GPUs
-lite = Lite(devices=2, accelerator="gpu")
-
-# Running with TPU Accelerator using 8 tpu cores
-lite = Lite(devices=8, accelerator="tpu")
-
-# Running with GPU Accelerator using the DistributedDataParallel strategy
-lite = Lite(devices=4, accelerator="gpu", strategy="ddp")
-
-
-

The "auto" option recognizes the machine you are on and selects the available accelerator.

-
# If your machine has GPUs, it will use the GPU Accelerator
-lite = Lite(devices=2, accelerator="auto")
-
-
-
-
-

strategy

-

Choose a training strategy: "dp", "ddp", "ddp_spawn", "tpu_spawn", "deepspeed", "ddp_sharded", or "ddp_sharded_spawn".

-
# Running with the DistributedDataParallel strategy on 4 GPUs
-lite = Lite(strategy="ddp", accelerator="gpu", devices=4)
-
-# Running with the DDP Spawn strategy using 4 cpu processes
-lite = Lite(strategy="ddp_spawn", accelerator="cpu", devices=4)
-
-
-

Additionally, you can pass in your custom strategy by configuring additional parameters.

-
from pytorch_lightning.strategies import DeepSpeedStrategy
-
-lite = Lite(strategy=DeepSpeedStrategy(stage=2), accelerator="gpu", devices=2)
-
-
-

Support for Horovod and Fully Sharded training strategies are coming soon.

-
-
-

devices

-

Configure the devices to run on. Can be of type:

-
    -
  • int: the number of devices (e.g., GPUs) to train on

  • -
  • list of int: which device index (e.g., GPU ID) to train on (0-indexed)

  • -
  • str: a string representation of one of the above

  • -
-
# default used by Lite, i.e., use the CPU
-lite = Lite(devices=None)
-
-# equivalent
-lite = Lite(devices=0)
-
-# int: run on two GPUs
-lite = Lite(devices=2, accelerator="gpu")
-
-# list: run on GPUs 1, 4 (by bus ordering)
-lite = Lite(devices=[1, 4], accelerator="gpu")
-lite = Lite(devices="1, 4", accelerator="gpu")  # equivalent
-
-# -1: run on all GPUs
-lite = Lite(devices=-1, accelerator="gpu")
-lite = Lite(devices="-1", accelerator="gpu")  # equivalent
-
-
-
-
-

gpus

-
-

Warning

-

gpus=x has been deprecated in v1.7 and will be removed in v2.0. -Please use accelerator='gpu' and devices=x instead.

-
-

Shorthand for setting devices=X and accelerator="gpu".

-
# Run on two GPUs
-lite = Lite(accelerator="gpu", devices=2)
-
-# Equivalent
-lite = Lite(devices=2, accelerator="gpu")
-
-
-
-
-

tpu_cores

-
-

Warning

-

tpu_cores=x has been deprecated in v1.7 and will be removed in v2.0. -Please use accelerator='tpu' and devices=x instead.

-
-

Shorthand for devices=X and accelerator="tpu".

-
# Run on eight TPUs
-lite = Lite(accelerator="tpu", devices=8)
-
-# Equivalent
-lite = Lite(devices=8, accelerator="tpu")
-
-
-
-
-

num_nodes

-

Number of cluster nodes for distributed operation.

-
# Default used by Lite
-lite = Lite(num_nodes=1)
-
-# Run on 8 nodes
-lite = Lite(num_nodes=8)
-
-
-

Learn more about distributed multi-node training on clusters here.

-
-
-

precision

-

Lightning Lite supports double precision (64), full precision (32), or half precision (16) operation (including bfloat16). -Half precision, or mixed precision, is the combined use of 32 and 16-bit floating points to reduce the memory footprint during model training. -This can result in improved performance, achieving significant speedups on modern GPUs.

-
# Default used by the Lite
-lite = Lite(precision=32, devices=1)
-
-# 16-bit (mixed) precision
-lite = Lite(precision=16, devices=1)
-
-# 16-bit bfloat precision
-lite = Lite(precision="bf16", devices=1)
-
-# 64-bit (double) precision
-lite = Lite(precision=64, devices=1)
-
-
-
-
-

plugins

-

Plugins allow you to connect arbitrary backends, precision libraries, clusters etc. For example: -To define your own behavior, subclass the relevant class and pass it in. Here’s an example linking up your own -ClusterEnvironment.

-
from pytorch_lightning.plugins.environments import ClusterEnvironment
-
-
-class MyCluster(ClusterEnvironment):
-    @property
-    def main_address(self):
-        return your_main_address
-
-    @property
-    def main_port(self):
-        return your_main_port
-
-    def world_size(self):
-        return the_world_size
-
-
-lite = Lite(plugins=[MyCluster()], ...)
-
-
-
-
-
-
-

Lightning Lite Methods

-
-

run

-

The run method serves two purposes:

-
    -
  1. Override this method from the LightningLite class and put your -training (or inference) code inside.

  2. -
  3. Launch the training procedure by calling the run method. Lite will take care of setting up the distributed backend.

  4. -
-

You can optionally pass arguments to the run method. For example, the hyperparameters or a backbone for the model.

-
from pytorch_lightning.lite import LightningLite
-
-
-class Lite(LightningLite):
-
-    # Input arguments are optional; put whatever you need
-    def run(self, learning_rate, num_layers):
-        """Here goes your training loop"""
-
-
-lite = Lite(accelerator="gpu", devices=2)
-lite.run(learning_rate=0.01, num_layers=12)
-
-
-
-
-

setup

-

Set up a model and corresponding optimizer(s). If you need to set up multiple models, call setup() on each of them. -Moves the model and optimizer to the correct device automatically.

-
model = nn.Linear(32, 64)
-optimizer = torch.optim.SGD(model.parameters(), lr=0.001)
-
-# Set up model and optimizer for accelerated training
-model, optimizer = self.setup(model, optimizer)
-
-# If you don't want Lite to set the device
-model, optimizer = self.setup(model, optimizer, move_to_device=False)
-
-
-

The setup method also prepares the model for the selected precision choice so that operations during forward() get -cast automatically.

-
-
-

setup_dataloaders

-

Set up one or multiple dataloaders for accelerated operation. If you are running a distributed strategy (e.g., DDP), Lite -replaces the sampler automatically for you. In addition, the dataloader will be configured to move the returned -data tensors to the correct device automatically.

-
train_data = torch.utils.DataLoader(train_dataset, ...)
-test_data = torch.utils.DataLoader(test_dataset, ...)
-
-train_data, test_data = self.setup_dataloaders(train_data, test_data)
-
-# If you don't want Lite to move the data to the device
-train_data, test_data = self.setup_dataloaders(train_data, test_data, move_to_device=False)
-
-# If you don't want Lite to replace the sampler in the context of distributed training
-train_data, test_data = self.setup_dataloaders(train_data, test_data, replace_sampler=False)
-
-
-
-
-

backward

-

This replaces any occurrences of loss.backward() and makes your code accelerator and precision agnostic.

-
output = model(input)
-loss = loss_fn(output, target)
-
-# loss.backward()
-self.backward(loss)
-
-
-
-
-

to_device

-

Use to_device() to move models, tensors or collections of tensors to -the current device. By default setup() and -setup_dataloaders() already move the model and data to the correct -device, so calling this method is only necessary for manual operation when needed.

-
data = torch.load("dataset.pt")
-data = self.to_device(data)
-
-
-
-
-

seed_everything

-

Make your code reproducible by calling this method at the beginning of your run.

-
# Instead of `torch.manual_seed(...)`, call:
-self.seed_everything(1234)
-
-
-

This covers PyTorch, NumPy and Python random number generators. In addition, Lite takes care of properly initializing -the seed of dataloader worker processes (can be turned off by passing workers=False).

-
-
-

autocast

-

Let the precision backend autocast the block of code under this context manager. This is optional and already done by -Lite for the model’s forward method (once the model was setup()). -You need this only if you wish to autocast more operations outside the ones in model forward:

-
model, optimizer = self.setup(model, optimizer)
-
-# Lite handles precision automatically for the model
-output = model(inputs)
-
-with self.autocast():  # optional
-    loss = loss_function(output, target)
-
-self.backward(loss)
-...
-
-
-
-
-

print

-

Print to the console via the built-in print function, but only on the main process. -This avoids excessive printing and logs when running on multiple devices/nodes.

-
# Print only on the main process
-self.print(f"{epoch}/{num_epochs}| Train Epoch Loss: {loss}")
-
-
-
-
-

save

-

Save contents to a checkpoint. Replaces all occurrences of torch.save(...) in your code. Lite will take care of -handling the saving part correctly, no matter if you are running a single device, multi-devices or multi-nodes.

-
# Instead of `torch.save(...)`, call:
-self.save(model.state_dict(), "path/to/checkpoint.ckpt")
-
-
-
-
-

load

-

Load checkpoint contents from a file. Replaces all occurrences of torch.load(...) in your code. Lite will take care of -handling the loading part correctly, no matter if you are running a single device, multi-device, or multi-node.

-
# Instead of `torch.load(...)`, call:
-self.load("path/to/checkpoint.ckpt")
-
-
-
-
-

barrier

-

Call this if you want all processes to wait and synchronize. Once all processes have entered this call, -execution continues. Useful for example when you want to download data on one process and make all others wait until -the data is written to disk.

-
# Download data only on one process
-if self.global_rank == 0:
-    download_data("http://...")
-
-# Wait until all processes meet up here
-self.barrier()
-
-# All processes are allowed to read the data now
-
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/starter/style_guide.html b/docs/starter/style_guide.html deleted file mode 100644 index bcc555d..0000000 --- a/docs/starter/style_guide.html +++ /dev/null @@ -1,908 +0,0 @@ - - - - - - - - - - - - - - 스타일 가이드 — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • 스타일 가이드
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

스타일 가이드

-

파이토치 라이트닝(PyTorch Lightning)의 주요한 목표는 가독성과 재현성을 개선하는 것입니다. GitHub 저장소나 연구 프로젝트에서 -LightningModule 을 발견하고, 관심있는 부분을 찾기 위해 정확히 어디를 봐야할지 정확히 알고 있다고 상상해보세요.

-

이 스타일 가이드의 목표는 Lightning의 코드가 유사하게 구성되도록 권장하는데 있습니다.

-
-
-

LightningModule

-

These are best practices for structuring your LightningModule class:

-
-

Systems vs Models

-
-https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/pl_docs/model_system.png -
-

The main principle behind a LightningModule is that a full system should be self-contained. -In Lightning, we differentiate between a system and a model.

-

A model is something like a resnet18, RNN, and so on.

-

A system defines how a collection of models interact with each other with user-defined training/evaluation logic. Examples of this are:

-
    -
  • GANs

  • -
  • Seq2Seq

  • -
  • BERT

  • -
  • etc.

  • -
-

A LightningModule can define both a system and a model:

-

Here’s a LightningModule that defines a system. This structure is what we recommend as a best practice. Keeping the model separate from the system improves -modularity, which eventually helps in better testing, reduces dependencies on the system and makes it easier to refactor.

-
class Encoder(nn.Module):
-    ...
-
-
-class Decoder(nn.Module):
-    ...
-
-
-class AutoEncoder(nn.Module):
-    def __init__(self):
-        super().__init__()
-        self.encoder = Encoder()
-        self.decoder = Decoder()
-
-    def forward(self, x):
-        return self.encoder(x)
-
-
-class AutoEncoderSystem(LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.auto_encoder = AutoEncoder()
-
-
-

For fast prototyping, it’s often useful to define all the computations in a LightningModule. For reusability -and scalability, it might be better to pass in the relevant backbones.

-

Here’s a LightningModule that defines a model. Although, we do not recommend to define a model like in the example.

-
class LitModel(LightningModule):
-    def __init__(self):
-        super().__init__()
-        self.layer_1 = nn.Linear()
-        self.layer_2 = nn.Linear()
-        self.layer_3 = nn.Linear()
-
-
-
-
-

Self-contained

-

A Lightning module should be self-contained. To see how self-contained your model is, a good test is to ask -yourself this question:

-

“Can someone drop this file into a Trainer without knowing anything about the internals?”

-

For example, we couple the optimizer with a model because the majority of models require a specific optimizer with -a specific learning rate scheduler to work well.

-
-
-

Init

-

The first place where LightningModules tend to stop being self-contained is in the init. Try to define all the relevant -sensible defaults in the init so that the user doesn’t have to guess.

-

Here’s an example where a user will have to go hunt through files to figure out how to init this LightningModule.

-
class LitModel(LightningModule):
-    def __init__(self, params):
-        self.lr = params.lr
-        self.coef_x = params.coef_x
-
-
-

Models defined as such leave you with many questions, such as what is coef_x? Is it a string? A float? What is the range? -Instead, be explicit in your init

-
class LitModel(LightningModule):
-    def __init__(self, encoder: nn.Module, coef_x: float = 0.2, lr: float = 1e-3):
-        ...
-
-
-

Now the user doesn’t have to guess. Instead, they know the value type, and the model has a sensible default where the -user can see the value immediately.

-
-
-

Method Order

-

The only required methods in the LightningModule are:

-
    -
  • init

  • -
  • training_step

  • -
  • configure_optimizers

  • -
-

However, if you decide to implement the rest of the optional methods, the recommended order is:

-
    -
  • model/system definition (init)

  • -
  • if doing inference, define forward

  • -
  • training hooks

  • -
  • validation hooks

  • -
  • test hooks

  • -
  • predict hooks

  • -
  • configure_optimizers

  • -
  • any other hooks

  • -
-

In practice, the code looks like this:

-
class LitModel(pl.LightningModule):
-
-    def __init__(...):
-
-    def forward(...):
-
-    def training_step(...):
-
-    def training_step_end(...):
-
-    def training_epoch_end(...):
-
-    def validation_step(...):
-
-    def validation_step_end(...):
-
-    def validation_epoch_end(...):
-
-    def test_step(...):
-
-    def test_step_end(...):
-
-    def test_epoch_end(...):
-
-    def configure_optimizers(...):
-
-    def any_extra_hook(...):
-
-
-
-
-

Forward vs training_step

-

We recommend using forward() for inference/predictions and keeping -training_step() independent.

-
def forward(self, x):
-    embeddings = self.encoder(x)
-    return embeddings
-
-
-def training_step(self, batch, batch_idx):
-    x, _ = batch
-    z = self.encoder(x)
-    pred = self.decoder(z)
-    ...
-
-
-
-
-
-
-

Data

-

These are best practices for handling data.

-
-

DataLoaders

-

Lightning uses DataLoader to handle all the data flow through the system. Whenever you structure dataloaders, -make sure to tune the number of workers for maximum efficiency.

-
-

Warning

-

Make sure not to use Trainer(strategy="ddp_spawn") with num_workers>0 in the DataLoader or you will bottleneck you code.

-
-
-
-

DataModules

-

The LightningDataModule is designed as a way of decoupling data-related -hooks from the LightningModule so you can develop dataset agnostic models. It makes it easy to hot swap different -datasets with your model, so you can test it and benchmark it across domains. It also makes sharing and reusing the exact data splits and transforms across projects possible.

-

Check out Managing Data document to understand data management within Lightning and its best practices.

-
    -
  • What dataset splits were used?

  • -
  • How many samples does this dataset have overall and within each split?

  • -
  • Which transforms were used?

  • -
-

It’s for this reason that we recommend you use datamodules. This is especially important when collaborating because -it will save your team a lot of time as well.

-

All they need to do is drop a datamodule into the Trainer and not worry about what was done to the data.

-

This is true for both academic and corporate settings where data cleaning and ad-hoc instructions slow down the progress -of iterating through ideas.

- -
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/tuning/profiler.html b/docs/tuning/profiler.html deleted file mode 100644 index 1bb3f0b..0000000 --- a/docs/tuning/profiler.html +++ /dev/null @@ -1,741 +0,0 @@ - - - - - - - - - - - - - - Find bottlenecks in your code — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Find bottlenecks in your code
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
- - -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/tuning/profiler_advanced.html b/docs/tuning/profiler_advanced.html deleted file mode 100644 index 13cf507..0000000 --- a/docs/tuning/profiler_advanced.html +++ /dev/null @@ -1,754 +0,0 @@ - - - - - - - - - - - - - - Find bottlenecks in your code (advanced) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Find bottlenecks in your code (advanced)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Find bottlenecks in your code (advanced)

-

Audience: Users who want to profile their TPU models to find bottlenecks and improve performance.

-
-
-

Profile cloud TPU models

-

To profile TPU models use the XLAProfiler

-
from pytorch_lightning.profiler import XLAProfiler
-
-profiler = XLAProfiler(port=9001)
-trainer = Trainer(profiler=profiler)
-
-
-
-
-
-

Capture profiling logs in Tensorboard

-

To capture profile logs in Tensorboard, follow these instructions:

-
-
-

0: Setup the required installs

-

Use this guide to help you with the Cloud TPU required installations.

-
-
-
-

1: Start Tensorboard

-

Start the TensorBoard server:

-
tensorboard --logdir ./tensorboard --port 9001
-
-
-

Now open the following url on your browser

-
http://localhost:9001/#profile
-
-
-
-
-
-

2: Capture the profile

-

Once the code you want to profile is running:

-
    -
  1. click on the CAPTURE PROFILE button.

  2. -
  3. Enter localhost:9001 (default port for XLA Profiler) as the Profile Service URL.

  4. -
  5. Enter the number of milliseconds for the profiling duration

  6. -
  7. Click CAPTURE

  8. -
-
-
-
-

3: Don’t stop your code

-

Make sure the code is running while you are trying to capture the traces. It will lead to better performance insights if the profiling duration is longer than the step time.

-
-
-
-

4: View the profiling logs

-

Once the capture is finished, the page will refresh and you can browse through the insights using the Tools dropdown at the top left

-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/tuning/profiler_basic.html b/docs/tuning/profiler_basic.html deleted file mode 100644 index 835cbfd..0000000 --- a/docs/tuning/profiler_basic.html +++ /dev/null @@ -1,789 +0,0 @@ - - - - - - - - - - - - - - Find bottlenecks in your code (basic) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Find bottlenecks in your code (basic)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Find bottlenecks in your code (basic)

-

Audience: Users who want to learn the basics of removing bottlenecks from their code

-
-
-

Why do I need profiling?

-

Profiling helps you find bottlenecks in your code by capturing analytics such as how long a function takes or how much memory is used.

-
-
-
-

Find training loop bottlenecks

-

The most basic profile measures all the key methods across Callbacks, DataModules and the LightningModule in the training loop.

-
trainer = Trainer(profiler="simple")
-
-
-

Once the .fit() function has completed, you’ll see an output like this:

-
FIT Profiler Report
-
------------------------------------------------------------------------------------------------
-|  Action                                          |  Mean duration (s)     |  Total time (s) |
------------------------------------------------------------------------------------------------
-|  [LightningModule]BoringModel.prepare_data       |  10.0001               |  20.00          |
-|  run_training_epoch                              |  6.1558                |  6.1558         |
-|  run_training_batch                              |  0.0022506             |  0.015754       |
-|  [LightningModule]BoringModel.optimizer_step     |  0.0017477             |  0.012234       |
-|  [LightningModule]BoringModel.val_dataloader     |  0.00024388            |  0.00024388     |
-|  on_train_batch_start                            |  0.00014637            |  0.0010246      |
-|  [LightningModule]BoringModel.teardown           |  2.15e-06              |  2.15e-06       |
-|  [LightningModule]BoringModel.on_train_start     |  1.644e-06             |  1.644e-06      |
-|  [LightningModule]BoringModel.on_train_end       |  1.516e-06             |  1.516e-06      |
-|  [LightningModule]BoringModel.on_fit_end         |  1.426e-06             |  1.426e-06      |
-|  [LightningModule]BoringModel.setup              |  1.403e-06             |  1.403e-06      |
-|  [LightningModule]BoringModel.on_fit_start       |  1.226e-06             |  1.226e-06      |
------------------------------------------------------------------------------------------------
-
-
-

In this report we can see that the slowest function is prepare_data. Now you can figure out why data preparation is slowing down your training.

-

The simple profiler measures all the standard methods used in the training loop automatically, including:

-
    -
  • on_train_epoch_start

  • -
  • on_train_epoch_end

  • -
  • on_train_batch_start

  • -
  • model_backward

  • -
  • on_after_backward

  • -
  • optimizer_step

  • -
  • on_train_batch_end

  • -
  • training_step_end

  • -
  • on_training_end

  • -
  • etc…

  • -
-
-
-
-

Profile the time within every function

-

To profile the time within every function, use the AdvancedProfiler built on top of Python’s cProfiler.

-
trainer = Trainer(profiler="advanced")
-
-
-

Once the .fit() function has completed, you’ll see an output like this:

-
Profiler Report
-
-Profile stats for: get_train_batch
-        4869394 function calls (4863767 primitive calls) in 18.893 seconds
-Ordered by: cumulative time
-List reduced from 76 to 10 due to restriction <10>
-ncalls  tottime  percall  cumtime  percall filename:lineno(function)
-3752/1876    0.011    0.000   18.887    0.010 {built-in method builtins.next}
-    1876     0.008    0.000   18.877    0.010 dataloader.py:344(__next__)
-    1876     0.074    0.000   18.869    0.010 dataloader.py:383(_next_data)
-    1875     0.012    0.000   18.721    0.010 fetch.py:42(fetch)
-    1875     0.084    0.000   18.290    0.010 fetch.py:44(<listcomp>)
-    60000    1.759    0.000   18.206    0.000 mnist.py:80(__getitem__)
-    60000    0.267    0.000   13.022    0.000 transforms.py:68(__call__)
-    60000    0.182    0.000    7.020    0.000 transforms.py:93(__call__)
-    60000    1.651    0.000    6.839    0.000 functional.py:42(to_tensor)
-    60000    0.260    0.000    5.734    0.000 transforms.py:167(__call__)
-
-
-

If the profiler report becomes too long, you can stream the report to a file:

-
from pytorch_lightning.profiler import AdvancedProfiler
-
-profiler = AdvancedProfiler(dirpath=".", filename="perf_logs")
-trainer = Trainer(profiler=profiler)
-
-
-
-
-
-

Measure accelerator usage

-

Another helpful technique to detect bottlenecks is to ensure that you’re using the full capacity of your accelerator (GPU/TPU/IPU/HPU). -This can be measured with the DeviceStatsMonitor:

-
from pytorch_lightning.callbacks import DeviceStatsMonitor
-
-trainer = Trainer(callbacks=[DeviceStatsMonitor()])
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/tuning/profiler_expert.html b/docs/tuning/profiler_expert.html deleted file mode 100644 index 49b19e5..0000000 --- a/docs/tuning/profiler_expert.html +++ /dev/null @@ -1,782 +0,0 @@ - - - - - - - - - - - - - - Find bottlenecks in your code (expert) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Find bottlenecks in your code (expert)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Find bottlenecks in your code (expert)

-

Audience: Users who want to build their own profilers.

-
-
-

Build your own profiler

-

To build your own profiler, subclass Profiler -and override some of its methods. Here is a simple example that profiles the first occurrence and total calls of each action:

-
from pytorch_lightning.profiler import Profiler
-from collections import defaultdict
-import time
-
-
-class ActionCountProfiler(Profiler):
-    def __init__(self, dirpath=None, filename=None):
-        super().__init__(dirpath=dirpath, filename=filename)
-        self._action_count = defaultdict(int)
-        self._action_first_occurrence = {}
-
-    def start(self, action_name):
-        if action_name not in self._action_first_occurrence:
-            self._action_first_occurrence[action_name] = time.strftime("%m/%d/%Y, %H:%M:%S")
-
-    def stop(self, action_name):
-        self._action_count[action_name] += 1
-
-    def summary(self):
-        res = f"\nProfile Summary: \n"
-        max_len = max(len(x) for x in self._action_count)
-
-        for action_name in self._action_count:
-            # generate summary for actions called more than once
-            if self._action_count[action_name] > 1:
-                res += (
-                    f"{action_name:<{max_len}s} \t "
-                    + "self._action_first_occurrence[action_name]} \t "
-                    + "{self._action_count[action_name]} \n"
-                )
-
-        return res
-
-    def teardown(self, stage):
-        self._action_count = {}
-        self._action_first_occurrence = {}
-        super().teardown(stage=stage)
-
-
-
trainer = Trainer(profiler=ActionCountProfiler())
-trainer.fit(...)
-
-
-
-
-
-

Profile custom actions of interest

-

To profile a specific action of interest, reference a profiler in the LightningModule.

-
from pytorch_lightning.profiler import SimpleProfiler, PassThroughProfiler
-
-
-class MyModel(LightningModule):
-    def __init__(self, profiler=None):
-        self.profiler = profiler or PassThroughProfiler()
-
-
-

To profile in any part of your code, use the self.profiler.profile() function

-
class MyModel(LightningModule):
-    def custom_processing_step(self, data):
-        with self.profiler.profile("my_custom_action"):
-            ...
-        return data
-
-
-

Here’s the full code:

-
from pytorch_lightning.profiler import SimpleProfiler, PassThroughProfiler
-
-
-class MyModel(LightningModule):
-    def __init__(self, profiler=None):
-        self.profiler = profiler or PassThroughProfiler()
-
-    def custom_processing_step(self, data):
-        with self.profiler.profile("my_custom_action"):
-            ...
-        return data
-
-
-profiler = SimpleProfiler()
-model = MyModel(profiler)
-trainer = Trainer(profiler=profiler, max_epochs=1)
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/tuning/profiler_intermediate.html b/docs/tuning/profiler_intermediate.html deleted file mode 100644 index 9c09f2e..0000000 --- a/docs/tuning/profiler_intermediate.html +++ /dev/null @@ -1,848 +0,0 @@ - - - - - - - - - - - - - - Find bottlenecks in your code (intermediate) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Find bottlenecks in your code (intermediate)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Find bottlenecks in your code (intermediate)

-

Audience: Users who want to see more granular profiling information

-
-
-

Profile pytorch operations

-

To understand the cost of each PyTorch operation, use the PyTorchProfiler built on top of the PyTorch profiler.

-
from pytorch_lightning.profiler import PyTorchProfiler
-
-profiler = PyTorchProfiler()
-trainer = Trainer(profiler=profiler)
-
-
-

The profiler will generate an output like this:

-
Profiler Report
-
-Profile stats for: training_step
----------------------  ---------------  ---------------  ---------------  ---------------  ---------------
-Name                   Self CPU total %  Self CPU total   CPU total %      CPU total        CPU time avg
----------------------  ---------------  ---------------  ---------------  ---------------  ---------------
-t                      62.10%           1.044ms          62.77%           1.055ms          1.055ms
-addmm                  32.32%           543.135us        32.69%           549.362us        549.362us
-mse_loss               1.35%            22.657us         3.58%            60.105us         60.105us
-mean                   0.22%            3.694us          2.05%            34.523us         34.523us
-div_                   0.64%            10.756us         1.90%            32.001us         16.000us
-ones_like              0.21%            3.461us          0.81%            13.669us         13.669us
-sum_out                0.45%            7.638us          0.74%            12.432us         12.432us
-transpose              0.23%            3.786us          0.68%            11.393us         11.393us
-as_strided             0.60%            10.060us         0.60%            10.060us         3.353us
-to                     0.18%            3.059us          0.44%            7.464us          7.464us
-empty_like             0.14%            2.387us          0.41%            6.859us          6.859us
-empty_strided          0.38%            6.351us          0.38%            6.351us          3.175us
-fill_                  0.28%            4.782us          0.33%            5.566us          2.783us
-expand                 0.20%            3.336us          0.28%            4.743us          4.743us
-empty                  0.27%            4.456us          0.27%            4.456us          2.228us
-copy_                  0.15%            2.526us          0.15%            2.526us          2.526us
-broadcast_tensors      0.15%            2.492us          0.15%            2.492us          2.492us
-size                   0.06%            0.967us          0.06%            0.967us          0.484us
-is_complex             0.06%            0.961us          0.06%            0.961us          0.481us
-stride                 0.03%            0.517us          0.03%            0.517us          0.517us
----------------------  ---------------  ---------------  ---------------  ---------------  ---------------
-Self CPU time total: 1.681ms
-
-
-
-

Note

-

When using the PyTorch Profiler, wall clock time will not not be representative of the true wall clock time. -This is due to forcing profiled operations to be measured synchronously, when many CUDA ops happen asynchronously. -It is recommended to use this Profiler to find bottlenecks/breakdowns, however for end to end wall clock time use -the SimpleProfiler.

-
-
-
-
-

Profile a distributed model

-

To profile a distributed model, use the PyTorchProfiler with the filename argument which will save a report per rank.

-
from pytorch_lightning.profiler import PyTorchProfiler
-
-profiler = PyTorchProfiler(filename="perf-logs")
-trainer = Trainer(profiler=profiler)
-
-
-

With two ranks, it will generate a report like so:

-
Profiler Report: rank 0
-
-Profile stats for: training_step
----------------------  ---------------  ---------------  ---------------  ---------------  ---------------
-Name                   Self CPU total %  Self CPU total   CPU total %      CPU total        CPU time avg
----------------------  ---------------  ---------------  ---------------  ---------------  ---------------
-t                      62.10%           1.044ms          62.77%           1.055ms          1.055ms
-addmm                  32.32%           543.135us        32.69%           549.362us        549.362us
-mse_loss               1.35%            22.657us         3.58%            60.105us         60.105us
-mean                   0.22%            3.694us          2.05%            34.523us         34.523us
-div_                   0.64%            10.756us         1.90%            32.001us         16.000us
-ones_like              0.21%            3.461us          0.81%            13.669us         13.669us
-sum_out                0.45%            7.638us          0.74%            12.432us         12.432us
-transpose              0.23%            3.786us          0.68%            11.393us         11.393us
-as_strided             0.60%            10.060us         0.60%            10.060us         3.353us
-to                     0.18%            3.059us          0.44%            7.464us          7.464us
-empty_like             0.14%            2.387us          0.41%            6.859us          6.859us
-empty_strided          0.38%            6.351us          0.38%            6.351us          3.175us
-fill_                  0.28%            4.782us          0.33%            5.566us          2.783us
-expand                 0.20%            3.336us          0.28%            4.743us          4.743us
-empty                  0.27%            4.456us          0.27%            4.456us          2.228us
-copy_                  0.15%            2.526us          0.15%            2.526us          2.526us
-broadcast_tensors      0.15%            2.492us          0.15%            2.492us          2.492us
-size                   0.06%            0.967us          0.06%            0.967us          0.484us
-is_complex             0.06%            0.961us          0.06%            0.961us          0.481us
-stride                 0.03%            0.517us          0.03%            0.517us          0.517us
----------------------  ---------------  ---------------  ---------------  ---------------  ---------------
-Self CPU time total: 1.681ms
-
-
-
Profiler Report: rank 1
-
-Profile stats for: training_step
----------------------  ---------------  ---------------  ---------------  ---------------  ---------------
-Name                   Self CPU total %  Self CPU total   CPU total %      CPU total        CPU time avg
----------------------  ---------------  ---------------  ---------------  ---------------  ---------------
-t                      42.10%           1.044ms          62.77%           1.055ms          1.055ms
-addmm                  32.32%           543.135us        32.69%           549.362us        549.362us
-mse_loss               1.35%            22.657us         3.58%            60.105us         60.105us
-mean                   0.22%            3.694us          2.05%            34.523us         34.523us
-div_                   0.64%            10.756us         1.90%            32.001us         16.000us
-ones_like              0.21%            3.461us          0.81%            13.669us         13.669us
-sum_out                0.45%            7.638us          0.74%            12.432us         12.432us
-transpose              0.23%            3.786us          0.68%            11.393us         11.393us
-as_strided             0.60%            10.060us         0.60%            10.060us         3.353us
-to                     0.18%            3.059us          0.44%            7.464us          7.464us
-empty_like             0.14%            2.387us          0.41%            6.859us          6.859us
-empty_strided          0.38%            6.351us          0.38%            6.351us          3.175us
-fill_                  0.28%            4.782us          0.33%            5.566us          2.783us
-expand                 0.20%            3.336us          0.28%            4.743us          4.743us
-empty                  0.27%            4.456us          0.27%            4.456us          2.228us
-copy_                  0.15%            2.526us          0.15%            2.526us          2.526us
-broadcast_tensors      0.15%            2.492us          0.15%            2.492us          2.492us
-size                   0.06%            0.967us          0.06%            0.967us          0.484us
-is_complex             0.06%            0.961us          0.06%            0.961us          0.481us
-stride                 0.03%            0.517us          0.03%            0.517us          0.517us
----------------------  ---------------  ---------------  ---------------  ---------------  ---------------
-Self CPU time total: 1.681ms
-
-
-

This profiler will record training_step, backward, validation_step, test_step, and predict_step by default. -The output below shows the profiling for the action training_step. The user can provide PyTorchProfiler(record_functions={...}) -to extend the scope of profiled functions.

-
-

Note

-

When using the PyTorch Profiler, wall clock time will not not be representative of the true wall clock time. -This is due to forcing profiled operations to be measured synchronously, when many CUDA ops happen asynchronously. -It is recommended to use this Profiler to find bottlenecks/breakdowns, however for end to end wall clock time use -the SimpleProfiler.

-
-
-
-
-

Visualize profiled operations

-

To visualize the profiled operations, enable emit_nvtx in the PyTorchProfiler.

-
from pytorch_lightning.profiler import PyTorchProfiler
-
-profiler = PyTorchProfiler(emit_nvtx=True)
-trainer = Trainer(profiler=profiler)
-
-
-

Then run as following:

-
nvprof --profile-from-start off -o trace_name.prof -- <regular command here>
-
-
-

To visualize the profiled operation, you can either use nvvp:

-
nvvp trace_name.prof
-
-
-

or python:

-
python -c 'import torch; print(torch.autograd.profiler.load_nvprof("trace_name.prof"))'
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/visualize/experiment_managers.html b/docs/visualize/experiment_managers.html deleted file mode 100644 index 37ad539..0000000 --- a/docs/visualize/experiment_managers.html +++ /dev/null @@ -1,881 +0,0 @@ - - - - - - - - - - - - - - Manage Experiments — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Manage Experiments
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Manage Experiments

-

To track other artifacts, such as histograms or model topology graphs first select one of the many experiment managers (loggers) supported by Lightning

-
from pytorch_lightning import loggers as pl_loggers
-
-tensorboard = pl_loggers.TensorBoardLogger()
-trainer = Trainer(logger=tensorboard)
-
-
-

then access the logger’s API directly

-
def training_step(self):
-    tensorboard = self.logger.experiment
-    tensorboard.add_image()
-    tensorboard.add_histogram(...)
-    tensorboard.add_figure(...)
-
-
-
-
-

Comet.ml

-

To use Comet.ml first install the comet package:

-
pip install comet-ml
-
-
-

Configure the logger and pass it to the Trainer:

-
from pytorch_lightning.loggers import CometLogger
-
-comet_logger = CometLogger(api_key="YOUR_COMET_API_KEY")
-trainer = Trainer(logger=comet_logger)
-
-
-

Access the comet logger from any function (except the LightningModule init) to use its API for tracking advanced artifacts

-
class LitModel(LightningModule):
-    def any_lightning_module_function_or_hook(self):
-        comet = self.logger.experiment
-        fake_images = torch.Tensor(32, 3, 28, 28)
-        comet.add_image("generated_images", fake_images, 0)
-
-
-

Here’s the full documentation for the CometLogger.

-
-
-
-

MLflow

-

To use MLflow first install the MLflow package:

-
pip install mlflow
-
-
-

Configure the logger and pass it to the Trainer:

-
from pytorch_lightning.loggers import MLFlowLogger
-
-mlf_logger = MLFlowLogger(experiment_name="lightning_logs", tracking_uri="file:./ml-runs")
-trainer = Trainer(logger=mlf_logger)
-
-
-

Access the comet logger from any function (except the LightningModule init) to use its API for tracking advanced artifacts

-
class LitModel(LightningModule):
-    def any_lightning_module_function_or_hook(self):
-        mlf_logger = self.logger.experiment
-        fake_images = torch.Tensor(32, 3, 28, 28)
-        mlf_logger.add_image("generated_images", fake_images, 0)
-
-
-

Here’s the full documentation for the MLFlowLogger.

-
-
-
-

Neptune.ai

-

To use Neptune.ai first install the neptune package:

-
pip install neptune-client
-
-
-

or with conda:

-
conda install -c conda-forge neptune-client
-
-
-

Configure the logger and pass it to the Trainer:

-
from pytorch_lightning.loggers import NeptuneLogger
-
-neptune_logger = NeptuneLogger(
-    api_key="ANONYMOUS",  # replace with your own
-    project="common/pytorch-lightning-integration",  # format "<WORKSPACE/PROJECT>"
-)
-trainer = Trainer(logger=neptune_logger)
-
-
-

Access the neptune logger from any function (except the LightningModule init) to use its API for tracking advanced artifacts

-
class LitModel(LightningModule):
-    def any_lightning_module_function_or_hook(self):
-        neptune_logger = self.logger.experiment["your/metadata/structure"]
-        neptune_logger.log(metadata)
-
-
-

Here’s the full documentation for the NeptuneLogger.

-
-
-
-

Tensorboard

-

TensorBoard already comes installed with Lightning. If you removed the install install the following package.

-
pip install tensorboard
-
-
-

Configure the logger and pass it to the Trainer:

-
from pytorch_lightning.loggers import TensorBoardLogger
-
-logger = TensorBoardLogger()
-trainer = Trainer(logger=logger)
-
-
-

Access the tensorboard logger from any function (except the LightningModule init) to use its API for tracking advanced artifacts

-
class LitModel(LightningModule):
-    def any_lightning_module_function_or_hook(self):
-        tensorboard_logger = self.logger.experiment
-        fake_images = torch.Tensor(32, 3, 28, 28)
-        tensorboard_logger.add_image("generated_images", fake_images, 0)
-
-
-

Here’s the full documentation for the TensorBoardLogger.

-
-
-
-

Weights and Biases

-

To use Weights and Biases (wandb) first install the wandb package:

-
pip install wandb
-
-
-

Configure the logger and pass it to the Trainer:

-
from pytorch_lightning.loggers import WandbLogger
-
-wandb_logger = WandbLogger(project="MNIST", log_model="all")
-trainer = Trainer(logger=wandb_logger)
-
-# log gradients and model topology
-wandb_logger.watch(model)
-
-
-

Access the wandb logger from any function (except the LightningModule init) to use its API for tracking advanced artifacts

-
class MyModule(LightningModule):
-    def any_lightning_module_function_or_hook(self):
-        wandb_logger = self.logger.experiment
-        fake_images = torch.Tensor(32, 3, 28, 28)
-
-        # Option 1
-        wandb_logger.log({"generated_images": [wandb.Image(fake_images, caption="...")]})
-
-        # Option 2 for specifically logging images
-        wandb_logger.log_image(key="generated_images", images=[fake_images])
-
-
-

Here’s the full documentation for the WandbLogger. -Demo in Google Colab with hyperparameter search and model logging.

-
-
-
-

Use multiple exp managers

-

To use multiple experiment managers at the same time, pass a list to the logger Trainer argument.

-
from pytorch_lightning.loggers import TensorBoardLogger, WandbLogger
-
-logger1 = TensorBoardLogger()
-logger2 = WandbLogger()
-trainer = Trainer(logger=[logger1, logger2])
-
-
-

Access all loggers from any function (except the LightningModule init) to use their APIs for tracking advanced artifacts

-
class MyModule(LightningModule):
-    def any_lightning_module_function_or_hook(self):
-        tensorboard_logger = self.logger.experiment[0]
-        wandb_logger = self.logger.experiment[1]
-
-        fake_images = torch.Tensor(32, 3, 28, 28)
-
-        tensorboard_logger.add_image("generated_images", fake_images, 0)
-        wandb_logger.add_image("generated_images", fake_images, 0)
-
-
-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/visualize/loggers.html b/docs/visualize/loggers.html deleted file mode 100644 index 5fa0bc1..0000000 --- a/docs/visualize/loggers.html +++ /dev/null @@ -1,751 +0,0 @@ - - - - - - - - - - - - - - Track and Visualize Experiments — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Track and Visualize Experiments
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
- - - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/visualize/logging_advanced.html b/docs/visualize/logging_advanced.html deleted file mode 100644 index d6800b2..0000000 --- a/docs/visualize/logging_advanced.html +++ /dev/null @@ -1,1044 +0,0 @@ - - - - - - - - - - - - - - Track and Visualize Experiments (advanced) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Track and Visualize Experiments (advanced)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Track and Visualize Experiments (advanced)

-

Audience: Users who want to do advanced speed optimizations by customizing the logging behavior.

-
-
-

Change progress bar defaults

-

To change the default values (ie: version number) shown in the progress bar, override the get_metrics() method in your logger.

-
from pytorch_lightning.callbacks.progress import Tqdm
-
-
-class CustomProgressBar(Tqdm):
-    def get_metrics(self, *args, **kwargs):
-        # don't show the version number
-        items = super().get_metrics()
-        items.pop("v_num", None)
-        return items
-
-
-
-
-
-

Customize tracking to speed up model

-
-

Modify logging frequency

-

Logging a metric on every single batch can slow down training. By default, Lightning logs every 50 rows, or 50 training steps. -To change this behaviour, set the log_every_n_steps Trainer flag.

-
k = 10
-trainer = Trainer(log_every_n_steps=k)
-
-
-
-
-
-

Modify flushing frequency

-

Metrics are kept in memory for N steps to improve training efficiency. Every N steps, metrics flush to disk. To change the frequency of this flushing, use the flush_logs_every_n_steps Trainer argument.

-
# faster training, high memory
-Trainer(flush_logs_every_n_steps=500)
-
-# slower training, low memory
-Trainer(flush_logs_every_n_steps=500)
-
-
-

The higher flush_logs_every_n_steps is, the faster the model will train but the memory will build up until the next flush. -The smaller flush_logs_every_n_steps is, the slower the model will train but memory will be kept to a minimum.

-

TODO: chart

-
-
-
-
-

Customize self.log

-

The LightningModule self.log method offers many configurations to customize its behavior.

-
-
-

add_dataloader_idx

-

Default: True

-

If True, appends the index of the current dataloader to the name (when using multiple dataloaders). If False, user needs to give unique names for each dataloader to not mix the values.

-
self.log(add_dataloader_idx=True)
-
-
-
-
-
-

batch_size

-

Default: None

-

Current batch size used for accumulating logs logged with on_epoch=True. This will be directly inferred from the loaded batch, but for some data structures you might need to explicitly provide it.

-
self.log(batch_size=32)
-
-
-
-
-
-

enable_graph

-

Default: True

-

If True, will not auto detach the graph.

-
self.log(enable_graph=True)
-
-
-
-
-
-

logger

-

Default: True

-

Send logs to the logger like Tensorboard, or any other custom logger passed to the Trainer (Default: True).

-
self.log(logger=True)
-
-
-
-
-
-

on_epoch

-

Default: It varies

-

If this is True, that specific self.log call accumulates and reduces all metrics to the end of the epoch.

-
self.log(on_epoch=True)
-
-
-

The default value depends in which function this is called

-
def training_step(self, batch, batch_idx):
-    # Default: False
-    self.log(on_epoch=False)
-
-
-def validation_step(self, batch, batch_idx):
-    # Default: True
-    self.log(on_epoch=True)
-
-
-def test_step(self, batch, batch_idx):
-    # Default: True
-    self.log(on_epoch=True)
-
-
-
-
-
-

on_step

-

Default: It varies

-

If this is True, that specific self.log call will NOT accumulate metrics. Instead it will generate a timeseries across steps.

-
self.log(on_step=True)
-
-
-

The default value depends in which function this is called

-
def training_step(self, batch, batch_idx):
-    # Default: True
-    self.log(on_step=True)
-
-
-def validation_step(self, batch, batch_idx):
-    # Default: False
-    self.log(on_step=False)
-
-
-def test_step(self, batch, batch_idx):
-    # Default: False
-    self.log(on_step=False)
-
-
-
-
-
-

prog_bar

-

Default: False

-

If set to True, logs will be sent to the progress bar.

-
self.log(prog_bar=True)
-
-
-
-
-
-

rank_zero_only

-

Default: True

-

Whether the value will be logged only on rank 0. This will prevent synchronization which would produce a deadlock as not all processes would perform this log call.

-
self.log(rank_zero_only=True)
-
-
-
-
-
-

reduce_fx

-

Default: torch.mean()

-

Reduction function over step values for end of epoch. Uses torch.mean() by default.

-
self.log(reduce_fx=torch.mean)
-
-
-
-
-
-

sync_dist

-

Default: False

-

If True, reduces the metric across devices. Use with care as this may lead to a significant communication overhead.

-
self.log(sync_dist=False)
-
-
-
-
-
-

sync_dist_group

-

Default: None

-

The DDP group to sync across.

-
import torch.distributed as dist
-
-group = dist.init_process_group("nccl", rank=self.global_rank, world_size=self.world_size)
-self.log(sync_dist_group=group)
-
-
-
-
-
-
-

Enable metrics for distributed training

-

For certain types of metrics that need complex aggregation, we recommended to build your metric using torchmetric which ensures all the complexities of metric aggregation in distributed environments is handled.

-

First, implement your metric:

-
import torch
-import torchmetrics
-
-
-class MyAccuracy(Metric):
-    def __init__(self, dist_sync_on_step=False):
-        # call `self.add_state`for every internal state that is needed for the metrics computations
-        # dist_reduce_fx indicates the function that should be used to reduce
-        # state from multiple processes
-        super().__init__(dist_sync_on_step=dist_sync_on_step)
-
-        self.add_state("correct", default=torch.tensor(0), dist_reduce_fx="sum")
-        self.add_state("total", default=torch.tensor(0), dist_reduce_fx="sum")
-
-    def update(self, preds: torch.Tensor, target: torch.Tensor):
-        # update metric states
-        preds, target = self._input_format(preds, target)
-        assert preds.shape == target.shape
-
-        self.correct += torch.sum(preds == target)
-        self.total += target.numel()
-
-    def compute(self):
-        # compute final result
-        return self.correct.float() / self.total
-
-
-

To use the metric inside Lightning, 1) initialize it in the init, 2) compute the metric, 3) pass it into self.log

-
class LitModel(LightningModule):
-    def __init__(self):
-        # 1. initialize the metric
-        self.accuracy = MyAccuracy()
-
-    def training_step(self, batch, batch_idx):
-        x, y = batch
-        preds = self(x)
-
-        # 2. compute the metric
-        self.accuracy(preds, y)
-
-        # 3. log it
-        self.log("train_acc_step", self.accuracy)
-
-
-
-
-
-

Log to a custom cloud filesystem

-

Lightning is integrated with the major remote file systems including local filesystems and several cloud storage providers such as -S3 on AWS, GCS on Google Cloud, -or ADL on Azure.

-

PyTorch Lightning uses fsspec internally to handle all filesystem operations.

-

To save logs to a remote filesystem, prepend a protocol like “s3:/” to the root_dir used for writing and reading model data.

-
from pytorch_lightning.loggers import TensorBoardLogger
-
-logger = TensorBoardLogger(save_dir="s3://my_bucket/logs/")
-
-trainer = Trainer(logger=logger)
-trainer.fit(model)
-
-
-
-
-
-

Track both step and epoch metrics

-

To track the timeseries over steps (on_step) as well as the accumulated epoch metric (on_epoch), set both to True

-
self.log(on_step=True, on_epoch=True)
-
-
-

Setting both to True will generate two graphs with _step for the timeseries over steps and _epoch for the epoch metric.

-

# TODO: show images of both

-
-
-
-

Understand self.log automatic behavior

-

This table shows the default values of on_step and on_epoch depending on the LightningModule or Callback method.

-
-
-

In LightningModule

- - ----- - - - - - - - - - - - - - - - - -
Default behavior of logging in ightningModule

Method

on_step

on_epoch

on_after_backward, on_before_backward, on_before_optimizer_step, on_before_zero_grad, training_step, training_step_end

True

False

training_epoch_end, test_epoch_end, test_step, test_step_end, validation_epoch_end, validation_step, validation_step_end

False

True

-
-
-
-

In Callback

- - ----- - - - - - - - - - - - - - - - - -
Default behavior of logging in Callback

Method

on_step

on_epoch

on_after_backward, on_before_backward, on_before_optimizer_step, on_before_zero_grad, on_train_batch_start, on_train_batch_end

True

False

on_train_epoch_start, on_train_epoch_end, on_train_start, on_validation_batch_start, on_validation_batch_end, on_validation_start, on_validation_epoch_start, on_validation_epoch_end

False

True

-
-

Note

-

To add logging to an unsupported method, please open an issue with a clear description of why it is blocking you.

-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/visualize/logging_basic.html b/docs/visualize/logging_basic.html deleted file mode 100644 index de65446..0000000 --- a/docs/visualize/logging_basic.html +++ /dev/null @@ -1,800 +0,0 @@ - - - - - - - - - - - - - - Track and Visualize Experiments (basic) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Track and Visualize Experiments (basic)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Track and Visualize Experiments (basic)

-

Audience: Users who want to visualize and monitor their model development

-
-
-

Why do I need to track metrics?

-

In model development, we track values of interest such as the validation_loss to visualize the learning process for our models. Model development is like driving a car without windows, charts and logs provide the windows to know where to drive the car.

-

With Lightning, you can visualize virtually anything you can think of: numbers, text, images, audio. Your creativity and imagination are the only limiting factor.

-
-
-
-

Track metrics

-

Metric visualization is the most basic but powerful way of understanding how your model is doing throughout the model development process.

-

To track a metric, simply use the self.log method available inside the LightningModule

-
class LitModel(pl.LightningModule):
-    def training_step(self, batch, batch_idx):
-        value = self.global_step
-        self.log("some_value", self.global_step)
-
-
-

To log multiple metrics at once, use self.log_dict

-
values = {"loss": loss, "acc": acc, "metric_n": metric_n}  # add more items if needed
-self.log_dict(values)
-
-
-

TODO: show plot of metric changing over time

-
-
-

View in the commandline

-

To view metrics in the commandline progress bar, set the prog_bar argument to True.

-
self.log(prog_bar=True)
-
-
-

TODO: need progress bar here

-
-
-
-

View in the browser

-

To view metrics in the browser you need to use an experiment manager with these capabilities. By Default, Lightning uses Tensorboard which is free and opensource.

-

Tensorboard is already enabled by default

-
# every trainer already has tensorboard enabled by default
-trainer = Trainer()
-
-
-

To launch the tensorboard dashboard run the following command on the commandline.

-
tensorboard --logdir=lightning_logs/
-
-
-

If you’re using a notebook environment such as colab or kaggle or jupyter, launch Tensorboard with this command

-
%reload_ext tensorboard
-%tensorboard --logdir=lightning_logs/
-
-
-
-
-
-

Accumulate a metric

-

When self.log is called inside the training_step, it generates a timeseries showing how the metric behaves over time.

-

TODO: show chart

-

However, For the validation and test sets we are not generally interested in plotting the metric values per batch of data. Instead, we want to compute a summary statistic (such as average, min or max) across the full split of data.

-

When you call self.log inside the validation_step and test_step, Lightning automatically accumulates the metric and averages it once it’s gone through the whole split (epoch).

-
def validation_step(self, batch, batch_idx):
-    value = batch_idx + 1
-    self.log("average_value", value)
-
-
-

TODO: show single point plotted

-

If you don’t want to average, add your own function in the reduce_fx argument.

-
# default function
-self.log(reduce_fx=torch.mean)
-
-
-
-
-
-
-

Track images

-

If your experiment manager supports image visualization, simply log the image with self.log

-
# (32 batch samples, 3 channels, 32 width, 32 height)
-image = torch.Tensor(32, 3, 28, 28)
-self.log("an_image", image)
-
-
-
-
-
-

Track text

-

If your experiment manager supports text visualization, simply log the text with self.log

-
text = "hello world"
-self.log("some_text", text)
-
-
-

# TODO: show screenshot

-
-
-
-

Configure the saving directory

-

By default, anything that is logged is saved to the current working directory. To use a different directory, set the default_root_dir argument in the Trainer.

-
Trainer(default_root_dir="/your/custom/path")
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/visualize/logging_expert.html b/docs/visualize/logging_expert.html deleted file mode 100644 index 8a6c436..0000000 --- a/docs/visualize/logging_expert.html +++ /dev/null @@ -1,806 +0,0 @@ - - - - - - - - - - - - - - Track and Visualize Experiments (expert) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Track and Visualize Experiments (expert)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Track and Visualize Experiments (expert)

-

Audience: Users who want to make their own progress bars or integrate new experiment managers.

-
-
-

Change the progress bar

-

If you’d like to change the way the progress bar displays information you can use some of our built-in progress bard or build your own.

-
-
-

Use the TQDMProgressBar

-

To use the TQDMProgressBar pass it into the callbacks Trainer argument.

-
from pytorch_lightning.callbacks import TQDMProgressBar
-
-trainer = Trainer(callbacks=[TQDMProgressBar()])
-
-
-
-
-
-

Use the RichProgressBar

-

The RichProgressBar can add custom colors and beautiful formatting for your progress bars. First, install the `rich <https://github.com/Textualize/rich>`_ library

-
pip install rich
-
-
-

Then pass the callback into the callbacks Trainer argument:

-
from pytorch_lightning.callbacks import RichProgressBar
-
-trainer = Trainer(callbacks=[RichProgressBar()])
-
-
-

The rich progress bar can also have custom themes

-
from pytorch_lightning.callbacks import RichProgressBar
-from pytorch_lightning.callbacks.progress.rich_progress import RichProgressBarTheme
-
-# create your own theme!
-theme = RichProgressBarTheme(description="green_yellow", progress_bar="green1")
-
-# init as normal
-progress_bar = RichProgressBar(theme=theme)
-trainer = Trainer(callbacks=progress_bar)
-
-
-
-
-
-
-

Customize a progress bar

-

To customize either the TQDMProgressBar or the RichProgressBar, subclass it and override any of its methods.

-
from pytorch_lightning.callbacks import TQDMProgressBar
-
-
-class LitProgressBar(TQDMProgressBar):
-    def init_validation_tqdm(self):
-        bar = super().init_validation_tqdm()
-        bar.set_description("running validation...")
-        return bar
-
-
-
-
-
-

Build your own progress bar

-

To build your own progress bar, subclass ProgressBarBase

-
from pytorch_lightning.callbacks import ProgressBarBase
-
-
-class LitProgressBar(ProgressBarBase):
-    def __init__(self):
-        super().__init__()  # don't forget this :)
-        self.enable = True
-
-    def disable(self):
-        self.enable = False
-
-    def on_train_batch_end(self, trainer, pl_module, outputs, batch_idx):
-        super().on_train_batch_end(trainer, pl_module, outputs, batch_idx)  # don't forget this :)
-        percent = (self.train_batch_idx / self.total_train_batches) * 100
-        sys.stdout.flush()
-        sys.stdout.write(f"{percent:.01f} percent complete \r")
-
-
-bar = LitProgressBar()
-trainer = Trainer(callbacks=[bar])
-
-
-
-
-
-

Integrate an experiment manager

-

To create an integration between a custom logger and Lightning, subclass LightningLoggerBase

-
from pytorch_lightning.loggers import Logger
-
-
-class LitLogger(Logger):
-    @property
-    def name(self) -> str:
-        return "my-experiment"
-
-    @property
-    def version(self):
-        return "version_0"
-
-    def log_metrics(self, metrics, step=None):
-        print("my logged metrics", metrics)
-
-    def log_hyperparams(self, params, *args, **kwargs):
-        print("my logged hyperparameters", params)
-
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/visualize/logging_intermediate.html b/docs/visualize/logging_intermediate.html deleted file mode 100644 index 5f8e554..0000000 --- a/docs/visualize/logging_intermediate.html +++ /dev/null @@ -1,926 +0,0 @@ - - - - - - - - - - - - - - Track and Visualize Experiments (intermediate) — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- -
    - -
  • - - - Docs - - > -
  • - - -
  • Track and Visualize Experiments (intermediate)
  • - - -
  • - - - - - -
  • - -
- - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Track and Visualize Experiments (intermediate)

-

Audience: Users who want to track more complex outputs and use third-party experiment managers.

-
-
-

Track audio and other artifacts

-

To track other artifacts, such as histograms or model topology graphs first select one of the many loggers supported by Lightning

-
from pytorch_lightning import loggers as pl_loggers
-
-tensorboard = pl_loggers.TensorBoardLogger()
-trainer = Trainer(logger=tensorboard)
-
-
-

then access the logger’s API directly

-
def training_step(self):
-    tensorboard = self.logger.experiment
-    tensorboard.add_image()
-    tensorboard.add_histogram(...)
-    tensorboard.add_figure(...)
-
-
-
-
-

Comet.ml

-

To use Comet.ml first install the comet package:

-
pip install comet-ml
-
-
-

Configure the logger and pass it to the Trainer:

-
from pytorch_lightning.loggers import CometLogger
-
-comet_logger = CometLogger(api_key="YOUR_COMET_API_KEY")
-trainer = Trainer(logger=comet_logger)
-
-
-

Access the comet logger from any function (except the LightningModule init) to use its API for tracking advanced artifacts

-
class LitModel(LightningModule):
-    def any_lightning_module_function_or_hook(self):
-        comet = self.logger.experiment
-        fake_images = torch.Tensor(32, 3, 28, 28)
-        comet.add_image("generated_images", fake_images, 0)
-
-
-

Here’s the full documentation for the CometLogger.

-
-
-
-

MLflow

-

To use MLflow first install the MLflow package:

-
pip install mlflow
-
-
-

Configure the logger and pass it to the Trainer:

-
from pytorch_lightning.loggers import MLFlowLogger
-
-mlf_logger = MLFlowLogger(experiment_name="lightning_logs", tracking_uri="file:./ml-runs")
-trainer = Trainer(logger=mlf_logger)
-
-
-

Access the comet logger from any function (except the LightningModule init) to use its API for tracking advanced artifacts

-
class LitModel(LightningModule):
-    def any_lightning_module_function_or_hook(self):
-        mlf_logger = self.logger.experiment
-        fake_images = torch.Tensor(32, 3, 28, 28)
-        mlf_logger.add_image("generated_images", fake_images, 0)
-
-
-

Here’s the full documentation for the MLFlowLogger.

-
-
-
-

Neptune.ai

-

To use Neptune.ai first install the neptune package:

-
pip install neptune-client
-
-
-

or with conda:

-
conda install -c conda-forge neptune-client
-
-
-

Configure the logger and pass it to the Trainer:

-
from pytorch_lightning.loggers import NeptuneLogger
-
-neptune_logger = NeptuneLogger(
-    api_key="ANONYMOUS",  # replace with your own
-    project="common/pytorch-lightning-integration",  # format "<WORKSPACE/PROJECT>"
-)
-trainer = Trainer(logger=neptune_logger)
-
-
-

Access the neptune logger from any function (except the LightningModule init) to use its API for tracking advanced artifacts

-
class LitModel(LightningModule):
-    def any_lightning_module_function_or_hook(self):
-        neptune_logger = self.logger.experiment["your/metadata/structure"]
-        neptune_logger.log(metadata)
-
-
-

Here’s the full documentation for the NeptuneLogger.

-
-
-
-

Tensorboard

-

TensorBoard already comes installed with Lightning. If you removed the install install the following package.

-
pip install tensorboard
-
-
-

Configure the logger and pass it to the Trainer:

-
from pytorch_lightning.loggers import TensorBoardLogger
-
-logger = TensorBoardLogger()
-trainer = Trainer(logger=logger)
-
-
-

Access the tensorboard logger from any function (except the LightningModule init) to use its API for tracking advanced artifacts

-
class LitModel(LightningModule):
-    def any_lightning_module_function_or_hook(self):
-        tensorboard_logger = self.logger.experiment
-        fake_images = torch.Tensor(32, 3, 28, 28)
-        tensorboard_logger.add_image("generated_images", fake_images, 0)
-
-
-

Here’s the full documentation for the TensorBoardLogger.

-
-
-
-

Weights and Biases

-

To use Weights and Biases (wandb) first install the wandb package:

-
pip install wandb
-
-
-

Configure the logger and pass it to the Trainer:

-
from pytorch_lightning.loggers import WandbLogger
-
-wandb_logger = WandbLogger(project="MNIST", log_model="all")
-trainer = Trainer(logger=wandb_logger)
-
-# log gradients and model topology
-wandb_logger.watch(model)
-
-
-

Access the wandb logger from any function (except the LightningModule init) to use its API for tracking advanced artifacts

-
class MyModule(LightningModule):
-    def any_lightning_module_function_or_hook(self):
-        wandb_logger = self.logger.experiment
-        fake_images = torch.Tensor(32, 3, 28, 28)
-
-        # Option 1
-        wandb_logger.log({"generated_images": [wandb.Image(fake_images, caption="...")]})
-
-        # Option 2 for specifically logging images
-        wandb_logger.log_image(key="generated_images", images=[fake_images])
-
-
-

Here’s the full documentation for the WandbLogger. -Demo in Google Colab with hyperparameter search and model logging.

-
-
-
-

Use multiple exp managers

-

To use multiple experiment managers at the same time, pass a list to the logger Trainer argument.

-
from pytorch_lightning.loggers import TensorBoardLogger, WandbLogger
-
-logger1 = TensorBoardLogger()
-logger2 = WandbLogger()
-trainer = Trainer(logger=[logger1, logger2])
-
-
-

Access all loggers from any function (except the LightningModule init) to use their APIs for tracking advanced artifacts

-
class MyModule(LightningModule):
-    def any_lightning_module_function_or_hook(self):
-        tensorboard_logger = self.logger.experiment[0]
-        wandb_logger = self.logger.experiment[1]
-
-        fake_images = torch.Tensor(32, 3, 28, 28)
-
-        tensorboard_logger.add_image("generated_images", fake_images, 0)
-        wandb_logger.add_image("generated_images", fake_images, 0)
-
-
-
-
-
-
-

Track multiple metrics in the same chart

-

If your logger supports plotting multiple metrics on the same chart, pass in a dictionary to self.log.

-
self.log("performance", {"acc": acc, "recall": recall})
-
-
-
-
-
-

Track hyperparameters

-

To track hyperparameters, first call save_hyperparameters from the LightningModule init:

-
class MyLightningModule(LightningModule):
-    def __init__(self, learning_rate, another_parameter, *args, **kwargs):
-        super().__init__()
-        self.save_hyperparameters()
-
-
-

If your logger supports tracked hyperparameters, the hyperparameters will automatically show up on the logger dashboard.

-

TODO: show tracked hyperparameters.

-
-
-
-

Track model topology

-

Multiple loggers support visualizing the model topology. Here’s an example that tracks the model topology using Tensorboard.

-
def any_lightning_module_function_or_hook(self):
-    tensorboard_logger = self.logger.experiment
-
-    prototype_array = torch.Tensor(32, 1, 28, 27)
-    tensorboard_logger.log_graph(model=self, input_array=prototype_array)
-
-
-

TODO: show tensorboard topology.

-
-
- - -
- -
-
- - - - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/docs/visualize/supported_exp_managers.html b/docs/visualize/supported_exp_managers.html deleted file mode 100644 index daab22f..0000000 --- a/docs/visualize/supported_exp_managers.html +++ /dev/null @@ -1,848 +0,0 @@ - - - - - - - - - - - - - - Comet.ml — PyTorch Lightning 1.7.0dev documentation - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- - - - - -
-
-
- - - - - - - - - - - -
-
-
- - - - - - - - - - - - - - - - -
- - - - -
-
- -
- Shortcuts -
-
- -
-
- - - -
- -
-
- -
-

Comet.ml

-

To use Comet.ml first install the comet package:

-
pip install comet-ml
-
-
-

Configure the logger and pass it to the Trainer:

-
from pytorch_lightning.loggers import CometLogger
-
-comet_logger = CometLogger(api_key="YOUR_COMET_API_KEY")
-trainer = Trainer(logger=comet_logger)
-
-
-

Access the comet logger from any function (except the LightningModule init) to use its API for tracking advanced artifacts

-
class LitModel(LightningModule):
-    def any_lightning_module_function_or_hook(self):
-        comet = self.logger.experiment
-        fake_images = torch.Tensor(32, 3, 28, 28)
-        comet.add_image("generated_images", fake_images, 0)
-
-
-

Here’s the full documentation for the CometLogger.

-
-
-
-

MLflow

-

To use MLflow first install the MLflow package:

-
pip install mlflow
-
-
-

Configure the logger and pass it to the Trainer:

-
from pytorch_lightning.loggers import MLFlowLogger
-
-mlf_logger = MLFlowLogger(experiment_name="lightning_logs", tracking_uri="file:./ml-runs")
-trainer = Trainer(logger=mlf_logger)
-
-
-

Access the comet logger from any function (except the LightningModule init) to use its API for tracking advanced artifacts

-
class LitModel(LightningModule):
-    def any_lightning_module_function_or_hook(self):
-        mlf_logger = self.logger.experiment
-        fake_images = torch.Tensor(32, 3, 28, 28)
-        mlf_logger.add_image("generated_images", fake_images, 0)
-
-
-

Here’s the full documentation for the MLFlowLogger.

-
-
-
-

Neptune.ai

-

To use Neptune.ai first install the neptune package:

-
pip install neptune-client
-
-
-

or with conda:

-
conda install -c conda-forge neptune-client
-
-
-

Configure the logger and pass it to the Trainer:

-
from pytorch_lightning.loggers import NeptuneLogger
-
-neptune_logger = NeptuneLogger(
-    api_key="ANONYMOUS",  # replace with your own
-    project="common/pytorch-lightning-integration",  # format "<WORKSPACE/PROJECT>"
-)
-trainer = Trainer(logger=neptune_logger)
-
-
-

Access the neptune logger from any function (except the LightningModule init) to use its API for tracking advanced artifacts

-
class LitModel(LightningModule):
-    def any_lightning_module_function_or_hook(self):
-        neptune_logger = self.logger.experiment["your/metadata/structure"]
-        neptune_logger.log(metadata)
-
-
-

Here’s the full documentation for the NeptuneLogger.

-
-
-
-

Tensorboard

-

TensorBoard already comes installed with Lightning. If you removed the install install the following package.

-
pip install tensorboard
-
-
-

Configure the logger and pass it to the Trainer:

-
from pytorch_lightning.loggers import TensorBoardLogger
-
-logger = TensorBoardLogger()
-trainer = Trainer(logger=logger)
-
-
-

Access the tensorboard logger from any function (except the LightningModule init) to use its API for tracking advanced artifacts

-
class LitModel(LightningModule):
-    def any_lightning_module_function_or_hook(self):
-        tensorboard_logger = self.logger.experiment
-        fake_images = torch.Tensor(32, 3, 28, 28)
-        tensorboard_logger.add_image("generated_images", fake_images, 0)
-
-
-

Here’s the full documentation for the TensorBoardLogger.

-
-
-
-

Weights and Biases

-

To use Weights and Biases (wandb) first install the wandb package:

-
pip install wandb
-
-
-

Configure the logger and pass it to the Trainer:

-
from pytorch_lightning.loggers import WandbLogger
-
-wandb_logger = WandbLogger(project="MNIST", log_model="all")
-trainer = Trainer(logger=wandb_logger)
-
-# log gradients and model topology
-wandb_logger.watch(model)
-
-
-

Access the wandb logger from any function (except the LightningModule init) to use its API for tracking advanced artifacts

-
class MyModule(LightningModule):
-    def any_lightning_module_function_or_hook(self):
-        wandb_logger = self.logger.experiment
-        fake_images = torch.Tensor(32, 3, 28, 28)
-
-        # Option 1
-        wandb_logger.log({"generated_images": [wandb.Image(fake_images, caption="...")]})
-
-        # Option 2 for specifically logging images
-        wandb_logger.log_image(key="generated_images", images=[fake_images])
-
-
-

Here’s the full documentation for the WandbLogger. -Demo in Google Colab with hyperparameter search and model logging.

-
-
-
-

Use multiple exp managers

-

To use multiple experiment managers at the same time, pass a list to the logger Trainer argument.

-
from pytorch_lightning.loggers import TensorBoardLogger, WandbLogger
-
-logger1 = TensorBoardLogger()
-logger2 = WandbLogger()
-trainer = Trainer(logger=[logger1, logger2])
-
-
-

Access all loggers from any function (except the LightningModule init) to use their APIs for tracking advanced artifacts

-
class MyModule(LightningModule):
-    def any_lightning_module_function_or_hook(self):
-        tensorboard_logger = self.logger.experiment[0]
-        wandb_logger = self.logger.experiment[1]
-
-        fake_images = torch.Tensor(32, 3, 28, 28)
-
-        tensorboard_logger.add_image("generated_images", fake_images, 0)
-        wandb_logger.add_image("generated_images", fake_images, 0)
-
-
-
- - -
- -
-
- - - - -
- - - -
-

- © Copyright Copyright (c) 2018-2022, William Falcon et al... - -

-
- -
- Built with Sphinx using a theme provided by Read the Docs. -
- - -
- -
-
- - -
-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
-
-
- -
-
-
- - - - - - - - - -
-
-
-
- - -
-
-
- - -
- - - - - - - - - \ No newline at end of file diff --git a/examples/README.md b/examples/README.md new file mode 100644 index 0000000..243e172 --- /dev/null +++ b/examples/README.md @@ -0,0 +1,37 @@ +# Examples + +Our most robust examples showing all sorts of implementations +can be found in our sister library [Lightning Bolts](https://lightning.ai/docs/pytorch/latest/ecosystem/bolts.html). + +______________________________________________________________________ + +*Note that some examples may rely on new features that are only available in the development branch and may be incompatible with any releases.* +*If you see any errors, you might want to consider switching to a version tag you would like to run examples with.* +*For example, if you're using `pytorch-lightning==1.6.4` in your environment and seeing issues, run examples of the tag [1.6.4](https://github.com/Lightning-AI/lightning/tree/1.6.4/pl_examples).* + +______________________________________________________________________ + +## Lightning Fabric Examples + +We show how to accelerate your PyTorch code with [Lightning Fabric](https://lightning.ai/docs/fabric) with minimal code changes. +You stay in full control of the training loop. + +- [MNIST: Vanilla PyTorch vs. Fabric](fabric/image_classifier/README.md) +- [DCGAN: Vanilla PyTorch vs. Fabric](fabric/dcgan/README.md) + +______________________________________________________________________ + +## Lightning Trainer Examples + +In this folder, we have 2 simple examples that showcase the power of the Lightning Trainer. + +- [Image Classifier](pytorch/basics/backbone_image_classifier.py) (trains arbitrary datasets with arbitrary backbones). +- [Autoencoder](pytorch/basics/autoencoder.py) + +______________________________________________________________________ + +## Domain Examples + +This folder contains older examples. You should instead use the examples +in [Lightning Bolts](https://lightning.ai/docs/pytorch/latest/ecosystem/bolts.html) +for advanced use cases. diff --git a/examples/app/argparse/app.py b/examples/app/argparse/app.py new file mode 100644 index 0000000..794e2fc --- /dev/null +++ b/examples/app/argparse/app.py @@ -0,0 +1,28 @@ +import argparse + +import lightning as L + + +class Work(L.LightningWork): + def __init__(self, cloud_compute): + super().__init__(cloud_compute=cloud_compute) + + def run(self): + pass + + +class Flow(L.LightningFlow): + def __init__(self, cloud_compute): + super().__init__() + self.work = Work(cloud_compute) + + def run(self): + assert self.work.cloud_compute.name == "gpu", self.work.cloud_compute.name + self.stop() + + +if __name__ == "__main__": + parser = argparse.ArgumentParser() + parser.add_argument("--use_gpu", action="store_true", default=False, help="Whether to use GPU in the cloud") + hparams = parser.parse_args() + app = L.LightningApp(Flow(L.CloudCompute("gpu" if hparams.use_gpu else "cpu"))) diff --git a/examples/app/boring/.gitignore b/examples/app/boring/.gitignore new file mode 100644 index 0000000..9401870 --- /dev/null +++ b/examples/app/boring/.gitignore @@ -0,0 +1,10 @@ +lightning_logs +*.pt +.storage/ +.shared/ +data +*.ckpt +redis-stable +node_modules +*.rdb +boring_file.txt diff --git a/examples/app/boring/app.py b/examples/app/boring/app.py new file mode 100644 index 0000000..bf77786 --- /dev/null +++ b/examples/app/boring/app.py @@ -0,0 +1,61 @@ +import os + +import lightning as L +from lightning.app.components import TracerPythonScript +from lightning.app.storage import Path + +FILE_CONTENT = """ +Hello there! +This tab is currently an IFrame of the FastAPI Server running in `DestinationFileAndServeWork`. +Also, the content of this file was created in `SourceFileWork` and then transferred to `DestinationFileAndServeWork`. +Are you already 🤯 ? Stick with us, this is only the beginning. Lightning is 🚀. +""" + + +class SourceFileWork(L.LightningWork): + def __init__(self, cloud_compute: L.CloudCompute = L.CloudCompute(), **kwargs): + super().__init__(parallel=True, **kwargs, cloud_compute=cloud_compute) + self.boring_path = None + + def run(self): + # This should be used as a REFERENCE to the file. + self.boring_path = "lit://boring_file.txt" + with open(self.boring_path, "w", encoding="utf-8") as f: + f.write(FILE_CONTENT) + + +class DestinationFileAndServeWork(TracerPythonScript): + def run(self, path: Path): + assert path.exists() + self.script_args += [f"--filepath={path}", f"--host={self.host}", f"--port={self.port}"] + super().run() + + +class BoringApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.source_work = SourceFileWork() + self.dest_work = DestinationFileAndServeWork( + script_path=os.path.join(os.path.dirname(__file__), "scripts/serve.py"), + port=1111, + parallel=False, # runs until killed. + cloud_compute=L.CloudCompute(), + raise_exception=True, + ) + + @property + def ready(self) -> bool: + return self.dest_work.is_running + + def run(self): + self.source_work.run() + if self.source_work.has_succeeded: + # the flow passes the file from one work to another. + self.dest_work.run(self.source_work.boring_path) + self.stop("Boring App End") + + def configure_layout(self): + return {"name": "Boring Tab", "content": self.dest_work.url + "/file"} + + +app = L.LightningApp(BoringApp()) diff --git a/examples/app/boring/app_dynamic.py b/examples/app/boring/app_dynamic.py new file mode 100644 index 0000000..ea66cc2 --- /dev/null +++ b/examples/app/boring/app_dynamic.py @@ -0,0 +1,72 @@ +import os + +import lightning as L +from lightning.app.components import TracerPythonScript +from lightning.app.storage import Path +from lightning.app.structures import Dict + +FILE_CONTENT = """ +Hello there! +This tab is currently an IFrame of the FastAPI Server running in `DestinationFileAndServeWork`. +Also, the content of this file was created in `SourceFileWork` and then transferred to `DestinationFileAndServeWork`. +Are you already 🤯 ? Stick with us, this is only the beginning. Lightning is 🚀. +""" + + +class SourceFileWork(L.LightningWork): + def __init__(self, cloud_compute: L.CloudCompute = L.CloudCompute(), **kwargs): + super().__init__(parallel=True, **kwargs, cloud_compute=cloud_compute) + self.boring_path = None + + def run(self): + # This should be used as a REFERENCE to the file. + self.boring_path = "lit://boring_file.txt" + with open(self.boring_path, "w") as f: + f.write(FILE_CONTENT) + + +class DestinationFileAndServeWork(TracerPythonScript): + def run(self, path: Path): + assert path.exists() + self.script_args += [f"--filepath={path}", f"--host={self.host}", f"--port={self.port}"] + super().run() + + +class BoringApp(L.LightningFlow): + def __init__(self): + super().__init__() + self.dict = Dict() + + @property + def ready(self) -> bool: + if "dst_w" in self.dict: + return self.dict["dst_w"].url != "" + return False + + def run(self): + # create dynamically the source_work at runtime + if "src_w" not in self.dict: + self.dict["src_w"] = SourceFileWork() + + self.dict["src_w"].run() + + if self.dict["src_w"].has_succeeded: + # create dynamically the dst_w at runtime + if "dst_w" not in self.dict: + self.dict["dst_w"] = DestinationFileAndServeWork( + script_path=os.path.join(os.path.dirname(__file__), "scripts/serve.py"), + port=1111, + parallel=False, # runs until killed. + cloud_compute=L.CloudCompute(), + raise_exception=True, + ) + + # the flow passes the file from one work to another. + self.dict["dst_w"].run(self.dict["src_w"].boring_path) + self.stop("Boring App End") + + def configure_layout(self): + return {"name": "Boring Tab", "content": self.dict["dst_w"].url + "/file" if "dst_w" in self.dict else ""} + + +app = L.LightningApp(BoringApp(), log_level="debug") diff --git a/examples/app/boring/scripts/__init__.py b/examples/app/boring/scripts/__init__.py new file mode 100644 index 0000000..e69de29 diff --git a/examples/app/boring/scripts/serve.py b/examples/app/boring/scripts/serve.py new file mode 100644 index 0000000..dedd601 --- /dev/null +++ b/examples/app/boring/scripts/serve.py @@ -0,0 +1,29 @@ +import argparse +import os + +import uvicorn +from fastapi import FastAPI +from fastapi.requests import Request +from fastapi.responses import HTMLResponse + +if __name__ == "__main__": + parser = argparse.ArgumentParser("Server Parser") + parser.add_argument("--filepath", type=str, help="Where to find the `filepath`") + parser.add_argument("--host", type=str, default="0.0.0.0", help="Server host`") + parser.add_argument("--port", type=int, default="8888", help="Server port`") + hparams = parser.parse_args() + + fastapi_service = FastAPI() + + if not os.path.exists(str(hparams.filepath)): + content = ["The file wasn't transferred"] + else: + with open(hparams.filepath) as fo: + content = fo.readlines() # read the file received from SourceWork. + + @fastapi_service.get("/file") + async def get_file_content(request: Request, response_class=HTMLResponse): + lines = "\n".join(["

" + line + "

" for line in content]) + return HTMLResponse(f"
    {lines}
") + + uvicorn.run(app=fastapi_service, host=hparams.host, port=hparams.port) diff --git a/examples/app/commands_and_api/.lightningignore b/examples/app/commands_and_api/.lightningignore new file mode 100644 index 0000000..f7275bb --- /dev/null +++ b/examples/app/commands_and_api/.lightningignore @@ -0,0 +1 @@ +venv/ diff --git a/examples/app/commands_and_api/app.py b/examples/app/commands_and_api/app.py new file mode 100644 index 0000000..a661663 --- /dev/null +++ b/examples/app/commands_and_api/app.py @@ -0,0 +1,53 @@ +from command import CustomCommand, CustomConfig + +from lightning import LightningFlow +from lightning.app.api import Get, Post +from lightning.app.core.app import LightningApp + + +async def handler(): + print("Has been called") + return "Hello World !" + + +class ChildFlow(LightningFlow): + def nested_command(self, name: str): + """A nested command.""" + print(f"Hello {name}") + + def configure_commands(self): + return [{"nested_command": self.nested_command}] + + +class FlowCommands(LightningFlow): + def __init__(self): + super().__init__() + self.names = [] + self.child_flow = ChildFlow() + + def run(self): + if self.names: + print(self.names) + + def command_without_client(self, name: str): + """A command without a client.""" + self.names.append(name) + + def command_with_client(self, config: CustomConfig): + self.names.append(config.name) + + def configure_commands(self): + commands = [ + {"command_without_client": self.command_without_client}, + {"command_with_client": CustomCommand(self.command_with_client)}, + ] + return commands + self.child_flow.configure_commands() + + def configure_api(self): + return [ + Post("/user/command_without_client", self.command_without_client), + Get("/pure_function", handler), + ] + + +app = LightningApp(FlowCommands(), log_level="debug") diff --git a/examples/app/commands_and_api/command.py b/examples/app/commands_and_api/command.py new file mode 100644 index 0000000..96d3f67 --- /dev/null +++ b/examples/app/commands_and_api/command.py @@ -0,0 +1,19 @@ +from argparse import ArgumentParser + +from pydantic import BaseModel + +from lightning.app.utilities.commands import ClientCommand + + +class CustomConfig(BaseModel): + name: str + + +class CustomCommand(ClientCommand): + description = "A command with a client." + + def run(self): + parser = ArgumentParser() + parser.add_argument("--name", type=str) + args = parser.parse_args() + self.invoke_handler(config=CustomConfig(name=args.name)) diff --git a/examples/app/components/python/__init__.py b/examples/app/components/python/__init__.py new file mode 100644 index 0000000..e69de29 diff --git a/examples/app/components/python/app.py b/examples/app/components/python/app.py new file mode 100644 index 0000000..467caa2 --- /dev/null +++ b/examples/app/components/python/app.py @@ -0,0 +1,24 @@ +import os +from pathlib import Path + +import lightning as L +from examples.components.python.component_tracer import PLTracerPythonScript + + +class RootFlow(L.LightningFlow): + def __init__(self): + super().__init__() + script_path = Path(__file__).parent / "pl_script.py" + self.tracer_python_script = PLTracerPythonScript(script_path) + + def run(self): + assert os.getenv("GLOBAL_RANK", "0") == "0" + if not self.tracer_python_script.has_started: + self.tracer_python_script.run() + if self.tracer_python_script.has_succeeded: + self.stop("tracer script succeed") + if self.tracer_python_script.has_failed: + self.stop("tracer script failed") + + +app = L.LightningApp(RootFlow()) diff --git a/examples/app/components/python/component_popen.py b/examples/app/components/python/component_popen.py new file mode 100644 index 0000000..bc70b9f --- /dev/null +++ b/examples/app/components/python/component_popen.py @@ -0,0 +1,7 @@ +from pathlib import Path + +from lightning.app.components import PopenPythonScript + +if __name__ == "__main__": + comp = PopenPythonScript(Path(__file__).parent / "pl_script.py") + comp.run() diff --git a/examples/app/components/python/component_tracer.py b/examples/app/components/python/component_tracer.py new file mode 100644 index 0000000..27ff653 --- /dev/null +++ b/examples/app/components/python/component_tracer.py @@ -0,0 +1,52 @@ +from lightning.app.components import TracerPythonScript +from lightning.app.storage import Path +from lightning.app.utilities.tracer import Tracer +from lightning.pytorch import Trainer + + +class PLTracerPythonScript(TracerPythonScript): + """This component can be used for ANY PyTorch Lightning script to track its progress and extract its best model + path.""" + + def __init__(self, *args, **kwargs): + super().__init__(*args, **kwargs) + # Define the component state. + self.global_step = None + self.best_model_path = None + + def configure_tracer(self) -> Tracer: + from lightning.pytorch.callbacks import Callback + + class MyInjectedCallback(Callback): + def __init__(self, lightning_work): + self.lightning_work = lightning_work + + def on_train_start(self, trainer, pl_module) -> None: + print("This code doesn't belong to the script but was injected.") + print("Even the Lightning Work is available and state transfer works !") + print(self.lightning_work) + + def on_batch_train_end(self, trainer, *_) -> None: + # On every batch end, collects some information. + # This is communicated automatically to the rest of the app, + # so you can track your training in real time in the Lightning App UI. + self.lightning_work.global_step = trainer.global_step + best_model_path = trainer.checkpoint_callback.best_model_path + if best_model_path: + self.lightning_work.best_model_path = Path(best_model_path) + + # This hook would be called every time + # before a Trainer `__init__` method is called. + + def trainer_pre_fn(trainer, *args, **kwargs): + kwargs["callbacks"] = kwargs.get("callbacks", []) + [MyInjectedCallback(self)] + return {}, args, kwargs + + tracer = super().configure_tracer() + tracer.add_traced(Trainer, "__init__", pre_fn=trainer_pre_fn) + return tracer + + +if __name__ == "__main__": + comp = PLTracerPythonScript(Path(__file__).parent / "pl_script.py") + res = comp.run() diff --git a/examples/app/components/python/pl_script.py b/examples/app/components/python/pl_script.py new file mode 100644 index 0000000..75538da --- /dev/null +++ b/examples/app/components/python/pl_script.py @@ -0,0 +1,10 @@ +from lightning.pytorch import Trainer +from lightning.pytorch.demos.boring_classes import BoringModel + +if __name__ == "__main__": + model = BoringModel() + trainer = Trainer(max_epochs=1, accelerator="cpu", devices=2, strategy="ddp") + trainer.fit(model) + trainer.validate(model) + trainer.test(model) + trainer.predict(model) diff --git a/examples/app/components/serve/gradio/app.py b/examples/app/components/serve/gradio/app.py new file mode 100644 index 0000000..eef7000 --- /dev/null +++ b/examples/app/components/serve/gradio/app.py @@ -0,0 +1,52 @@ +from functools import partial + +import gradio as gr +import requests +import torch +from PIL import Image + +import lightning as L +from lightning.app.components import ServeGradio + + +# Credit to @akhaliq for his inspiring work. +# Find his original code there: https://huggingface.co/spaces/akhaliq/AnimeGANv2/blob/main/app.py +class AnimeGANv2UI(ServeGradio): + inputs = gr.inputs.Image(type="pil") + outputs = gr.outputs.Image(type="pil") + elon = "https://upload.wikimedia.org/wikipedia/commons/thumb/3/34/Elon_Musk_Royal_Society_%28crop2%29.jpg/330px-Elon_Musk_Royal_Society_%28crop2%29.jpg" + img = Image.open(requests.get(elon, stream=True).raw) + img.save("elon.jpg") + examples = [["elon.jpg"]] + + def __init__(self): + super().__init__() + self.ready = False + + def predict(self, img): + return self.model(img=img) + + def build_model(self): + repo = "AK391/animegan2-pytorch:main" + model = torch.hub.load(repo, "generator", device="cpu") + face2paint = torch.hub.load(repo, "face2paint", size=512, device="cpu") + self.ready = True + return partial(face2paint, model=model) + + +class RootFlow(L.LightningFlow): + def __init__(self): + super().__init__() + self.demo = AnimeGANv2UI() + + def run(self): + self.demo.run() + + def configure_layout(self): + tabs = [] + if self.demo.ready: + tabs.append({"name": "Home", "content": self.demo}) + return tabs + + +app = L.LightningApp(RootFlow()) diff --git a/examples/app/components/serve/gradio/beyonce.jpg b/examples/app/components/serve/gradio/beyonce.jpg new file mode 100644 index 0000000..68b6084 Binary files /dev/null and b/examples/app/components/serve/gradio/beyonce.jpg differ diff --git a/examples/app/components/serve/gradio/requirements.txt b/examples/app/components/serve/gradio/requirements.txt new file mode 100644 index 0000000..25acedd --- /dev/null +++ b/examples/app/components/serve/gradio/requirements.txt @@ -0,0 +1 @@ +gradio diff --git a/examples/app/dag/.gitignore b/examples/app/dag/.gitignore new file mode 100644 index 0000000..fcb9fa9 --- /dev/null +++ b/examples/app/dag/.gitignore @@ -0,0 +1,6 @@ +df_data +df_target +X_train +X_test +y_train +y_test diff --git a/examples/app/dag/.lightningignore b/examples/app/dag/.lightningignore new file mode 100644 index 0000000..78ae490 --- /dev/null +++ b/examples/app/dag/.lightningignore @@ -0,0 +1,8 @@ +*df_data* +*df_target* +*X_train* +*X_test* +*y_train* +*y_test* +*.shared* +*.storage* diff --git a/examples/app/dag/app.py b/examples/app/dag/app.py new file mode 100644 index 0000000..f344242 --- /dev/null +++ b/examples/app/dag/app.py @@ -0,0 +1,131 @@ +import os +from importlib import import_module + +import numpy as np +import pandas as pd +from sklearn import datasets +from sklearn.metrics import mean_squared_error + +import lightning as L +from lightning.app.components import TracerPythonScript +from lightning.app.storage import Payload +from lightning.app.structures import Dict, List + + +def get_path(path): + return os.path.join(os.path.dirname(__file__), path) + + +class GetDataWork(L.LightningWork): + """This component is responsible to download some data and store them with a PayLoad.""" + + def __init__(self): + super().__init__() + self.df_data = None + self.df_target = None + + def run(self): + print("Starting data collection...") + data = datasets.fetch_california_housing(data_home=get_path("data")) + self.df_data = Payload(pd.DataFrame(data["data"], columns=data["feature_names"])) + self.df_target = Payload(pd.DataFrame(data["target"], columns=["MedHouseVal"])) + print("Finished data collection.") + + +class ModelWork(L.LightningWork): + """This component is receiving some data and train a sklearn model.""" + + def __init__(self, model_path: str, parallel: bool): + super().__init__(parallel=parallel) + self.model_path, self.model_name = model_path.split(".") + self.test_rmse = None + + def run(self, X_train: Payload, X_test: Payload, y_train: Payload, y_test: Payload): + print(f"Starting training and evaluating {self.model_name}...") + module = import_module(f"sklearn.{self.model_path}") + model = getattr(module, self.model_name)() + model.fit(X_train.value, y_train.value.ravel()) + y_test_prediction = model.predict(X_test.value) + self.test_rmse = np.sqrt(mean_squared_error(y_test.value, y_test_prediction)) + print(f"Finished training and evaluating {self.model_name}.") + + +class DAG(L.LightningFlow): + """This component is a DAG.""" + + def __init__(self, models_paths: list): + super().__init__() + # Step 1: Create a work to get the data. + self.data_collector = GetDataWork() + + # Step 2: Create a tracer component. This is used to execute python script + # and collect any outputs from its globals as Payloads. + self.processing = TracerPythonScript( + get_path("processing.py"), + outputs=["X_train", "X_test", "y_train", "y_test"], + ) + + # Step 3: Create the work to train the models_paths in parallel. + self.dict = Dict( + **{model_path.split(".")[-1]: ModelWork(model_path, parallel=True) for model_path in models_paths} + ) + + # Step 4: Some element to track components progress. + self.has_completed = False + self.metrics = {} + + def run(self): + # Step 1 and 2: Download and process the data. + self.data_collector.run() + self.processing.run( + df_data=self.data_collector.df_data, + df_target=self.data_collector.df_target, + ) + + # Step 3: Launch n models training in parallel. + for model, work in self.dict.items(): + work.run( + X_train=self.processing.X_train, + X_test=self.processing.X_test, + y_train=self.processing.y_train, + y_test=self.processing.y_test, + ) + if work.test_rmse: # Use the state to control when to collect and stop. + self.metrics[model] = work.test_rmse + work.stop() # Stop the model work to reduce cost + + # Step 4: Print the score of each model when they are all finished. + if len(self.metrics) == len(self.dict): + print(self.metrics) + self.has_completed = True + + +class ScheduledDAG(L.LightningFlow): + def __init__(self, dag_cls, **dag_kwargs): + super().__init__() + self.dags = List() + self._dag_cls = dag_cls + self.dag_kwargs = dag_kwargs + + def run(self): + """Example of scheduling an infinite number of DAG runs continuously.""" + # Step 1: Every minute, create and launch a new DAG. + if self.schedule("* * * * *"): + print("Launching a new DAG") + self.dags.append(self._dag_cls(**self.dag_kwargs)) + + for dag in self.dags: + if not dag.has_completed: + dag.run() + + +app = L.LightningApp( + ScheduledDAG( + DAG, + models_paths=[ + "svm.SVR", + "linear_model.LinearRegression", + "tree.DecisionTreeRegressor", + ], + ), +) diff --git a/examples/app/dag/processing.py b/examples/app/dag/processing.py new file mode 100644 index 0000000..245377f --- /dev/null +++ b/examples/app/dag/processing.py @@ -0,0 +1,14 @@ +import random + +from sklearn.model_selection import train_test_split +from sklearn.preprocessing import MinMaxScaler + +print("Starting processing ...") +scaler = MinMaxScaler() + +X_train, X_test, y_train, y_test = train_test_split( + df_data.values, df_target.values, test_size=0.20, random_state=random.randint(0, 42) +) +X_train = scaler.fit_transform(X_train) +X_test = scaler.transform(X_test) +print("Finished processing.") diff --git a/examples/app/dag/requirements.txt b/examples/app/dag/requirements.txt new file mode 100644 index 0000000..f669f51 --- /dev/null +++ b/examples/app/dag/requirements.txt @@ -0,0 +1,2 @@ +scikit-learn +pandas diff --git a/examples/app/display_name/.lightningignore b/examples/app/display_name/.lightningignore new file mode 100644 index 0000000..f7275bb --- /dev/null +++ b/examples/app/display_name/.lightningignore @@ -0,0 +1 @@ +venv/ diff --git a/examples/app/display_name/app.py b/examples/app/display_name/app.py new file mode 100644 index 0000000..f06d8ee --- /dev/null +++ b/examples/app/display_name/app.py @@ -0,0 +1,25 @@ +import lightning as L + + +class Work(L.LightningWork): + def __init__(self, start_with_flow=True): + super().__init__(start_with_flow=start_with_flow) + + def run(self): + pass + + +class Flow(L.LightningFlow): + def __init__(self): + super().__init__() + self.w = Work() + self.w1 = Work(start_with_flow=False) + self.w.display_name = "My Custom Name" # Not supported yet + self.w1.display_name = "My Custom Name 1" + + def run(self): + self.w.run() + self.w1.run() + + +app = L.LightningApp(Flow()) diff --git a/examples/app/drive/.gitignore b/examples/app/drive/.gitignore new file mode 100644 index 0000000..eaa5fa8 --- /dev/null +++ b/examples/app/drive/.gitignore @@ -0,0 +1 @@ +a.txt diff --git a/examples/app/drive/app.py b/examples/app/drive/app.py new file mode 100644 index 0000000..1a24f5c --- /dev/null +++ b/examples/app/drive/app.py @@ -0,0 +1,51 @@ +import os + +import lightning as L +from lightning.app.storage import Drive + + +class Work_1(L.LightningWork): + def run(self, drive: Drive): + # 1. Create a file. + with open("a.txt", "w") as f: + f.write("Hello World !") + + # 2. Put the file into the drive. + drive.put("a.txt") + + # 3. Delete the locally. + os.remove("a.txt") + + +class Work_2(L.LightningWork): + def __init__(self): + super().__init__() + + def run(self, drive: Drive): + print(drive.list(".")) # Prints ["a.txt"] + + print(os.path.exists("a.txt")) # Prints False + + drive.get("a.txt") # Transfer the file from this drive to the local filesystem. + + print(os.path.exists("a.txt")) # Prints True + + with open("a.txt") as f: + print(f.readlines()[0]) # Prints Hello World ! + + +class Flow(L.LightningFlow): + def __init__(self): + super().__init__() + self.drive_1 = Drive("lit://drive_1") + self.work_1 = Work_1() + self.work_2 = Work_2() + + def run(self): + # Pass the drive to both works. + self.work_1.run(self.drive_1) + self.work_2.run(self.drive_1) + self.stop("Application End!") + + +app = L.LightningApp(Flow()) diff --git a/examples/app/hpo/README.md b/examples/app/hpo/README.md new file mode 100644 index 0000000..b9b648b --- /dev/null +++ b/examples/app/hpo/README.md @@ -0,0 +1,64 @@ +# Build a Lightning Hyperparameter Optimization (HPO) App + +## A bit of background + +Traditionally, developing machine learning (ML) products requires choosing among a large space of +hyperparameters while creating and training the ML models. Hyperparameter optimization +(HPO) aims to find a well-performing hyperparameter configuration for a given ML model +on a dataset at hand, including the ML model, +its hyperparameters, and other data processing steps. + +HPOs free the human expert from a tedious and error-prone, manual hyperparameter tuning process. + +As an example, in the famous [scikit-learn](https://scikit-learn.org/stable/) library, +hyperparameters are passed as arguments to the constructor of +the estimator classes such as `C` kernel for +[Support Vector Classifier](https://scikit-learn.org/stable/modules/classes.html?highlight=svm#module-sklearn.svm), etc. + +It is possible and recommended to search the hyperparameter space for the best validation score. + +An HPO search consists of: + +- an objective method +- a defined parameter space +- a method for searching or sampling candidates + +A naive method for sampling candidates is grid search, which exhaustively considers all +hyperparameter combinations from a user-specified grid. + +Fortunately, HPO is an active area of research, and many methods have been developed to +optimize the time required to get strong candidates. + +In the following tutorial, you will learn how to use Lightning together with [Optuna](https://optuna.org/). + +[Optuna](https://optuna.org/) is an open source HPO framework to automate hyperparameter search. +Out-of-the-box, it provides efficient algorithms to search large spaces and prune unpromising trials for faster results. + +First, you will learn about the best practices on how to implement HPO without the Lightning Framework. +Secondly, we will dive into a working HPO application with Lightning, and finally create a neat +[HiPlot UI](https://facebookresearch.github.io/hiplot/_static/demo/demo_basic_usage.html?hip.filters=%5B%5D&hip.color_by=%22dropout%22&hip.PARALLEL_PLOT.order=%5B%22uid%22%2C%22dropout%22%2C%22lr%22%2C%22loss%22%2C%22optimizer%22%5D) +for our application. + +## Getting started + +### Step 1: Download the data + +```bash +python download_data.py +``` + +### Step 2: Run the HPO Lightning App without an UI + +```bash +lightning run app app_wo_ui.py +``` + +### Step 3: Run the HPO Lightning App with HiPlot UI in Streamlit. + +```bash +lightning run app app_wi_ui.py +``` + +## Learn More + +In the documentation, search for `Build a Sweep App`. diff --git a/examples/app/hpo/app_wi_ui.py b/examples/app/hpo/app_wi_ui.py new file mode 100644 index 0000000..ec0ce25 --- /dev/null +++ b/examples/app/hpo/app_wi_ui.py @@ -0,0 +1,61 @@ +from pathlib import Path + +import optuna +from hyperplot import HiPlotFlow +from objective import ObjectiveWork + +import lightning as L +from lightning.app.structures import Dict + + +class RootHPOFlow(L.LightningFlow): + def __init__(self, script_path, data_dir, total_trials, simultaneous_trials): + super().__init__() + self.script_path = script_path + self.data_dir = data_dir + self.total_trials = total_trials + self.simultaneous_trials = simultaneous_trials + self.num_trials = simultaneous_trials + self._study = optuna.create_study() + self.ws = Dict() + self.hi_plot = HiPlotFlow() + + def run(self): + if self.num_trials >= self.total_trials: + self.stop() + + has_told_study = [] + + for trial_idx in range(self.num_trials): + work_name = f"objective_work_{trial_idx}" + if work_name not in self.ws: + objective_work = ObjectiveWork( + script_path=self.script_path, + data_dir=self.data_dir, + cloud_compute=L.CloudCompute("cpu"), + ) + self.ws[work_name] = objective_work + if not self.ws[work_name].has_started: + trial = self._study.ask(ObjectiveWork.distributions()) + self.ws[work_name].run(trial_id=trial._trial_id, **trial.params) + + if self.ws[work_name].metric and not self.ws[work_name].has_told_study: + self.hi_plot.data.append({"x": -1 * self.ws[work_name].metric, **self.ws[work_name].params}) + self._study.tell(self.ws[work_name].trial_id, self.ws[work_name].metric) + self.ws[work_name].has_told_study = True + + has_told_study.append(self.ws[work_name].has_told_study) + + if all(has_told_study): + self.num_trials += self.simultaneous_trials + + +if __name__ == "__main__": + app = L.LightningApp( + RootHPOFlow( + script_path=str(Path(__file__).parent / "pl_script.py"), + data_dir="data/hymenoptera_data_version_0", + total_trials=6, + simultaneous_trials=2, + ) + ) diff --git a/examples/app/hpo/app_wo_ui.py b/examples/app/hpo/app_wo_ui.py new file mode 100644 index 0000000..9ae6c58 --- /dev/null +++ b/examples/app/hpo/app_wo_ui.py @@ -0,0 +1,58 @@ +from pathlib import Path + +import optuna +from objective import ObjectiveWork + +import lightning as L +from lightning.app.structures import Dict + + +class RootHPOFlow(L.LightningFlow): + def __init__(self, script_path, data_dir, total_trials, simultaneous_trials): + super().__init__() + self.script_path = script_path + self.data_dir = data_dir + self.total_trials = total_trials + self.simultaneous_trials = simultaneous_trials + self.num_trials = simultaneous_trials + self._study = optuna.create_study() + self.ws = Dict() + + def run(self): + if self.num_trials >= self.total_trials: + self.stop() + + has_told_study = [] + + for trial_idx in range(self.num_trials): + work_name = f"objective_work_{trial_idx}" + if work_name not in self.ws: + objective_work = ObjectiveWork( + script_path=self.script_path, + data_dir=self.data_dir, + cloud_compute=L.CloudCompute("cpu"), + ) + self.ws[work_name] = objective_work + if not self.ws[work_name].has_started: + trial = self._study.ask(ObjectiveWork.distributions()) + self.ws[work_name].run(trial_id=trial._trial_id, **trial.params) + + if self.ws[work_name].metric and not self.ws[work_name].has_told_study: + self._study.tell(self.ws[work_name].trial_id, self.ws[work_name].metric) + self.ws[work_name].has_told_study = True + + has_told_study.append(self.ws[work_name].has_told_study) + + if all(has_told_study): + self.num_trials += self.simultaneous_trials + + +if __name__ == "__main__": + app = L.LightningApp( + RootHPOFlow( + script_path=str(Path(__file__).parent / "pl_script.py"), + data_dir="data/hymenoptera_data_version_0", + total_trials=6, + simultaneous_trials=2, + ) + ) diff --git a/examples/app/hpo/download_data.py b/examples/app/hpo/download_data.py new file mode 100644 index 0000000..d82b86a --- /dev/null +++ b/examples/app/hpo/download_data.py @@ -0,0 +1,5 @@ +from utils import download_data + +data_dir = "hymenoptera_data_version_0" +download_url = f"https://pl-flash-data.s3.amazonaws.com/{data_dir}.zip" +download_data(download_url, "./data") diff --git a/examples/app/hpo/hyperplot.py b/examples/app/hpo/hyperplot.py new file mode 100644 index 0000000..3d82378 --- /dev/null +++ b/examples/app/hpo/hyperplot.py @@ -0,0 +1,34 @@ +import lightning as L +from lightning.app.frontend import StreamlitFrontend +from lightning.app.utilities.state import AppState + + +class HiPlotFlow(L.LightningFlow): + def __init__(self): + super().__init__() + self.data = [] + + def run(self): + pass + + def configure_layout(self): + return StreamlitFrontend(render_fn=render_fn) + + +def render_fn(state: AppState): + import json + + import hiplot as hip + import streamlit as st + from streamlit_autorefresh import st_autorefresh + + st.set_page_config(layout="wide") + st_autorefresh(interval=1000, limit=None, key="refresh") + + if not state.data: + st.write("No data available yet ! Stay tuned") + return + + xp = hip.Experiment.from_iterable(state.data) + ret_val = xp.to_streamlit(ret="selected_uids", key="hip").display() + st.markdown("hiplot returned " + json.dumps(ret_val)) diff --git a/examples/app/hpo/objective.py b/examples/app/hpo/objective.py new file mode 100644 index 0000000..a9dae08 --- /dev/null +++ b/examples/app/hpo/objective.py @@ -0,0 +1,63 @@ +import os +import tempfile +from datetime import datetime +from typing import Optional + +import pandas as pd +import torch +from optuna.distributions import CategoricalDistribution, LogUniformDistribution +from torchmetrics import Accuracy + +import lightning as L +from lightning.app.components import TracerPythonScript + + +class ObjectiveWork(TracerPythonScript): + def __init__(self, script_path: str, data_dir: str, cloud_compute: Optional[L.CloudCompute]): + timestamp = datetime.now().strftime("%H:%M:%S") + tmpdir = tempfile.TemporaryDirectory().name + submission_path = os.path.join(tmpdir, f"{timestamp}.csv") + best_model_path = os.path.join(tmpdir, f"{timestamp}.model.pt") + super().__init__( + script_path, + script_args=[ + f"--train_data_path={data_dir}/train", + f"--test_data_path={data_dir}/test", + f"--submission_path={submission_path}", + f"--best_model_path={best_model_path}", + ], + cloud_compute=cloud_compute, + ) + self.data_dir = data_dir + self.best_model_path = best_model_path + self.submission_path = submission_path + self.metric = None + self.trial_id = None + self.metric = None + self.params = None + self.has_told_study = False + + def run(self, trial_id: int, **params): + self.trial_id = trial_id + self.params = params + self.script_args.extend([f"--{k}={v}" for k, v in params.items()]) + super().run() + self.compute_metric() + + def _to_labels(self, path: str): + return torch.from_numpy(pd.read_csv(path).label.values) + + def compute_metric(self): + self.metric = -1 * float( + Accuracy(task="binary")( + self._to_labels(self.submission_path), + self._to_labels(f"{self.data_dir}/ground_truth.csv"), + ) + ) + + @staticmethod + def distributions(): + return { + "backbone": CategoricalDistribution(["resnet18", "resnet34"]), + "learning_rate": LogUniformDistribution(0.0001, 0.1), + } diff --git a/examples/app/hpo/pl_script.py b/examples/app/hpo/pl_script.py new file mode 100644 index 0000000..bbc4537 --- /dev/null +++ b/examples/app/hpo/pl_script.py @@ -0,0 +1,43 @@ +import argparse +import os + +import pandas as pd +import torch +from flash import Trainer +from flash.image import ImageClassificationData, ImageClassifier + +# Parse arguments provided by the Work. +parser = argparse.ArgumentParser() +parser.add_argument("--train_data_path", type=str, required=True) +parser.add_argument("--submission_path", type=str, required=True) +parser.add_argument("--test_data_path", type=str, required=True) +parser.add_argument("--best_model_path", type=str, required=True) +# Optional +parser.add_argument("--backbone", type=str, default="resnet18") +parser.add_argument("--learning_rate", type=float, default=0.01) +args = parser.parse_args() + + +datamodule = ImageClassificationData.from_folders( + train_folder=args.train_data_path, + batch_size=8, +) + +model = ImageClassifier(datamodule.num_classes, backbone=args.backbone) +trainer = Trainer(fast_dev_run=True) +trainer.fit(model, datamodule=datamodule) +trainer.save_checkpoint(args.best_model_path) + +datamodule = ImageClassificationData.from_folders( + predict_folder=args.test_data_path, + batch_size=8, +) + +predictions = Trainer().predict(model, datamodule=datamodule) +submission_data = [ + {"filename": os.path.basename(p["metadata"]["filepath"]), "label": torch.argmax(p["preds"]).item()} + for batch in predictions + for p in batch +] +df = pd.DataFrame(submission_data) +df.to_csv(args.submission_path, index=False) diff --git a/examples/app/hpo/requirements.txt b/examples/app/hpo/requirements.txt new file mode 100644 index 0000000..bd85880 --- /dev/null +++ b/examples/app/hpo/requirements.txt @@ -0,0 +1,3 @@ +optuna +lightning-flash[image,serve] == 0.7.0 +hiplot diff --git a/examples/app/hpo/utils.py b/examples/app/hpo/utils.py new file mode 100644 index 0000000..a08fda2 --- /dev/null +++ b/examples/app/hpo/utils.py @@ -0,0 +1,54 @@ +import os +import os.path +import tarfile +import zipfile + +import requests + + +def download_data(url: str, path: str = "data/", verbose: bool = False) -> None: + """Download file with progressbar. + + # Code taken from: https://gist.github.com/ruxi/5d6803c116ec1130d484a4ab8c00c603 + # __author__ = "github.com/ruxi" + # __license__ = "MIT" + + Usage: + download_file('http://web4host.net/5MB.zip') + """ + if url == "NEED_TO_BE_CREATED": + raise NotImplementedError + + if not os.path.exists(path): + os.makedirs(path) + local_filename = os.path.join(path, url.split("/")[-1]) + r = requests.get(url, stream=True, verify=False) + file_size = int(r.headers["Content-Length"]) if "Content-Length" in r.headers else 0 + chunk_size = 1024 + num_bars = int(file_size / chunk_size) + if verbose: + print({"file_size": file_size}) + print({"num_bars": num_bars}) + + if not os.path.exists(local_filename): + with open(local_filename, "wb") as fp: + for chunk in r.iter_content(chunk_size=chunk_size): + fp.write(chunk) # type: ignore + + def extract_tarfile(file_path: str, extract_path: str, mode: str): + if os.path.exists(file_path): + with tarfile.open(file_path, mode=mode) as tar_ref: + for member in tar_ref.getmembers(): + try: + tar_ref.extract(member, path=extract_path, set_attrs=False) + except PermissionError: + raise PermissionError(f"Could not extract tar file {file_path}") + + if ".zip" in local_filename: + if os.path.exists(local_filename): + with zipfile.ZipFile(local_filename, "r") as zip_ref: + zip_ref.extractall(path) + elif local_filename.endswith(".tar.gz") or local_filename.endswith(".tgz"): + extract_tarfile(local_filename, path, "r:gz") + elif local_filename.endswith(".tar.bz2") or local_filename.endswith(".tbz"): + extract_tarfile(local_filename, path, "r:bz2") diff --git a/examples/app/installation_commands/app.py b/examples/app/installation_commands/app.py new file mode 100644 index 0000000..b03ce63 --- /dev/null +++ b/examples/app/installation_commands/app.py @@ -0,0 +1,32 @@ +# EXAMPLE COMPONENT: RUN A SCRIPT +# app.py +# !echo "I am installing a dependency not declared in a requirements file" +# !pip install lmdb +import lmdb + +import lightning as L + + +class YourComponent(L.LightningWork): + def run(self): + print(lmdb.version()) + print("lmdb successfully installed") + print("Accessing a module in a Work or Flow body works!") + + +class RootFlow(L.LightningFlow): + def __init__(self, work): + super().__init__() + self.work = work + + def run(self): + self.work.run() + + +print(f"Accessing an object in main code body works!: version = {lmdb.version()}") + + +# run on a cloud machine +compute = L.CloudCompute("cpu") +worker = YourComponent(cloud_compute=compute) +app = L.LightningApp(RootFlow(worker)) diff --git a/examples/app/interruptible/app.py b/examples/app/interruptible/app.py new file mode 100644 index 0000000..60077ec --- /dev/null +++ b/examples/app/interruptible/app.py @@ -0,0 +1,32 @@ +from time import sleep + +import lightning as L + + +class Work(L.LightningWork): + def __init__(self, *args, **kwargs): + super().__init__(*args, **kwargs) + self.counter = 0 + + def run(self): + while True: + print(self.counter) + self.counter += 1 + sleep(1) + + +class Flow(L.LightningFlow): + def __init__(self): + super().__init__() + self.w = Work( + cloud_compute=L.CloudCompute("gpu", interruptible=True), + start_with_flow=False, + parallel=True, + ) + + def run(self): + self.w.run() + print(self.w.counter) + + +app = L.LightningApp(Flow()) diff --git a/examples/app/justpy/app.py b/examples/app/justpy/app.py new file mode 100644 index 0000000..a4c9abc --- /dev/null +++ b/examples/app/justpy/app.py @@ -0,0 +1,42 @@ +from typing import Callable + +from lightning import LightningApp, LightningFlow +from lightning.app.frontend import JustPyFrontend + + +class Flow(LightningFlow): + def __init__(self): + super().__init__() + self.counter = 0 + + def run(self): + print(self.counter) + + def configure_layout(self): + return JustPyFrontend(render_fn=render_fn) + + +def render_fn(get_state: Callable) -> Callable: + import justpy as jp + + def webpage(): + wp = jp.QuasarPage(dark=True) + d = jp.Div(classes="q-pa-md q-gutter-sm", a=wp) + container = jp.QBtn(color="primary", text="Counter: 0") + + async def click(*_): + state = get_state() + state.counter += 1 + container.text = f"Counter: {state.counter}" + + button = jp.QBtn(color="primary", text="Click Me!", click=click) + + d.add(button) + d.add(container) + + return wp + + return webpage + + +app = LightningApp(Flow()) diff --git a/examples/app/justpy/requirements.txt b/examples/app/justpy/requirements.txt new file mode 100644 index 0000000..5f69409 --- /dev/null +++ b/examples/app/justpy/requirements.txt @@ -0,0 +1 @@ +justpy diff --git a/examples/app/layout/app.py b/examples/app/layout/app.py new file mode 100644 index 0000000..7048f62 --- /dev/null +++ b/examples/app/layout/app.py @@ -0,0 +1,100 @@ +"""An example showcasing how `configure_layout` can be used to nest user interfaces of different flows. + +Run the app: + +lightning run app examples/layout/demo.py + +This starts one server for each flow that returns a UI. Access the UI at the link printed in the terminal. +""" + +import os +from time import sleep + +import lightning as L +from lightning.app.frontend import StaticWebFrontend, StreamlitFrontend + + +class C11(L.LightningFlow): + def __init__(self): + super().__init__() + self.message = "Hello Streamlit!" + + def run(self): + pass + + def configure_layout(self): + return StreamlitFrontend(render_fn=render_c11) + + +def render_c11(state): + import streamlit as st + + st.write(state.message) + + +class C21(L.LightningFlow): + def __init__(self): + super().__init__() + + def run(self): + pass + + def configure_layout(self): + return StaticWebFrontend(os.path.join(os.path.dirname(__file__), "ui1")) + + +class C22(L.LightningFlow): + def __init__(self): + super().__init__() + + def run(self): + pass + + def configure_layout(self): + return StaticWebFrontend(os.path.join(os.path.dirname(__file__), "ui2")) + + +class C1(L.LightningFlow): + def __init__(self): + super().__init__() + self.c11 = C11() + + def run(self): + pass + + +class C2(L.LightningFlow): + def __init__(self): + super().__init__() + self.c21 = C21() + self.c22 = C22() + + def run(self): + pass + + def configure_layout(self): + return [ + {"name": "one", "content": self.c21}, + {"name": "two", "content": self.c22}, + ] + + +class Root(L.LightningFlow): + def __init__(self): + super().__init__() + self.c1 = C1() + self.c2 = C2() + + def run(self): + sleep(10) + self.stop("Layout End") + + def configure_layout(self): + return [ + {"name": "one", "content": self.c1.c11}, + {"name": "two", "content": self.c2}, + {"name": "three", "content": "https://lightning.ai"}, + ] + + +app = L.LightningApp(Root()) diff --git a/examples/app/layout/requirements.txt b/examples/app/layout/requirements.txt new file mode 100644 index 0000000..12a4706 --- /dev/null +++ b/examples/app/layout/requirements.txt @@ -0,0 +1 @@ +streamlit diff --git a/examples/app/layout/ui1/index.html b/examples/app/layout/ui1/index.html new file mode 100644 index 0000000..7019634 --- /dev/null +++ b/examples/app/layout/ui1/index.html @@ -0,0 +1,10 @@ + + + + + One + + +One + + diff --git a/examples/app/layout/ui2/index.html b/examples/app/layout/ui2/index.html new file mode 100644 index 0000000..f9b6432 --- /dev/null +++ b/examples/app/layout/ui2/index.html @@ -0,0 +1,10 @@ + + + + + Two + + +Two + + diff --git a/examples/app/mount/app.py b/examples/app/mount/app.py new file mode 100644 index 0000000..d0d2adf --- /dev/null +++ b/examples/app/mount/app.py @@ -0,0 +1,35 @@ +import os + +import lightning as L +from lightning_app import CloudCompute +from lightning_app.storage import Mount + + +class Work(L.LightningWork): + def __init__(self, *args, **kwargs): + super().__init__(*args, **kwargs) + + def run(self): + files = os.listdir("/content/esRedditJson/") + for file in files: + print(file) + assert "esRedditJson1" in files + + +class Flow(L.LightningFlow): + def __init__(self): + super().__init__() + self.work_1 = Work( + cloud_compute=CloudCompute( + mounts=Mount( + source="s3://ryft-public-sample-data/esRedditJson/", + mount_path="/content/esRedditJson/", + ), + ) + ) + + def run(self): + self.work_1.run() + + +app = L.LightningApp(Flow()) diff --git a/examples/app/multi_node/README.md b/examples/app/multi_node/README.md new file mode 100644 index 0000000..aef1524 --- /dev/null +++ b/examples/app/multi_node/README.md @@ -0,0 +1,51 @@ +# Lightning & Multi Node Training + +Lightning supports makes multi-node training simple by providing a simple interface to orchestrate compute and data. + +## Multi Node with raw PyTorch + +You can run the multi-node raw PyTorch by running the following commands. + +Here is an example where you spawn your processes yourself. + +```bash +lightning run app train_pytorch.py +``` + +or you can use the built-in component for it. + +```bash +lightning run app train_pytorch_spawn.py +``` + +## Multi Node with raw PyTorch + Fabric + +You can run the multi-node raw PyTorch and Fabric by running the following commands. + +```bash +lightning run app train_fabric.py +``` + +Using Fabric, you retain control over your loops while accessing in a minimal way all Lightning distributed strategies. + +## Multi Node with Lightning Trainer + +Lightning supports running Lightning Trainer from a script or within a Lightning Work. + +You can either run a script directly + +```bash +lightning run app train_pl_script.py +``` + +or run your code within as a work. + +```bash +lightning run app train_pl.py +``` + +## Multi Node with any frameworks + +```bash +lightning run app train_any.py +``` diff --git a/examples/app/multi_node/pl_boring_script.py b/examples/app/multi_node/pl_boring_script.py new file mode 100644 index 0000000..bdced94 --- /dev/null +++ b/examples/app/multi_node/pl_boring_script.py @@ -0,0 +1,7 @@ +import lightning as L +from lightning.pytorch.demos.boring_classes import BoringModel + +if __name__ == "__main__": + model = BoringModel() + trainer = L.Trainer(max_epochs=1) + trainer.fit(model) diff --git a/examples/app/multi_node/requirements.txt b/examples/app/multi_node/requirements.txt new file mode 100644 index 0000000..12c6d5d --- /dev/null +++ b/examples/app/multi_node/requirements.txt @@ -0,0 +1 @@ +torch diff --git a/examples/app/multi_node/train_any.py b/examples/app/multi_node/train_any.py new file mode 100644 index 0000000..5dfb947 --- /dev/null +++ b/examples/app/multi_node/train_any.py @@ -0,0 +1,22 @@ +import lightning as L +from lightning.app.components import MultiNode + + +class AnyDistributedComponent(L.LightningWork): + def run( + self, + main_address: str, + main_port: int, + num_nodes: int, + node_rank: int, + ): + print(f"ADD YOUR DISTRIBUTED CODE: {main_address} {main_port} {num_nodes} {node_rank}.") + + +app = L.LightningApp( + MultiNode( + AnyDistributedComponent, + num_nodes=2, + cloud_compute=L.CloudCompute("gpu"), + ) +) diff --git a/examples/app/multi_node/train_fabric.py b/examples/app/multi_node/train_fabric.py new file mode 100644 index 0000000..335e1e7 --- /dev/null +++ b/examples/app/multi_node/train_fabric.py @@ -0,0 +1,41 @@ +import torch + +import lightning as L +from lightning.app.components import FabricMultiNode +from lightning.fabric import Fabric + + +class FabricPyTorchDistributed(L.LightningWork): + def run(self): + # 1. Prepare the model + model = torch.nn.Sequential( + torch.nn.Linear(1, 1), + torch.nn.ReLU(), + torch.nn.Linear(1, 1), + ) + + # 2. Create Fabric. + fabric = Fabric(strategy="ddp", precision="16-mixed") + model, optimizer = fabric.setup(model, torch.optim.SGD(model.parameters(), lr=0.01)) + criterion = torch.nn.MSELoss() + + # 3. Train the model for 1000 steps. + for step in range(1000): + model.zero_grad() + x = torch.tensor([0.8]).to(fabric.device) + target = torch.tensor([1.0]).to(fabric.device) + output = model(x) + loss = criterion(output, target) + print(f"global_rank: {fabric.global_rank} step: {step} loss: {loss}") + fabric.backward(loss) + optimizer.step() + + +# 8 GPUs: (2 nodes of 4 x v100) +app = L.LightningApp( + FabricMultiNode( + FabricPyTorchDistributed, + cloud_compute=L.CloudCompute("gpu-fast-multi"), # 4 x V100 + num_nodes=2, + ) +) diff --git a/examples/app/multi_node/train_lt.py b/examples/app/multi_node/train_lt.py new file mode 100644 index 0000000..8ed62a1 --- /dev/null +++ b/examples/app/multi_node/train_lt.py @@ -0,0 +1,20 @@ +# app.py +import lightning as L +from lightning.app.components import LightningTrainerMultiNode +from lightning.pytorch.demos.boring_classes import BoringModel + + +class LightningTrainerDistributed(L.LightningWork): + def run(self): + model = BoringModel() + trainer = L.Trainer(max_epochs=10, strategy="ddp") + trainer.fit(model) + + +# 8 GPUs: (2 nodes of 4 x v100) +component = LightningTrainerMultiNode( + LightningTrainerDistributed, + num_nodes=2, + cloud_compute=L.CloudCompute("gpu-fast-multi"), # 4 x v100 +) +app = L.LightningApp(component) diff --git a/examples/app/multi_node/train_lt_script.py b/examples/app/multi_node/train_lt_script.py new file mode 100644 index 0000000..58f8473 --- /dev/null +++ b/examples/app/multi_node/train_lt_script.py @@ -0,0 +1,12 @@ +import lightning as L +from lightning.app.components import LightningTrainerScript +from lightning.app.utilities.packaging.cloud_compute import CloudCompute + +# 8 GPUs: (2 nodes of 4 x v100) +app = L.LightningApp( + LightningTrainerScript( + "pl_boring_script.py", + num_nodes=2, + cloud_compute=CloudCompute("gpu-fast-multi"), # 4 x v100 + ), +) diff --git a/examples/app/multi_node/train_pytorch.py b/examples/app/multi_node/train_pytorch.py new file mode 100644 index 0000000..e5a9a1f --- /dev/null +++ b/examples/app/multi_node/train_pytorch.py @@ -0,0 +1,61 @@ +# app.py +# ! pip install torch +import torch +from torch.nn.parallel.distributed import DistributedDataParallel + +import lightning as L +from lightning.app.components import MultiNode + + +def distributed_train(local_rank: int, main_address: str, main_port: int, num_nodes: int, node_rank: int, nprocs: int): + # 1. SET UP DISTRIBUTED ENVIRONMENT + global_rank = local_rank + node_rank * nprocs + world_size = num_nodes * nprocs + + if torch.distributed.is_available() and not torch.distributed.is_initialized(): + torch.distributed.init_process_group( + "nccl" if torch.cuda.is_available() else "gloo", + rank=global_rank, + world_size=world_size, + init_method=f"tcp://{main_address}:{main_port}", + ) + + # 2. PREPARE DISTRIBUTED MODEL + model = torch.nn.Linear(32, 2) + device = torch.device(f"cuda:{local_rank}") if torch.cuda.is_available() else torch.device("cpu") + model = DistributedDataParallel(model, device_ids=[local_rank] if torch.cuda.is_available() else None).to(device) + + # 3. SETUP LOSS AND OPTIMIZER + criterion = torch.nn.MSELoss() + optimizer = torch.optim.SGD(model.parameters(), lr=0.01) + + # 4.TRAIN THE MODEL FOR 50 STEPS + for step in range(50): + model.zero_grad() + x = torch.randn(64, 32).to(device) + output = model(x) + loss = criterion(output, torch.ones_like(output)) + print(f"global_rank: {global_rank} step: {step} loss: {loss}") + loss.backward() + optimizer.step() + + # 5. VERIFY ALL COPIES OF THE MODEL HAVE THE SAME WEIGTHS AT END OF TRAINING + weight = model.module.weight.clone() + torch.distributed.all_reduce(weight) + assert torch.equal(model.module.weight, weight / world_size) + + print("Multi Node Distributed Training Done!") + + +class PyTorchDistributed(L.LightningWork): + def run(self, main_address: str, main_port: int, num_nodes: int, node_rank: int): + nprocs = torch.cuda.device_count() if torch.cuda.is_available() else 1 + torch.multiprocessing.spawn( + distributed_train, args=(main_address, main_port, num_nodes, node_rank, nprocs), nprocs=nprocs + ) + + +# 8 GPUs: (2 nodes x 4 v 100) +compute = L.CloudCompute("gpu-fast-multi") # 4 x v100 +component = MultiNode(PyTorchDistributed, num_nodes=2, cloud_compute=compute) +app = L.LightningApp(component) diff --git a/examples/app/multi_node/train_pytorch_spawn.py b/examples/app/multi_node/train_pytorch_spawn.py new file mode 100644 index 0000000..165a0c7 --- /dev/null +++ b/examples/app/multi_node/train_pytorch_spawn.py @@ -0,0 +1,52 @@ +import torch +from torch.nn.parallel.distributed import DistributedDataParallel + +import lightning as L +from lightning.app.components import PyTorchSpawnMultiNode + + +class PyTorchDistributed(L.LightningWork): + def run( + self, + world_size: int, + node_rank: int, + global_rank: str, + local_rank: int, + ): + # 1. Prepare the model + model = torch.nn.Sequential( + torch.nn.Linear(1, 1), + torch.nn.ReLU(), + torch.nn.Linear(1, 1), + ) + + # 2. Setup distributed training + device = torch.device(f"cuda:{local_rank}") if torch.cuda.is_available() else torch.device("cpu") + model = DistributedDataParallel( + model.to(device), device_ids=[local_rank] if torch.cuda.is_available() else None + ) + + # 3. Prepare loss and optimizer + criterion = torch.nn.MSELoss() + optimizer = torch.optim.SGD(model.parameters(), lr=0.01) + + # 4. Train the model for 1000 steps. + for step in range(1000): + model.zero_grad() + x = torch.tensor([0.8]).to(device) + target = torch.tensor([1.0]).to(device) + output = model(x) + loss = criterion(output, target) + print(f"global_rank: {global_rank} step: {step} loss: {loss}") + loss.backward() + optimizer.step() + + +# 8 GPUs: (2 nodes x 4 v 100) +app = L.LightningApp( + PyTorchSpawnMultiNode( + PyTorchDistributed, + num_nodes=2, + cloud_compute=L.CloudCompute("gpu-fast-multi"), # 4 x v100 + ) +) diff --git a/examples/app/payload/app.py b/examples/app/payload/app.py new file mode 100644 index 0000000..3da3a3c --- /dev/null +++ b/examples/app/payload/app.py @@ -0,0 +1,31 @@ +import lightning as L +from lightning.app.storage import Payload + + +class SourceFileWriterWork(L.LightningWork): + def __init__(self): + super().__init__() + self.value = None + + def run(self): + self.value = Payload(42) + + +class DestinationWork(L.LightningWork): + def run(self, payload): + assert payload.value == 42 + + +class RootFlow(L.LightningFlow): + def __init__(self): + super().__init__() + self.src = SourceFileWriterWork() + self.dst = DestinationWork() + + def run(self): + self.src.run() + self.dst.run(self.src.value) + self.stop("Application End!") + + +app = L.LightningApp(RootFlow()) diff --git a/examples/app/pickle_or_not/app.py b/examples/app/pickle_or_not/app.py new file mode 100644 index 0000000..25b3abf --- /dev/null +++ b/examples/app/pickle_or_not/app.py @@ -0,0 +1,54 @@ +import logging + +import lightning as L + +logger = logging.getLogger(__name__) + + +class PickleChecker(L.LightningWork): + def run(self, pickle_image: bytes): + parsed = self.parse_image(pickle_image) + if parsed == b"it is a pickle": + return True + if parsed == b"it is not a pickle": + return False + raise Exception("Couldn't parse the image") + + @staticmethod + def parse_image(image_str: bytes): + return image_str + + +class Slack(L.LightningFlow): + def __init__(self): + super().__init__() + + @staticmethod + def send_message(message): + logger.info(f"Sending message: {message}") + + def run(self): + pass + + +class RootComponent(L.LightningFlow): + def __init__(self): + super().__init__() + self.pickle_checker = PickleChecker() + self.slack = Slack() + self.counter = 3 + + def run(self): + if self.counter > 0: + logger.info(f"Running the app {self.counter}") + image_str = b"it is not a pickle" + if self.pickle_checker.run(image_str): + self.slack.send_message("It's a pickle!") + else: + self.slack.send_message("It's not a pickle!") + self.counter -= 1 + else: + self.stop("Pickle or Not End") + + +app = L.LightningApp(RootComponent()) diff --git a/examples/app/pickle_or_not/requirements.txt b/examples/app/pickle_or_not/requirements.txt new file mode 100644 index 0000000..e69de29 diff --git a/examples/app/server/app.py b/examples/app/server/app.py new file mode 100644 index 0000000..6cd2397 --- /dev/null +++ b/examples/app/server/app.py @@ -0,0 +1,42 @@ +# !pip install torchvision pydantic +import base64 +import io + +import torch +import torchvision +from PIL import Image +from pydantic import BaseModel + +import lightning as L +from lightning.app.components.serve import Image as InputImage +from lightning.app.components.serve import PythonServer + + +class PyTorchServer(PythonServer): + def setup(self): + self._model = torchvision.models.resnet18(pretrained=True) + self._device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu") + self._model.to(self._device) + + def predict(self, request): + image = base64.b64decode(request.image.encode("utf-8")) + image = Image.open(io.BytesIO(image)) + transforms = torchvision.transforms.Compose( + [ + torchvision.transforms.Resize(224), + torchvision.transforms.ToTensor(), + torchvision.transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]), + ] + ) + image = transforms(image) + image = image.to(self._device) + prediction = self._model(image.unsqueeze(0)) + return {"prediction": prediction.argmax().item()} + + +class OutputData(BaseModel): + prediction: int + + +component = PyTorchServer(input_type=InputImage, output_type=OutputData, cloud_compute=L.CloudCompute("gpu")) +app = L.LightningApp(component) diff --git a/examples/app/server_with_auto_scaler/app.py b/examples/app/server_with_auto_scaler/app.py new file mode 100644 index 0000000..8e0907b --- /dev/null +++ b/examples/app/server_with_auto_scaler/app.py @@ -0,0 +1,91 @@ +# ! pip install torch torchvision +from typing import List + +import torch +import torchvision +from pydantic import BaseModel + +import lightning as L + + +class BatchRequestModel(BaseModel): + inputs: List[L.app.components.Image] + + +class BatchResponse(BaseModel): + outputs: List[L.app.components.Number] + + +class PyTorchServer(L.app.components.PythonServer): + def __init__(self, *args, **kwargs): + super().__init__( + input_type=BatchRequestModel, + output_type=BatchResponse, + *args, + **kwargs, + ) + + def setup(self): + self._device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu") + self._model = torchvision.models.resnet18(pretrained=True).to(self._device) + + def predict(self, requests: BatchRequestModel): + transforms = torchvision.transforms.Compose( + [ + torchvision.transforms.Resize(224), + torchvision.transforms.ToTensor(), + torchvision.transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]), + ] + ) + images = [] + for request in requests.inputs: + image = L.app.components.serve.types.image.Image.deserialize(request.image) + image = transforms(image).unsqueeze(0) + images.append(image) + images = torch.cat(images) + images = images.to(self._device) + predictions = self._model(images) + results = predictions.argmax(1).cpu().numpy().tolist() + return BatchResponse(outputs=[{"prediction": pred} for pred in results]) + + +class MyAutoScaler(L.app.components.AutoScaler): + def scale(self, replicas: int, metrics: dict) -> int: + pending_requests = metrics["pending_requests"] + active_or_pending_works = replicas + metrics["pending_works"] + + if active_or_pending_works == 0: + return 1 if pending_requests > 0 else 0 + + pending_requests_per_running_or_pending_work = pending_requests / active_or_pending_works + + # scale out if the number of pending requests exceeds max batch size. + max_requests_per_work = self.max_batch_size + if pending_requests_per_running_or_pending_work >= max_requests_per_work: + return replicas + 1 + + # scale in if the number of pending requests is below 25% of max_requests_per_work + min_requests_per_work = max_requests_per_work * 0.25 + if pending_requests_per_running_or_pending_work < min_requests_per_work: + return replicas - 1 + + return replicas + + +app = L.LightningApp( + MyAutoScaler( + # work class and args + PyTorchServer, + cloud_compute=L.CloudCompute("gpu"), + # autoscaler specific args + min_replicas=1, + max_replicas=4, + scale_out_interval=10, + scale_in_interval=10, + endpoint="predict", + input_type=L.app.components.Image, + output_type=L.app.components.Number, + timeout_batching=1, + max_batch_size=8, + ) +) diff --git a/examples/app/template_streamlit_ui/app.py b/examples/app/template_streamlit_ui/app.py new file mode 100644 index 0000000..21a1303 --- /dev/null +++ b/examples/app/template_streamlit_ui/app.py @@ -0,0 +1,44 @@ +from lightning.app import LightningApp, LightningFlow +from lightning.app.frontend import StreamlitFrontend +from lightning.app.utilities.state import AppState + + +class StreamlitUI(LightningFlow): + def __init__(self): + super().__init__() + self.message_to_print = "Hello World!" + self.should_print = False + + def configure_layout(self): + return StreamlitFrontend(render_fn=render_fn) + + +def render_fn(state: AppState): + import streamlit as st + + should_print = st.button("Should print to the terminal ?") + + if should_print: + state.should_print = not state.should_print + + st.write("Currently printing." if state.should_print else "Currently waiting to print.") + + +class HelloWorld(LightningFlow): + def __init__(self): + super().__init__() + self.counter = 0 + self.streamlit_ui = StreamlitUI() + + def run(self): + self.streamlit_ui.run() + if self.streamlit_ui.should_print: + print(f"{self.counter}: {self.streamlit_ui.message_to_print}") + self.counter += 1 + self.streamlit_ui.should_print = False + + def configure_layout(self): + return [{"name": "StreamLitUI", "content": self.streamlit_ui}] + + +app = LightningApp(HelloWorld()) diff --git a/examples/app/template_streamlit_ui/requirements.txt b/examples/app/template_streamlit_ui/requirements.txt new file mode 100644 index 0000000..12a4706 --- /dev/null +++ b/examples/app/template_streamlit_ui/requirements.txt @@ -0,0 +1 @@ +streamlit diff --git a/examples/app/v0/.gitignore b/examples/app/v0/.gitignore new file mode 100644 index 0000000..186149f --- /dev/null +++ b/examples/app/v0/.gitignore @@ -0,0 +1,2 @@ +.storage +.lightning diff --git a/examples/app/v0/README.md b/examples/app/v0/README.md new file mode 100644 index 0000000..516283a --- /dev/null +++ b/examples/app/v0/README.md @@ -0,0 +1,18 @@ +# v0 app + +This app is a flow-only app with nothing fancy. +This is meant to present the basic functionalities of the lightning framework. + +## Starting it + +Local + +```bash +lightning run app app.py +``` + +Cloud + +```bash +lightning run app app.py --cloud +``` diff --git a/examples/app/v0/app.py b/examples/app/v0/app.py new file mode 100644 index 0000000..bf8803f --- /dev/null +++ b/examples/app/v0/app.py @@ -0,0 +1,49 @@ +# v0_app.py +import os +from datetime import datetime +from time import sleep + +import lightning as L +from lightning.app.frontend import StaticWebFrontend + + +class Word(L.LightningFlow): + def __init__(self, letter): + super().__init__() + self.letter = letter + self.repeats = letter + + def run(self): + self.repeats += self.letter + + def configure_layout(self): + return StaticWebFrontend(os.path.join(os.path.dirname(__file__), f"ui/{self.letter}")) + + +class V0App(L.LightningFlow): + def __init__(self): + super().__init__() + self.aas = Word("a") + self.bbs = Word("b") + self.counter = 0 + + def run(self): + now = datetime.now() + now = now.strftime("%H:%M:%S") + log = {"time": now, "a": self.aas.repeats, "b": self.bbs.repeats} + print(log) + self.aas.run() + self.bbs.run() + + sleep(2.0) + self.counter += 1 + + def configure_layout(self): + tab1 = {"name": "Tab_1", "content": self.aas} + tab2 = {"name": "Tab_2", "content": self.bbs} + tab3 = {"name": "Tab_3", "content": "https://tensorboard.dev/experiment/8m1aX0gcQ7aEmH0J7kbBtg/#scalars"} + + return [tab1, tab2, tab3] + + +app = L.LightningApp(V0App(), log_level="debug") diff --git a/examples/app/v0/emulate_ui.py b/examples/app/v0/emulate_ui.py new file mode 100644 index 0000000..8a5b45c --- /dev/null +++ b/examples/app/v0/emulate_ui.py @@ -0,0 +1,19 @@ +from time import sleep + +import requests + +from lightning.app.utilities.state import headers_for + +headers = headers_for({}) +headers["X-Lightning-Type"] = "DEFAULT" + +res = requests.get("http://127.0.0.1:7501/state", headers=headers) + + +res = requests.post("http://127.0.0.1:7501/state", json={"stage": "running"}, headers=headers) +print(res) + +sleep(10) + +res = requests.post("http://127.0.0.1:7501/state", json={"stage": "stopping"}, headers=headers) +print(res) diff --git a/examples/app/v0/requirements.txt b/examples/app/v0/requirements.txt new file mode 100644 index 0000000..edfce78 --- /dev/null +++ b/examples/app/v0/requirements.txt @@ -0,0 +1 @@ +py diff --git a/examples/app/v0/ui/a/index.html b/examples/app/v0/ui/a/index.html new file mode 100644 index 0000000..6ddb9a5 --- /dev/null +++ b/examples/app/v0/ui/a/index.html @@ -0,0 +1 @@ +
Hello from component A
diff --git a/examples/app/v0/ui/b/index.html b/examples/app/v0/ui/b/index.html new file mode 100644 index 0000000..3bfd9e2 --- /dev/null +++ b/examples/app/v0/ui/b/index.html @@ -0,0 +1 @@ +
Hello from component B
diff --git a/examples/app/works_on_default_machine/app_v2.py b/examples/app/works_on_default_machine/app_v2.py new file mode 100644 index 0000000..ee60e77 --- /dev/null +++ b/examples/app/works_on_default_machine/app_v2.py @@ -0,0 +1,53 @@ +from fastapi import FastAPI +from fastapi.middleware.cors import CORSMiddleware +from uvicorn import run + +from lightning import CloudCompute, LightningApp, LightningFlow, LightningWork + + +class Work(LightningWork): + def __init__(self, **kwargs): + super().__init__(parallel=True, **kwargs) + + def run(self): + fastapi_service = FastAPI() + + fastapi_service.add_middleware( + CORSMiddleware, + allow_origins=["*"], + allow_credentials=True, + allow_methods=["*"], + allow_headers=["*"], + ) + + @fastapi_service.get("/") + def get_root(): + return {"Hello Word!"} + + run(fastapi_service, host=self.host, port=self.port) + + +class Flow(LightningFlow): + def __init__(self): + super().__init__() + # In the Cloud: All the works defined without passing explicitly a CloudCompute object + # are running on the default machine. + # This would apply to `work_a`, `work_b` and the dynamically created `work_d`. + + self.work_a = Work() + self.work_b = Work() + + self.work_c = Work(cloud_compute=CloudCompute(name="cpu-small")) + + def run(self): + if not hasattr(self, "work_d"): + self.work_d = Work() + + for work in self.works(): + work.run() + + def configure_layout(self): + return [{"name": w.name, "content": w} for i, w in enumerate(self.works())] + + +app = LightningApp(Flow(), log_level="debug") diff --git a/examples/app/works_on_default_machine/requirements.txt b/examples/app/works_on_default_machine/requirements.txt new file mode 100644 index 0000000..12a4706 --- /dev/null +++ b/examples/app/works_on_default_machine/requirements.txt @@ -0,0 +1 @@ +streamlit diff --git a/examples/data/image/imagenet.py b/examples/data/image/imagenet.py new file mode 100644 index 0000000..c9cd50f --- /dev/null +++ b/examples/data/image/imagenet.py @@ -0,0 +1,190 @@ +import os +import traceback +from argparse import ArgumentParser +from typing import Callable, Literal, Optional + +import torch +import torch.nn.functional as F +import torch.optim as optim +import torch.optim.lr_scheduler as lr_scheduler + +import lightning as L +from lightning.pytorch.utilities.model_helpers import get_torchvision_model + +parser = ArgumentParser() +parser.add_argument("--workers", default=4, type=int) +parser.add_argument("--batchsize", default=56, type=int) +parser.add_argument("-e", "--evaluate", dest="evaluate", action="store_true", help="evaluate model on validation set") +args = parser.parse_args() + +# -------------------------------- +# Step 1: Define a LightningModule +# -------------------------------- + + +class ImageNetLightningModel(L.LightningModule): + """ + >>> ImageNetLightningModel(data_path='missing') # doctest: +ELLIPSIS +NORMALIZE_WHITESPACE + ImageNetLightningModel( + (model): ResNet(...) + ) + """ + + from torchvision.models.resnet import ResNet18_Weights + + def __init__( + self, + data_path: str, + index_file_path: str = None, + arch: str = "resnet18", + weights=ResNet18_Weights.IMAGENET1K_V1, + lr: float = 1e-4, + momentum: float = 0.9, + weight_decay: float = 1e-4, + batch_size: int = 256, + workers: int = 4, + ): + super().__init__() + self.arch = arch + self.weights = weights + self.lr = lr + self.momentum = momentum + self.weight_decay = weight_decay + self.batch_size = batch_size + self.workers = workers + self.data_path = data_path + self.index_file_path = index_file_path + self.model = get_torchvision_model(self.arch, weights=self.weights) + self.train_dataset: Optional[Dataset] = None + self.eval_dataset: Optional[Dataset] = None + + def forward(self, x): + return self.model(x) + + def training_step(self, batch, batch_idx): + images, target = batch + output = self.model(images) + loss_train = F.cross_entropy(output, target) + self.log("train_loss", loss_train) + return loss_train + + def eval_step(self, batch, batch_idx, prefix: str): + images, target = batch + output = self.model(images) + loss_val = F.cross_entropy(output, target) + self.log(f"{prefix}_loss", loss_val) + return loss_val + + def validation_step(self, batch, batch_idx): + return self.eval_step(batch, batch_idx, "val") + + def test_step(self, batch, batch_idx): + return self.eval_step(batch, batch_idx, "test") + + def configure_optimizers(self): + optimizer = optim.SGD(self.parameters(), lr=self.lr, momentum=self.momentum, weight_decay=self.weight_decay) + scheduler = lr_scheduler.LambdaLR(optimizer, lambda epoch: 0.1 ** (epoch // 30)) + return [optimizer], [scheduler] + + def train_dataloader(self): + import torchvision as tv + + transforms = tv.transforms.Compose([tv.transforms.RandomResizedCrop(224), tv.transforms.ToTensor()]) + + train_dataset = S3LightningImagenetDataset( + data_source=self.data_path, split="train", transforms=transforms, path_to_index_file=self.index_file_path + ) + + return torch.utils.data.DataLoader( + dataset=train_dataset, batch_size=self.batch_size, shuffle=True, num_workers=self.workers + ) + + def val_dataloader(self): + import torchvision as tv + + transforms = tv.transforms.Compose([tv.transforms.RandomResizedCrop(224), tv.transforms.ToTensor()]) + + val_dataset = S3LightningImagenetDataset( + data_source=self.data_path, split="val", transforms=transforms, path_to_index_file=self.index_file_path + ) + + return torch.utils.data.DataLoader( + dataset=val_dataset, batch_size=self.batch_size, shuffle=True, num_workers=self.workers + ) + + def test_dataloader(self): + return self.val_dataloader() + + +# ------------------- +# Step 2: Define data +# ------------------- + + +class S3LightningImagenetDataset(L.LightningDataset): + def __init__( + self, + data_source: str, + split: Literal["train", "val"], + transforms: Optional[Callable] = None, + path_to_index_file: Optional[str] = None, + ): + from torchvision.models._meta import _IMAGENET_CATEGORIES + + super().__init__(data_source=data_source, backend="s3", path_to_index_file=path_to_index_file) + + # only get files for the split + self.files = tuple([x for x in self.files if split in x]) + + # get unique classes + self.classes = _IMAGENET_CATEGORIES + + self.transforms = transforms + + def load_sample(self, file_path, stream): + from PIL import Image + + try: + img = Image.open(stream) + + if self.transforms is not None: + img = self.transforms(img) + + # Converting grey scale images to RGB + if img.shape[0] == 1: + img = img.repeat((3, 1, 1)) + + curr_cls = os.path.basename(os.path.dirname(file_path)).replace("_", " ") + cls_idx = self.classes.index(curr_cls) + return img, cls_idx + except Exception: + print(file_path, traceback.print_exc()) + pass + + +if __name__ == "__main__": + # os.environ["AWS_ACCESS_KEY"] = + # os.environ["AWS_SECRET_ACCESS_KEY"] = + + data_path = "s3://imagenet-tiny" + index_file_path = "imagenet/imagenet-index.txt" + + # ------------------- + # Step 3: Train + # ------------------- + + print("Instantiate Model") + model = ImageNetLightningModel( + weights=None, + data_path=data_path, + index_file_path=index_file_path, + batch_size=args.batchsize, + workers=args.workers, + ) + trainer = L.Trainer() + + print("Train Model") + if args.evaluate: + trainer.test(model) + else: + trainer.fit(model) diff --git a/examples/fabric/build_your_own_trainer/README.md b/examples/fabric/build_your_own_trainer/README.md new file mode 100644 index 0000000..b795ad3 --- /dev/null +++ b/examples/fabric/build_your_own_trainer/README.md @@ -0,0 +1,27 @@ +## Build Your Own Trainer (BYOT) + +This example demonstrates how easy it is to build a fully customizable trainer for your `LightningModule` using `Fabric`. +It is built upon `lightning.fabric` for hardware and training orchestration and consists of two files: + +- trainer.py contains the actual `MyCustomTrainer` implementation +- run.py contains a script utilizing this trainer for training a very simple MNIST module. + +### Run + +To run this example, call `python run.py` + +### Requirements + +This example has the following requirements which need to be installed on your python environment: + +- `lightning` +- `torchmetrics` +- `torch` +- `torchvision` +- `tqdm` + +to install them with the appropriate versions run: + +```bash +pip install "lightning>=2.0" "torchmetrics>=0.11" "torchvision>=0.14" "torch>=1.13" tqdm +``` diff --git a/examples/fabric/build_your_own_trainer/run.py b/examples/fabric/build_your_own_trainer/run.py new file mode 100644 index 0000000..6902374 --- /dev/null +++ b/examples/fabric/build_your_own_trainer/run.py @@ -0,0 +1,81 @@ +import torch +from torchmetrics.functional.classification.accuracy import accuracy +from trainer import MyCustomTrainer + +import lightning as L + + +class MNISTModule(L.LightningModule): + def __init__(self) -> None: + super().__init__() + self.model = torch.nn.Sequential( + torch.nn.Conv2d( + in_channels=1, + out_channels=16, + kernel_size=5, + stride=1, + padding=2, + ), + torch.nn.ReLU(), + torch.nn.MaxPool2d(kernel_size=2), + torch.nn.Conv2d(16, 32, 5, 1, 2), + torch.nn.ReLU(), + torch.nn.MaxPool2d(2), + torch.nn.Flatten(), + # fully connected layer, output 10 classes + torch.nn.Linear(32 * 7 * 7, 10), + ) + self.loss_fn = torch.nn.CrossEntropyLoss() + + def forward(self, x: torch.Tensor): + return self.model(x) + + def training_step(self, batch, batch_idx: int): + x, y = batch + + logits = self(x) + + loss = self.loss_fn(logits, y) + accuracy_train = accuracy(logits.argmax(-1), y, num_classes=10, task="multiclass", top_k=1) + + return {"loss": loss, "accuracy": accuracy_train} + + def configure_optimizers(self): + optim = torch.optim.Adam(self.parameters(), lr=1e-4) + return optim, { + "scheduler": torch.optim.lr_scheduler.ReduceLROnPlateau(optim, mode="max", verbose=True), + "monitor": "val_accuracy", + "interval": "epoch", + "frequency": 1, + } + + def validation_step(self, *args, **kwargs): + return self.training_step(*args, **kwargs) + + +def train(model): + from torchvision.datasets import MNIST + from torchvision.transforms import ToTensor + + train_set = MNIST(root="/tmp/data/MNIST", train=True, transform=ToTensor(), download=True) + val_set = MNIST(root="/tmp/data/MNIST", train=False, transform=ToTensor(), download=False) + + train_loader = torch.utils.data.DataLoader( + train_set, batch_size=64, shuffle=True, pin_memory=torch.cuda.is_available(), num_workers=4 + ) + val_loader = torch.utils.data.DataLoader( + val_set, batch_size=64, shuffle=False, pin_memory=torch.cuda.is_available(), num_workers=4 + ) + + # MPS backend currently does not support all operations used in this example. + # If you want to use MPS, set accelerator='auto' and also set PYTORCH_ENABLE_MPS_FALLBACK=1 + accelerator = "cpu" if torch.backends.mps.is_available() else "auto" + + trainer = MyCustomTrainer( + accelerator=accelerator, devices="auto", limit_train_batches=10, limit_val_batches=20, max_epochs=3 + ) + trainer.fit(model, train_loader, val_loader) + + +if __name__ == "__main__": + train(MNISTModule()) diff --git a/examples/fabric/build_your_own_trainer/trainer.py b/examples/fabric/build_your_own_trainer/trainer.py new file mode 100644 index 0000000..69895b6 --- /dev/null +++ b/examples/fabric/build_your_own_trainer/trainer.py @@ -0,0 +1,525 @@ +import os +from collections.abc import Mapping +from functools import partial +from typing import Any, cast, Iterable, List, Literal, Optional, Tuple, Union + +import torch +from lightning_utilities import apply_to_collection +from tqdm import tqdm + +import lightning as L +from lightning.fabric.accelerators import Accelerator +from lightning.fabric.loggers import Logger +from lightning.fabric.strategies import Strategy +from lightning.fabric.wrappers import _unwrap_objects +from lightning.pytorch.utilities.model_helpers import is_overridden + + +class MyCustomTrainer: + def __init__( + self, + accelerator: Union[str, Accelerator] = "auto", + strategy: Union[str, Strategy] = "auto", + devices: Union[List[int], str, int] = "auto", + precision: Union[str, int] = "32-true", + plugins: Optional[Union[str, Any]] = None, + callbacks: Optional[Union[List[Any], Any]] = None, + loggers: Optional[Union[Logger, List[Logger]]] = None, + max_epochs: Optional[int] = 1000, + max_steps: Optional[int] = None, + grad_accum_steps: int = 1, + limit_train_batches: Union[int, float] = float("inf"), + limit_val_batches: Union[int, float] = float("inf"), + validation_frequency: int = 1, + use_distributed_sampler: bool = True, + checkpoint_dir: str = "./checkpoints", + checkpoint_frequency: int = 1, + ) -> None: + """Exemplary Trainer with Fabric. This is a very simple trainer focused on readablity but with reduced + featureset. As a trainer with more included features, we recommend using the + :class:`lightning.pytorch.Trainer`. + + Args: + accelerator: The hardware to run on. Possible choices are: + ``"cpu"``, ``"cuda"``, ``"mps"``, ``"gpu"``, ``"tpu"``, ``"auto"``. + strategy: Strategy for how to run across multiple devices. Possible choices are: + ``"dp"``, ``"ddp"``, ``"ddp_spawn"``, ``"deepspeed"``, ``"fsdp"``. + devices: Number of devices to train on (``int``), + which GPUs to train on (``list`` or ``str``), or ``"auto"``. + The value applies per node. + precision: Double precision (``"64"``), full precision (``"32"``), half precision AMP (``"16-mixed"``), + or bfloat16 precision AMP (``"bf16-mixed"``). + plugins: One or several custom plugins + callbacks: A single callback or a list of callbacks. The following hooks are supported: + - on_train_epoch_start + - on train_epoch_end + - on_train_batch_start + - on_train_batch_end + - on_before_backward + - on_after_backward + - on_before_zero_grad + - on_before_optimizer_step + - on_validation_model_eval + - on_validation_model_train + - on_validation_epoch_start + - on_validation_epoch_end + - on_validation_batch_start + - on_validation_batch_end + + loggers: A single logger or a list of loggers. See :meth:`~lightning.fabric.fabric.Fabric.log` for more + information. + + max_epochs: The maximum number of epochs to train + max_steps: The maximum number of (optimizer) steps to train + grad_accum_steps: How many batches to process before each optimizer step + limit_train_batches: Limits the number of train batches per epoch + If greater than number of batches in the dataloader, this has no effect. + limit_val_batches: Limits the number of validation batches per epoch. + If greater than number of batches in the dataloader, this has no effect. + validation_frequency: How many epochs to run before each validation epoch. + use_distributed_sampler: Wraps the sampler of each dataloader with a respective distributed-aware sampler + in case of distributed training. + checkpoint_dir: Directory to store checkpoints to. + checkpoint_frequency: How many epochs to run before each checkpoint is written. + + Warning: + callbacks written for the lightning trainer (especially making assumptions on the trainer), won't work! + """ + + self.fabric = L.Fabric( + accelerator=accelerator, + strategy=strategy, + devices=devices, + precision=precision, + plugins=plugins, + callbacks=callbacks, + loggers=loggers, + ) + self.global_step = 0 + self.grad_accum_steps: int = grad_accum_steps + self.current_epoch = 0 + + self.max_epochs = max_epochs + self.max_steps = max_steps + self.should_stop = False + + # ensures limit_X_batches is either int or inf + if not isinstance(limit_train_batches, int): + assert limit_train_batches == float("inf") + + if not isinstance(limit_val_batches, int): + assert limit_val_batches == float("inf") + + self.limit_train_batches = limit_train_batches + self.limit_val_batches = limit_val_batches + self.validation_frequency = validation_frequency + self.use_distributed_sampler = use_distributed_sampler + self._current_train_return: Union[torch.Tensor, Mapping[str, Any]] = {} + self._current_val_return: Optional[Union[torch.Tensor, Mapping[str, Any]]] = {} + + self.checkpoint_dir = checkpoint_dir + self.checkpoint_frequency = checkpoint_frequency + + def fit( + self, + model: L.LightningModule, + train_loader: torch.utils.data.DataLoader, + val_loader: torch.utils.data.DataLoader, + ckpt_path: Optional[str] = None, + ): + """The main entrypoint of the trainer, triggering the actual training. + + Args: + model: the LightningModule to train. + Can have the same hooks as :attr:`callbacks` (see :meth:`MyCustomTrainer.__init__`). + train_loader: the training dataloader. Has to be an iterable returning batches. + val_loader: the validation dataloader. Has to be an iterable returning batches. + If not specified, no validation will run. + ckpt_path: Path to previous checkpoints to resume training from. + If specified, will always look for the latest checkpoint within the given directory. + """ + self.fabric.launch() + + # setup dataloaders + train_loader = self.fabric.setup_dataloaders(train_loader, use_distributed_sampler=self.use_distributed_sampler) + if val_loader is not None: + val_loader = self.fabric.setup_dataloaders(val_loader, use_distributed_sampler=self.use_distributed_sampler) + + # setup model and optimizer + if isinstance(self.fabric.strategy, L.fabric.strategies.fsdp.FSDPStrategy): + # currently, there is no way to support fsdp with model.configure_optimizers in fabric + # as it would require fabric to hold a reference to the model, which we don't want to. + raise NotImplementedError("BYOT currently does not support FSDP") + + optimizer, scheduler_cfg = self._parse_optimizers_schedulers(model.configure_optimizers()) + assert optimizer is not None + model, optimizer = self.fabric.setup(model, optimizer) + + # assemble state (current epoch and global step will be added in save) + state = {"model": model, "optim": optimizer, "scheduler": scheduler_cfg} + + # load last checkpoint if available + if ckpt_path is not None and os.path.isdir(ckpt_path): + latest_checkpoint_path = self.get_latest_checkpoint(self.checkpoint_dir) + if latest_checkpoint_path is not None: + self.load(state, latest_checkpoint_path) + + # check if we even need to train here + if self.max_epochs is not None and self.current_epoch >= self.max_epochs: + self.should_stop = True + + while not self.should_stop: + self.train_loop( + model, optimizer, train_loader, limit_batches=self.limit_train_batches, scheduler_cfg=scheduler_cfg + ) + + if self.should_validate: + self.val_loop(model, val_loader, limit_batches=self.limit_val_batches) + + self.step_scheduler(model, scheduler_cfg, level="epoch", current_value=self.current_epoch) + + self.current_epoch += 1 + + # stopping condition on epoch level + if self.max_epochs is not None and self.current_epoch >= self.max_epochs: + self.should_stop = True + + self.save(state) + + # reset for next fit call + self.should_stop = False + + def train_loop( + self, + model: L.LightningModule, + optimizer: torch.optim.Optimizer, + train_loader: torch.utils.data.DataLoader, + limit_batches: Union[int, float] = float("inf"), + scheduler_cfg: Optional[Mapping[str, Union[L.fabric.utilities.types.LRScheduler, bool, str, int]]] = None, + ): + """The training loop running a single training epoch. + + Args: + model: the LightningModule to train + optimizer: the optimizer, optimizing the LightningModule. + train_loader: The dataloader yielding the training batches. + limit_batches: Limits the batches during this training epoch. + If greater then the number of batches in the ``train_loader``, this has no effect. + scheduler_cfg: The learning rate scheduler configuration. + Have a look at :meth:`lightning.pytorch.LightninModule.configure_optimizers` for supported values. + """ + self.fabric.call("on_train_epoch_start") + iterable = self.progbar_wrapper( + train_loader, total=min(len(train_loader), limit_batches), desc=f"Epoch {self.current_epoch}" + ) + + for batch_idx, batch in enumerate(iterable): + # end epoch if stopping training completely or max batches for this epoch reached + if self.should_stop or batch_idx >= limit_batches: + break + + self.fabric.call("on_train_batch_start", batch, batch_idx) + + # check if optimizer should step in gradient accumulation + should_optim_step = self.global_step % self.grad_accum_steps == 0 + if should_optim_step: + # currently only supports a single optimizer + self.fabric.call("on_before_optimizer_step", optimizer, 0) + + # optimizer step runs train step internally through closure + optimizer.step(partial(self.training_step, model=model, batch=batch, batch_idx=batch_idx)) + self.fabric.call("on_before_zero_grad", optimizer) + + optimizer.zero_grad() + + else: + # gradient accumulation -> no optimizer step + self.training_step(model=model, batch=batch, batch_idx=batch_idx) + + self.fabric.call("on_train_batch_end", self._current_train_return, batch, batch_idx) + + # this guard ensures, we only step the scheduler once per global step + if should_optim_step: + self.step_scheduler(model, scheduler_cfg, level="step", current_value=self.global_step) + + # add output values to progress bar + self._format_iterable(iterable, self._current_train_return, "train") + + # only increase global step if optimizer stepped + self.global_step += int(should_optim_step) + + # stopping criterion on step level + if self.max_steps is not None and self.global_step >= self.max_steps: + self.should_stop = True + break + + self.fabric.call("on_train_epoch_end") + + def val_loop( + self, + model: L.LightningModule, + val_loader: Optional[torch.utils.data.DataLoader], + limit_batches: Union[int, float] = float("inf"), + ): + """The validation loop ruunning a single validation epoch. + + Args: + model: the LightningModule to evaluate + val_loader: The dataloader yielding the validation batches. + limit_batches: Limits the batches during this validation epoch. + If greater then the number of batches in the ``val_loader``, this has no effect. + """ + # no validation if val_loader wasn't passed + if val_loader is None: + return + + # no validation but warning if val_loader was passed, but validation_step not implemented + if val_loader is not None and not is_overridden("validation_step", _unwrap_objects(model)): + L.fabric.utilities.rank_zero_warn( + "Your LightningModule does not have a validation_step implemented, " + "but you passed a validation dataloder. Skipping Validation." + ) + return + + self.fabric.call("on_validation_model_eval") # calls `model.eval()` + + torch.set_grad_enabled(False) + + self.fabric.call("on_validation_epoch_start") + + iterable = self.progbar_wrapper(val_loader, total=min(len(val_loader), limit_batches), desc="Validation") + + for batch_idx, batch in enumerate(iterable): + # end epoch if stopping training completely or max batches for this epoch reached + if self.should_stop or batch_idx >= limit_batches: + break + + self.fabric.call("on_validation_batch_start", batch, batch_idx) + + out = model.validation_step(batch, batch_idx) + # avoid gradients in stored/accumulated values -> prevents potential OOM + out = apply_to_collection(out, torch.Tensor, lambda x: x.detach()) + + self.fabric.call("on_validation_batch_end", out, batch, batch_idx) + self._current_val_return = out + + self._format_iterable(iterable, self._current_val_return, "val") + + self.fabric.call("on_validation_epoch_end") + + self.fabric.call("on_validation_model_train") + torch.set_grad_enabled(True) + + def training_step(self, model: L.LightningModule, batch: Any, batch_idx: int) -> torch.Tensor: + """A single training step, running forward and backward. The optimizer step is called separately, as this + is given as a closure to the optimizer step. + + Args: + model: the lightning module to train + batch: the batch to run the forward on + batch_idx: index of the current batch w.r.t the current epoch + """ + outputs: Union[torch.Tensor, Mapping[str, Any]] = model.training_step(batch, batch_idx=batch_idx) + + loss = outputs if isinstance(outputs, torch.Tensor) else outputs["loss"] + + self.fabric.call("on_before_backward", loss) + self.fabric.backward(loss) + self.fabric.call("on_after_backward") + + # avoid gradients in stored/accumulated values -> prevents potential OOM + self._current_train_return = apply_to_collection(outputs, dtype=torch.Tensor, function=lambda x: x.detach()) + + return loss + + def step_scheduler( + self, + model: L.LightningModule, + scheduler_cfg: Optional[Mapping[str, Union[L.fabric.utilities.types.LRScheduler, bool, str, int]]], + level: Literal["step", "epoch"], + current_value: int, + ) -> None: + """Steps the learning rate scheduler if necessary. + + Args: + model: The LightningModule to train + scheduler_cfg: The learning rate scheduler configuration. + Have a look at :meth:`lightning.pytorch.LightningModule.configure_optimizers` for supported values. + level: whether we are trying to step on epoch- or step-level + current_value: Holds the current_epoch if ``level==epoch``, else holds the ``global_step`` + """ + + # no scheduler + if scheduler_cfg is None: + return + + # wrong interval (step vs. epoch) + if scheduler_cfg["interval"] != level: + return + + # right interval, but wrong step wrt frequency + if current_value % cast(int, scheduler_cfg["frequency"]) != 0: + return + + # assemble potential monitored values + possible_monitor_vals = {None: None} + if isinstance(self._current_train_return, torch.Tensor): + possible_monitor_vals.update("train_loss", self._current_train_return) + elif isinstance(self._current_train_return, Mapping): + possible_monitor_vals.update({"train_" + k: v for k, v in self._current_train_return.items()}) + + if isinstance(self._current_val_return, torch.Tensor): + possible_monitor_vals.update("val_loss", self._current_val_return) + elif isinstance(self._current_val_return, Mapping): + possible_monitor_vals.update({"val_" + k: v for k, v in self._current_val_return.items()}) + + try: + monitor = possible_monitor_vals[cast(Optional[str], scheduler_cfg["monitor"])] + except KeyError as ex: + possible_keys = list(possible_monitor_vals.keys()) + raise KeyError( + f"monitor {scheduler_cfg['monitor']} is invalid. Possible values are {possible_keys}." + ) from ex + + # rely on model hook for actual step + model.lr_scheduler_step(scheduler_cfg["scheduler"], monitor) + + @property + def should_validate(self) -> bool: + """Whether to currently run validation.""" + return self.current_epoch % self.validation_frequency == 0 + + def progbar_wrapper(self, iterable: Iterable, total: int, **kwargs: Any): + """Wraps the iterable with tqdm for global rank zero. + + Args: + iterable: the iterable to wrap with tqdm + total: the total length of the iterable, necessary in case the number of batches was limited. + """ + if self.fabric.is_global_zero: + return tqdm(iterable, total=total, **kwargs) + return iterable + + def load(self, state: Optional[Mapping], path: str) -> None: + """Loads a checkpoint from a given file into state. + + Args: + state: a mapping contaning model, optimizer and lr scheduler + path: the path to load the checkpoint from + """ + if state is None: + state = {} + + remainder = self.fabric.load(path, state) + self.global_step = remainder.pop("global_step") + self.current_epoch = remainder.pop("current_epoch") + + if remainder: + raise RuntimeError(f"Unused Checkpoint Values: {remainder}") + + def save(self, state: Optional[Mapping]) -> None: + """Saves a checkpoint to the ``checkpoint_dir`` + + Args: + state: A mapping containing model, optimizer and lr scheduler. + """ + if state is None: + state = {} + + state.update(global_step=self.global_step, current_epoch=self.current_epoch) + + self.fabric.save(os.path.join(self.checkpoint_dir, f"epoch-{self.current_epoch:04d}.ckpt"), state) + + @staticmethod + def get_latest_checkpoint(checkpoint_dir: str) -> Optional[str]: + """Returns the latest checkpoint from the ``checkpoint_dir`` + + Args: + checkpoint_dir: the directory to search for checkpoints + """ + if not os.path.isdir(checkpoint_dir): + return None + + items = sorted(os.listdir(checkpoint_dir)) + + if not items: + return None + + return os.path.join(checkpoint_dir, items[-1]) + + def _parse_optimizers_schedulers( + self, configure_optim_output + ) -> Tuple[ + Optional[L.fabric.utilities.types.Optimizable], + Optional[Mapping[str, Union[L.fabric.utilities.types.LRScheduler, bool, str, int]]], + ]: + """Recursively parses the output of :meth:`lightning.pytorch.LightningModule.configure_optimizers`. + + Args: + configure_optim_output: The output of ``configure_optimizers``. + For supported values, please refer to :meth:`lightning.pytorch.LightningModule.configure_optimizers`. + """ + _lr_sched_defaults = {"interval": "epoch", "frequency": 1, "monitor": "val_loss"} + + # single optimizer + if isinstance(configure_optim_output, L.fabric.utilities.types.Optimizable): + return configure_optim_output, None + + # single lr scheduler + if isinstance(configure_optim_output, L.fabric.utilities.types.LRScheduler): + return None, _lr_sched_defaults.update(scheduler=configure_optim_output) + + # single lr scheduler config + if isinstance(configure_optim_output, Mapping): + _lr_sched_defaults.update(configure_optim_output) + return None, _lr_sched_defaults + + # list or tuple + if isinstance(configure_optim_output, (list, tuple)): + if all(isinstance(_opt_cand, L.fabric.utilities.types.Optimizable) for _opt_cand in configure_optim_output): + # single optimizer in list + if len(configure_optim_output) == 1: + return configure_optim_output[0][0], None + + raise NotImplementedError("BYOT only supports a single optimizer") + + if all( + isinstance(_lr_cand, (L.fabric.utilities.types.LRScheduler, Mapping)) + for _lr_cand in configure_optim_output + ): + # single scheduler in list + if len(configure_optim_output) == 1: + return None, self._parse_optimizers_schedulers(configure_optim_output[0])[1] + + # optimizer and lr scheduler + elif len(configure_optim_output) == 2: + opt_cands, lr_cands = ( + self._parse_optimizers_schedulers(configure_optim_output[0])[0], + self._parse_optimizers_schedulers(configure_optim_output[1])[1], + ) + return opt_cands, lr_cands + + return None, None + + @staticmethod + def _format_iterable( + prog_bar, candidates: Optional[Union[torch.Tensor, Mapping[str, Union[torch.Tensor, float, int]]]], prefix: str + ): + """Adds values as postfix string to progressbar. + + Args: + prog_bar: a progressbar (on global rank zero) or an iterable (every other rank). + candidates: the values to add as postfix strings to the progressbar. + prefix: the prefix to add to each of these values. + """ + if isinstance(prog_bar, tqdm) and candidates is not None: + postfix_str = "" + float_candidates = apply_to_collection(candidates, torch.Tensor, lambda x: x.item()) + if isinstance(candidates, torch.Tensor): + postfix_str += f" {prefix}_loss: {float_candidates:.3f}" + elif isinstance(candidates, Mapping): + for k, v in float_candidates.items(): + postfix_str += f" {prefix}_{k}: {v:.3f}" + + if postfix_str: + prog_bar.set_postfix_str(postfix_str) diff --git a/examples/fabric/dcgan/README.md b/examples/fabric/dcgan/README.md new file mode 100644 index 0000000..669e282 --- /dev/null +++ b/examples/fabric/dcgan/README.md @@ -0,0 +1,45 @@ +## DCGAN + +This is an example of a GAN (Generative Adversarial Network) that learns to generate realistic images of faces. +We show two code versions: +The first one is implemented in raw PyTorch, but isn't easy to scale. +The second one is using [Lightning Fabric](https://lightning.ai/docs/fabric) to accelerate and scale the model. + +Tip: You can easily inspect the difference between the two files with: + +```bash +sdiff train_torch.py train_fabric.py +``` + +| Real | Generated | +| :------------------------------------------------------------------------------------------------------------------: | :----------------------------------------------------------------------------------------------------------------: | +| ![sample-data](https://user-images.githubusercontent.com/5495193/206484557-2e9e3810-a9c8-4ae0-bc6e-126866fef4f0.png) | ![fake-7914](https://user-images.githubusercontent.com/5495193/206484621-5dc4a9a6-c782-4c71-8e80-27580cdcc7e6.png) | + +### Run + +**Raw PyTorch:** + +```bash +python train_torch.py +``` + +**Accelerated using Lightning Fabric:** + +```bash +python train_fabric.py +``` + +Generated images get saved to the _outputs_ folder. + +### Notes + +The CelebA dataset is hosted through a Google Drive link by the authors, but the downloads are limited. +You may get a message saying that the daily quota was reached. In this case, +[manually download the data](https://drive.google.com/drive/folders/0B7EVK8r0v71pWEZsZE9oNnFzTm8?resourcekey=0-5BR16BdXnb8hVj6CNHKzLg) +through your browser. + +### References + +- [DCGAN Tutorial](https://pytorch.org/tutorials/beginner/dcgan_faces_tutorial.html) +- [Unsupervised Representation Learning with Deep Convolutional Generative Adversarial Networks](https://arxiv.org/abs/1511.06434) +- [Large-scale CelebFaces Attributes (CelebA) Dataset](https://mmlab.ie.cuhk.edu.hk/projects/CelebA.html) diff --git a/examples/fabric/dcgan/train_fabric.py b/examples/fabric/dcgan/train_fabric.py new file mode 100644 index 0000000..2eb3998 --- /dev/null +++ b/examples/fabric/dcgan/train_fabric.py @@ -0,0 +1,268 @@ +""" +DCGAN - Accelerated with Lightning Fabric + +Code adapted from the official PyTorch DCGAN tutorial: +https://pytorch.org/tutorials/beginner/dcgan_faces_tutorial.html +""" +import os +import time +from pathlib import Path + +import torch +import torch.nn as nn +import torch.nn.parallel +import torch.optim as optim +import torch.utils.data +import torchvision.transforms as transforms +import torchvision.utils +from torchvision.datasets import CelebA + +from lightning.fabric import Fabric, seed_everything + +# Root directory for dataset +dataroot = "data/" +# Number of workers for dataloader +workers = os.cpu_count() +# Batch size during training +batch_size = 128 +# Spatial size of training images +image_size = 64 +# Number of channels in the training images +nc = 3 +# Size of z latent vector (i.e. size of generator input) +nz = 100 +# Size of feature maps in generator +ngf = 64 +# Size of feature maps in discriminator +ndf = 64 +# Number of training epochs +num_epochs = 5 +# Learning rate for optimizers +lr = 0.0002 +# Beta1 hyperparameter for Adam optimizers +beta1 = 0.5 +# Number of GPUs to use +num_gpus = 1 + + +def main(): + # Set random seed for reproducibility + seed_everything(999) + + fabric = Fabric(accelerator="auto", devices=1) + fabric.launch() + + dataset = CelebA( + root=dataroot, + split="all", + download=True, + transform=transforms.Compose( + [ + transforms.Resize(image_size), + transforms.CenterCrop(image_size), + transforms.ToTensor(), + transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5)), + ] + ), + ) + + # Create the dataloader + dataloader = torch.utils.data.DataLoader(dataset, batch_size=batch_size, shuffle=True, num_workers=workers) + + output_dir = Path("outputs-fabric", time.strftime("%Y%m%d-%H%M%S")) + output_dir.mkdir(parents=True, exist_ok=True) + + # Plot some training images + real_batch = next(iter(dataloader)) + torchvision.utils.save_image( + real_batch[0][:64], + output_dir / "sample-data.png", + padding=2, + normalize=True, + ) + + # Create the generator + generator = Generator() + + # Apply the weights_init function to randomly initialize all weights + generator.apply(weights_init) + + # Create the Discriminator + discriminator = Discriminator() + + # Apply the weights_init function to randomly initialize all weights + discriminator.apply(weights_init) + + # Initialize BCELoss function + criterion = nn.BCELoss() + + # Create batch of latent vectors that we will use to visualize + # the progression of the generator + fixed_noise = torch.randn(64, nz, 1, 1, device=fabric.device) + + # Establish convention for real and fake labels during training + real_label = 1.0 + fake_label = 0.0 + + # Set up Adam optimizers for both G and D + optimizer_d = optim.Adam(discriminator.parameters(), lr=lr, betas=(beta1, 0.999)) + optimizer_g = optim.Adam(generator.parameters(), lr=lr, betas=(beta1, 0.999)) + + discriminator, optimizer_d = fabric.setup(discriminator, optimizer_d) + generator, optimizer_g = fabric.setup(generator, optimizer_g) + dataloader = fabric.setup_dataloaders(dataloader) + + # Lists to keep track of progress + losses_g = [] + losses_d = [] + iteration = 0 + + # Training loop + for epoch in range(num_epochs): + for i, data in enumerate(dataloader, 0): + # (1) Update D network: maximize log(D(x)) + log(1 - D(G(z))) + # (a) Train with all-real batch + discriminator.zero_grad() + real = data[0] + b_size = real.size(0) + label = torch.full((b_size,), real_label, dtype=torch.float, device=fabric.device) + # Forward pass real batch through D + output = discriminator(real).view(-1) + # Calculate loss on all-real batch + err_d_real = criterion(output, label) + # Calculate gradients for D in backward pass + fabric.backward(err_d_real) + d_x = output.mean().item() + + # (b) Train with all-fake batch + # Generate batch of latent vectors + noise = torch.randn(b_size, nz, 1, 1, device=fabric.device) + # Generate fake image batch with G + fake = generator(noise) + label.fill_(fake_label) + # Classify all fake batch with D + output = discriminator(fake.detach()).view(-1) + # Calculate D's loss on the all-fake batch + err_d_fake = criterion(output, label) + # Calculate the gradients for this batch, accumulated (summed) with previous gradients + fabric.backward(err_d_fake) + d_g_z1 = output.mean().item() + # Compute error of D as sum over the fake and the real batches + err_d = err_d_real + err_d_fake + # Update D + optimizer_d.step() + + # (2) Update G network: maximize log(D(G(z))) + generator.zero_grad() + label.fill_(real_label) # fake labels are real for generator cost + # Since we just updated D, perform another forward pass of all-fake batch through D + output = discriminator(fake).view(-1) + # Calculate G's loss based on this output + err_g = criterion(output, label) + # Calculate gradients for G + fabric.backward(err_g) + d_g_z2 = output.mean().item() + # Update G + optimizer_g.step() + + # Output training stats + if i % 50 == 0: + fabric.print( + f"[{epoch}/{num_epochs}][{i}/{len(dataloader)}]\t" + f"Loss_D: {err_d.item():.4f}\t" + f"Loss_G: {err_g.item():.4f}\t" + f"D(x): {d_x:.4f}\t" + f"D(G(z)): {d_g_z1:.4f} / {d_g_z2:.4f}" + ) + + # Save Losses for plotting later + losses_g.append(err_g.item()) + losses_d.append(err_d.item()) + + # Check how the generator is doing by saving G's output on fixed_noise + if (iteration % 500 == 0) or ((epoch == num_epochs - 1) and (i == len(dataloader) - 1)): + with torch.no_grad(): + fake = generator(fixed_noise).detach().cpu() + + if fabric.is_global_zero: + torchvision.utils.save_image( + fake, + output_dir / f"fake-{iteration:04d}.png", + padding=2, + normalize=True, + ) + fabric.barrier() + + iteration += 1 + + +def weights_init(m): + # custom weights initialization called on netG and netD + classname = m.__class__.__name__ + if classname.find("Conv") != -1: + nn.init.normal_(m.weight.data, 0.0, 0.02) + elif classname.find("BatchNorm") != -1: + nn.init.normal_(m.weight.data, 1.0, 0.02) + nn.init.constant_(m.bias.data, 0) + + +class Generator(nn.Module): + def __init__(self): + super().__init__() + self.main = nn.Sequential( + # input is Z, going into a convolution + nn.ConvTranspose2d(nz, ngf * 8, 4, 1, 0, bias=False), + nn.BatchNorm2d(ngf * 8), + nn.ReLU(True), + # state size. (ngf*8) x 4 x 4 + nn.ConvTranspose2d(ngf * 8, ngf * 4, 4, 2, 1, bias=False), + nn.BatchNorm2d(ngf * 4), + nn.ReLU(True), + # state size. (ngf*4) x 8 x 8 + nn.ConvTranspose2d(ngf * 4, ngf * 2, 4, 2, 1, bias=False), + nn.BatchNorm2d(ngf * 2), + nn.ReLU(True), + # state size. (ngf*2) x 16 x 16 + nn.ConvTranspose2d(ngf * 2, ngf, 4, 2, 1, bias=False), + nn.BatchNorm2d(ngf), + nn.ReLU(True), + # state size. (ngf) x 32 x 32 + nn.ConvTranspose2d(ngf, nc, 4, 2, 1, bias=False), + nn.Tanh() + # state size. (nc) x 64 x 64 + ) + + def forward(self, input): + return self.main(input) + + +class Discriminator(nn.Module): + def __init__(self): + super().__init__() + self.main = nn.Sequential( + # input is (nc) x 64 x 64 + nn.Conv2d(nc, ndf, 4, 2, 1, bias=False), + nn.LeakyReLU(0.2, inplace=True), + # state size. (ndf) x 32 x 32 + nn.Conv2d(ndf, ndf * 2, 4, 2, 1, bias=False), + nn.BatchNorm2d(ndf * 2), + nn.LeakyReLU(0.2, inplace=True), + # state size. (ndf*2) x 16 x 16 + nn.Conv2d(ndf * 2, ndf * 4, 4, 2, 1, bias=False), + nn.BatchNorm2d(ndf * 4), + nn.LeakyReLU(0.2, inplace=True), + # state size. (ndf*4) x 8 x 8 + nn.Conv2d(ndf * 4, ndf * 8, 4, 2, 1, bias=False), + nn.BatchNorm2d(ndf * 8), + nn.LeakyReLU(0.2, inplace=True), + # state size. (ndf*8) x 4 x 4 + nn.Conv2d(ndf * 8, 1, 4, 1, 0, bias=False), + nn.Sigmoid(), + ) + + def forward(self, input): + return self.main(input) + + +if __name__ == "__main__": + main() diff --git a/examples/fabric/dcgan/train_torch.py b/examples/fabric/dcgan/train_torch.py new file mode 100644 index 0000000..6362736 --- /dev/null +++ b/examples/fabric/dcgan/train_torch.py @@ -0,0 +1,271 @@ +""" +DCGAN - Raw PyTorch Implementation + +Code adapted from the official PyTorch DCGAN tutorial: +https://pytorch.org/tutorials/beginner/dcgan_faces_tutorial.html +""" +import os +import random +import time +from pathlib import Path + +import torch +import torch.nn as nn +import torch.nn.parallel +import torch.optim as optim +import torch.utils.data +import torchvision.transforms as transforms +import torchvision.utils +from torchvision.datasets import CelebA + +# Root directory for dataset +dataroot = "data/" +# Number of workers for dataloader +workers = os.cpu_count() +# Batch size during training +batch_size = 128 +# Spatial size of training images +image_size = 64 +# Number of channels in the training images +nc = 3 +# Size of z latent vector (i.e. size of generator input) +nz = 100 +# Size of feature maps in generator +ngf = 64 +# Size of feature maps in discriminator +ndf = 64 +# Number of training epochs +num_epochs = 5 +# Learning rate for optimizers +lr = 0.0002 +# Beta1 hyperparameter for Adam optimizers +beta1 = 0.5 +# Number of GPUs to use +num_gpus = 1 + + +def main(): + # Set random seed for reproducibility + seed = 999 + print("Random Seed: ", seed) + random.seed(seed) + torch.manual_seed(seed) + + dataset = CelebA( + root=dataroot, + split="all", + download=True, + transform=transforms.Compose( + [ + transforms.Resize(image_size), + transforms.CenterCrop(image_size), + transforms.ToTensor(), + transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5)), + ] + ), + ) + + # Create the dataloader + dataloader = torch.utils.data.DataLoader(dataset, batch_size=batch_size, shuffle=True, num_workers=workers) + + # Decide which device we want to run on + device = torch.device("cuda:0" if (torch.cuda.is_available() and num_gpus > 0) else "cpu") + + output_dir = Path("outputs-torch", time.strftime("%Y%m%d-%H%M%S")) + output_dir.mkdir(parents=True, exist_ok=True) + + # Plot some training images + real_batch = next(iter(dataloader)) + torchvision.utils.save_image( + real_batch[0][:64], + output_dir / "sample-data.png", + padding=2, + normalize=True, + ) + + # Create the generator + generator = Generator().to(device) + + # Handle multi-gpu if desired + if (device.type == "cuda") and (num_gpus > 1): + generator = nn.DataParallel(generator, list(range(num_gpus))) + + # Apply the weights_init function to randomly initialize all weights + generator.apply(weights_init) + + # Create the Discriminator + discriminator = Discriminator().to(device) + + # Handle multi-gpu if desired + if (device.type == "cuda") and (num_gpus > 1): + discriminator = nn.DataParallel(discriminator, list(range(num_gpus))) + + # Apply the weights_init function to randomly initialize all weights + discriminator.apply(weights_init) + + # Initialize BCELoss function + criterion = nn.BCELoss() + + # Create batch of latent vectors that we will use to visualize + # the progression of the generator + fixed_noise = torch.randn(64, nz, 1, 1, device=device) + + # Establish convention for real and fake labels during training + real_label = 1.0 + fake_label = 0.0 + + # Set up Adam optimizers for both G and D + optimizer_d = optim.Adam(discriminator.parameters(), lr=lr, betas=(beta1, 0.999)) + optimizer_g = optim.Adam(generator.parameters(), lr=lr, betas=(beta1, 0.999)) + + # Lists to keep track of progress + losses_g = [] + losses_d = [] + iteration = 0 + + # Training loop + for epoch in range(num_epochs): + for i, data in enumerate(dataloader, 0): + # (1) Update D network: maximize log(D(x)) + log(1 - D(G(z))) + # (a) Train with all-real batch + discriminator.zero_grad() + real_cpu = data[0].to(device) + b_size = real_cpu.size(0) + label = torch.full((b_size,), real_label, dtype=torch.float, device=device) + # Forward pass real batch through D + output = discriminator(real_cpu).view(-1) + # Calculate loss on all-real batch + err_d_real = criterion(output, label) + # Calculate gradients for D in backward pass + err_d_real.backward() + d_x = output.mean().item() + + # (b) Train with all-fake batch + # Generate batch of latent vectors + noise = torch.randn(b_size, nz, 1, 1, device=device) + # Generate fake image batch with G + fake = generator(noise) + label.fill_(fake_label) + # Classify all fake batch with D + output = discriminator(fake.detach()).view(-1) + # Calculate D's loss on the all-fake batch + err_d_fake = criterion(output, label) + # Calculate the gradients for this batch, accumulated (summed) with previous gradients + err_d_fake.backward() + d_g_z1 = output.mean().item() + # Compute error of D as sum over the fake and the real batches + err_d = err_d_real + err_d_fake + # Update D + optimizer_d.step() + + # (2) Update G network: maximize log(D(G(z))) + generator.zero_grad() + label.fill_(real_label) # fake labels are real for generator cost + # Since we just updated D, perform another forward pass of all-fake batch through D + output = discriminator(fake).view(-1) + # Calculate G's loss based on this output + err_g = criterion(output, label) + # Calculate gradients for G + err_g.backward() + d_g_z2 = output.mean().item() + # Update G + optimizer_g.step() + + # Output training stats + if i % 50 == 0: + print( + f"[{epoch}/{num_epochs}][{i}/{len(dataloader)}]\t" + f"Loss_D: {err_d.item():.4f}\t" + f"Loss_G: {err_g.item():.4f}\t" + f"D(x): {d_x:.4f}\t" + f"D(G(z)): {d_g_z1:.4f} / {d_g_z2:.4f}" + ) + + # Save Losses for plotting later + losses_g.append(err_g.item()) + losses_d.append(err_d.item()) + + # Check how the generator is doing by saving G's output on fixed_noise + if (iteration % 500 == 0) or ((epoch == num_epochs - 1) and (i == len(dataloader) - 1)): + with torch.no_grad(): + fake = generator(fixed_noise).detach().cpu() + torchvision.utils.save_image( + fake, + output_dir / f"fake-{iteration:04d}.png", + padding=2, + normalize=True, + ) + + iteration += 1 + + +def weights_init(m): + # custom weights initialization called on netG and netD + classname = m.__class__.__name__ + if classname.find("Conv") != -1: + nn.init.normal_(m.weight.data, 0.0, 0.02) + elif classname.find("BatchNorm") != -1: + nn.init.normal_(m.weight.data, 1.0, 0.02) + nn.init.constant_(m.bias.data, 0) + + +class Generator(nn.Module): + def __init__(self): + super().__init__() + self.main = nn.Sequential( + # input is Z, going into a convolution + nn.ConvTranspose2d(nz, ngf * 8, 4, 1, 0, bias=False), + nn.BatchNorm2d(ngf * 8), + nn.ReLU(True), + # state size. (ngf*8) x 4 x 4 + nn.ConvTranspose2d(ngf * 8, ngf * 4, 4, 2, 1, bias=False), + nn.BatchNorm2d(ngf * 4), + nn.ReLU(True), + # state size. (ngf*4) x 8 x 8 + nn.ConvTranspose2d(ngf * 4, ngf * 2, 4, 2, 1, bias=False), + nn.BatchNorm2d(ngf * 2), + nn.ReLU(True), + # state size. (ngf*2) x 16 x 16 + nn.ConvTranspose2d(ngf * 2, ngf, 4, 2, 1, bias=False), + nn.BatchNorm2d(ngf), + nn.ReLU(True), + # state size. (ngf) x 32 x 32 + nn.ConvTranspose2d(ngf, nc, 4, 2, 1, bias=False), + nn.Tanh() + # state size. (nc) x 64 x 64 + ) + + def forward(self, input): + return self.main(input) + + +class Discriminator(nn.Module): + def __init__(self): + super().__init__() + self.main = nn.Sequential( + # input is (nc) x 64 x 64 + nn.Conv2d(nc, ndf, 4, 2, 1, bias=False), + nn.LeakyReLU(0.2, inplace=True), + # state size. (ndf) x 32 x 32 + nn.Conv2d(ndf, ndf * 2, 4, 2, 1, bias=False), + nn.BatchNorm2d(ndf * 2), + nn.LeakyReLU(0.2, inplace=True), + # state size. (ndf*2) x 16 x 16 + nn.Conv2d(ndf * 2, ndf * 4, 4, 2, 1, bias=False), + nn.BatchNorm2d(ndf * 4), + nn.LeakyReLU(0.2, inplace=True), + # state size. (ndf*4) x 8 x 8 + nn.Conv2d(ndf * 4, ndf * 8, 4, 2, 1, bias=False), + nn.BatchNorm2d(ndf * 8), + nn.LeakyReLU(0.2, inplace=True), + # state size. (ndf*8) x 4 x 4 + nn.Conv2d(ndf * 8, 1, 4, 1, 0, bias=False), + nn.Sigmoid(), + ) + + def forward(self, input): + return self.main(input) + + +if __name__ == "__main__": + main() diff --git a/examples/fabric/image_classifier/README.md b/examples/fabric/image_classifier/README.md new file mode 100644 index 0000000..65332ac --- /dev/null +++ b/examples/fabric/image_classifier/README.md @@ -0,0 +1,37 @@ +## MNIST Examples + +Here are two MNIST classifiers implemented in PyTorch. +The first one is implemented in pure PyTorch, but isn't easy to scale. +The second one is using [Lightning Fabric](https://lightning.ai/docs/fabric) to accelerate and scale the model. + +Tip: You can easily inspect the difference between the two files with: + +```bash +sdiff train_torch.py train_fabric.py +``` + +#### 1. Image Classifier with Vanilla PyTorch + +Trains a simple CNN over MNIST using vanilla PyTorch. It only supports singe GPU training. + +```bash +# CPU +python train_torch.py +``` + +______________________________________________________________________ + +#### 2. Image Classifier with Lightning Fabric + +This script shows you how to scale the pure PyTorch code to enable GPU and multi-GPU training using [Lightning Fabric](https://lightning.ai/docs/fabric). + +```bash +# CPU +lightning run model train_fabric.py + +# GPU (CUDA or M1 Mac) +lightning run model train_fabric.py --accelerator=gpu + +# Multiple GPUs +lightning run model train_fabric.py --accelerator=gpu --devices=4 +``` diff --git a/examples/fabric/image_classifier/train_fabric.py b/examples/fabric/image_classifier/train_fabric.py new file mode 100644 index 0000000..5f4d931 --- /dev/null +++ b/examples/fabric/image_classifier/train_fabric.py @@ -0,0 +1,192 @@ +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +"""Here are 4 easy steps to use Fabric in your PyTorch code. + +1. Create the Lightning Fabric object at the beginning of your script. + +2. Remove all ``.to`` and ``.cuda`` calls since Fabric will take care of it. + +3. Apply ``setup`` over each model and optimizers pair, ``setup_dataloaders`` on all your dataloaders, +and replace ``loss.backward()`` with ``self.backward(loss)``. + +4. Run the script from the terminal using ``lightning run model path/to/train.py`` + +Accelerate your training loop by setting the ``--accelerator``, ``--strategy``, ``--devices`` options directly from +the command line. See ``lightning run model --help`` or learn more from the documentation: +https://lightning.ai/docs/fabric. +""" + +import argparse +from os import path + +import torch +import torch.nn as nn +import torch.nn.functional as F +import torch.optim as optim +import torchvision.transforms as T +from torch.optim.lr_scheduler import StepLR +from torchmetrics.classification import Accuracy +from torchvision.datasets import MNIST + +from lightning.fabric import Fabric # import Fabric +from lightning.fabric import seed_everything + +DATASETS_PATH = path.join(path.dirname(__file__), "..", "..", "..", "Datasets") + + +class Net(nn.Module): + def __init__(self) -> None: + super().__init__() + self.conv1 = nn.Conv2d(1, 32, 3, 1) + self.conv2 = nn.Conv2d(32, 64, 3, 1) + self.dropout1 = nn.Dropout(0.25) + self.dropout2 = nn.Dropout(0.5) + self.fc1 = nn.Linear(9216, 128) + self.fc2 = nn.Linear(128, 10) + + def forward(self, x): + x = self.conv1(x) + x = F.relu(x) + x = self.conv2(x) + x = F.relu(x) + x = F.max_pool2d(x, 2) + x = self.dropout1(x) + x = torch.flatten(x, 1) + x = self.fc1(x) + x = F.relu(x) + x = self.dropout2(x) + x = self.fc2(x) + return F.log_softmax(x, dim=1) + + +def run(hparams): + # Create the Lightning Fabric object. The parameters like accelerator, strategy, devices etc. will be proided + # by the command line. See all options: `lightning run model --help` + fabric = Fabric() + + seed_everything(hparams.seed) # instead of torch.manual_seed(...) + + transform = T.Compose([T.ToTensor(), T.Normalize((0.1307,), (0.3081,))]) + + # Let rank 0 download the data first, then everyone will load MNIST + with fabric.rank_zero_first(): + train_dataset = MNIST(DATASETS_PATH, download=fabric.is_global_zero, train=True, transform=transform) + test_dataset = MNIST(DATASETS_PATH, download=fabric.is_global_zero, train=False, transform=transform) + + train_loader = torch.utils.data.DataLoader( + train_dataset, + batch_size=hparams.batch_size, + ) + test_loader = torch.utils.data.DataLoader(test_dataset, batch_size=hparams.batch_size) + + # don't forget to call `setup_dataloaders` to prepare for dataloaders for distributed training. + train_loader, test_loader = fabric.setup_dataloaders(train_loader, test_loader) + + model = Net() # remove call to .to(device) + optimizer = optim.Adadelta(model.parameters(), lr=hparams.lr) + + # don't forget to call `setup` to prepare for model / optimizer for distributed training. + # the model is moved automatically to the right device. + model, optimizer = fabric.setup(model, optimizer) + + scheduler = StepLR(optimizer, step_size=1, gamma=hparams.gamma) + + # use torchmetrics instead of manually computing the accuracy + test_acc = Accuracy(task="multiclass", num_classes=10).to(fabric.device) + + # EPOCH LOOP + for epoch in range(1, hparams.epochs + 1): + # TRAINING LOOP + model.train() + for batch_idx, (data, target) in enumerate(train_loader): + # NOTE: no need to call `.to(device)` on the data, target + optimizer.zero_grad() + output = model(data) + loss = F.nll_loss(output, target) + fabric.backward(loss) # instead of loss.backward() + + optimizer.step() + if (batch_idx == 0) or ((batch_idx + 1) % hparams.log_interval == 0): + print( + "Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}".format( + epoch, + batch_idx * len(data), + len(train_loader.dataset), + 100.0 * batch_idx / len(train_loader), + loss.item(), + ) + ) + if hparams.dry_run: + break + + scheduler.step() + + # TESTING LOOP + model.eval() + test_loss = 0 + with torch.no_grad(): + for data, target in test_loader: + # NOTE: no need to call `.to(device)` on the data, target + output = model(data) + test_loss += F.nll_loss(output, target, reduction="sum").item() + + # WITHOUT TorchMetrics + # pred = output.argmax(dim=1, keepdim=True) # get the index of the max log-probability + # correct += pred.eq(target.view_as(pred)).sum().item() + + # WITH TorchMetrics + test_acc(output, target) + + if hparams.dry_run: + break + + # all_gather is used to aggregated the value across processes + test_loss = fabric.all_gather(test_loss).sum() / len(test_loader.dataset) + + print(f"\nTest set: Average loss: {test_loss:.4f}, Accuracy: ({100 * test_acc.compute():.0f}%)\n") + test_acc.reset() + + if hparams.dry_run: + break + + # When using distributed training, use `fabric.save` + # to ensure the current process is allowed to save a checkpoint + if hparams.save_model: + fabric.save(model.state_dict(), "mnist_cnn.pt") + + +if __name__ == "__main__": + # Arguments can be passed in through the CLI as normal and will be parsed here + # Example: + # lightning run model image_classifier.py accelerator=cuda --epochs=3 + parser = argparse.ArgumentParser(description="Fabric MNIST Example") + parser.add_argument( + "--batch-size", type=int, default=64, metavar="N", help="input batch size for training (default: 64)" + ) + parser.add_argument("--epochs", type=int, default=14, metavar="N", help="number of epochs to train (default: 14)") + parser.add_argument("--lr", type=float, default=1.0, metavar="LR", help="learning rate (default: 1.0)") + parser.add_argument("--gamma", type=float, default=0.7, metavar="M", help="Learning rate step gamma (default: 0.7)") + parser.add_argument("--dry-run", action="store_true", default=False, help="quickly check a single pass") + parser.add_argument("--seed", type=int, default=1, metavar="S", help="random seed (default: 1)") + parser.add_argument( + "--log-interval", + type=int, + default=10, + metavar="N", + help="how many batches to wait before logging training status", + ) + parser.add_argument("--save-model", action="store_true", default=False, help="For Saving the current Model") + hparams = parser.parse_args() + + run(hparams) diff --git a/examples/fabric/image_classifier/train_torch.py b/examples/fabric/image_classifier/train_torch.py new file mode 100644 index 0000000..e2bfd75 --- /dev/null +++ b/examples/fabric/image_classifier/train_torch.py @@ -0,0 +1,152 @@ +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +import argparse +from os import path + +import torch +import torch.nn as nn +import torch.nn.functional as F +import torch.optim as optim +import torchvision.transforms as T +from torch.optim.lr_scheduler import StepLR +from torchvision.datasets import MNIST + +DATASETS_PATH = path.join(path.dirname(__file__), "..", "..", "..", "Datasets") + + +# Credit to the PyTorch team +# Taken from https://github.com/pytorch/examples/blob/master/mnist/main.py and slightly adapted. +class Net(nn.Module): + def __init__(self) -> None: + super().__init__() + self.conv1 = nn.Conv2d(1, 32, 3, 1) + self.conv2 = nn.Conv2d(32, 64, 3, 1) + self.dropout1 = nn.Dropout(0.25) + self.dropout2 = nn.Dropout(0.5) + self.fc1 = nn.Linear(9216, 128) + self.fc2 = nn.Linear(128, 10) + + def forward(self, x): + x = self.conv1(x) + x = F.relu(x) + x = self.conv2(x) + x = F.relu(x) + x = F.max_pool2d(x, 2) + x = self.dropout1(x) + x = torch.flatten(x, 1) + x = self.fc1(x) + x = F.relu(x) + x = self.dropout2(x) + x = self.fc2(x) + return F.log_softmax(x, dim=1) + + +def run(hparams): + torch.manual_seed(hparams.seed) + + use_cuda = torch.cuda.is_available() + device = torch.device("cuda" if use_cuda else "cpu") + + transform = T.Compose([T.ToTensor(), T.Normalize((0.1307,), (0.3081,))]) + train_dataset = MNIST(DATASETS_PATH, train=True, download=True, transform=transform) + test_dataset = MNIST(DATASETS_PATH, train=False, transform=transform) + train_loader = torch.utils.data.DataLoader( + train_dataset, + batch_size=hparams.batch_size, + ) + test_loader = torch.utils.data.DataLoader(test_dataset, batch_size=hparams.batch_size) + + model = Net().to(device) + optimizer = optim.Adadelta(model.parameters(), lr=hparams.lr) + + scheduler = StepLR(optimizer, step_size=1, gamma=hparams.gamma) + + # EPOCH LOOP + for epoch in range(1, hparams.epochs + 1): + # TRAINING LOOP + model.train() + for batch_idx, (data, target) in enumerate(train_loader): + data, target = data.to(device), target.to(device) + optimizer.zero_grad() + output = model(data) + loss = F.nll_loss(output, target) + loss.backward() + optimizer.step() + if (batch_idx == 0) or ((batch_idx + 1) % hparams.log_interval == 0): + print( + "Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}".format( + epoch, + batch_idx * len(data), + len(train_loader.dataset), + 100.0 * batch_idx / len(train_loader), + loss.item(), + ) + ) + if hparams.dry_run: + break + scheduler.step() + + # TESTING LOOP + model.eval() + test_loss = 0 + correct = 0 + with torch.no_grad(): + for data, target in test_loader: + data, target = data.to(device), target.to(device) + output = model(data) + test_loss += F.nll_loss(output, target, reduction="sum").item() # sum up batch loss + pred = output.argmax(dim=1, keepdim=True) # get the index of the max log-probability + correct += pred.eq(target.view_as(pred)).sum().item() + if hparams.dry_run: + break + + test_loss /= len(test_loader.dataset) + + print( + "\nTest set: Average loss: {:.4f}, Accuracy: {}/{} ({:.0f}%)\n".format( + test_loss, correct, len(test_loader.dataset), 100.0 * correct / len(test_loader.dataset) + ) + ) + + if hparams.dry_run: + break + + if hparams.save_model: + torch.save(model.state_dict(), "mnist_cnn.pt") + + +def main(): + parser = argparse.ArgumentParser(description="PyTorch MNIST Example") + parser.add_argument( + "--batch-size", type=int, default=64, metavar="N", help="input batch size for training (default: 64)" + ) + parser.add_argument("--epochs", type=int, default=14, metavar="N", help="number of epochs to train (default: 14)") + parser.add_argument("--lr", type=float, default=1.0, metavar="LR", help="learning rate (default: 1.0)") + parser.add_argument("--gamma", type=float, default=0.7, metavar="M", help="Learning rate step gamma (default: 0.7)") + parser.add_argument("--dry-run", action="store_true", default=False, help="quickly check a single pass") + parser.add_argument("--seed", type=int, default=1, metavar="S", help="random seed (default: 1)") + parser.add_argument( + "--log-interval", + type=int, + default=10, + metavar="N", + help="how many batches to wait before logging training status", + ) + parser.add_argument("--save-model", action="store_true", default=False, help="For Saving the current Model") + hparams = parser.parse_args() + run(hparams) + + +if __name__ == "__main__": + main() diff --git a/examples/fabric/kfold_cv/README.md b/examples/fabric/kfold_cv/README.md new file mode 100644 index 0000000..a98aac9 --- /dev/null +++ b/examples/fabric/kfold_cv/README.md @@ -0,0 +1,30 @@ +## K-Fold Cross Validation + +This is an example of performing K-Fold cross validation supported with [Lightning Fabric](https://lightning.ai/docs/fabric). To learn more about cross validation, check out [this article](https://sebastianraschka.com/blog/2016/model-evaluation-selection-part3.html#introduction-to-k-fold-cross-validation). + +We use the MNIST dataset to train a simple CNN model. We create the k-fold cross validation splits using the `ModelSelection.KFold` [class](https://scikit-learn.org/stable/modules/generated/sklearn.model_selection.KFold.html) in the `scikit-learn` library. Ensure that you have the `scikit-learn` library installed; + +```bash +pip install scikit-learn +``` + +#### Run K-Fold Image Classification with Lightning Fabric + +This script shows you how to scale the pure PyTorch code to enable GPU and multi-GPU training using [Lightning Fabric](https://lightning.ai/docs/fabric). + +```bash +# CPU +lightning run model train_fabric.py + +# GPU (CUDA or M1 Mac) +lightning run model train_fabric.py --accelerator=gpu + +# Multiple GPUs +lightning run model train_fabric.py --accelerator=gpu --devices=4 +``` + +### References + +- [KFold Model Selection](https://scikit-learn.org/stable/modules/generated/sklearn.model_selection.KFold.html) +- [K-Fold Cross Validation by Sebastian Rashcka](https://sebastianraschka.com/blog/2016/model-evaluation-selection-part3.html#introduction-to-k-fold-cross-validation) +- [Cross Validation Wiki]() diff --git a/examples/fabric/kfold_cv/train_fabric.py b/examples/fabric/kfold_cv/train_fabric.py new file mode 100644 index 0000000..ffaa11f --- /dev/null +++ b/examples/fabric/kfold_cv/train_fabric.py @@ -0,0 +1,194 @@ +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +import argparse +from os import path + +import torch +import torch.nn as nn +import torch.nn.functional as F +import torch.optim as optim +import torchvision.transforms as T +from sklearn import model_selection +from torch.utils.data import DataLoader, SubsetRandomSampler +from torchmetrics.classification import Accuracy +from torchvision.datasets import MNIST + +from lightning.fabric import Fabric # import Fabric +from lightning.fabric import seed_everything + +DATASETS_PATH = path.join(path.dirname(__file__), "..", "..", "..", "Datasets") + + +class Net(nn.Module): + def __init__(self) -> None: + super().__init__() + self.conv1 = nn.Conv2d(1, 32, 3, 1) + self.conv2 = nn.Conv2d(32, 64, 3, 1) + self.dropout1 = nn.Dropout(0.25) + self.dropout2 = nn.Dropout(0.5) + self.fc1 = nn.Linear(9216, 128) + self.fc2 = nn.Linear(128, 10) + + def forward(self, x): + x = self.conv1(x) + x = F.relu(x) + x = self.conv2(x) + x = F.relu(x) + x = F.max_pool2d(x, 2) + x = self.dropout1(x) + x = torch.flatten(x, 1) + x = self.fc1(x) + x = F.relu(x) + x = self.dropout2(x) + x = self.fc2(x) + return F.log_softmax(x, dim=1) + + +def train_dataloader(model, data_loader, optimizer, fabric, epoch, hparams, fold): + # TRAINING LOOP + model.train() + for batch_idx, (data, target) in enumerate(data_loader): + # NOTE: no need to call `.to(device)` on the data, target + optimizer.zero_grad() + output = model(data) + loss = F.nll_loss(output, target) + fabric.backward(loss) # instead of loss.backward() + + optimizer.step() + if (batch_idx == 0) or ((batch_idx + 1) % hparams.log_interval == 0): + print( + "Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}".format( + epoch, + batch_idx * len(data), + len(data_loader.dataset), + 100.0 * batch_idx / len(data_loader), + loss.item(), + ) + ) + + if hparams.dry_run: + break + + +def validate_dataloader(model, data_loader, fabric, hparams, fold, acc_metric): + model.eval() + loss = 0 + with torch.no_grad(): + for data, target in data_loader: + # NOTE: no need to call `.to(device)` on the data, target + output = model(data) + loss += F.nll_loss(output, target, reduction="sum").item() + + # Accuracy with torchmetrics + acc_metric.update(output, target) + + if hparams.dry_run: + break + + # all_gather is used to aggregated the value across processes + loss = fabric.all_gather(loss).sum() / len(data_loader.dataset) + + # compute acc + acc = acc_metric.compute() * 100 + + print(f"\nFor fold: {fold} Validation set: Average loss: {loss:.4f}, Accuracy: ({acc:.0f}%)\n") + return acc + + +def run(hparams): + # Create the Lightning Fabric object. The parameters like accelerator, strategy, devices etc. will be proided + # by the command line. See all options: `lightning run model --help` + fabric = Fabric() + + seed_everything(hparams.seed) # instead of torch.manual_seed(...) + + transform = T.Compose([T.ToTensor(), T.Normalize((0.1307,), (0.3081,))]) + + # Let rank 0 download the data first, then everyone will load MNIST + with fabric.rank_zero_first(): + dataset = MNIST(DATASETS_PATH, train=True, transform=transform) + + # Loop over different folds (shuffle = False by default so reproducible) + folds = hparams.folds + kfold = model_selection.KFold(n_splits=folds) + + # initialize n_splits models and optimizers + models = [Net() for _ in range(kfold.n_splits)] + optimizers = [optim.Adadelta(model.parameters(), lr=hparams.lr) for model in models] + + # fabric setup for models and optimizers + for i in range(kfold.n_splits): + models[i], optimizers[i] = fabric.setup(models[i], optimizers[i]) + + # Accuracy using torchmetrics + acc_metric = Accuracy(task="multiclass", num_classes=10).to(fabric.device) + + # loop over epochs + for epoch in range(1, hparams.epochs + 1): + # loop over folds + epoch_acc = 0 + for fold, (train_ids, val_ids) in enumerate(kfold.split(dataset)): + print(f"Working on fold {fold}") + + # initialize dataloaders based on folds + batch_size = hparams.batch_size + train_loader = DataLoader(dataset, batch_size=batch_size, sampler=SubsetRandomSampler(train_ids)) + val_loader = DataLoader(dataset, batch_size=batch_size, sampler=SubsetRandomSampler(val_ids)) + + # get model and optimizer for the current fold + model, optimizer = models[fold], optimizers[fold] + + # train and validate + train_dataloader(model, train_loader, optimizer, fabric, epoch, hparams, fold) + epoch_acc += validate_dataloader(model, val_loader, fabric, hparams, fold, acc_metric) + acc_metric.reset() + + # log epoch metrics + print(f"Epoch {epoch} - Average acc: {epoch_acc / kfold.n_splits}") + + if hparams.dry_run: + break + + # When using distributed training, use `fabric.save` + # to ensure the current process is allowed to save a checkpoint + if hparams.save_model: + fabric.save(model.state_dict(), "mnist_cnn.pt") + + +if __name__ == "__main__": + # Arguments can be passed in through the CLI as normal and will be parsed here + # Example: + # lightning run model image_classifier.py accelerator=cuda --epochs=3 + parser = argparse.ArgumentParser(description="Fabric MNIST K-Fold Cross Validation Example") + parser.add_argument( + "--batch-size", type=int, default=64, metavar="N", help="input batch size for training (default: 64)" + ) + parser.add_argument("--epochs", type=int, default=14, metavar="N", help="number of epochs to train (default: 14)") + parser.add_argument("--lr", type=float, default=1.0, metavar="LR", help="learning rate (default: 1.0)") + parser.add_argument("--gamma", type=float, default=0.7, metavar="M", help="Learning rate step gamma (default: 0.7)") + parser.add_argument("--dry-run", action="store_true", default=False, help="quickly check a single pass") + parser.add_argument("--seed", type=int, default=1, metavar="S", help="random seed (default: 1)") + parser.add_argument( + "--log-interval", + type=int, + default=10, + metavar="N", + help="how many batches to wait before logging training status", + ) + parser.add_argument("--folds", type=int, default=5, help="number of folds for k-fold cross validation") + parser.add_argument("--save-model", action="store_true", default=False, help="For Saving the current Model") + hparams = parser.parse_args() + + run(hparams) diff --git a/examples/fabric/language_model/README.md b/examples/fabric/language_model/README.md new file mode 100644 index 0000000..013b5d8 --- /dev/null +++ b/examples/fabric/language_model/README.md @@ -0,0 +1,17 @@ +## Transformers + +This example contains a simple training loop for next-word prediction with a [Transformer model](https://arxiv.org/abs/1706.03762) on a subset of the [WikiText2](https://www.salesforce.com/products/einstein/ai-research/the-wikitext-dependency-language-modeling-dataset/) dataset. +It is a simplified version of the [official PyTorch example](https://github.com/pytorch/examples/tree/main/word_language_model). + +### Train with Fabric + +```bash +# CPU +lightning run model --accelerator=cpu train.py + +# GPU (CUDA or M1 Mac) +lightning run model --accelerator=gpu train.py + +# Multiple GPUs +lightning run model --accelerator=gpu --devices=4 train.py +``` diff --git a/examples/fabric/language_model/train.py b/examples/fabric/language_model/train.py new file mode 100644 index 0000000..64af73f --- /dev/null +++ b/examples/fabric/language_model/train.py @@ -0,0 +1,75 @@ +import torch +import torch.nn.functional as F +from torch.utils.data import DataLoader, random_split + +import lightning as L +from lightning.pytorch.demos import Transformer, WikiText2 + + +def main(): + L.seed_everything(42) + + fabric = L.Fabric() + + # Data + dataset = WikiText2() + train_dataloader, val_dataloader, _ = get_dataloaders(dataset) + + # Model + model = Transformer(vocab_size=dataset.vocab_size) + + # Optimizer + optimizer = torch.optim.SGD(model.parameters(), lr=0.1) + + model, optimizer = fabric.setup(model, optimizer) + train_dataloader, val_dataloader = fabric.setup_dataloaders(train_dataloader, val_dataloader) + train(fabric, model, optimizer, train_dataloader, val_dataloader) + + +def train(fabric, model, optimizer, train_dataloader, val_dataloader, max_epochs=20): + for epoch in range(max_epochs): + train_epoch(fabric, model, optimizer, train_dataloader, epoch) + val_loss = validate(fabric, model, val_dataloader) + fabric.print(f"val loss {val_loss.item():.4f}") + + +def train_epoch(fabric, model, optimizer, train_dataloader, epoch): + for batch_idx, batch in enumerate(train_dataloader): + input, target = batch + output = model(input, target) + loss = F.nll_loss(output, target.view(-1)) + fabric.backward(loss) + fabric.clip_gradients(model, optimizer, clip_val=0.25) + optimizer.step() + optimizer.zero_grad() + + if batch_idx % 200 == 0: + fabric.print(f"epoch: {epoch} - iteration: {batch_idx} - loss {loss.item():.4f}") + + +@torch.no_grad() +def validate(fabric, model, val_dataloader): + fabric.print("Validating ...") + model.eval() + losses = torch.zeros(len(val_dataloader)) + for k, batch in enumerate(val_dataloader): + input, target = batch + output = model(input, target) + loss = F.nll_loss(output, target.view(-1)) + losses[k] = loss.item() + out = losses.mean() + model.train() + return out + + +def get_dataloaders(dataset): + n = len(dataset) + train_dataset, val_dataset, test_dataset = random_split(dataset, [n - 4000, 2000, 2000]) + train_dataloader = DataLoader(train_dataset, batch_size=20, shuffle=True) + val_dataloader = DataLoader(val_dataset, batch_size=20, shuffle=False) + test_dataloader = DataLoader(test_dataset, batch_size=20, shuffle=False) + return train_dataloader, val_dataloader, test_dataloader + + +if __name__ == "__main__": + main() diff --git a/examples/fabric/meta_learning/README.md b/examples/fabric/meta_learning/README.md new file mode 100644 index 0000000..c31b9c7 --- /dev/null +++ b/examples/fabric/meta_learning/README.md @@ -0,0 +1,43 @@ +## Meta-Learning - MAML + +This is an example of a meta-learning algorithm called [MAML](https://arxiv.org/abs/1703.03400), trained on the +[Omniglot dataset](https://paperswithcode.com/dataset/omniglot-1) of handwritten characters from different alphabets. + +The goal of meta-learning in this context is to learn a 'meta'-model trained on many different tasks, such that it can quickly adapt to a new task when trained with very few samples (few-shot learning). +If you are new to meta-learning, have a look at this short [introduction video](https://www.youtube.com/watch?v=ItPEBdD6VMk). + +We show two code versions: +The first one is implemented in raw PyTorch, but it contains quite a bit of boilerplate code for distributed training. +The second one is using [Lightning Fabric](https://lightning.ai/docs/fabric) to accelerate and scale the model. + +Tip: You can easily inspect the difference between the two files with: + +```bash +sdiff train_torch.py train_fabric.py +``` + +### Requirements + +```bash +pip install lightning learn2learn cherry-rl 'gym<=0.22' +``` + +### Run + +**Raw PyTorch:** + +```bash +torchrun --nproc_per_node=2 --standalone train_torch.py +``` + +**Accelerated using Lightning Fabric:** + +```bash +lightning run model train_fabric.py --devices 2 --strategy ddp --accelerator cpu +``` + +### References + +- [MAML explained in 7 minutes](https://www.youtube.com/watch?v=ItPEBdD6VMk) +- [Learn2Learn Resources](http://learn2learn.net/examples/vision/#maml) +- [MAML Paper](https://arxiv.org/abs/1703.03400) diff --git a/examples/fabric/meta_learning/train_fabric.py b/examples/fabric/meta_learning/train_fabric.py new file mode 100644 index 0000000..d0806fa --- /dev/null +++ b/examples/fabric/meta_learning/train_fabric.py @@ -0,0 +1,163 @@ +""" +MAML - Accelerated with Lightning Fabric + +Adapted from https://github.com/learnables/learn2learn/blob/master/examples/vision/distributed_maml.py +Original code author: Séb Arnold - learnables.net +Based on the paper: https://arxiv.org/abs/1703.03400 + +Requirements: +- lightning>=1.9.0 +- learn2learn +- cherry-rl +- gym<=0.22 + +Run it with: + lightning run model train_fabric.py --accelerator=cuda --devices=2 --strategy=ddp +""" +import cherry +import learn2learn as l2l +import torch + +from lightning.fabric import Fabric, seed_everything + + +def accuracy(predictions, targets): + predictions = predictions.argmax(dim=1).view(targets.shape) + return (predictions == targets).sum().float() / targets.size(0) + + +def fast_adapt(batch, learner, loss, adaptation_steps, shots, ways): + data, labels = batch + + # Separate data into adaptation/evalutation sets + adaptation_indices = torch.zeros(data.size(0), dtype=bool) + adaptation_indices[torch.arange(shots * ways) * 2] = True + evaluation_indices = ~adaptation_indices + adaptation_data, adaptation_labels = data[adaptation_indices], labels[adaptation_indices] + evaluation_data, evaluation_labels = data[evaluation_indices], labels[evaluation_indices] + + # Adapt the model + for step in range(adaptation_steps): + train_error = loss(learner(adaptation_data), adaptation_labels) + learner.adapt(train_error) + + # Evaluate the adapted model + predictions = learner(evaluation_data) + valid_error = loss(predictions, evaluation_labels) + valid_accuracy = accuracy(predictions, evaluation_labels) + return valid_error, valid_accuracy + + +def main( + ways=5, + shots=5, + meta_lr=0.003, + fast_lr=0.5, + meta_batch_size=32, + adaptation_steps=1, + num_iterations=60000, + seed=42, +): + # Create the Fabric object + # Arguments get parsed from the command line, see `lightning run model --help` + fabric = Fabric() + + meta_batch_size = meta_batch_size // fabric.world_size + seed_everything(seed + fabric.global_rank) + + # Create Tasksets using the benchmark interface + tasksets = l2l.vision.benchmarks.get_tasksets( + # 'mini-imagenet' works too, but you need to download it manually due to license restrictions of ImageNet + "omniglot", + train_ways=ways, + train_samples=2 * shots, + test_ways=ways, + test_samples=2 * shots, + num_tasks=20000, + root="data", + ) + + # Create model + # model = l2l.vision.models.MiniImagenetCNN(ways) + model = l2l.vision.models.OmniglotFC(28**2, ways) + model = fabric.to_device(model) + maml = l2l.algorithms.MAML(model, lr=fast_lr, first_order=False) + optimizer = torch.optim.Adam(maml.parameters(), meta_lr) + optimizer = cherry.optim.Distributed(maml.parameters(), opt=optimizer, sync=1) + + # model, optimizer = fabric.setup(model, optimizer) + + optimizer.sync_parameters() + loss = torch.nn.CrossEntropyLoss(reduction="mean") + + for iteration in range(num_iterations): + optimizer.zero_grad() + meta_train_error = 0.0 + meta_train_accuracy = 0.0 + meta_valid_error = 0.0 + meta_valid_accuracy = 0.0 + for task in range(meta_batch_size): + # Compute meta-training loss + learner = maml.clone() + batch = fabric.to_device(tasksets.train.sample()) + evaluation_error, evaluation_accuracy = fast_adapt( + batch, + learner, + loss, + adaptation_steps, + shots, + ways, + ) + fabric.backward(evaluation_error) + meta_train_error += evaluation_error.item() + meta_train_accuracy += evaluation_accuracy.item() + + # Compute meta-validation loss + learner = maml.clone() + batch = fabric.to_device(tasksets.validation.sample()) + evaluation_error, evaluation_accuracy = fast_adapt( + batch, + learner, + loss, + adaptation_steps, + shots, + ways, + ) + meta_valid_error += evaluation_error.item() + meta_valid_accuracy += evaluation_accuracy.item() + + # Print some metrics + fabric.print("\n") + fabric.print("Iteration", iteration) + fabric.print("Meta Train Error", meta_train_error / meta_batch_size) + fabric.print("Meta Train Accuracy", meta_train_accuracy / meta_batch_size) + fabric.print("Meta Valid Error", meta_valid_error / meta_batch_size) + fabric.print("Meta Valid Accuracy", meta_valid_accuracy / meta_batch_size) + + # Average the accumulated gradients and optimize + for p in maml.parameters(): + p.grad.data.mul_(1.0 / meta_batch_size) + optimizer.step() # averages gradients across all workers + + meta_test_error = 0.0 + meta_test_accuracy = 0.0 + for task in range(meta_batch_size): + # Compute meta-testing loss + learner = maml.clone() + batch = fabric.to_device(tasksets.test.sample()) + evaluation_error, evaluation_accuracy = fast_adapt( + batch, + learner, + loss, + adaptation_steps, + shots, + ways, + ) + meta_test_error += evaluation_error.item() + meta_test_accuracy += evaluation_accuracy.item() + fabric.print("Meta Test Error", meta_test_error / meta_batch_size) + fabric.print("Meta Test Accuracy", meta_test_accuracy / meta_batch_size) + + +if __name__ == "__main__": + main() diff --git a/examples/fabric/meta_learning/train_torch.py b/examples/fabric/meta_learning/train_torch.py new file mode 100644 index 0000000..365d01d --- /dev/null +++ b/examples/fabric/meta_learning/train_torch.py @@ -0,0 +1,180 @@ +""" +MAML - Raw PyTorch implementation using the Learn2Learn library + +Adapted from https://github.com/learnables/learn2learn/blob/master/examples/vision/distributed_maml.py +Original code author: Séb Arnold - learnables.net +Based on the paper: https://arxiv.org/abs/1703.03400 + +Requirements: +- learn2learn +- cherry-rl +- gym<=0.22 + +This code is written for distributed training. + +Run it with: + torchrun --nproc_per_node=2 --standalone train_torch.py +""" +import os +import random + +import cherry +import learn2learn as l2l +import torch +import torch.distributed as dist + + +def accuracy(predictions, targets): + predictions = predictions.argmax(dim=1).view(targets.shape) + return (predictions == targets).sum().float() / targets.size(0) + + +def fast_adapt(batch, learner, loss, adaptation_steps, shots, ways, device): + data, labels = batch + data, labels = data.to(device), labels.to(device) + + # Separate data into adaptation/evalutation sets + adaptation_indices = torch.zeros(data.size(0), dtype=bool) + adaptation_indices[torch.arange(shots * ways) * 2] = True + evaluation_indices = ~adaptation_indices + adaptation_data, adaptation_labels = data[adaptation_indices], labels[adaptation_indices] + evaluation_data, evaluation_labels = data[evaluation_indices], labels[evaluation_indices] + + # Adapt the model + for step in range(adaptation_steps): + train_error = loss(learner(adaptation_data), adaptation_labels) + learner.adapt(train_error) + + # Evaluate the adapted model + predictions = learner(evaluation_data) + valid_error = loss(predictions, evaluation_labels) + valid_accuracy = accuracy(predictions, evaluation_labels) + return valid_error, valid_accuracy + + +def main( + ways=5, + shots=5, + meta_lr=0.003, + fast_lr=0.5, + meta_batch_size=32, + adaptation_steps=1, + num_iterations=60000, + cuda=True, + seed=42, +): + local_rank = int(os.environ["LOCAL_RANK"]) + world_size = int(os.environ["WORLD_SIZE"]) + os.environ["MASTER_ADDR"] = "127.0.0.1" + os.environ["MASTER_PORT"] = "12345" + dist.init_process_group("gloo", rank=local_rank, world_size=world_size) + rank = dist.get_rank() + + meta_batch_size = meta_batch_size // world_size + seed = seed + rank + + random.seed(seed) + torch.manual_seed(seed) + device = torch.device("cpu") + if cuda and torch.cuda.device_count(): + torch.cuda.manual_seed(seed) + device_id = rank % torch.cuda.device_count() + device = torch.device("cuda:" + str(device_id)) + + # Create Tasksets using the benchmark interface + tasksets = l2l.vision.benchmarks.get_tasksets( + # 'mini-imagenet' works too, but you need to download it manually due to license restrictions of ImageNet + "omniglot", + train_ways=ways, + train_samples=2 * shots, + test_ways=ways, + test_samples=2 * shots, + num_tasks=20000, + root="data", + ) + + # Create model + # model = l2l.vision.models.MiniImagenetCNN(ways) + model = l2l.vision.models.OmniglotFC(28**2, ways) + model.to(device) + maml = l2l.algorithms.MAML(model, lr=fast_lr, first_order=False) + optimizer = torch.optim.Adam(maml.parameters(), meta_lr) + optimizer = cherry.optim.Distributed(maml.parameters(), opt=optimizer, sync=1) + optimizer.sync_parameters() + loss = torch.nn.CrossEntropyLoss(reduction="mean") + + for iteration in range(num_iterations): + optimizer.zero_grad() + meta_train_error = 0.0 + meta_train_accuracy = 0.0 + meta_valid_error = 0.0 + meta_valid_accuracy = 0.0 + for task in range(meta_batch_size): + # Compute meta-training loss + learner = maml.clone() + batch = tasksets.train.sample() + evaluation_error, evaluation_accuracy = fast_adapt( + batch, + learner, + loss, + adaptation_steps, + shots, + ways, + device, + ) + evaluation_error.backward() + meta_train_error += evaluation_error.item() + meta_train_accuracy += evaluation_accuracy.item() + + # Compute meta-validation loss + learner = maml.clone() + batch = tasksets.validation.sample() + evaluation_error, evaluation_accuracy = fast_adapt( + batch, + learner, + loss, + adaptation_steps, + shots, + ways, + device, + ) + meta_valid_error += evaluation_error.item() + meta_valid_accuracy += evaluation_accuracy.item() + + # Print some metrics + if rank == 0: + print("\n") + print("Iteration", iteration) + print("Meta Train Error", meta_train_error / meta_batch_size) + print("Meta Train Accuracy", meta_train_accuracy / meta_batch_size) + print("Meta Valid Error", meta_valid_error / meta_batch_size) + print("Meta Valid Accuracy", meta_valid_accuracy / meta_batch_size) + + # Average the accumulated gradients and optimize + for p in maml.parameters(): + p.grad.data.mul_(1.0 / meta_batch_size) + optimizer.step() # averages gradients across all workers + + meta_test_error = 0.0 + meta_test_accuracy = 0.0 + for task in range(meta_batch_size): + # Compute meta-testing loss + learner = maml.clone() + batch = tasksets.test.sample() + evaluation_error, evaluation_accuracy = fast_adapt( + batch, + learner, + loss, + adaptation_steps, + shots, + ways, + device, + ) + meta_test_error += evaluation_error.item() + meta_test_accuracy += evaluation_accuracy.item() + print("Meta Test Error", meta_test_error / meta_batch_size) + print("Meta Test Accuracy", meta_test_accuracy / meta_batch_size) + + +if __name__ == "__main__": + main() diff --git a/examples/fabric/reinforcement_learning/README.md b/examples/fabric/reinforcement_learning/README.md new file mode 100644 index 0000000..73b6e91 --- /dev/null +++ b/examples/fabric/reinforcement_learning/README.md @@ -0,0 +1,129 @@ +# Proximal Policy Optimization - PPO implementation powered by Lightning Fabric + +This is an example of a Reinforcement Learning algorithm called [Proximal Policy Optimization (PPO)](https://arxiv.org/abs/1707.06347) implemented in PyTorch and accelerated by [Lightning Fabric](https://lightning.ai/docs/fabric). + +The goal of Reinforcement Learning is to train agents to act in their surrounding environment maximizing the cumulative reward received from it. This can be depicted in the following figure: + +

+ +

+ +PPO is one of such algorithms, which alternates between sampling data through interaction with the environment, and optimizing a +“surrogate” objective function using stochastic gradient ascent. + +## Requirements + +Install requirements by running + +```bash +pip install -r requirements.txt +``` + +## Example 1 - Environment coupled with the agent + +In this example we present two code versions: the first one is implemented in raw PyTorch, but it contains quite a bit of boilerplate code for distributed training. The second one is using Lightning Fabric to accelerate and scale the model. + +The main architecture is the following: + +

+ +

+ +where `N+1` processes (labelled *rank-0*, ..., *rank-N* in the figure above) will be spawned by Fabric/PyTorch, each of them running `M+1` independent copies of the environment (*Env-0*, ..., *Env-M*). Every rank has its own copy of the agent, represented by a [LightningModule](https://lightning.ai/docs/pytorch/stable/common/lightning_module.html)/[Pytorch Module](https://pytorch.org/docs/stable/generated/torch.nn.Module.html), which will be updated through distributed training. + +### Raw PyTorch: + +```bash +torchrun --nproc_per_node=2 --standalone train_torch.py +``` + +### Lightning Fabric: + +```bash +lightning run model --accelerator=cpu --strategy=ddp --devices=2 train_fabric.py +``` + +### Visualizing logs + +You can visualize training and test logs by running: + +```bash +tensorboard --logdir logs +``` + +Under the `logs` folder you should find two folders: + +- `logs/torch_logs` +- `logs/fabric_logs` + +If you have run the experiment with the `--capture-video` you should find the `train_videos` and `test_videos` folders under the specific experiment folder. + +## Results + +The following video shows a trained agent on the [LunarLander-v2 environment](https://gymnasium.farama.org/environments/box2d/lunar_lander/). + +

+ +

+ +The agent was trained with the following: + +```bash +lightning run model \ + --accelerator=cpu \ + --strategy=ddp \ + --devices=2 \ + train_fabric.py \ + --capture-video \ + --env-id LunarLander-v2 \ + --total-timesteps 500000 \ + --ortho-init \ + --num-envs 2 \ + --num-steps 2048 \ + --seed 1 +``` + +## Example 2 - Environment decoupled from the agent + +In this example we have gone even further leveraging the flexibility offered by [Fabric](https://lightning.ai/docs/fabric). +The architecture is depicted in the following figure: + +

+ +

+ +where, differently from the previous example, we have completely decoupled the environment from the agents: the *rank-0* process will be regarded as the *Player*, which runs `M+1` independent copies of the environment (*Env-0*, ..., *Env-M*); the *rank-1*, ..., *rank-N* are the *Trainers*, which contain the agent to be optimized. Player and Trainer share data through [collectives](https://lightning.ai/docs/fabric/stable/api/generated/lightning.fabric.plugins.collectives.TorchCollective.html#lightning.fabric.plugins.collectives.TorchCollective) and thanks to Fabric's flexibility we can run Player and Trainers on different devices. +So for example: + +```bash +lightning run model --devices=3 train_fabric_decoupled.py --num-envs 4 +``` + +will spawn 3 processes, one is the Player and the others the Trainers, with the Player running 4 independent environments, where every process runs on the CPU; + +```bash +lightning run model --devices=3 train_fabric_decoupled.py --num-envs 4 --cuda +``` + +will instead run only the Trainers on the GPU. +If one wants to run both the Player and the Trainers on the GPU, then both the flags `--cuda` and `--player-on-gpu` must be provided: + +```bash +lightning run model --devices=3 train_fabric_decoupled.py --num-envs 4 --cuda --player-on-gpu +``` + +> **Warning** +> +> With this second example, there is no need for the user to provide the `accellerator` and the `strategy` to the `lightning run model` script. + +## Number of updates, environment steps and share data + +In every one of the examples above, one has that: + +- The number of total updates will be given by `args.total_timesteps / args.num_steps` +- `args.num_steps` is the number of environment interactions before the agent training step, i.e. the agent gathers `args.num_steps` experiences and uses them to update itself during the training step +- `args.share_data` controls how the data is shared between processes. In particular: + - In the first example, **if `args.share_data` is set** then every process will have access at the data gathered by all the other processes, effectively calling the [all_gather](https://pytorch.org/docs/stable/distributed.html#torch.distributed.all_gather) distributed function. In this way, during the training step, the agents can employ the standard [PyTorch distributed training receipe](https://pytorch.org/docs/stable/generated/torch.nn.parallel.DistributedDataParallel.html#torch.nn.parallel.DistributedDataParallel), where one can assume that before the training starts every process sees the same data, and trains the model on a disjoint subset (from process to process) of it. Otherwise, **if `args.share_data` is not set** (the default), then every process will update the model with its own local data + - In the second example, when **`args.share_data` is set** then one has the same behaviour of the first example. Instead, when **`args.share_data` is not set** then the player scatters an almost-equal-sized subset of the collected experiences to the trainers, effectively calling the [scatter](https://pytorch.org/docs/stable/distributed.html#torch.distributed.scatter) distributed function diff --git a/examples/fabric/reinforcement_learning/requirements.txt b/examples/fabric/reinforcement_learning/requirements.txt new file mode 100644 index 0000000..83bfd42 --- /dev/null +++ b/examples/fabric/reinforcement_learning/requirements.txt @@ -0,0 +1,5 @@ +gymnasium[box2d]>=0.27.1 +moviepy +lightning>=1.9.0 +torchmetrics +tensorboard diff --git a/examples/fabric/reinforcement_learning/rl/__init__.py b/examples/fabric/reinforcement_learning/rl/__init__.py new file mode 100644 index 0000000..e69de29 diff --git a/examples/fabric/reinforcement_learning/rl/agent.py b/examples/fabric/reinforcement_learning/rl/agent.py new file mode 100644 index 0000000..6f34265 --- /dev/null +++ b/examples/fabric/reinforcement_learning/rl/agent.py @@ -0,0 +1,248 @@ +import math +from typing import Dict, Tuple + +import gymnasium as gym +import torch +import torch.nn.functional as F +from rl.loss import entropy_loss, policy_loss, value_loss +from rl.utils import layer_init +from torch import Tensor +from torch.distributions import Categorical +from torchmetrics import MeanMetric + +from lightning.pytorch import LightningModule + + +class PPOAgent(torch.nn.Module): + def __init__(self, envs: gym.vector.SyncVectorEnv, act_fun: str = "relu", ortho_init: bool = False) -> None: + super().__init__() + if act_fun.lower() == "relu": + act_fun = torch.nn.ReLU() + elif act_fun.lower() == "tanh": + act_fun = torch.nn.Tanh() + else: + raise ValueError("Unrecognized activation function: `act_fun` must be either `relu` or `tanh`") + self.critic = torch.nn.Sequential( + layer_init( + torch.nn.Linear(math.prod(envs.single_observation_space.shape), 64), + ortho_init=ortho_init, + ), + act_fun, + layer_init(torch.nn.Linear(64, 64), ortho_init=ortho_init), + act_fun, + layer_init(torch.nn.Linear(64, 1), std=1.0, ortho_init=ortho_init), + ) + self.actor = torch.nn.Sequential( + layer_init( + torch.nn.Linear(math.prod(envs.single_observation_space.shape), 64), + ortho_init=ortho_init, + ), + act_fun, + layer_init(torch.nn.Linear(64, 64), ortho_init=ortho_init), + act_fun, + layer_init(torch.nn.Linear(64, envs.single_action_space.n), std=0.01, ortho_init=ortho_init), + ) + + def get_action(self, x: Tensor, action: Tensor = None) -> Tuple[Tensor, Tensor, Tensor]: + logits = self.actor(x) + distribution = Categorical(logits=logits) + if action is None: + action = distribution.sample() + return action, distribution.log_prob(action), distribution.entropy() + + def get_greedy_action(self, x: Tensor) -> Tensor: + logits = self.actor(x) + probs = F.softmax(logits, dim=-1) + return torch.argmax(probs, dim=-1) + + def get_value(self, x: Tensor) -> Tensor: + return self.critic(x) + + def get_action_and_value(self, x: Tensor, action: Tensor = None) -> Tuple[Tensor, Tensor, Tensor, Tensor]: + action, log_prob, entropy = self.get_action(x, action) + value = self.get_value(x) + return action, log_prob, entropy, value + + def forward(self, x: Tensor, action: Tensor = None) -> Tuple[Tensor, Tensor, Tensor, Tensor]: + return self.get_action_and_value(x, action) + + @torch.no_grad() + def estimate_returns_and_advantages( + self, + rewards: Tensor, + values: Tensor, + dones: Tensor, + next_obs: Tensor, + next_done: Tensor, + num_steps: int, + gamma: float, + gae_lambda: float, + ) -> Tuple[Tensor, Tensor]: + next_value = self.get_value(next_obs).reshape(1, -1) + advantages = torch.zeros_like(rewards) + lastgaelam = 0 + for t in reversed(range(num_steps)): + if t == num_steps - 1: + nextnonterminal = torch.logical_not(next_done) + nextvalues = next_value + else: + nextnonterminal = torch.logical_not(dones[t + 1]) + nextvalues = values[t + 1] + delta = rewards[t] + gamma * nextvalues * nextnonterminal - values[t] + advantages[t] = lastgaelam = delta + gamma * gae_lambda * nextnonterminal * lastgaelam + returns = advantages + values + return returns, advantages + + +class PPOLightningAgent(LightningModule): + def __init__( + self, + envs: gym.vector.SyncVectorEnv, + act_fun: str = "relu", + ortho_init: bool = False, + vf_coef: float = 1.0, + ent_coef: float = 0.0, + clip_coef: float = 0.2, + clip_vloss: bool = False, + normalize_advantages: bool = False, + **torchmetrics_kwargs, + ): + super().__init__() + if act_fun.lower() == "relu": + act_fun = torch.nn.ReLU() + elif act_fun.lower() == "tanh": + act_fun = torch.nn.Tanh() + else: + raise ValueError("Unrecognized activation function: `act_fun` must be either `relu` or `tanh`") + self.vf_coef = vf_coef + self.ent_coef = ent_coef + self.clip_coef = clip_coef + self.clip_vloss = clip_vloss + self.normalize_advantages = normalize_advantages + self.critic = torch.nn.Sequential( + layer_init( + torch.nn.Linear(math.prod(envs.single_observation_space.shape), 64), + ortho_init=ortho_init, + ), + act_fun, + layer_init(torch.nn.Linear(64, 64), ortho_init=ortho_init), + act_fun, + layer_init(torch.nn.Linear(64, 1), std=1.0, ortho_init=ortho_init), + ) + self.actor = torch.nn.Sequential( + layer_init( + torch.nn.Linear(math.prod(envs.single_observation_space.shape), 64), + ortho_init=ortho_init, + ), + act_fun, + layer_init(torch.nn.Linear(64, 64), ortho_init=ortho_init), + act_fun, + layer_init(torch.nn.Linear(64, envs.single_action_space.n), std=0.01, ortho_init=ortho_init), + ) + self.avg_pg_loss = MeanMetric(**torchmetrics_kwargs) + self.avg_value_loss = MeanMetric(**torchmetrics_kwargs) + self.avg_ent_loss = MeanMetric(**torchmetrics_kwargs) + + def get_action(self, x: Tensor, action: Tensor = None) -> Tuple[Tensor, Tensor, Tensor]: + logits = self.actor(x) + distribution = Categorical(logits=logits) + if action is None: + action = distribution.sample() + return action, distribution.log_prob(action), distribution.entropy() + + def get_greedy_action(self, x: Tensor) -> Tensor: + logits = self.actor(x) + probs = F.softmax(logits, dim=-1) + return torch.argmax(probs, dim=-1) + + def get_value(self, x: Tensor) -> Tensor: + return self.critic(x) + + def get_action_and_value(self, x: Tensor, action: Tensor = None) -> Tuple[Tensor, Tensor, Tensor, Tensor]: + action, log_prob, entropy = self.get_action(x, action) + value = self.get_value(x) + return action, log_prob, entropy, value + + def forward(self, x: Tensor, action: Tensor = None) -> Tuple[Tensor, Tensor, Tensor, Tensor]: + return self.get_action_and_value(x, action) + + @torch.no_grad() + def estimate_returns_and_advantages( + self, + rewards: Tensor, + values: Tensor, + dones: Tensor, + next_obs: Tensor, + next_done: Tensor, + num_steps: int, + gamma: float, + gae_lambda: float, + ) -> Tuple[Tensor, Tensor]: + next_value = self.get_value(next_obs).reshape(1, -1) + advantages = torch.zeros_like(rewards) + lastgaelam = 0 + for t in reversed(range(num_steps)): + if t == num_steps - 1: + nextnonterminal = torch.logical_not(next_done) + nextvalues = next_value + else: + nextnonterminal = torch.logical_not(dones[t + 1]) + nextvalues = values[t + 1] + delta = rewards[t] + gamma * nextvalues * nextnonterminal - values[t] + advantages[t] = lastgaelam = delta + gamma * gae_lambda * nextnonterminal * lastgaelam + returns = advantages + values + return returns, advantages + + def training_step(self, batch: Dict[str, Tensor]): + # Get actions and values given the current observations + _, newlogprob, entropy, newvalue = self(batch["obs"], batch["actions"].long()) + logratio = newlogprob - batch["logprobs"] + ratio = logratio.exp() + + # Policy loss + advantages = batch["advantages"] + if self.normalize_advantages: + advantages = (advantages - advantages.mean()) / (advantages.std() + 1e-8) + + pg_loss = policy_loss(batch["advantages"], ratio, self.clip_coef) + + # Value loss + v_loss = value_loss( + newvalue, + batch["values"], + batch["returns"], + self.clip_coef, + self.clip_vloss, + self.vf_coef, + ) + + # Entropy loss + ent_loss = entropy_loss(entropy, self.ent_coef) + + # Update metrics + self.avg_pg_loss(pg_loss) + self.avg_value_loss(v_loss) + self.avg_ent_loss(ent_loss) + + # Overall loss + return pg_loss + ent_loss + v_loss + + def on_train_epoch_end(self, global_step: int) -> None: + # Log metrics and reset their internal state + self.logger.log_metrics( + { + "Loss/policy_loss": self.avg_pg_loss.compute(), + "Loss/value_loss": self.avg_value_loss.compute(), + "Loss/entropy_loss": self.avg_ent_loss.compute(), + }, + global_step, + ) + self.reset_metrics() + + def reset_metrics(self): + self.avg_pg_loss.reset() + self.avg_value_loss.reset() + self.avg_ent_loss.reset() + + def configure_optimizers(self, lr: float): + return torch.optim.Adam(self.parameters(), lr=lr, eps=1e-4) diff --git a/examples/fabric/reinforcement_learning/rl/loss.py b/examples/fabric/reinforcement_learning/rl/loss.py new file mode 100644 index 0000000..0ab74b3 --- /dev/null +++ b/examples/fabric/reinforcement_learning/rl/loss.py @@ -0,0 +1,29 @@ +import torch +import torch.nn.functional as F +from torch import Tensor + + +def policy_loss(advantages: torch.Tensor, ratio: torch.Tensor, clip_coef: float) -> torch.Tensor: + pg_loss1 = -advantages * ratio + pg_loss2 = -advantages * torch.clamp(ratio, 1 - clip_coef, 1 + clip_coef) + return torch.max(pg_loss1, pg_loss2).mean() + + +def value_loss( + new_values: Tensor, + old_values: Tensor, + returns: Tensor, + clip_coef: float, + clip_vloss: bool, + vf_coef: float, +) -> Tensor: + new_values = new_values.view(-1) + if not clip_vloss: + values_pred = new_values + else: + values_pred = old_values + torch.clamp(new_values - old_values, -clip_coef, clip_coef) + return vf_coef * F.mse_loss(values_pred, returns) + + +def entropy_loss(entropy: Tensor, ent_coef: float) -> Tensor: + return -entropy.mean() * ent_coef diff --git a/examples/fabric/reinforcement_learning/rl/utils.py b/examples/fabric/reinforcement_learning/rl/utils.py new file mode 100644 index 0000000..a990337 --- /dev/null +++ b/examples/fabric/reinforcement_learning/rl/utils.py @@ -0,0 +1,182 @@ +import argparse +import math +import os +from distutils.util import strtobool +from typing import Optional, TYPE_CHECKING, Union + +import gymnasium as gym +import torch +from torch.utils.tensorboard import SummaryWriter + +if TYPE_CHECKING: + from rl.agent import PPOAgent, PPOLightningAgent + + +def parse_args(): + parser = argparse.ArgumentParser() + parser.add_argument("--exp-name", type=str, default="default", help="the name of this experiment") + + # PyTorch arguments + parser.add_argument("--seed", type=int, default=42, help="seed of the experiment") + parser.add_argument( + "--cuda", + type=lambda x: bool(strtobool(x)), + default=False, + nargs="?", + const=True, + help="If toggled, GPU training will be used. " + "This affects also the distributed backend used (NCCL (gpu) vs GLOO (cpu))", + ) + parser.add_argument( + "--player-on-gpu", + type=lambda x: bool(strtobool(x)), + default=False, + nargs="?", + const=True, + help="If toggled, player will run on GPU (used only by `train_fabric_decoupled.py` script). " + "This affects also the distributed backend used (NCCL (gpu) vs GLOO (cpu))", + ) + parser.add_argument( + "--torch-deterministic", + type=lambda x: bool(strtobool(x)), + default=True, + nargs="?", + const=True, + help="if toggled, `torch.backends.cudnn.deterministic=False`", + ) + + # Distributed arguments + parser.add_argument("--num-envs", type=int, default=2, help="the number of parallel game environments") + parser.add_argument( + "--share-data", + type=lambda x: bool(strtobool(x)), + default=False, + nargs="?", + const=True, + help="Toggle sharing data between processes", + ) + parser.add_argument("--per-rank-batch-size", type=int, default=64, help="the batch size for each rank") + + # Environment arguments + parser.add_argument("--env-id", type=str, default="CartPole-v1", help="the id of the environment") + parser.add_argument( + "--num-steps", type=int, default=128, help="the number of steps to run in each environment per policy rollout" + ) + parser.add_argument( + "--capture-video", + type=lambda x: bool(strtobool(x)), + default=False, + nargs="?", + const=True, + help="whether to capture videos of the agent performances (check out `videos` folder)", + ) + + # PPO arguments + parser.add_argument("--total-timesteps", type=int, default=2**16, help="total timesteps of the experiments") + parser.add_argument("--learning-rate", type=float, default=1e-3, help="the learning rate of the optimizer") + parser.add_argument( + "--anneal-lr", + type=lambda x: bool(strtobool(x)), + default=False, + nargs="?", + const=True, + help="Toggle learning rate annealing for policy and value networks", + ) + parser.add_argument("--gamma", type=float, default=0.99, help="the discount factor gamma") + parser.add_argument( + "--gae-lambda", type=float, default=0.95, help="the lambda for the general advantage estimation" + ) + parser.add_argument("--update-epochs", type=int, default=10, help="the K epochs to update the policy") + parser.add_argument( + "--activation-function", + type=str, + default="relu", + choices=["relu", "tanh"], + help="The activation function of the model", + ) + parser.add_argument( + "--ortho-init", + type=lambda x: bool(strtobool(x)), + default=False, + nargs="?", + const=True, + help="Toggles the orthogonal initialization of the model", + ) + parser.add_argument( + "--normalize-advantages", + type=lambda x: bool(strtobool(x)), + default=False, + nargs="?", + const=True, + help="Toggles advantages normalization", + ) + parser.add_argument("--clip-coef", type=float, default=0.2, help="the surrogate clipping coefficient") + parser.add_argument( + "--clip-vloss", + type=lambda x: bool(strtobool(x)), + default=False, + nargs="?", + const=True, + help="Toggles whether or not to use a clipped loss for the value function, as per the paper.", + ) + parser.add_argument("--ent-coef", type=float, default=0.0, help="coefficient of the entropy") + parser.add_argument("--vf-coef", type=float, default=1.0, help="coefficient of the value function") + parser.add_argument("--max-grad-norm", type=float, default=0.5, help="the maximum norm for the gradient clipping") + return parser.parse_args() + + +def layer_init( + layer: torch.nn.Module, + std: float = math.sqrt(2), + bias_const: float = 0.0, + ortho_init: bool = True, +): + if ortho_init: + torch.nn.init.orthogonal_(layer.weight, std) + torch.nn.init.constant_(layer.bias, bias_const) + return layer + + +def linear_annealing(optimizer: torch.optim.Optimizer, update: int, num_updates: int, initial_lr: float): + frac = 1.0 - (update - 1.0) / num_updates + lrnow = frac * initial_lr + for pg in optimizer.param_groups: + pg["lr"] = lrnow + + +def make_env(env_id: str, seed: int, idx: int, capture_video: bool, run_name: Optional[str] = None, prefix: str = ""): + def thunk(): + env = gym.make(env_id, render_mode="rgb_array") + env = gym.wrappers.RecordEpisodeStatistics(env) + if capture_video and idx == 0 and run_name is not None: + env = gym.wrappers.RecordVideo( + env, os.path.join(run_name, prefix + "_videos" if prefix else "videos"), disable_logger=True + ) + env.action_space.seed(seed) + env.observation_space.seed(seed) + return env + + return thunk + + +@torch.no_grad() +def test( + agent: Union["PPOLightningAgent", "PPOAgent"], device: torch.device, logger: SummaryWriter, args: argparse.Namespace +): + env = make_env(args.env_id, args.seed, 0, args.capture_video, logger.log_dir, "test")() + step = 0 + done = False + cumulative_rew = 0 + next_obs = torch.tensor(env.reset(seed=args.seed)[0], device=device) + while not done: + # Act greedly through the environment + action = agent.get_greedy_action(next_obs) + + # Single environment step + next_obs, reward, done, truncated, info = env.step(action.cpu().numpy()) + done = done or truncated + cumulative_rew += reward + next_obs = torch.tensor(next_obs, device=device) + step += 1 + logger.add_scalar("Test/cumulative_reward", cumulative_rew, 0) + env.close() diff --git a/examples/fabric/reinforcement_learning/train_fabric.py b/examples/fabric/reinforcement_learning/train_fabric.py new file mode 100644 index 0000000..5b142fc --- /dev/null +++ b/examples/fabric/reinforcement_learning/train_fabric.py @@ -0,0 +1,215 @@ +""" +Proximal Policy Optimization (PPO) - Accelerated with Lightning Fabric + +Author: Federico Belotti @belerico +Adapted from https://github.com/vwxyzjn/cleanrl/blob/master/cleanrl/ppo.py +Based on the paper: https://arxiv.org/abs/1707.06347 + +Requirements: +- gymnasium[box2d]>=0.27.1 +- moviepy +- lightning +- torchmetrics +- tensorboard + + +Run it with: + lightning run model --accelerator=cpu --strategy=ddp --devices=2 train_fabric.py +""" + +import argparse +import os +import time +from datetime import datetime +from typing import Dict + +import gymnasium as gym +import torch +import torchmetrics +from rl.agent import PPOLightningAgent +from rl.utils import linear_annealing, make_env, parse_args, test +from torch import Tensor +from torch.utils.data import BatchSampler, DistributedSampler, RandomSampler + +from lightning.fabric import Fabric +from lightning.fabric.loggers import TensorBoardLogger + + +def train( + fabric: Fabric, + agent: PPOLightningAgent, + optimizer: torch.optim.Optimizer, + data: Dict[str, Tensor], + global_step: int, + args: argparse.Namespace, +): + indexes = list(range(data["obs"].shape[0])) + if args.share_data: + sampler = DistributedSampler( + indexes, num_replicas=fabric.world_size, rank=fabric.global_rank, shuffle=True, seed=args.seed + ) + else: + sampler = RandomSampler(indexes) + sampler = BatchSampler(sampler, batch_size=args.per_rank_batch_size, drop_last=False) + + for epoch in range(args.update_epochs): + if args.share_data: + sampler.sampler.set_epoch(epoch) + for batch_idxes in sampler: + loss = agent.training_step({k: v[batch_idxes] for k, v in data.items()}) + optimizer.zero_grad(set_to_none=True) + fabric.backward(loss) + fabric.clip_gradients(agent, optimizer, max_norm=args.max_grad_norm) + optimizer.step() + agent.on_train_epoch_end(global_step) + + +def main(args: argparse.Namespace): + run_name = f"{args.env_id}_{args.exp_name}_{args.seed}_{int(time.time())}" + logger = TensorBoardLogger( + root_dir=os.path.join("logs", "fabric_logs", datetime.today().strftime("%Y-%m-%d_%H-%M-%S")), name=run_name + ) + + # Initialize Fabric + fabric = Fabric(loggers=logger) + rank = fabric.global_rank + world_size = fabric.world_size + device = fabric.device + fabric.seed_everything(args.seed) + torch.backends.cudnn.deterministic = args.torch_deterministic + + # Log hyperparameters + fabric.logger.experiment.add_text( + "hyperparameters", + "|param|value|\n|-|-|\n%s" % ("\n".join([f"|{key}|{value}|" for key, value in vars(args).items()])), + ) + + # Environment setup + envs = gym.vector.SyncVectorEnv( + [ + make_env( + args.env_id, args.seed + rank * args.num_envs + i, rank, args.capture_video, logger.log_dir, "train" + ) + for i in range(args.num_envs) + ] + ) + assert isinstance(envs.single_action_space, gym.spaces.Discrete), "only discrete action space is supported" + + # Define the agent and the optimizer and setup them with Fabric + agent: PPOLightningAgent = PPOLightningAgent( + envs, + act_fun=args.activation_function, + vf_coef=args.vf_coef, + ent_coef=args.ent_coef, + clip_coef=args.clip_coef, + clip_vloss=args.clip_vloss, + ortho_init=args.ortho_init, + normalize_advantages=args.normalize_advantages, + ) + optimizer = agent.configure_optimizers(args.learning_rate) + agent, optimizer = fabric.setup(agent, optimizer) + + # Player metrics + rew_avg = torchmetrics.MeanMetric().to(device) + ep_len_avg = torchmetrics.MeanMetric().to(device) + + # Local data + obs = torch.zeros((args.num_steps, args.num_envs) + envs.single_observation_space.shape, device=device) + actions = torch.zeros((args.num_steps, args.num_envs) + envs.single_action_space.shape, device=device) + logprobs = torch.zeros((args.num_steps, args.num_envs), device=device) + rewards = torch.zeros((args.num_steps, args.num_envs), device=device) + dones = torch.zeros((args.num_steps, args.num_envs), device=device) + values = torch.zeros((args.num_steps, args.num_envs), device=device) + + # Global variables + global_step = 0 + start_time = time.time() + single_global_rollout = int(args.num_envs * args.num_steps * world_size) + num_updates = args.total_timesteps // single_global_rollout + + # Get the first environment observation and start the optimization + next_obs = torch.tensor(envs.reset(seed=args.seed)[0], device=device) + next_done = torch.zeros(args.num_envs, device=device) + for update in range(1, num_updates + 1): + # Learning rate annealing + if args.anneal_lr: + linear_annealing(optimizer, update, num_updates, args.learning_rate) + fabric.log("Info/learning_rate", optimizer.param_groups[0]["lr"], global_step) + + for step in range(0, args.num_steps): + global_step += args.num_envs * world_size + obs[step] = next_obs + dones[step] = next_done + + # Sample an action given the observation received by the environment + with torch.no_grad(): + action, logprob, _, value = agent.get_action_and_value(next_obs) + values[step] = value.flatten() + actions[step] = action + logprobs[step] = logprob + + # Single environment step + next_obs, reward, done, truncated, info = envs.step(action.cpu().numpy()) + done = torch.logical_or(torch.tensor(done), torch.tensor(truncated)) + rewards[step] = torch.tensor(reward, device=device).view(-1) + next_obs, next_done = torch.tensor(next_obs, device=device), done.to(device) + + if "final_info" in info: + for i, agent_final_info in enumerate(info["final_info"]): + if agent_final_info is not None and "episode" in agent_final_info: + fabric.print( + f"Rank-0: global_step={global_step}, reward_env_{i}={agent_final_info['episode']['r'][0]}" + ) + rew_avg(agent_final_info["episode"]["r"][0]) + ep_len_avg(agent_final_info["episode"]["l"][0]) + + # Sync the metrics + rew_avg_reduced = rew_avg.compute() + if not rew_avg_reduced.isnan(): + fabric.log("Rewards/rew_avg", rew_avg_reduced, global_step) + ep_len_avg_reduced = ep_len_avg.compute() + if not ep_len_avg_reduced.isnan(): + fabric.log("Game/ep_len_avg", ep_len_avg_reduced, global_step) + rew_avg.reset() + ep_len_avg.reset() + + # Estimate returns with GAE (https://arxiv.org/abs/1506.02438) + returns, advantages = agent.estimate_returns_and_advantages( + rewards, values, dones, next_obs, next_done, args.num_steps, args.gamma, args.gae_lambda + ) + + # Flatten the batch + local_data = { + "obs": obs.reshape((-1,) + envs.single_observation_space.shape), + "logprobs": logprobs.reshape(-1), + "actions": actions.reshape((-1,) + envs.single_action_space.shape), + "advantages": advantages.reshape(-1), + "returns": returns.reshape(-1), + "values": values.reshape(-1), + } + + if args.share_data: + # Gather all the tensors from all the world and reshape them + gathered_data = fabric.all_gather(local_data) + for k, v in gathered_data.items(): + if k == "obs": + gathered_data[k] = v.reshape((-1,) + envs.single_observation_space.shape) + elif k == "actions": + gathered_data[k] = v.reshape((-1,) + envs.single_action_space.shape) + else: + gathered_data[k] = v.reshape(-1) + else: + gathered_data = local_data + + # Train the agent + train(fabric, agent, optimizer, gathered_data, global_step, args) + fabric.log("Time/step_per_second", int(global_step / (time.time() - start_time)), global_step) + + envs.close() + if fabric.is_global_zero: + test(agent.module, device, fabric.logger.experiment, args) + + +if __name__ == "__main__": + args = parse_args() + main(args) diff --git a/examples/fabric/reinforcement_learning/train_fabric_decoupled.py b/examples/fabric/reinforcement_learning/train_fabric_decoupled.py new file mode 100644 index 0000000..da43a75 --- /dev/null +++ b/examples/fabric/reinforcement_learning/train_fabric_decoupled.py @@ -0,0 +1,352 @@ +""" +Proximal Policy Optimization (PPO) - Accelerated with Lightning Fabric + +Author: Federico Belotti @belerico +Adapted from https://github.com/vwxyzjn/cleanrl/blob/master/cleanrl/ppo.py +Based on the paper: https://arxiv.org/abs/1707.06347 + +Requirements: +- gymnasium[box2d]>=0.27.1 +- moviepy +- lightning +- torchmetrics +- tensorboard + + +Run it with: + lightning run model --devices=2 train_fabric_decoupled.py +""" + +import argparse +import os +import time +from contextlib import nullcontext +from datetime import datetime + +import gymnasium as gym +import torch +from rl.agent import PPOLightningAgent +from rl.utils import linear_annealing, make_env, parse_args, test +from torch.distributed.algorithms.join import Join +from torch.utils.data import BatchSampler, DistributedSampler, RandomSampler +from torchmetrics import MeanMetric + +from lightning.fabric import Fabric +from lightning.fabric.loggers import TensorBoardLogger +from lightning.fabric.plugins.collectives import TorchCollective +from lightning.fabric.plugins.collectives.collective import CollectibleGroup +from lightning.fabric.strategies import DDPStrategy + + +@torch.no_grad() +def player(args, world_collective: TorchCollective, player_trainer_collective: TorchCollective): + run_name = f"{args.env_id}_{args.exp_name}_{args.seed}" + logger = TensorBoardLogger( + root_dir=os.path.join("logs", "fabric_decoupled_logs", datetime.today().strftime("%Y-%m-%d_%H-%M-%S")), + name=run_name, + ) + log_dir = logger.log_dir + + # Initialize Fabric object + fabric = Fabric(loggers=logger, accelerator="cuda" if args.player_on_gpu else "cpu") + device = fabric.device + fabric.seed_everything(args.seed) + torch.backends.cudnn.deterministic = args.torch_deterministic + + # Log hyperparameters + logger.experiment.add_text( + "hyperparameters", + "|param|value|\n|-|-|\n%s" % ("\n".join([f"|{key}|{value}|" for key, value in vars(args).items()])), + ) + + # Environment setup + envs = gym.vector.SyncVectorEnv( + [make_env(args.env_id, args.seed + i, 0, args.capture_video, log_dir, "train") for i in range(args.num_envs)] + ) + assert isinstance(envs.single_action_space, gym.spaces.Discrete), "only discrete action space is supported" + + # Define the agent + agent: PPOLightningAgent = PPOLightningAgent( + envs, + act_fun=args.activation_function, + vf_coef=args.vf_coef, + ent_coef=args.ent_coef, + clip_coef=args.clip_coef, + clip_vloss=args.clip_vloss, + ortho_init=args.ortho_init, + normalize_advantages=args.normalize_advantages, + ).to(device) + flattened_parameters = torch.empty_like( + torch.nn.utils.convert_parameters.parameters_to_vector(agent.parameters()), device=device + ) + + # Receive the first weights from the rank-1, a.k.a. the first of the trainers + # In this way we are sure that before the first iteration everyone starts with the same parameters + player_trainer_collective.broadcast(flattened_parameters, src=1) + torch.nn.utils.convert_parameters.vector_to_parameters(flattened_parameters, agent.parameters()) + + # Player metrics + rew_avg = MeanMetric(sync_on_compute=False).to(device) + ep_len_avg = MeanMetric(sync_on_compute=False).to(device) + + # Local data + obs = torch.zeros((args.num_steps, args.num_envs) + envs.single_observation_space.shape).to(device) + actions = torch.zeros((args.num_steps, args.num_envs) + envs.single_action_space.shape).to(device) + logprobs = torch.zeros((args.num_steps, args.num_envs)).to(device) + rewards = torch.zeros((args.num_steps, args.num_envs)).to(device) + dones = torch.zeros((args.num_steps, args.num_envs)).to(device) + values = torch.zeros((args.num_steps, args.num_envs)).to(device) + + # Global variables + global_step = 0 + start_time = time.time() + single_global_step = int(args.num_envs * args.num_steps) + num_updates = args.total_timesteps // single_global_step + if not args.share_data: + if single_global_step < world_collective.world_size - 1: + raise RuntimeError( + "The number of trainers ({}) is greater than the available collected data ({}). ".format( + world_collective.world_size - 1, single_global_step + ) + + "Consider to lower the number of trainers at least to the size of available collected data" + ) + chunks_sizes = [ + len(chunk) + for chunk in torch.tensor_split(torch.arange(single_global_step), world_collective.world_size - 1) + ] + + # Broadcast num_updates to all the world + update_t = torch.tensor([num_updates], device=device, dtype=torch.float32) + world_collective.broadcast(update_t, src=0) + + # Get the first environment observation and start the optimization + next_obs = torch.tensor(envs.reset(seed=args.seed)[0], device=device) + next_done = torch.zeros(args.num_envs).to(device) + for _ in range(1, num_updates + 1): + for step in range(0, args.num_steps): + global_step += args.num_envs + obs[step] = next_obs + dones[step] = next_done + + # Sample an action given the observation received by the environment + action, logprob, _, value = agent.get_action_and_value(next_obs) + values[step] = value.flatten() + actions[step] = action + logprobs[step] = logprob + + # Single environment step + next_obs, reward, done, truncated, info = envs.step(action.cpu().numpy()) + done = torch.logical_or(torch.tensor(done), torch.tensor(truncated)) + rewards[step] = torch.tensor(reward, device=device).view(-1) + next_obs, next_done = torch.tensor(next_obs, device=device), done.to(device) + + if "final_info" in info: + for i, agent_final_info in enumerate(info["final_info"]): + if agent_final_info is not None and "episode" in agent_final_info: + fabric.print( + f"Rank-0: global_step={global_step}, reward_env_{i}={agent_final_info['episode']['r'][0]}" + ) + rew_avg(agent_final_info["episode"]["r"][0]) + ep_len_avg(agent_final_info["episode"]["l"][0]) + + # Sync the metrics + rew_avg_reduced = rew_avg.compute() + if not rew_avg_reduced.isnan(): + fabric.log("Rewards/rew_avg", rew_avg_reduced, global_step) + ep_len_avg_reduced = ep_len_avg.compute() + if not ep_len_avg_reduced.isnan(): + fabric.log("Game/ep_len_avg", ep_len_avg_reduced, global_step) + rew_avg.reset() + ep_len_avg.reset() + + # Estimate returns with GAE (https://arxiv.org/abs/1506.02438) + returns, advantages = agent.estimate_returns_and_advantages( + rewards, values, dones, next_obs, next_done, args.num_steps, args.gamma, args.gae_lambda + ) + + # Flatten the batch + local_data = { + "obs": obs.reshape((-1,) + envs.single_observation_space.shape), + "logprobs": logprobs.reshape(-1), + "actions": actions.reshape((-1,) + envs.single_action_space.shape), + "advantages": advantages.reshape(-1), + "returns": returns.reshape(-1), + "values": values.reshape(-1), + } + if not args.player_on_gpu and args.cuda: + for v in local_data.values(): + v = v.pin_memory() + + # Send data to the training agents + if args.share_data: + world_collective.broadcast_object_list([local_data], src=0) + else: + # Split data in an even way, when possible + perm = torch.randperm(single_global_step, device=device) + chunks = [{} for _ in range(world_collective.world_size - 1)] + for k, v in local_data.items(): + chunked_local_data = v[perm].split(chunks_sizes) + for i in range(len(chunks)): + chunks[i][k] = chunked_local_data[i] + + world_collective.scatter_object_list([None], [None] + chunks, src=0) + + # Gather metrics from the trainers to be plotted + metrics = [None] + player_trainer_collective.broadcast_object_list(metrics, src=1) + + # Wait the trainers to finish + player_trainer_collective.broadcast(flattened_parameters, src=1) + + # Convert back the parameters + torch.nn.utils.convert_parameters.vector_to_parameters(flattened_parameters, agent.parameters()) + + fabric.log_dict(metrics[0], global_step) + fabric.log_dict({"Time/step_per_second": int(global_step / (time.time() - start_time))}, global_step) + + if args.share_data: + world_collective.broadcast_object_list([-1], src=0) + else: + world_collective.scatter_object_list([None], [None] + [-1] * (world_collective.world_size - 1), src=0) + envs.close() + test(agent, device, fabric.logger.experiment, args) + + +def trainer( + args, + world_collective: TorchCollective, + player_trainer_collective: TorchCollective, + optimization_pg: CollectibleGroup, +): + global_rank = world_collective.rank + group_rank = global_rank - 1 + group_world_size = world_collective.world_size - 1 + + # Initialize Fabric + fabric = Fabric(strategy=DDPStrategy(process_group=optimization_pg), accelerator="cuda" if args.cuda else "cpu") + device = fabric.device + fabric.seed_everything(args.seed) + torch.backends.cudnn.deterministic = args.torch_deterministic + + # Environment setup + envs = gym.vector.SyncVectorEnv([make_env(args.env_id, 0, 0, False, None)]) + assert isinstance(envs.single_action_space, gym.spaces.Discrete), "only discrete action space is supported" + + # Define the agent and the optimizer and setup them with Fabric + agent: PPOLightningAgent = PPOLightningAgent( + envs, + act_fun=args.activation_function, + vf_coef=args.vf_coef, + ent_coef=args.ent_coef, + clip_coef=args.clip_coef, + clip_vloss=args.clip_vloss, + ortho_init=args.ortho_init, + normalize_advantages=args.normalize_advantages, + process_group=optimization_pg, + ) + optimizer = agent.configure_optimizers(args.learning_rate) + agent, optimizer = fabric.setup(agent, optimizer) + + # Send weights to rank-0, a.k.a. the player + if global_rank == 1: + player_trainer_collective.broadcast( + torch.nn.utils.convert_parameters.parameters_to_vector(agent.parameters()), src=1 + ) + + # Receive maximum number of updates from the player + update = 0 + num_updates = torch.zeros(1, device=device) + world_collective.broadcast(num_updates, src=0) + num_updates = num_updates.item() + + # Start training + while True: + # Wait for data + data = [None] + if args.share_data: + world_collective.broadcast_object_list(data, src=0) + else: + world_collective.scatter_object_list(data, [None for _ in range(world_collective.world_size)], src=0) + data = data[0] + if data == -1: + return + + # Metrics dict to be sent to the player + if group_rank == 0: + metrics = {} + + # Lerning rate annealing + if args.anneal_lr: + linear_annealing(optimizer, update, num_updates, args.learning_rate) + if group_rank == 0: + metrics["Info/learning_rate"] = optimizer.param_groups[0]["lr"] + update += 1 + + indexes = list(range(data["obs"].shape[0])) + if args.share_data: + sampler = DistributedSampler( + indexes, num_replicas=group_world_size, rank=group_rank, shuffle=True, seed=args.seed, drop_last=False + ) + else: + sampler = RandomSampler(indexes) + sampler = BatchSampler(sampler, batch_size=args.per_rank_batch_size, drop_last=False) + + # The Join context is needed because there can be the possibility + # that some ranks receive less data + with Join([agent._forward_module]) if not args.share_data else nullcontext(): + for epoch in range(args.update_epochs): + if args.share_data: + sampler.sampler.set_epoch(epoch) + for batch_idxes in sampler: + loss = agent.training_step({k: v[batch_idxes].to(device) for k, v in data.items()}) + optimizer.zero_grad(set_to_none=True) + fabric.backward(loss) + fabric.clip_gradients(agent, optimizer, max_norm=args.max_grad_norm) + optimizer.step() + + # Sync metrics + avg_pg_loss = agent.avg_pg_loss.compute() + avg_value_loss = agent.avg_value_loss.compute() + avg_ent_loss = agent.avg_ent_loss.compute() + agent.reset_metrics() + + # Send updated weights to the player + if global_rank == 1: + metrics["Loss/policy_loss"] = avg_pg_loss + metrics["Loss/value_loss"] = avg_value_loss + metrics["Loss/entropy_loss"] = avg_ent_loss + player_trainer_collective.broadcast_object_list( + [metrics], src=1 + ) # Broadcast metrics: fake send with object list between rank-0 and rank-1 + player_trainer_collective.broadcast( + torch.nn.utils.convert_parameters.parameters_to_vector(agent.parameters()), src=1 + ) + + +def main(args: argparse.Namespace): + world_collective = TorchCollective() + player_trainer_collective = TorchCollective() + world_collective.setup(backend="nccl" if args.player_on_gpu and args.cuda else "gloo") + + # Create a global group, assigning it to the collective: used by the player to exchange + # collected experiences with the trainers + world_collective.create_group() + global_rank = world_collective.rank + + # Create a group between rank-0 (player) and rank-1 (trainer), assigning it to the collective: + # used by rank-1 to send metrics to be tracked by the rank-0 at the end of a training episode + player_trainer_collective.create_group(ranks=[0, 1]) + + # Create a new group, without assigning it to the collective: in this way the trainers can + # still communicate with the player through the global group, but they can optimize the agent + # between themselves + optimization_pg = world_collective.new_group(ranks=list(range(1, world_collective.world_size))) + if global_rank == 0: + player(args, world_collective, player_trainer_collective) + else: + trainer(args, world_collective, player_trainer_collective, optimization_pg) + + +if __name__ == "__main__": + args = parse_args() + main(args) diff --git a/examples/fabric/reinforcement_learning/train_torch.py b/examples/fabric/reinforcement_learning/train_torch.py new file mode 100644 index 0000000..8974d30 --- /dev/null +++ b/examples/fabric/reinforcement_learning/train_torch.py @@ -0,0 +1,278 @@ +""" +Proximal Policy Optimization (PPO) - Accelerated with Lightning Fabric + +Author: Federico Belotti @belerico +Adapted from https://github.com/vwxyzjn/cleanrl/blob/master/cleanrl/ppo.py +Based on the paper: https://arxiv.org/abs/1707.06347 + +Requirements: +- gymnasium[box2d]>=0.27.1 +- moviepy +- lightning +- torchmetrics +- tensorboard + + +Run it with: + torchrun --nproc_per_node=2 --standalone train_torch.py +""" + +import argparse +import os +import random +import time +from datetime import datetime +from typing import Dict + +import gymnasium as gym +import torch +import torch.distributed as distributed +import torch.nn as nn +import torch.optim as optim +from rl.agent import PPOAgent +from rl.loss import entropy_loss, policy_loss, value_loss +from rl.utils import linear_annealing, make_env, parse_args, test +from torch import Tensor +from torch.nn.parallel import DistributedDataParallel +from torch.utils.data import BatchSampler, DistributedSampler, RandomSampler +from torch.utils.tensorboard import SummaryWriter + + +def train( + agent: PPOAgent, + optimizer: torch.optim.Optimizer, + data: Dict[str, Tensor], + logger: SummaryWriter, + global_step: int, + args: argparse.Namespace, +): + indexes = list(range(data["obs"].shape[0])) + if args.share_data: + sampler = DistributedSampler( + indexes, + num_replicas=distributed.get_world_size(), + rank=distributed.get_rank(), + shuffle=True, + seed=args.seed, + ) + else: + sampler = RandomSampler(indexes) + sampler = BatchSampler(sampler, batch_size=args.per_rank_batch_size, drop_last=False) + per_epoch_losses = torch.tensor([0.0, 0.0, 0.0], device=data["obs"].device) + for epoch in range(args.update_epochs): + if args.share_data: + sampler.sampler.set_epoch(epoch) + for batch_idxes in sampler: + _, newlogprob, entropy, newvalue = agent(data["obs"][batch_idxes], data["actions"].long()[batch_idxes]) + logratio = newlogprob - data["logprobs"][batch_idxes] + ratio = logratio.exp() + + advantages = data["advantages"][batch_idxes] + if args.normalize_advantages: + advantages = (advantages - advantages.mean()) / (advantages.std() + 1e-8) + + # Policy loss + pg_loss = policy_loss(advantages, ratio, args.clip_coef) + per_epoch_losses[0] += pg_loss.detach() + + # Value loss + v_loss = value_loss( + newvalue, + data["values"][batch_idxes], + data["returns"][batch_idxes], + args.clip_coef, + args.clip_vloss, + args.vf_coef, + ) + per_epoch_losses[1] += v_loss.detach() + + # Entropy loss + ent_loss = entropy_loss(entropy, args.ent_coef) + per_epoch_losses[2] += ent_loss.detach() + + # Overall loss + loss = pg_loss + ent_loss + v_loss + + optimizer.zero_grad(set_to_none=True) + loss.backward() + nn.utils.clip_grad_norm_(agent.parameters(), args.max_grad_norm) + optimizer.step() + + # Log + distributed.reduce(per_epoch_losses, dst=0) + if logger is not None: + per_epoch_losses = per_epoch_losses / (len(sampler) * distributed.get_world_size()) + logger.add_scalar("Loss/policy_loss", per_epoch_losses[0], global_step) + logger.add_scalar("Loss/value_loss", per_epoch_losses[1], global_step) + logger.add_scalar("Loss/entropy_loss", per_epoch_losses[2], global_step) + per_epoch_losses.fill_(0) + + +def main(args: argparse.Namespace): + # Init distributed environment + is_cuda_available = torch.cuda.is_available() and args.cuda + backend = "nccl" if is_cuda_available else "gloo" + local_rank = int(os.environ["LOCAL_RANK"]) + global_rank = int(os.environ["RANK"]) + world_size = int(os.environ["WORLD_SIZE"]) + if is_cuda_available: + torch.cuda.set_device(local_rank) + device = torch.device(f"cuda:{local_rank}" if is_cuda_available else "cpu") + distributed.init_process_group(backend=backend) + + # Seed everything + random.seed(args.seed) + torch.manual_seed(args.seed) + torch.cuda.manual_seed_all(args.seed) + torch.backends.cudnn.deterministic = args.torch_deterministic + + # Logger + log_dir = None + logger = None + run_name = f"{args.env_id}_{args.exp_name}_{args.seed}_{int(time.time())}" + if global_rank == 0: + log_dir = os.path.join("logs", "torch_logs", datetime.today().strftime("%Y-%m-%d_%H-%M-%S"), run_name) + logger = SummaryWriter(log_dir=log_dir) + + # Log hyperparameters + if global_rank == 0: + logger.add_text( + "hyperparameters", + "|param|value|\n|-|-|\n%s" % ("\n".join([f"|{key}|{value}|" for key, value in vars(args).items()])), + ) + + # Environment setup + envs = gym.vector.SyncVectorEnv( + [ + make_env( + args.env_id, + args.seed + global_rank * args.num_envs + i, + global_rank, + args.capture_video, + logger.log_dir if global_rank == 0 else None, + "train", + ) + for i in range(args.num_envs) + ] + ) + assert isinstance(envs.single_action_space, gym.spaces.Discrete), "only discrete action space is supported" + + # Define the agent and the optimizer and setup them with DistributedDataParallel + agent: PPOAgent = PPOAgent(envs, act_fun=args.activation_function, ortho_init=args.ortho_init).to(device) + agent = DistributedDataParallel( + agent, + device_ids=[local_rank] if is_cuda_available else None, + output_device=local_rank if is_cuda_available else None, + ) + optimizer = optim.Adam(agent.parameters(), lr=args.learning_rate, eps=1e-4) + + # Local data + obs = torch.zeros((args.num_steps, args.num_envs) + envs.single_observation_space.shape, device=device) + actions = torch.zeros((args.num_steps, args.num_envs) + envs.single_action_space.shape, device=device) + logprobs = torch.zeros((args.num_steps, args.num_envs), device=device) + rewards = torch.zeros((args.num_steps, args.num_envs), device=device) + dones = torch.zeros((args.num_steps, args.num_envs), device=device) + values = torch.zeros((args.num_steps, args.num_envs), device=device) + local_rew = 0.0 + local_ep_len = 0.0 + local_num_episodes = 0.0 + + # Global variables + global_step = 0 + start_time = time.time() + single_global_step = int(args.num_envs * args.num_steps * world_size) + num_updates = args.total_timesteps // single_global_step + + # Get the first environment observation and start the optimization + next_obs = torch.tensor(envs.reset(seed=args.seed)[0], device=device) + next_done = torch.zeros(args.num_envs, device=device) + for update in range(1, num_updates + 1): + # Learning rate annealing + if args.anneal_lr: + linear_annealing(optimizer, update, num_updates, args.learning_rate) + if global_rank == 0: + logger.add_scalar("Info/learning_rate", optimizer.param_groups[0]["lr"], global_step) + + for step in range(0, args.num_steps): + global_step += args.num_envs * world_size + obs[step] = next_obs + dones[step] = next_done + + # Sample an action given the observation received by the environment + with torch.no_grad(): + action, logprob, _, value = agent(next_obs) + values[step] = value.flatten() + actions[step] = action + logprobs[step] = logprob + + # Single environment step + next_obs, reward, done, truncated, info = envs.step(action.cpu().numpy()) + done = torch.logical_or(torch.tensor(done), torch.tensor(truncated)) + rewards[step] = torch.tensor(reward, device=device).view(-1) + next_obs, next_done = torch.tensor(next_obs, device=device), done.to(device) + + if "final_info" in info: + for i, agent_final_info in enumerate(info["final_info"]): + if agent_final_info is not None and "episode" in agent_final_info: + if global_rank == 0: + print( + f"Rank-0: global_step={global_step}, " + f"reward_env_{i}={agent_final_info['episode']['r'][0]}" + ) + local_num_episodes += 1 + local_rew += agent_final_info["episode"]["r"][0] + local_ep_len += agent_final_info["episode"]["l"][0] + + # Sync the metrics + global_stats = torch.tensor([local_rew, local_ep_len, local_num_episodes], device=device, dtype=torch.float32) + distributed.reduce(global_stats, dst=0) + if global_rank == 0 and global_stats[2] != 0.0: + logger.add_scalar("Rewards/rew_avg", global_stats[0] / global_stats[2], global_step) + logger.add_scalar("Game/ep_len_avg", global_stats[1] / global_stats[2], global_step) + + # Reset metrics + local_rew = 0 + local_ep_len = 0 + local_num_episodes = 0 + + # Estimate returns with GAE (https://arxiv.org/abs/1506.02438) + returns, advantages = agent.module.estimate_returns_and_advantages( + rewards, values, dones, next_obs, next_done, args.num_steps, args.gamma, args.gae_lambda + ) + + # Flatten the batch + local_data = { + "obs": obs.reshape((-1,) + envs.single_observation_space.shape), + "logprobs": logprobs.reshape(-1), + "actions": actions.reshape((-1,) + envs.single_action_space.shape), + "advantages": advantages.reshape(-1), + "returns": returns.reshape(-1), + "values": values.reshape(-1), + } + + if args.share_data: + # Gather all the tensors from all the world, concat and reshape them + gathered_data = [None for _ in range(world_size)] + distributed.all_gather_object(gathered_data, local_data) + processed_gathered_data = gathered_data[0] + for i in range(1, len(gathered_data)): + for k in processed_gathered_data: + processed_gathered_data[k] = torch.cat( + (processed_gathered_data[k].to(device), gathered_data[i][k].to(device)), dim=0 + ) + else: + processed_gathered_data = local_data + + # Train the agent + train(agent, optimizer, processed_gathered_data, logger, global_step, args) + if global_rank == 0: + logger.add_scalar("Time/step_per_second", int(global_step / (time.time() - start_time)), global_step) + + envs.close() + if global_rank == 0: + test(agent.module, device, logger, args) + + +if __name__ == "__main__": + args = parse_args() + main(args) diff --git a/examples/pytorch/basics/README.md b/examples/pytorch/basics/README.md new file mode 100644 index 0000000..0ef1933 --- /dev/null +++ b/examples/pytorch/basics/README.md @@ -0,0 +1,56 @@ +## Basic Examples + +Use these examples to test how Lightning works. + +### AutoEncoder + +This script shows you how to implement a CNN auto-encoder. + +```bash +# CPU +python autoencoder.py + +# GPUs (any number) +python autoencoder.py --trainer.accelerator 'gpu' --trainer.devices 2 + +# Distributed Data Parallel (DDP) +python autoencoder.py --trainer.accelerator 'gpu' --trainer.devices 2 --trainer.strategy 'ddp' +``` + +______________________________________________________________________ + +### Backbone Image Classifier + +This script shows you how to implement a `LightningModule` as a system. +A system describes a `LightningModule` which takes a single `torch.nn.Module` which makes exporting to producion simpler. + +```bash +# CPU +python backbone_image_classifier.py + +# GPUs (any number) +python backbone_image_classifier.py --trainer.accelerator 'gpu' --trainer.devices 2 + +# Distributed Data Parallel (DDP) +python backbone_image_classifier.py --trainer.accelerator 'gpu' --trainer.devices 2 --trainer.strategy 'ddp' +``` + +______________________________________________________________________ + +### Transformers + +This example contains a simple training loop for next-word prediction with a [Transformer model](https://arxiv.org/abs/1706.03762) on a subset of the [WikiText2](https://www.salesforce.com/products/einstein/ai-research/the-wikitext-dependency-language-modeling-dataset/) dataset. + +```bash +python transformer.py +``` + +______________________________________________________________________ + +### PyTorch Profiler + +This script shows you how to activate the [PyTorch Profiler](https://github.com/pytorch/kineto) with Lightning. + +```bash +python profiler_example.py +``` diff --git a/examples/pytorch/basics/autoencoder.py b/examples/pytorch/basics/autoencoder.py new file mode 100644 index 0000000..006397f --- /dev/null +++ b/examples/pytorch/basics/autoencoder.py @@ -0,0 +1,192 @@ +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +"""MNIST autoencoder example. + +To run: python autoencoder.py --trainer.max_epochs=50 +""" +from os import path +from typing import Optional, Tuple + +import torch +import torch.nn.functional as F +from torch import nn +from torch.utils.data import DataLoader, random_split + +from lightning.pytorch import callbacks, cli_lightning_logo, LightningDataModule, LightningModule, Trainer +from lightning.pytorch.cli import LightningCLI +from lightning.pytorch.demos.mnist_datamodule import MNIST +from lightning.pytorch.utilities import rank_zero_only +from lightning.pytorch.utilities.imports import _TORCHVISION_AVAILABLE + +if _TORCHVISION_AVAILABLE: + import torchvision + from torchvision import transforms + from torchvision.utils import save_image + +DATASETS_PATH = path.join(path.dirname(__file__), "..", "..", "Datasets") + + +class ImageSampler(callbacks.Callback): + def __init__( + self, + num_samples: int = 3, + nrow: int = 8, + padding: int = 2, + normalize: bool = True, + norm_range: Optional[Tuple[int, int]] = None, + scale_each: bool = False, + pad_value: int = 0, + ) -> None: + """ + Args: + num_samples: Number of images displayed in the grid. Default: ``3``. + nrow: Number of images displayed in each row of the grid. + The final grid size is ``(B / nrow, nrow)``. Default: ``8``. + padding: Amount of padding. Default: ``2``. + normalize: If ``True``, shift the image to the range (0, 1), + by the min and max values specified by :attr:`range`. Default: ``False``. + norm_range: Tuple (min, max) where min and max are numbers, + then these numbers are used to normalize the image. By default, min and max + are computed from the tensor. + scale_each: If ``True``, scale each image in the batch of + images separately rather than the (min, max) over all images. Default: ``False``. + pad_value: Value for the padded pixels. Default: ``0``. + """ + if not _TORCHVISION_AVAILABLE: # pragma: no cover + raise ModuleNotFoundError("You want to use `torchvision` which is not installed yet.") + + super().__init__() + self.num_samples = num_samples + self.nrow = nrow + self.padding = padding + self.normalize = normalize + self.norm_range = norm_range + self.scale_each = scale_each + self.pad_value = pad_value + + def _to_grid(self, images): + return torchvision.utils.make_grid( + tensor=images, + nrow=self.nrow, + padding=self.padding, + normalize=self.normalize, + value_range=self.norm_range, + scale_each=self.scale_each, + pad_value=self.pad_value, + ) + + @rank_zero_only + def on_train_epoch_end(self, trainer: Trainer, pl_module: LightningModule) -> None: + if not _TORCHVISION_AVAILABLE: + return + + images, _ = next(iter(DataLoader(trainer.datamodule.mnist_val, batch_size=self.num_samples))) + images_flattened = images.view(images.size(0), -1) + + # generate images + with torch.no_grad(): + pl_module.eval() + images_generated = pl_module(images_flattened.to(pl_module.device)) + pl_module.train() + + if trainer.current_epoch == 0: + save_image(self._to_grid(images), f"grid_ori_{trainer.current_epoch}.png") + save_image(self._to_grid(images_generated.reshape(images.shape)), f"grid_generated_{trainer.current_epoch}.png") + + +class LitAutoEncoder(LightningModule): + """ + >>> LitAutoEncoder() # doctest: +ELLIPSIS +NORMALIZE_WHITESPACE + LitAutoEncoder( + (encoder): ... + (decoder): ... + ) + """ + + def __init__(self, hidden_dim: int = 64, learning_rate=10e-3): + super().__init__() + self.save_hyperparameters() + self.encoder = nn.Sequential(nn.Linear(28 * 28, hidden_dim), nn.ReLU(), nn.Linear(hidden_dim, 3)) + self.decoder = nn.Sequential(nn.Linear(3, hidden_dim), nn.ReLU(), nn.Linear(hidden_dim, 28 * 28)) + + def forward(self, x): + z = self.encoder(x) + return self.decoder(z) + + def training_step(self, batch, batch_idx): + return self._common_step(batch, batch_idx, "train") + + def validation_step(self, batch, batch_idx): + self._common_step(batch, batch_idx, "val") + + def test_step(self, batch, batch_idx): + self._common_step(batch, batch_idx, "test") + + def predict_step(self, batch, batch_idx, dataloader_idx=None): + x = self._prepare_batch(batch) + return self(x) + + def configure_optimizers(self): + return torch.optim.Adam(self.parameters(), lr=self.hparams.learning_rate) + + def _prepare_batch(self, batch): + x, _ = batch + return x.view(x.size(0), -1) + + def _common_step(self, batch, batch_idx, stage: str): + x = self._prepare_batch(batch) + loss = F.mse_loss(x, self(x)) + self.log(f"{stage}_loss", loss, on_step=True) + return loss + + +class MyDataModule(LightningDataModule): + def __init__(self, batch_size: int = 32): + super().__init__() + dataset = MNIST(DATASETS_PATH, train=True, download=True, transform=transforms.ToTensor()) + self.mnist_test = MNIST(DATASETS_PATH, train=False, download=True, transform=transforms.ToTensor()) + self.mnist_train, self.mnist_val = random_split(dataset, [55000, 5000]) + self.batch_size = batch_size + + def train_dataloader(self): + return DataLoader(self.mnist_train, batch_size=self.batch_size) + + def val_dataloader(self): + return DataLoader(self.mnist_val, batch_size=self.batch_size) + + def test_dataloader(self): + return DataLoader(self.mnist_test, batch_size=self.batch_size) + + def predict_dataloader(self): + return DataLoader(self.mnist_test, batch_size=self.batch_size) + + +def cli_main(): + cli = LightningCLI( + LitAutoEncoder, + MyDataModule, + seed_everything_default=1234, + run=False, # used to de-activate automatic fitting. + trainer_defaults={"callbacks": ImageSampler(), "max_epochs": 10}, + save_config_kwargs={"overwrite": True}, + ) + cli.trainer.fit(cli.model, datamodule=cli.datamodule) + cli.trainer.test(ckpt_path="best", datamodule=cli.datamodule) + predictions = cli.trainer.predict(ckpt_path="best", datamodule=cli.datamodule) + print(predictions[0]) + + +if __name__ == "__main__": + cli_lightning_logo() + cli_main() diff --git a/examples/pytorch/basics/backbone_image_classifier.py b/examples/pytorch/basics/backbone_image_classifier.py new file mode 100644 index 0000000..f293a0a --- /dev/null +++ b/examples/pytorch/basics/backbone_image_classifier.py @@ -0,0 +1,137 @@ +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +"""MNIST backbone image classifier example. + +To run: python backbone_image_classifier.py --trainer.max_epochs=50 +""" +from os import path +from typing import Optional + +import torch +from torch.nn import functional as F +from torch.utils.data import DataLoader, random_split + +from lightning.pytorch import cli_lightning_logo, LightningDataModule, LightningModule +from lightning.pytorch.cli import LightningCLI +from lightning.pytorch.demos.mnist_datamodule import MNIST +from lightning.pytorch.utilities.imports import _TORCHVISION_AVAILABLE + +if _TORCHVISION_AVAILABLE: + from torchvision import transforms + +DATASETS_PATH = path.join(path.dirname(__file__), "..", "..", "Datasets") + + +class Backbone(torch.nn.Module): + """ + >>> Backbone() # doctest: +ELLIPSIS +NORMALIZE_WHITESPACE + Backbone( + (l1): Linear(...) + (l2): Linear(...) + ) + """ + + def __init__(self, hidden_dim=128): + super().__init__() + self.l1 = torch.nn.Linear(28 * 28, hidden_dim) + self.l2 = torch.nn.Linear(hidden_dim, 10) + + def forward(self, x): + x = x.view(x.size(0), -1) + x = torch.relu(self.l1(x)) + x = torch.relu(self.l2(x)) + return x + + +class LitClassifier(LightningModule): + """ + >>> LitClassifier(Backbone()) # doctest: +ELLIPSIS +NORMALIZE_WHITESPACE + LitClassifier( + (backbone): ... + ) + """ + + def __init__(self, backbone: Optional[Backbone] = None, learning_rate: float = 0.0001): + super().__init__() + self.save_hyperparameters(ignore=["backbone"]) + if backbone is None: + backbone = Backbone() + self.backbone = backbone + + def forward(self, x): + # use forward for inference/predictions + return self.backbone(x) + + def training_step(self, batch, batch_idx): + x, y = batch + y_hat = self(x) + loss = F.cross_entropy(y_hat, y) + self.log("train_loss", loss, on_epoch=True) + return loss + + def validation_step(self, batch, batch_idx): + x, y = batch + y_hat = self(x) + loss = F.cross_entropy(y_hat, y) + self.log("valid_loss", loss, on_step=True) + + def test_step(self, batch, batch_idx): + x, y = batch + y_hat = self(x) + loss = F.cross_entropy(y_hat, y) + self.log("test_loss", loss) + + def predict_step(self, batch, batch_idx, dataloader_idx=None): + x, y = batch + return self(x) + + def configure_optimizers(self): + # self.hparams available because we called self.save_hyperparameters() + return torch.optim.Adam(self.parameters(), lr=self.hparams.learning_rate) + + +class MyDataModule(LightningDataModule): + def __init__(self, batch_size: int = 32): + super().__init__() + dataset = MNIST(DATASETS_PATH, train=True, download=True, transform=transforms.ToTensor()) + self.mnist_test = MNIST(DATASETS_PATH, train=False, download=True, transform=transforms.ToTensor()) + self.mnist_train, self.mnist_val = random_split(dataset, [55000, 5000]) + self.batch_size = batch_size + + def train_dataloader(self): + return DataLoader(self.mnist_train, batch_size=self.batch_size) + + def val_dataloader(self): + return DataLoader(self.mnist_val, batch_size=self.batch_size) + + def test_dataloader(self): + return DataLoader(self.mnist_test, batch_size=self.batch_size) + + def predict_dataloader(self): + return DataLoader(self.mnist_test, batch_size=self.batch_size) + + +def cli_main(): + cli = LightningCLI( + LitClassifier, MyDataModule, seed_everything_default=1234, save_config_kwargs={"overwrite": True}, run=False + ) + cli.trainer.fit(cli.model, datamodule=cli.datamodule) + cli.trainer.test(ckpt_path="best", datamodule=cli.datamodule) + predictions = cli.trainer.predict(ckpt_path="best", datamodule=cli.datamodule) + print(predictions[0]) + + +if __name__ == "__main__": + cli_lightning_logo() + cli_main() diff --git a/examples/pytorch/basics/profiler_example.py b/examples/pytorch/basics/profiler_example.py new file mode 100644 index 0000000..0c429d2 --- /dev/null +++ b/examples/pytorch/basics/profiler_example.py @@ -0,0 +1,113 @@ +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +"""This script will generate 2 traces: one for `training_step` and one for `validation_step`. The traces can be +visualized in 2 ways: + +* With Chrome: + 1. Open Chrome and copy/paste this url: `chrome://tracing/`. + 2. Once tracing opens, click on `Load` at the top-right and load one of the generated traces. +* With PyTorch Tensorboard Profiler (Instructions are here: https://github.com/pytorch/kineto/tree/master/tb_plugin) + 1. pip install tensorboard torch-tb-profiler + 2. tensorboard --logdir={FOLDER} +""" + +from os import path + +import torch +import torchvision +import torchvision.transforms as T + +from lightning.pytorch import cli_lightning_logo, LightningDataModule, LightningModule +from lightning.pytorch.cli import LightningCLI +from lightning.pytorch.profilers.pytorch import PyTorchProfiler +from lightning.pytorch.utilities.model_helpers import get_torchvision_model + +DATASETS_PATH = path.join(path.dirname(__file__), "..", "..", "Datasets") + + +class ModelToProfile(LightningModule): + def __init__(self, name: str = "resnet18", automatic_optimization: bool = True): + super().__init__() + self.model = get_torchvision_model(name, weights="DEFAULT") + self.criterion = torch.nn.CrossEntropyLoss() + self.automatic_optimization = automatic_optimization + self.training_step = ( + self.automatic_optimization_training_step + if automatic_optimization + else self.manual_optimization_training_step + ) + + def automatic_optimization_training_step(self, batch, batch_idx): + inputs, labels = batch + outputs = self.model(inputs) + loss = self.criterion(outputs, labels) + self.log("train_loss", loss) + return loss + + def manual_optimization_training_step(self, batch, batch_idx): + opt = self.optimizers() + opt.zero_grad() + inputs, labels = batch + outputs = self.model(inputs) + loss = self.criterion(outputs, labels) + self.log("train_loss", loss) + self.manual_backward(loss) + opt.step() + + def validation_step(self, batch, batch_idx): + inputs, labels = batch + outputs = self.model(inputs) + loss = self.criterion(outputs, labels) + self.log("val_loss", loss) + + def predict_step(self, batch, batch_idx, dataloader_idx: int = None): + inputs = batch[0] + return self.model(inputs) + + def configure_optimizers(self): + return torch.optim.SGD(self.parameters(), lr=0.001, momentum=0.9) + + +class CIFAR10DataModule(LightningDataModule): + transform = T.Compose([T.Resize(256), T.CenterCrop(224), T.ToTensor()]) + + def train_dataloader(self, *args, **kwargs): + trainset = torchvision.datasets.CIFAR10(root=DATASETS_PATH, train=True, download=True, transform=self.transform) + return torch.utils.data.DataLoader(trainset, batch_size=2, shuffle=True, num_workers=0) + + def val_dataloader(self, *args, **kwargs): + valset = torchvision.datasets.CIFAR10(root=DATASETS_PATH, train=False, download=True, transform=self.transform) + return torch.utils.data.DataLoader(valset, batch_size=2, shuffle=True, num_workers=0) + + +def cli_main(): + cli = LightningCLI( + ModelToProfile, + CIFAR10DataModule, + save_config_kwargs={"overwrite": True}, + trainer_defaults={ + "profiler": PyTorchProfiler(), + "max_epochs": 1, + "limit_train_batches": 15, + "limit_val_batches": 15, + "accelerator": "gpu", + }, + run=False, + ) + cli.trainer.fit(cli.model, datamodule=cli.datamodule) + + +if __name__ == "__main__": + cli_lightning_logo() + cli_main() diff --git a/examples/pytorch/basics/transformer.py b/examples/pytorch/basics/transformer.py new file mode 100644 index 0000000..dbd990d --- /dev/null +++ b/examples/pytorch/basics/transformer.py @@ -0,0 +1,62 @@ +import torch +import torch.nn.functional as F +from torch.utils.data import DataLoader, random_split + +import lightning as L +from lightning.pytorch.demos import Transformer, WikiText2 + + +class LanguageModel(L.LightningModule): + def __init__(self, vocab_size): + super().__init__() + self.model = Transformer(vocab_size=vocab_size) + + def training_step(self, batch, batch_idx): + input, target = batch + output = self.model(input, target) + loss = F.nll_loss(output, target.view(-1)) + self.log("train_loss", loss, prog_bar=True) + return loss + + def validation_step(self, batch, batch_idx): + input, target = batch + output = self.model(input, target) + loss = F.nll_loss(output, target.view(-1)) + self.log("val_loss", loss, prog_bar=True) + return loss + + def test_step(self, batch, batch_idx): + input, target = batch + output = self.model(input, target) + loss = F.nll_loss(output, target.view(-1)) + self.log("test_loss", loss, prog_bar=True) + return loss + + def configure_optimizers(self): + return torch.optim.SGD(self.parameters(), lr=0.1) + + +def main(): + L.seed_everything(42) + + # Data + dataset = WikiText2() + + # Split data in to train, val, test + n = len(dataset) + train_dataset, val_dataset, test_dataset = random_split(dataset, [n - 4000, 2000, 2000]) + train_dataloader = DataLoader(train_dataset, batch_size=20, shuffle=True) + val_dataloader = DataLoader(val_dataset, batch_size=20, shuffle=False) + test_dataloader = DataLoader(test_dataset, batch_size=20, shuffle=False) + + # Model + model = LanguageModel(vocab_size=dataset.vocab_size) + + # Trainer + trainer = L.Trainer(gradient_clip_val=0.25, max_epochs=20) + trainer.fit(model, train_dataloader, val_dataloader) + trainer.test(model, test_dataloader) + + +if __name__ == "__main__": + main() diff --git a/examples/pytorch/bug_report/bug_report_model.ipynb b/examples/pytorch/bug_report/bug_report_model.ipynb new file mode 100644 index 0000000..dababd0 --- /dev/null +++ b/examples/pytorch/bug_report/bug_report_model.ipynb @@ -0,0 +1,267 @@ +{ + "nbformat": 4, + "nbformat_minor": 0, + "metadata": { + "accelerator": "GPU", + "colab": { + "name": "bug_report_model.ipynb", + "provenance": [], + "collapsed_sections": [] + }, + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.7" + } + }, + "cells": [ + { + "cell_type": "markdown", + "metadata": { + "id": "rR4_BAUYs3Mb" + }, + "source": [ + "![image.png]()" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "i7XbLCXGkll9" + }, + "source": [ + "# The Boring Model\n", + "Replicate a bug you experience, using this model.\n", + "\n", + "[Remember! we're always available for support on Slack](https://www.pytorchlightning.ai/community)" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "2LODD6w9ixlT" + }, + "source": [ + "---\n", + "## Setup env" + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "zK7-Gg69kMnG" + }, + "source": [ + "%%capture\n", + "! pip install -qU pytorch-lightning" + ], + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "WvuSN5jEbY8P" + }, + "source": [ + "---\n", + "## Deps" + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "w4_TYnt_keJi" + }, + "source": [ + "import os\n", + "\n", + "import torch\n", + "from torch.utils.data import DataLoader, Dataset\n", + "\n", + "from pytorch_lightning import LightningModule, Trainer" + ], + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "XrJDukwPtUnS" + }, + "source": [ + "---\n", + "## Data\n", + "Random data is best for debugging. If you needs special tensor shapes or batch compositions or dataloaders, modify as needed" + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "hvgTiaZpkvwS" + }, + "source": [ + "class RandomDataset(Dataset):\n", + " def __init__(self, size, num_samples):\n", + " self.len = num_samples\n", + " self.data = torch.randn(num_samples, size)\n", + "\n", + " def __getitem__(self, index):\n", + " return self.data[index]\n", + "\n", + " def __len__(self):\n", + " return self.len" + ], + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "code", + "metadata": { + "id": "sxVlWjGhl02D" + }, + "source": [ + "num_samples = 10000" + ], + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "code", + "metadata": { + "id": "V7ELesz1kVQo" + }, + "source": [ + "class BoringModel(LightningModule):\n", + " def __init__(self):\n", + " super().__init__()\n", + " self.layer = torch.nn.Linear(32, 2)\n", + "\n", + " def forward(self, x):\n", + " return self.layer(x)\n", + "\n", + " def training_step(self, batch, batch_idx):\n", + " loss = self(batch).sum()\n", + " self.log(\"train_loss\", loss)\n", + " return {\"loss\": loss}\n", + "\n", + " def validation_step(self, batch, batch_idx):\n", + " loss = self(batch).sum()\n", + " self.log(\"valid_loss\", loss)\n", + "\n", + " def test_step(self, batch, batch_idx):\n", + " loss = self(batch).sum()\n", + " self.log(\"test_loss\", loss)\n", + "\n", + " def configure_optimizers(self):\n", + " return torch.optim.SGD(self.layer.parameters(), lr=0.1)" + ], + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "ubvW3LGSupmt" + }, + "source": [ + "---\n", + "## Define the test" + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "4Dk6Ykv8lI7X" + }, + "source": [ + "def run():\n", + " train_data = DataLoader(RandomDataset(32, 64), batch_size=2)\n", + " val_data = DataLoader(RandomDataset(32, 64), batch_size=2)\n", + " test_data = DataLoader(RandomDataset(32, 64), batch_size=2)\n", + "\n", + " model = BoringModel()\n", + " trainer = Trainer(\n", + " default_root_dir=os.getcwd(),\n", + " limit_train_batches=1,\n", + " limit_val_batches=1,\n", + " limit_test_batches=1,\n", + " num_sanity_val_steps=0,\n", + " max_epochs=1,\n", + " enable_model_summary=False,\n", + " )\n", + " trainer.fit(model, train_dataloaders=train_data, val_dataloaders=val_data)\n", + " trainer.test(model, dataloaders=test_data)" + ], + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "4dPfTZVgmgxz" + }, + "source": [ + "---\n", + "## Run Test" + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "AAtq1hwSmjKe" + }, + "source": [ + "run()" + ], + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "Flyi--SpvsJN" + }, + "source": [ + "---\n", + "## Environment\n", + "Run this to get the environment details" + ] + }, + { + "cell_type": "code", + "metadata": { + "id": "0-yvGFRoaDSi" + }, + "source": [ + "%%capture\n", + "! wget https://raw.githubusercontent.com/Lightning-AI/lightning/master/requirements/collect_env_details.py" + ], + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "code", + "metadata": { + "id": "quj4LUDgmFvj" + }, + "source": [ + "! python collect_env_details.py" + ], + "execution_count": null, + "outputs": [] + } + ] +} diff --git a/examples/pytorch/bug_report/bug_report_model.py b/examples/pytorch/bug_report/bug_report_model.py new file mode 100644 index 0000000..551ea21 --- /dev/null +++ b/examples/pytorch/bug_report/bug_report_model.py @@ -0,0 +1,66 @@ +import os + +import torch +from torch.utils.data import DataLoader, Dataset + +from lightning.pytorch import LightningModule, Trainer + + +class RandomDataset(Dataset): + def __init__(self, size, length): + self.len = length + self.data = torch.randn(length, size) + + def __getitem__(self, index): + return self.data[index] + + def __len__(self): + return self.len + + +class BoringModel(LightningModule): + def __init__(self): + super().__init__() + self.layer = torch.nn.Linear(32, 2) + + def forward(self, x): + return self.layer(x) + + def training_step(self, batch, batch_idx): + loss = self(batch).sum() + self.log("train_loss", loss) + return {"loss": loss} + + def validation_step(self, batch, batch_idx): + loss = self(batch).sum() + self.log("valid_loss", loss) + + def test_step(self, batch, batch_idx): + loss = self(batch).sum() + self.log("test_loss", loss) + + def configure_optimizers(self): + return torch.optim.SGD(self.layer.parameters(), lr=0.1) + + +def run(): + train_data = DataLoader(RandomDataset(32, 64), batch_size=2) + val_data = DataLoader(RandomDataset(32, 64), batch_size=2) + test_data = DataLoader(RandomDataset(32, 64), batch_size=2) + + model = BoringModel() + trainer = Trainer( + default_root_dir=os.getcwd(), + limit_train_batches=1, + limit_val_batches=1, + limit_test_batches=1, + num_sanity_val_steps=0, + max_epochs=1, + enable_model_summary=False, + ) + trainer.fit(model, train_dataloaders=train_data, val_dataloaders=val_data) + trainer.test(model, dataloaders=test_data) + + +if __name__ == "__main__": + run() diff --git a/examples/pytorch/domain_templates/computer_vision_fine_tuning.py b/examples/pytorch/domain_templates/computer_vision_fine_tuning.py new file mode 100644 index 0000000..c7e492e --- /dev/null +++ b/examples/pytorch/domain_templates/computer_vision_fine_tuning.py @@ -0,0 +1,286 @@ +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +"""Computer vision example on Transfer Learning. This computer vision example illustrates how one could fine-tune a +pre-trained network (by default, a ResNet50 is used) using pytorch-lightning. For the sake of this example, the +'cats and dogs dataset' (~60MB, see `DATA_URL` below) and the proposed network (denoted by `TransferLearningModel`, +see below) is trained for 15 epochs. + +The training consists of three stages. + +From epoch 0 to 4, the feature extractor (the pre-trained network) is frozen except +maybe for the BatchNorm layers (depending on whether `train_bn = True`). The BatchNorm +layers (if `train_bn = True`) and the parameters of the classifier are trained as a +single parameters group with lr = 1e-2. + +From epoch 5 to 9, the last two layer groups of the pre-trained network are unfrozen +and added to the optimizer as a new parameter group with lr = 1e-4 (while lr = 1e-3 +for the first parameter group in the optimizer). + +Eventually, from epoch 10, all the remaining layer groups of the pre-trained network +are unfrozen and added to the optimizer as a third parameter group. From epoch 10, +the parameters of the pre-trained network are trained with lr = 1e-5 while those of +the classifier is trained with lr = 1e-4. + +Note: + See: https://pytorch.org/tutorials/beginner/transfer_learning_tutorial.html + +To run: + python computer_vision_fine_tuning.py fit +""" + +import logging +from pathlib import Path +from typing import Union + +import torch +import torch.nn.functional as F +from torch import nn, optim +from torch.optim.lr_scheduler import MultiStepLR +from torch.optim.optimizer import Optimizer +from torch.utils.data import DataLoader +from torchmetrics import Accuracy +from torchvision import transforms +from torchvision.datasets import ImageFolder +from torchvision.datasets.utils import download_and_extract_archive + +from lightning.pytorch import cli_lightning_logo, LightningDataModule, LightningModule +from lightning.pytorch.callbacks.finetuning import BaseFinetuning +from lightning.pytorch.cli import LightningCLI +from lightning.pytorch.utilities import rank_zero_info +from lightning.pytorch.utilities.model_helpers import get_torchvision_model + +log = logging.getLogger(__name__) +DATA_URL = "https://storage.googleapis.com/mledu-datasets/cats_and_dogs_filtered.zip" + +# --- Finetuning Callback --- + + +class MilestonesFinetuning(BaseFinetuning): + def __init__(self, milestones: tuple = (5, 10), train_bn: bool = False): + super().__init__() + self.milestones = milestones + self.train_bn = train_bn + + def freeze_before_training(self, pl_module: LightningModule): + self.freeze(modules=pl_module.feature_extractor, train_bn=self.train_bn) + + def finetune_function(self, pl_module: LightningModule, epoch: int, optimizer: Optimizer): + if epoch == self.milestones[0]: + # unfreeze 5 last layers + self.unfreeze_and_add_param_group( + modules=pl_module.feature_extractor[-5:], optimizer=optimizer, train_bn=self.train_bn + ) + + elif epoch == self.milestones[1]: + # unfreeze remaining layers + self.unfreeze_and_add_param_group( + modules=pl_module.feature_extractor[:-5], optimizer=optimizer, train_bn=self.train_bn + ) + + +class CatDogImageDataModule(LightningDataModule): + def __init__(self, dl_path: Union[str, Path] = "data", num_workers: int = 0, batch_size: int = 8): + """CatDogImageDataModule. + + Args: + dl_path: root directory where to download the data + num_workers: number of CPU workers + batch_size: number of sample in a batch + """ + super().__init__() + + self._dl_path = dl_path + self._num_workers = num_workers + self._batch_size = batch_size + + def prepare_data(self): + """Download images and prepare images datasets.""" + download_and_extract_archive(url=DATA_URL, download_root=self._dl_path, remove_finished=True) + + @property + def data_path(self): + return Path(self._dl_path).joinpath("cats_and_dogs_filtered") + + @property + def normalize_transform(self): + return transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]) + + @property + def train_transform(self): + return transforms.Compose( + [ + transforms.Resize((224, 224)), + transforms.RandomHorizontalFlip(), + transforms.ToTensor(), + self.normalize_transform, + ] + ) + + @property + def valid_transform(self): + return transforms.Compose([transforms.Resize((224, 224)), transforms.ToTensor(), self.normalize_transform]) + + def create_dataset(self, root, transform): + return ImageFolder(root=root, transform=transform) + + def __dataloader(self, train: bool): + """Train/validation loaders.""" + if train: + dataset = self.create_dataset(self.data_path.joinpath("train"), self.train_transform) + else: + dataset = self.create_dataset(self.data_path.joinpath("validation"), self.valid_transform) + return DataLoader(dataset=dataset, batch_size=self._batch_size, num_workers=self._num_workers, shuffle=train) + + def train_dataloader(self): + log.info("Training data loaded.") + return self.__dataloader(train=True) + + def val_dataloader(self): + log.info("Validation data loaded.") + return self.__dataloader(train=False) + + +# --- PyTorch Lightning module --- + + +class TransferLearningModel(LightningModule): + def __init__( + self, + backbone: str = "resnet50", + train_bn: bool = False, + milestones: tuple = (2, 4), + batch_size: int = 32, + lr: float = 1e-3, + lr_scheduler_gamma: float = 1e-1, + num_workers: int = 6, + **kwargs, + ) -> None: + """TransferLearningModel. + + Args: + backbone: Name (as in ``torchvision.models``) of the feature extractor + train_bn: Whether the BatchNorm layers should be trainable + milestones: List of two epochs milestones + lr: Initial learning rate + lr_scheduler_gamma: Factor by which the learning rate is reduced at each milestone + """ + super().__init__() + self.backbone = backbone + self.train_bn = train_bn + self.milestones = milestones + self.batch_size = batch_size + self.lr = lr + self.lr_scheduler_gamma = lr_scheduler_gamma + self.num_workers = num_workers + + self.__build_model() + + self.train_acc = Accuracy(task="binary") + self.valid_acc = Accuracy(task="binary") + self.save_hyperparameters() + + def __build_model(self): + """Define model layers & loss.""" + # 1. Load pre-trained network: + backbone = get_torchvision_model(self.backbone, weights="DEFAULT") + + _layers = list(backbone.children())[:-1] + self.feature_extractor = nn.Sequential(*_layers) + + # 2. Classifier: + _fc_layers = [nn.Linear(2048, 256), nn.ReLU(), nn.Linear(256, 32), nn.Linear(32, 1)] + self.fc = nn.Sequential(*_fc_layers) + + # 3. Loss: + self.loss_func = F.binary_cross_entropy_with_logits + + def forward(self, x): + """Forward pass. + + Returns logits. + """ + # 1. Feature extraction: + x = self.feature_extractor(x) + x = x.squeeze(-1).squeeze(-1) + + # 2. Classifier (returns logits): + x = self.fc(x) + + return x + + def loss(self, logits, labels): + return self.loss_func(input=logits, target=labels) + + def training_step(self, batch, batch_idx): + # 1. Forward pass: + x, y = batch + y_logits = self.forward(x) + y_scores = torch.sigmoid(y_logits) + y_true = y.view((-1, 1)).type_as(x) + + # 2. Compute loss + train_loss = self.loss(y_logits, y_true) + + # 3. Compute accuracy: + self.log("train_acc", self.train_acc(y_scores, y_true.int()), prog_bar=True) + + return train_loss + + def validation_step(self, batch, batch_idx): + # 1. Forward pass: + x, y = batch + y_logits = self.forward(x) + y_scores = torch.sigmoid(y_logits) + y_true = y.view((-1, 1)).type_as(x) + + # 2. Compute loss + self.log("val_loss", self.loss(y_logits, y_true), prog_bar=True) + + # 3. Compute accuracy: + self.log("val_acc", self.valid_acc(y_scores, y_true.int()), prog_bar=True) + + def configure_optimizers(self): + parameters = list(self.parameters()) + trainable_parameters = list(filter(lambda p: p.requires_grad, parameters)) + rank_zero_info( + f"The model will start training with only {len(trainable_parameters)} " + f"trainable parameters out of {len(parameters)}." + ) + optimizer = optim.Adam(trainable_parameters, lr=self.lr) + scheduler = MultiStepLR(optimizer, milestones=self.milestones, gamma=self.lr_scheduler_gamma) + return [optimizer], [scheduler] + + +class MyLightningCLI(LightningCLI): + def add_arguments_to_parser(self, parser): + parser.add_lightning_class_args(MilestonesFinetuning, "finetuning") + parser.link_arguments("data.batch_size", "model.batch_size") + parser.link_arguments("finetuning.milestones", "model.milestones") + parser.link_arguments("finetuning.train_bn", "model.train_bn") + parser.set_defaults( + { + "trainer.max_epochs": 15, + "trainer.enable_model_summary": False, + "trainer.num_sanity_val_steps": 0, + } + ) + + +def cli_main(): + MyLightningCLI(TransferLearningModel, CatDogImageDataModule, seed_everything_default=1234) + + +if __name__ == "__main__": + cli_lightning_logo() + cli_main() diff --git a/examples/pytorch/domain_templates/generative_adversarial_net.py b/examples/pytorch/domain_templates/generative_adversarial_net.py new file mode 100644 index 0000000..7837f6a --- /dev/null +++ b/examples/pytorch/domain_templates/generative_adversarial_net.py @@ -0,0 +1,233 @@ +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +"""To run this template just do: python generative_adversarial_net.py. + +After a few epochs, launch TensorBoard to see the images being generated at every batch: + +tensorboard --logdir default +""" +from argparse import ArgumentParser, Namespace + +import numpy as np +import torch +import torch.nn as nn +import torch.nn.functional as F + +from lightning.pytorch import cli_lightning_logo +from lightning.pytorch.core import LightningModule +from lightning.pytorch.demos.mnist_datamodule import MNISTDataModule +from lightning.pytorch.trainer import Trainer +from lightning.pytorch.utilities.imports import _TORCHVISION_AVAILABLE + +if _TORCHVISION_AVAILABLE: + import torchvision + + +class Generator(nn.Module): + """ + >>> Generator(img_shape=(1, 8, 8)) # doctest: +ELLIPSIS +NORMALIZE_WHITESPACE + Generator( + (model): Sequential(...) + ) + """ + + def __init__(self, latent_dim: int = 100, img_shape: tuple = (1, 28, 28)): + super().__init__() + self.img_shape = img_shape + + def block(in_feat, out_feat, normalize=True): + layers = [nn.Linear(in_feat, out_feat)] + if normalize: + layers.append(nn.BatchNorm1d(out_feat, 0.8)) + layers.append(nn.LeakyReLU(0.2, inplace=True)) + return layers + + self.model = nn.Sequential( + *block(latent_dim, 128, normalize=False), + *block(128, 256), + *block(256, 512), + *block(512, 1024), + nn.Linear(1024, int(np.prod(img_shape))), + nn.Tanh(), + ) + + def forward(self, z): + img = self.model(z) + img = img.view(img.size(0), *self.img_shape) + return img + + +class Discriminator(nn.Module): + """ + >>> Discriminator(img_shape=(1, 28, 28)) # doctest: +ELLIPSIS +NORMALIZE_WHITESPACE + Discriminator( + (model): Sequential(...) + ) + """ + + def __init__(self, img_shape): + super().__init__() + + self.model = nn.Sequential( + nn.Linear(int(np.prod(img_shape)), 512), + nn.LeakyReLU(0.2, inplace=True), + nn.Linear(512, 256), + nn.LeakyReLU(0.2, inplace=True), + nn.Linear(256, 1), + ) + + def forward(self, img): + img_flat = img.view(img.size(0), -1) + return self.model(img_flat) + + +class GAN(LightningModule): + """ + >>> GAN(img_shape=(1, 8, 8)) # doctest: +ELLIPSIS +NORMALIZE_WHITESPACE + GAN( + (generator): Generator( + (model): Sequential(...) + ) + (discriminator): Discriminator( + (model): Sequential(...) + ) + ) + """ + + def __init__( + self, + img_shape: tuple = (1, 28, 28), + lr: float = 0.0002, + b1: float = 0.5, + b2: float = 0.999, + latent_dim: int = 100, + ): + super().__init__() + self.save_hyperparameters() + self.automatic_optimization = False + + # networks + self.generator = Generator(latent_dim=self.hparams.latent_dim, img_shape=img_shape) + self.discriminator = Discriminator(img_shape=img_shape) + + self.validation_z = torch.randn(8, self.hparams.latent_dim) + + self.example_input_array = torch.zeros(2, self.hparams.latent_dim) + + def forward(self, z): + return self.generator(z) + + @staticmethod + def adversarial_loss(y_hat, y): + return F.binary_cross_entropy_with_logits(y_hat, y) + + def training_step(self, batch): + imgs, _ = batch + + opt_g, opt_d = self.optimizers() + + # sample noise + z = torch.randn(imgs.shape[0], self.hparams.latent_dim) + z = z.type_as(imgs) + + # Train generator + # ground truth result (ie: all fake) + # put on GPU because we created this tensor inside training_loop + valid = torch.ones(imgs.size(0), 1) + valid = valid.type_as(imgs) + + self.toggle_optimizer(opt_g) + # adversarial loss is binary cross-entropy + g_loss = self.adversarial_loss(self.discriminator(self(z)), valid) + opt_g.zero_grad() + self.manual_backward(g_loss) + opt_g.step() + self.untoggle_optimizer(opt_g) + + # Train discriminator + # Measure discriminator's ability to classify real from generated samples + # how well can it label as real? + valid = torch.ones(imgs.size(0), 1) + valid = valid.type_as(imgs) + + self.toggle_optimizer(opt_d) + real_loss = self.adversarial_loss(self.discriminator(imgs), valid) + + # how well can it label as fake? + fake = torch.zeros(imgs.size(0), 1) + fake = fake.type_as(imgs) + + fake_loss = self.adversarial_loss(self.discriminator(self(z).detach()), fake) + + # discriminator loss is the average of these + d_loss = (real_loss + fake_loss) / 2 + + opt_d.zero_grad() + self.manual_backward(d_loss) + opt_d.step() + self.untoggle_optimizer(opt_d) + + self.log_dict({"d_loss": d_loss, "g_loss": g_loss}) + + def configure_optimizers(self): + lr = self.hparams.lr + b1 = self.hparams.b1 + b2 = self.hparams.b2 + + opt_g = torch.optim.Adam(self.generator.parameters(), lr=lr, betas=(b1, b2)) + opt_d = torch.optim.Adam(self.discriminator.parameters(), lr=lr, betas=(b1, b2)) + return opt_g, opt_d + + def on_train_epoch_end(self): + z = self.validation_z.type_as(self.generator.model[0].weight) + + # log sampled images + sample_imgs = self(z) + grid = torchvision.utils.make_grid(sample_imgs) + for logger in self.loggers: + logger.experiment.add_image("generated_images", grid, self.current_epoch) + + +def main(args: Namespace) -> None: + # ------------------------ + # 1 INIT LIGHTNING MODEL + # ------------------------ + model = GAN(lr=args.lr, b1=args.b1, b2=args.b2, latent_dim=args.latent_dim) + + # ------------------------ + # 2 INIT TRAINER + # ------------------------ + # If use distributed training PyTorch recommends to use DistributedDataParallel. + # See: https://pytorch.org/docs/stable/nn.html#torch.nn.DataParallel + dm = MNISTDataModule() + trainer = Trainer(accelerator="gpu", devices=1) + + # ------------------------ + # 3 START TRAINING + # ------------------------ + trainer.fit(model, dm) + + +if __name__ == "__main__": + cli_lightning_logo() + parser = ArgumentParser() + + # Hyperparameters + parser.add_argument("--lr", type=float, default=0.0002, help="adam: learning rate") + parser.add_argument("--b1", type=float, default=0.5, help="adam: decay of first order momentum of gradient") + parser.add_argument("--b2", type=float, default=0.999, help="adam: decay of second order momentum of gradient") + parser.add_argument("--latent_dim", type=int, default=100, help="dimensionality of the latent space") + args = parser.parse_args() + + main(args) diff --git a/examples/pytorch/domain_templates/imagenet.py b/examples/pytorch/domain_templates/imagenet.py new file mode 100644 index 0000000..0d7275f --- /dev/null +++ b/examples/pytorch/domain_templates/imagenet.py @@ -0,0 +1,195 @@ +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +"""This example is largely adapted from https://github.com/pytorch/examples/blob/master/imagenet/main.py. + +Before you can run this example, you will need to download the ImageNet dataset manually from the +`official website `_ and place it into a folder `path/to/imagenet`. + +Train on ImageNet with default parameters: + +.. code-block: bash + + python imagenet.py fit --model.data_path /path/to/imagenet + +or show all options you can change: + +.. code-block: bash + + python imagenet.py --help + python imagenet.py fit --help +""" +import os +from typing import Optional + +import torch +import torch.nn.functional as F +import torch.nn.parallel +import torch.optim as optim +import torch.optim.lr_scheduler as lr_scheduler +import torch.utils.data +import torch.utils.data.distributed +import torchvision.datasets as datasets +import torchvision.transforms as transforms +from torch.utils.data import Dataset +from torchmetrics import Accuracy + +from lightning.pytorch import LightningModule +from lightning.pytorch.callbacks import ModelCheckpoint, TQDMProgressBar +from lightning.pytorch.cli import LightningCLI +from lightning.pytorch.strategies import ParallelStrategy +from lightning.pytorch.utilities.model_helpers import get_torchvision_model + + +class ImageNetLightningModel(LightningModule): + """ + >>> ImageNetLightningModel(data_path='missing') # doctest: +ELLIPSIS +NORMALIZE_WHITESPACE + ImageNetLightningModel( + (model): ResNet(...) + ) + """ + + def __init__( + self, + data_path: str, + arch: str = "resnet18", + weights: Optional[str] = None, + lr: float = 0.1, + momentum: float = 0.9, + weight_decay: float = 1e-4, + batch_size: int = 256, + workers: int = 4, + ): + super().__init__() + self.arch = arch + self.weights = weights + self.lr = lr + self.momentum = momentum + self.weight_decay = weight_decay + self.data_path = data_path + self.batch_size = batch_size + self.workers = workers + self.model = get_torchvision_model(self.arch, weights=self.weights) + self.train_dataset: Optional[Dataset] = None + self.eval_dataset: Optional[Dataset] = None + # ToDo: this number of classes hall be parsed when the dataset is loaded from folder + self.train_acc1 = Accuracy(task="multiclass", num_classes=1000, top_k=1) + self.train_acc5 = Accuracy(task="multiclass", num_classes=1000, top_k=5) + self.eval_acc1 = Accuracy(task="multiclass", num_classes=1000, top_k=1) + self.eval_acc5 = Accuracy(task="multiclass", num_classes=1000, top_k=5) + + def forward(self, x): + return self.model(x) + + def training_step(self, batch, batch_idx): + images, target = batch + output = self.model(images) + loss_train = F.cross_entropy(output, target) + self.log("train_loss", loss_train) + # update metrics + self.train_acc1(output, target) + self.train_acc5(output, target) + self.log("train_acc1", self.train_acc1, prog_bar=True) + self.log("train_acc5", self.train_acc5, prog_bar=True) + return loss_train + + def eval_step(self, batch, batch_idx, prefix: str): + images, target = batch + output = self.model(images) + loss_val = F.cross_entropy(output, target) + self.log(f"{prefix}_loss", loss_val) + # update metrics + self.eval_acc1(output, target) + self.eval_acc5(output, target) + self.log(f"{prefix}_acc1", self.eval_acc1, prog_bar=True) + self.log(f"{prefix}_acc5", self.eval_acc5, prog_bar=True) + return loss_val + + def validation_step(self, batch, batch_idx): + return self.eval_step(batch, batch_idx, "val") + + def test_step(self, batch, batch_idx): + return self.eval_step(batch, batch_idx, "test") + + def configure_optimizers(self): + optimizer = optim.SGD(self.parameters(), lr=self.lr, momentum=self.momentum, weight_decay=self.weight_decay) + scheduler = lr_scheduler.LambdaLR(optimizer, lambda epoch: 0.1 ** (epoch // 30)) + return [optimizer], [scheduler] + + def setup(self, stage: str): + if isinstance(self.trainer.strategy, ParallelStrategy): + # When using a single GPU per process and per `DistributedDataParallel`, we need to divide the batch size + # ourselves based on the total number of GPUs we have + num_processes = max(1, self.trainer.strategy.num_processes) + self.batch_size = int(self.batch_size / num_processes) + self.workers = int(self.workers / num_processes) + + if stage == "fit": + normalize = transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]) + train_dir = os.path.join(self.data_path, "train") + self.train_dataset = datasets.ImageFolder( + train_dir, + transforms.Compose( + [ + transforms.RandomResizedCrop(224), + transforms.RandomHorizontalFlip(), + transforms.ToTensor(), + normalize, + ] + ), + ) + # all stages will use the eval dataset + normalize = transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]) + val_dir = os.path.join(self.data_path, "val") + self.eval_dataset = datasets.ImageFolder( + val_dir, + transforms.Compose([transforms.Resize(256), transforms.CenterCrop(224), transforms.ToTensor(), normalize]), + ) + + def train_dataloader(self): + return torch.utils.data.DataLoader( + dataset=self.train_dataset, + batch_size=self.batch_size, + shuffle=True, + num_workers=self.workers, + pin_memory=True, + ) + + def val_dataloader(self): + return torch.utils.data.DataLoader( + self.eval_dataset, batch_size=self.batch_size, num_workers=self.workers, pin_memory=True + ) + + def test_dataloader(self): + return self.val_dataloader() + + +if __name__ == "__main__": + LightningCLI( + ImageNetLightningModel, + trainer_defaults={ + "max_epochs": 90, + "accelerator": "auto", + "devices": 1, + "logger": False, + "benchmark": True, + "callbacks": [ + # the PyTorch example refreshes every 10 batches + TQDMProgressBar(refresh_rate=10), + # save when the validation top1 accuracy improves + ModelCheckpoint(monitor="val_acc1", mode="max"), + ], + }, + seed_everything_default=42, + save_config_kwargs={"overwrite": True}, + ) diff --git a/examples/pytorch/domain_templates/reinforce_learn_Qnet.py b/examples/pytorch/domain_templates/reinforce_learn_Qnet.py new file mode 100644 index 0000000..0f3e455 --- /dev/null +++ b/examples/pytorch/domain_templates/reinforce_learn_Qnet.py @@ -0,0 +1,395 @@ +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +"""Deep Reinforcement Learning: Deep Q-network (DQN) + +The template illustrates using Lightning for Reinforcement Learning. The example builds a basic DQN using the +classic CartPole environment. + +To run the template, just run: +`python reinforce_learn_Qnet.py` + +After ~1500 steps, you will see the total_reward hitting the max score of 475+. +Open up TensorBoard to see the metrics: + +`tensorboard --logdir default` + +References +---------- + +[1] https://github.com/PacktPublishing/Deep-Reinforcement-Learning-Hands-On- +Second-Edition/blob/master/Chapter06/02_dqn_pong.py +""" + +import argparse +from collections import deque, namedtuple, OrderedDict +from typing import Iterator, List, Tuple + +import gym +import numpy as np +import torch +import torch.nn as nn +import torch.optim as optim +from torch.optim.optimizer import Optimizer +from torch.utils.data import DataLoader +from torch.utils.data.dataset import IterableDataset + +from lightning.pytorch import cli_lightning_logo, LightningModule, seed_everything, Trainer + + +class DQN(nn.Module): + """Simple MLP network. + + >>> DQN(10, 5) # doctest: +ELLIPSIS +NORMALIZE_WHITESPACE + DQN( + (net): Sequential(...) + ) + """ + + def __init__(self, obs_size: int, n_actions: int, hidden_size: int = 128): + """ + Args: + obs_size: observation/state size of the environment + n_actions: number of discrete actions available in the environment + hidden_size: size of hidden layers + """ + super().__init__() + self.net = nn.Sequential(nn.Linear(obs_size, hidden_size), nn.ReLU(), nn.Linear(hidden_size, n_actions)) + + def forward(self, x): + return self.net(x.float()) + + +# Named tuple for storing experience steps gathered in training +Experience = namedtuple("Experience", field_names=["state", "action", "reward", "done", "new_state"]) + + +class ReplayBuffer: + """Replay Buffer for storing past experiences allowing the agent to learn from them. + + >>> ReplayBuffer(5) # doctest: +ELLIPSIS + <...reinforce_learn_Qnet.ReplayBuffer object at ...> + """ + + def __init__(self, capacity: int) -> None: + """ + Args: + capacity: size of the buffer + """ + self.buffer = deque(maxlen=capacity) + + def __len__(self) -> int: + return len(self.buffer) + + def append(self, experience: Experience) -> None: + """Add experience to the buffer. + + Args: + experience: tuple (state, action, reward, done, new_state) + """ + self.buffer.append(experience) + + def sample(self, batch_size: int) -> Tuple: + indices = np.random.choice(len(self.buffer), batch_size, replace=False) + states, actions, rewards, dones, next_states = zip(*(self.buffer[idx] for idx in indices)) + + return ( + np.array(states), + np.array(actions), + np.array(rewards, dtype=np.float32), + np.array(dones, dtype=np.bool), + np.array(next_states), + ) + + +class RLDataset(IterableDataset): + """Iterable Dataset containing the ExperienceBuffer which will be updated with new experiences during training. + + >>> RLDataset(ReplayBuffer(5)) # doctest: +ELLIPSIS + <...reinforce_learn_Qnet.RLDataset object at ...> + """ + + def __init__(self, buffer: ReplayBuffer, sample_size: int = 200) -> None: + """ + Args: + buffer: replay buffer + sample_size: number of experiences to sample at a time + """ + self.buffer = buffer + self.sample_size = sample_size + + def __iter__(self) -> Iterator: + states, actions, rewards, dones, new_states = self.buffer.sample(self.sample_size) + for i in range(len(dones)): + yield states[i], actions[i], rewards[i], dones[i], new_states[i] + + +class Agent: + """Base Agent class handling the interaction with the environment. + + >>> env = gym.make("CartPole-v1") + >>> buffer = ReplayBuffer(10) + >>> Agent(env, buffer) # doctest: +ELLIPSIS + <...reinforce_learn_Qnet.Agent object at ...> + """ + + def __init__(self, env: gym.Env, replay_buffer: ReplayBuffer) -> None: + """ + Args: + env: training environment + replay_buffer: replay buffer storing experiences + """ + self.env = env + self.replay_buffer = replay_buffer + self.reset() + self.state = self.env.reset() + + def reset(self) -> None: + """Resets the environment and updates the state.""" + self.state = self.env.reset() + + def get_action(self, net: nn.Module, epsilon: float, device: str) -> int: + """Using the given network, decide what action to carry out using an epsilon-greedy policy. + + Args: + net: DQN network + epsilon: value to determine likelihood of taking a random action + device: current device + + Returns: + action + """ + if np.random.random() < epsilon: + action = self.env.action_space.sample() + else: + state = torch.tensor([self.state]) + + if device not in ["cpu"]: + state = state.cuda(device) + + q_values = net(state) + _, action = torch.max(q_values, dim=1) + action = int(action.item()) + + return action + + @torch.no_grad() + def play_step(self, net: nn.Module, epsilon: float = 0.0, device: str = "cpu") -> Tuple[float, bool]: + """Carries out a single interaction step between the agent and the environment. + + Args: + net: DQN network + epsilon: value to determine likelihood of taking a random action + device: current device + + Returns: + reward, done + """ + action = self.get_action(net, epsilon, device) + + # do step in the environment + new_state, reward, done, _ = self.env.step(action) + + exp = Experience(self.state, action, reward, done, new_state) + + self.replay_buffer.append(exp) + + self.state = new_state + if done: + self.reset() + return reward, done + + +class DQNLightning(LightningModule): + """Basic DQN Model. + + >>> DQNLightning(env="CartPole-v1") # doctest: +ELLIPSIS +NORMALIZE_WHITESPACE + DQNLightning( + (net): DQN( + (net): Sequential(...) + ) + (target_net): DQN( + (net): Sequential(...) + ) + ) + """ + + def __init__( + self, + env: str, + replay_size: int = 200, + warm_start_steps: int = 200, + gamma: float = 0.99, + eps_start: float = 1.0, + eps_end: float = 0.01, + eps_last_frame: int = 200, + sync_rate: int = 10, + lr: float = 1e-2, + episode_length: int = 50, + batch_size: int = 4, + **kwargs, + ) -> None: + super().__init__(**kwargs) + self.replay_size = replay_size + self.warm_start_steps = warm_start_steps + self.gamma = gamma + self.eps_start = eps_start + self.eps_end = eps_end + self.eps_last_frame = eps_last_frame + self.sync_rate = sync_rate + self.lr = lr + self.episode_length = episode_length + self.batch_size = batch_size + + self.env = gym.make(env) + obs_size = self.env.observation_space.shape[0] + n_actions = self.env.action_space.n + + self.net = DQN(obs_size, n_actions) + self.target_net = DQN(obs_size, n_actions) + + self.buffer = ReplayBuffer(self.replay_size) + self.agent = Agent(self.env, self.buffer) + self.total_reward = 0 + self.episode_reward = 0 + self.populate(self.warm_start_steps) + + def populate(self, steps: int = 1000) -> None: + """Carries out several random steps through the environment to initially fill up the replay buffer with + experiences. + + Args: + steps: number of random steps to populate the buffer with + """ + for i in range(steps): + self.agent.play_step(self.net, epsilon=1.0) + + def forward(self, x: torch.Tensor) -> torch.Tensor: + """Passes in a state `x` through the network and gets the `q_values` of each action as an output. + + Args: + x: environment state + + Returns: + q values + """ + return self.net(x) + + def dqn_mse_loss(self, batch: Tuple[torch.Tensor, torch.Tensor]) -> torch.Tensor: + """Calculates the mse loss using a mini batch from the replay buffer. + + Args: + batch: current mini batch of replay data + + Returns: + loss + """ + states, actions, rewards, dones, next_states = batch + + state_action_values = self.net(states).gather(1, actions.unsqueeze(-1)).squeeze(-1) + + with torch.no_grad(): + next_state_values = self.target_net(next_states).max(1)[0] + next_state_values[dones] = 0.0 + next_state_values = next_state_values.detach() + + expected_state_action_values = next_state_values * self.gamma + rewards + + return nn.MSELoss()(state_action_values, expected_state_action_values) + + def training_step(self, batch: Tuple[torch.Tensor, torch.Tensor], nb_batch) -> OrderedDict: + """Carries out a single step through the environment to update the replay buffer. Then calculates loss + based on the minibatch received. + + Args: + batch: current mini batch of replay data + nb_batch: batch number + + Returns: + Training loss and log metrics + """ + device = self.get_device(batch) + epsilon = max(self.eps_end, self.eps_start - (self.global_step + 1) / self.eps_last_frame) + + # step through environment with agent + reward, done = self.agent.play_step(self.net, epsilon, device) + self.episode_reward += reward + + # calculates training loss + loss = self.dqn_mse_loss(batch) + + if done: + self.total_reward = self.episode_reward + self.episode_reward = 0 + + # Soft update of target network + if self.global_step % self.sync_rate == 0: + self.target_net.load_state_dict(self.net.state_dict()) + + log = { + "total_reward": torch.tensor(self.total_reward).to(device), + "reward": torch.tensor(reward).to(device), + "steps": torch.tensor(self.global_step).to(device), + } + + return OrderedDict({"loss": loss, "log": log, "progress_bar": log}) + + def configure_optimizers(self) -> List[Optimizer]: + """Initialize Adam optimizer.""" + optimizer = optim.Adam(self.net.parameters(), lr=self.lr) + return [optimizer] + + def __dataloader(self) -> DataLoader: + """Initialize the Replay Buffer dataset used for retrieving experiences.""" + dataset = RLDataset(self.buffer, self.episode_length) + return DataLoader(dataset=dataset, batch_size=self.batch_size, sampler=None) + + def train_dataloader(self) -> DataLoader: + """Get train loader.""" + return self.__dataloader() + + def get_device(self, batch) -> str: + """Retrieve device currently being used by minibatch.""" + return batch[0].device.index if self.on_gpu else "cpu" + + +def main(args) -> None: + model = DQNLightning(**vars(args)) + trainer = Trainer(accelerator="cpu", devices=1, val_check_interval=100) + trainer.fit(model) + + +if __name__ == "__main__": + cli_lightning_logo() + seed_everything(0) + + parser = argparse.ArgumentParser() + parser.add_argument("--batch_size", type=int, default=16, help="size of the batches") + parser.add_argument("--lr", type=float, default=1e-2, help="learning rate") + parser.add_argument("--env", type=str, default="CartPole-v1", help="gym environment tag") + parser.add_argument("--gamma", type=float, default=0.99, help="discount factor") + parser.add_argument("--sync_rate", type=int, default=10, help="how many frames do we update the target network") + parser.add_argument("--replay_size", type=int, default=1000, help="capacity of the replay buffer") + parser.add_argument( + "--warm_start_steps", + type=int, + default=1000, + help="how many samples do we use to fill our buffer at the start of training", + ) + parser.add_argument("--eps_last_frame", type=int, default=1000, help="what frame should epsilon stop decaying") + parser.add_argument("--eps_start", type=float, default=1.0, help="starting value of epsilon") + parser.add_argument("--eps_end", type=float, default=0.01, help="final value of epsilon") + parser.add_argument("--episode_length", type=int, default=200, help="max length of an episode") + args = parser.parse_args() + + main(args) diff --git a/examples/pytorch/domain_templates/reinforce_learn_ppo.py b/examples/pytorch/domain_templates/reinforce_learn_ppo.py new file mode 100644 index 0000000..b68fcf7 --- /dev/null +++ b/examples/pytorch/domain_templates/reinforce_learn_ppo.py @@ -0,0 +1,455 @@ +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +"""PyTorch Lightning implementation of Proximal Policy Optimization (PPO) + + +Paper authors: John Schulman, Filip Wolski, Prafulla Dhariwal, Alec Radford, Oleg Klimov + +The example implements PPO compatible to work with any continuous or discrete action-space environments via OpenAI Gym. + +To run the template, just run: +`python reinforce_learn_ppo.py` + +References +---------- +[1] https://github.com/openai/baselines/blob/master/baselines/ppo2/ppo2.py +[2] https://github.com/openai/spinningup +[3] https://github.com/sid-sundrani/ppo_lightning +""" +import argparse +from typing import Callable, Iterator, List, Tuple + +import gym +import torch +from torch import nn +from torch.distributions import Categorical, Normal +from torch.optim.optimizer import Optimizer +from torch.utils.data import DataLoader, IterableDataset + +from lightning.pytorch import cli_lightning_logo, LightningModule, seed_everything, Trainer + + +def create_mlp(input_shape: Tuple[int], n_actions: int, hidden_size: int = 128): + """Simple Multi-Layer Perceptron network.""" + return nn.Sequential( + nn.Linear(input_shape[0], hidden_size), + nn.ReLU(), + nn.Linear(hidden_size, hidden_size), + nn.ReLU(), + nn.Linear(hidden_size, n_actions), + ) + + +class ActorCategorical(nn.Module): + """Policy network, for discrete action spaces, which returns a distribution and an action given an + observation.""" + + def __init__(self, actor_net): + """ + Args: + input_shape: observation shape of the environment + n_actions: number of discrete actions available in the environment + """ + super().__init__() + + self.actor_net = actor_net + + def forward(self, states): + logits = self.actor_net(states) + pi = Categorical(logits=logits) + actions = pi.sample() + + return pi, actions + + def get_log_prob(self, pi: Categorical, actions: torch.Tensor): + """Takes in a distribution and actions and returns log prob of actions under the distribution. + + Args: + pi: torch distribution + actions: actions taken by distribution + + Returns: + log probability of the action under pi + """ + return pi.log_prob(actions) + + +class ActorContinuous(nn.Module): + """Policy network, for continuous action spaces, which returns a distribution and an action given an + observation.""" + + def __init__(self, actor_net, act_dim): + """ + Args: + input_shape: observation shape of the environment + n_actions: number of discrete actions available in the environment + """ + super().__init__() + self.actor_net = actor_net + log_std = -0.5 * torch.ones(act_dim, dtype=torch.float) + self.log_std = nn.Parameter(log_std) + + def forward(self, states): + mu = self.actor_net(states) + std = torch.exp(self.log_std) + pi = Normal(loc=mu, scale=std) + actions = pi.sample() + + return pi, actions + + def get_log_prob(self, pi: Normal, actions: torch.Tensor): + """Takes in a distribution and actions and returns log prob of actions under the distribution. + + Args: + pi: torch distribution + actions: actions taken by distribution + + Returns: + log probability of the action under pi + """ + return pi.log_prob(actions).sum(axis=-1) + + +class ExperienceSourceDataset(IterableDataset): + """Implementation from PyTorch Lightning Bolts: https://github.com/Lightning-AI/lightning- + bolts/blob/master/pl_bolts/datamodules/experience_source.py. + + Basic experience source dataset. Takes a generate_batch function that returns an iterator. The logic for the + experience source and how the batch is generated is defined the Lightning model itself + """ + + def __init__(self, generate_batch: Callable): + self.generate_batch = generate_batch + + def __iter__(self) -> Iterator: + return self.generate_batch() + + +class PPOLightning(LightningModule): + """PyTorch Lightning implementation of PPO. + + Example: + model = PPOLightning("CartPole-v0") + Train: + trainer = Trainer() + trainer.fit(model) + """ + + def __init__( + self, + env: str, + gamma: float = 0.99, + lam: float = 0.95, + lr_actor: float = 3e-4, + lr_critic: float = 1e-3, + max_episode_len: float = 200, + batch_size: int = 512, + steps_per_epoch: int = 2048, + nb_optim_iters: int = 4, + clip_ratio: float = 0.2, + **kwargs, + ) -> None: + """ + Args: + env: gym environment tag + gamma: discount factor + lam: advantage discount factor (lambda in the paper) + lr_actor: learning rate of actor network + lr_critic: learning rate of critic network + max_episode_len: maximum number interactions (actions) in an episode + batch_size: batch_size when training network- can simulate number of policy updates performed per epoch + steps_per_epoch: how many action-state pairs to rollout for trajectory collection per epoch + nb_optim_iters: how many steps of gradient descent to perform on each batch + clip_ratio: hyperparameter for clipping in the policy objective + """ + super().__init__() + + # Hyperparameters + self.lr_actor = lr_actor + self.lr_critic = lr_critic + self.steps_per_epoch = steps_per_epoch + self.nb_optim_iters = nb_optim_iters + self.batch_size = batch_size + self.gamma = gamma + self.lam = lam + self.max_episode_len = max_episode_len + self.clip_ratio = clip_ratio + self.save_hyperparameters() + + self.automatic_optimization = False + + self.env = gym.make(env) + # value network + self.critic = create_mlp(self.env.observation_space.shape, 1) + # policy network (agent) + if isinstance(self.env.action_space, gym.spaces.box.Box): + act_dim = self.env.action_space.shape[0] + actor_mlp = create_mlp(self.env.observation_space.shape, act_dim) + self.actor = ActorContinuous(actor_mlp, act_dim) + elif isinstance(self.env.action_space, gym.spaces.discrete.Discrete): + actor_mlp = create_mlp(self.env.observation_space.shape, self.env.action_space.n) + self.actor = ActorCategorical(actor_mlp) + else: + raise NotImplementedError( + "Env action space should be of type Box (continuous) or Discrete (categorical)." + f" Got type: {type(self.env.action_space)}" + ) + + self.batch_states = [] + self.batch_actions = [] + self.batch_adv = [] + self.batch_qvals = [] + self.batch_logp = [] + + self.ep_rewards = [] + self.ep_values = [] + self.epoch_rewards = [] + + self.episode_step = 0 + self.avg_ep_reward = 0 + self.avg_ep_len = 0 + self.avg_reward = 0 + + self.state = torch.FloatTensor(self.env.reset()) + + def forward(self, x: torch.Tensor) -> Tuple[torch.Tensor, torch.Tensor, torch.Tensor]: + """Passes in a state x through the network and returns the policy and a sampled action. + + Args: + x: environment state + + Returns: + Tuple of policy and action + """ + pi, action = self.actor(x) + value = self.critic(x) + + return pi, action, value + + def discount_rewards(self, rewards: List[float], discount: float) -> List[float]: + """Calculate the discounted rewards of all rewards in list. + + Args: + rewards: list of rewards/advantages + + Returns: + list of discounted rewards/advantages + """ + assert isinstance(rewards[0], float) + + cumul_reward = [] + sum_r = 0.0 + + for r in reversed(rewards): + sum_r = (sum_r * discount) + r + cumul_reward.append(sum_r) + + return list(reversed(cumul_reward)) + + def calc_advantage(self, rewards: List[float], values: List[float], last_value: float) -> List[float]: + """Calculate the advantage given rewards, state values, and the last value of episode. + + Args: + rewards: list of episode rewards + values: list of state values from critic + last_value: value of last state of episode + + Returns: + list of advantages + """ + rews = rewards + [last_value] + vals = values + [last_value] + # GAE + delta = [rews[i] + self.gamma * vals[i + 1] - vals[i] for i in range(len(rews) - 1)] + return self.discount_rewards(delta, self.gamma * self.lam) + + def generate_trajectory_samples(self) -> Tuple[List[torch.Tensor], List[torch.Tensor], List[torch.Tensor]]: + """ + Contains the logic for generating trajectory data to train policy and value network + Yield: + Tuple of Lists containing tensors for states, actions, log probs, qvals and advantage + """ + for step in range(self.steps_per_epoch): + self.state = self.state.to(device=self.device) + + with torch.no_grad(): + pi, action, value = self(self.state) + log_prob = self.actor.get_log_prob(pi, action) + + next_state, reward, done, _ = self.env.step(action.cpu().numpy()) + + self.episode_step += 1 + + self.batch_states.append(self.state) + self.batch_actions.append(action) + self.batch_logp.append(log_prob) + + self.ep_rewards.append(reward) + self.ep_values.append(value.item()) + + self.state = torch.FloatTensor(next_state) + + epoch_end = step == (self.steps_per_epoch - 1) + terminal = len(self.ep_rewards) == self.max_episode_len + + if epoch_end or done or terminal: + # if trajectory ends abtruptly, bootstrap value of next state + if (terminal or epoch_end) and not done: + self.state = self.state.to(device=self.device) + with torch.no_grad(): + _, _, value = self(self.state) + last_value = value.item() + steps_before_cutoff = self.episode_step + else: + last_value = 0 + steps_before_cutoff = 0 + + # discounted cumulative reward + self.batch_qvals += self.discount_rewards(self.ep_rewards + [last_value], self.gamma)[:-1] + # advantage + self.batch_adv += self.calc_advantage(self.ep_rewards, self.ep_values, last_value) + # logs + self.epoch_rewards.append(sum(self.ep_rewards)) + # reset params + self.ep_rewards = [] + self.ep_values = [] + self.episode_step = 0 + self.state = torch.FloatTensor(self.env.reset()) + + if epoch_end: + train_data = zip( + self.batch_states, self.batch_actions, self.batch_logp, self.batch_qvals, self.batch_adv + ) + + for state, action, logp_old, qval, adv in train_data: + yield state, action, logp_old, qval, adv + + self.batch_states.clear() + self.batch_actions.clear() + self.batch_adv.clear() + self.batch_logp.clear() + self.batch_qvals.clear() + + # logging + self.avg_reward = sum(self.epoch_rewards) / self.steps_per_epoch + + # if epoch ended abruptly, exlude last cut-short episode to prevent stats skewness + epoch_rewards = self.epoch_rewards + if not done: + epoch_rewards = epoch_rewards[:-1] + + total_epoch_reward = sum(epoch_rewards) + nb_episodes = len(epoch_rewards) + + self.avg_ep_reward = total_epoch_reward / nb_episodes + self.avg_ep_len = (self.steps_per_epoch - steps_before_cutoff) / nb_episodes + + self.epoch_rewards.clear() + + def actor_loss(self, state, action, logp_old, qval, adv) -> torch.Tensor: + pi, _ = self.actor(state) + logp = self.actor.get_log_prob(pi, action) + ratio = torch.exp(logp - logp_old) + clip_adv = torch.clamp(ratio, 1 - self.clip_ratio, 1 + self.clip_ratio) * adv + return -(torch.min(ratio * adv, clip_adv)).mean() + + def critic_loss(self, state, action, logp_old, qval, adv) -> torch.Tensor: + value = self.critic(state) + return (qval - value).pow(2).mean() + + def training_step(self, batch: Tuple[torch.Tensor, torch.Tensor]): + """Carries out a single update to actor and critic network from a batch of replay buffer. + + Args: + batch: batch of replay buffer/trajectory data + """ + state, action, old_logp, qval, adv = batch + + # normalize advantages + adv = (adv - adv.mean()) / adv.std() + + self.log("avg_ep_len", self.avg_ep_len, prog_bar=True, on_step=False, on_epoch=True) + self.log("avg_ep_reward", self.avg_ep_reward, prog_bar=True, on_step=False, on_epoch=True) + self.log("avg_reward", self.avg_reward, prog_bar=True, on_step=False, on_epoch=True) + + optimizer_actor, optimizer_critic = self.optimizers() + + loss_actor = self.actor_loss(state, action, old_logp, qval, adv) + self.manual_backward(loss_actor) + optimizer_actor.step() + optimizer_actor.zero_grad() + + loss_critic = self.critic_loss(state, action, old_logp, qval, adv) + self.manual_backward(loss_critic) + optimizer_critic.step() + optimizer_critic.zero_grad() + + self.log("loss_critic", loss_critic, on_step=False, on_epoch=True, prog_bar=False, logger=True) + self.log("loss_actor", loss_actor, on_step=False, on_epoch=True, prog_bar=True, logger=True) + + def configure_optimizers(self) -> List[Optimizer]: + """Initialize Adam optimizer.""" + optimizer_actor = torch.optim.Adam(self.actor.parameters(), lr=self.lr_actor) + optimizer_critic = torch.optim.Adam(self.critic.parameters(), lr=self.lr_critic) + return optimizer_actor, optimizer_critic + + def optimizer_step(self, *args, **kwargs): + """Run 'nb_optim_iters' number of iterations of gradient descent on actor and critic for each data + sample.""" + for _ in range(self.nb_optim_iters): + super().optimizer_step(*args, **kwargs) + + def _dataloader(self) -> DataLoader: + """Initialize the Replay Buffer dataset used for retrieving experiences.""" + dataset = ExperienceSourceDataset(self.generate_trajectory_samples) + return DataLoader(dataset=dataset, batch_size=self.batch_size) + + def train_dataloader(self) -> DataLoader: + """Get train loader.""" + return self._dataloader() + + +def main(args) -> None: + model = PPOLightning(**vars(args)) + trainer = Trainer(accelerator="cpu", devices=1, val_check_interval=100) + trainer.fit(model) + + +if __name__ == "__main__": + cli_lightning_logo() + seed_everything(0) + + parser = argparse.ArgumentParser() + parser.add_argument("--env", type=str, default="CartPole-v0") + parser.add_argument("--gamma", type=float, default=0.99, help="discount factor") + parser.add_argument("--lam", type=float, default=0.95, help="advantage discount factor") + parser.add_argument("--lr_actor", type=float, default=3e-4, help="learning rate of actor network") + parser.add_argument("--lr_critic", type=float, default=1e-3, help="learning rate of critic network") + parser.add_argument("--max_episode_len", type=int, default=1000, help="capacity of the replay buffer") + parser.add_argument("--batch_size", type=int, default=512, help="batch_size when training network") + parser.add_argument( + "--steps_per_epoch", + type=int, + default=2048, + help="how many action-state pairs to rollout for trajectory collection per epoch", + ) + parser.add_argument( + "--nb_optim_iters", type=int, default=4, help="how many steps of gradient descent to perform on each batch" + ) + parser.add_argument( + "--clip_ratio", type=float, default=0.2, help="hyperparameter for clipping in the policy objective" + ) + args = parser.parse_args() + + main(args) diff --git a/examples/pytorch/domain_templates/semantic_segmentation.py b/examples/pytorch/domain_templates/semantic_segmentation.py new file mode 100644 index 0000000..eb81675 --- /dev/null +++ b/examples/pytorch/domain_templates/semantic_segmentation.py @@ -0,0 +1,406 @@ +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +import os +import random +from argparse import ArgumentParser, Namespace + +import numpy as np +import torch +import torch.nn.functional as F +import torchvision.transforms as transforms +from PIL import Image +from torch import nn +from torch.utils.data import DataLoader, Dataset + +from lightning.pytorch import cli_lightning_logo, LightningModule, Trainer + +DEFAULT_VOID_LABELS = (0, 1, 2, 3, 4, 5, 6, 9, 10, 14, 15, 16, 18, 29, 30, -1) +DEFAULT_VALID_LABELS = (7, 8, 11, 12, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 31, 32, 33) + + +def _create_synth_kitti_dataset(path_dir: str, image_dims: tuple = (1024, 512)): + """Create synthetic dataset with random images, just to simulate that the dataset have been already + downloaded.""" + path_dir_images = os.path.join(path_dir, KITTI.IMAGE_PATH) + path_dir_masks = os.path.join(path_dir, KITTI.MASK_PATH) + for p_dir in (path_dir_images, path_dir_masks): + os.makedirs(p_dir, exist_ok=True) + for i in range(3): + path_img = os.path.join(path_dir_images, f"dummy_kitti_{i}.png") + Image.new("RGB", image_dims).save(path_img) + path_mask = os.path.join(path_dir_masks, f"dummy_kitti_{i}.png") + Image.new("L", image_dims).save(path_mask) + + +class KITTI(Dataset): + """Class for KITTI Semantic Segmentation Benchmark dataset. + + Dataset link - http://www.cvlibs.net/datasets/kitti/eval_semseg.php?benchmark=semantics2015 + + There are 34 classes in the given labels. However, not all of them are useful for training + (like railings on highways, road dividers, etc.). + So, these useless classes (the pixel values of these classes) are stored in the `void_labels`. + The useful classes are stored in the `valid_labels`. + + The `encode_segmap` function sets all pixels with any of the `void_labels` to `ignore_index` + (250 by default). It also sets all of the valid pixels to the appropriate value between 0 and + `len(valid_labels)` (since that is the number of valid classes), so it can be used properly by + the loss function when comparing with the output. + + The `get_filenames` function retrieves the filenames of all images in the given `path` and + saves the absolute path in a list. + + In the `get_item` function, images and masks are resized to the given `img_size`, masks are + encoded using `encode_segmap`, and given `transform` (if any) are applied to the image only + (mask does not usually require transforms, but they can be implemented in a similar way). + """ + + IMAGE_PATH = os.path.join("training", "image_2") + MASK_PATH = os.path.join("training", "semantic") + + def __init__( + self, + data_path: str, + split: str, + img_size: tuple = (1242, 376), + void_labels: list = DEFAULT_VOID_LABELS, + valid_labels: list = DEFAULT_VALID_LABELS, + transform=None, + ): + self.img_size = img_size + self.void_labels = void_labels + self.valid_labels = valid_labels + self.ignore_index = 250 + self.class_map = dict(zip(self.valid_labels, range(len(self.valid_labels)))) + self.transform = transform + + self.split = split + self.data_path = data_path + self.img_path = os.path.join(self.data_path, self.IMAGE_PATH) + self.mask_path = os.path.join(self.data_path, self.MASK_PATH) + self.img_list = self.get_filenames(self.img_path) + self.mask_list = self.get_filenames(self.mask_path) + + # Split between train and valid set (80/20) + random_inst = random.Random(12345) # for repeatability + n_items = len(self.img_list) + idxs = random_inst.sample(range(n_items), n_items // 5) + if self.split == "train": + idxs = [idx for idx in range(n_items) if idx not in idxs] + self.img_list = [self.img_list[i] for i in idxs] + self.mask_list = [self.mask_list[i] for i in idxs] + + def __len__(self): + return len(self.img_list) + + def __getitem__(self, idx): + img = Image.open(self.img_list[idx]) + img = img.resize(self.img_size) + img = np.array(img) + + mask = Image.open(self.mask_list[idx]).convert("L") + mask = mask.resize(self.img_size) + mask = np.array(mask) + mask = self.encode_segmap(mask) + + if self.transform: + img = self.transform(img) + + return img, mask + + def encode_segmap(self, mask): + """Sets void classes to zero so they won't be considered for training.""" + for voidc in self.void_labels: + mask[mask == voidc] = self.ignore_index + for validc in self.valid_labels: + mask[mask == validc] = self.class_map[validc] + # remove extra idxs from updated dataset + mask[mask > 18] = self.ignore_index + return mask + + def get_filenames(self, path): + """Returns a list of absolute paths to images inside given `path`""" + files_list = [] + for filename in os.listdir(path): + files_list.append(os.path.join(path, filename)) + return files_list + + +class UNet(nn.Module): + """Architecture based on U-Net: Convolutional Networks for Biomedical Image Segmentation. + + Link - https://arxiv.org/abs/1505.04597 + + >>> UNet(num_classes=2, num_layers=3) # doctest: +ELLIPSIS +NORMALIZE_WHITESPACE + UNet( + (layers): ModuleList( + (0): DoubleConv(...) + (1): Down(...) + (2): Down(...) + (3): Up(...) + (4): Up(...) + (5): Conv2d(64, 2, kernel_size=(1, 1), stride=(1, 1)) + ) + ) + """ + + def __init__(self, num_classes: int = 19, num_layers: int = 5, features_start: int = 64, bilinear: bool = False): + """ + Args: + num_classes: Number of output classes required (default 19 for KITTI dataset) + num_layers: Number of layers in each side of U-net + features_start: Number of features in first layer + bilinear: Whether to use bilinear interpolation or transposed convolutions for upsampling. + """ + super().__init__() + self.num_layers = num_layers + + layers = [DoubleConv(3, features_start)] + + feats = features_start + for _ in range(num_layers - 1): + layers.append(Down(feats, feats * 2)) + feats *= 2 + + for _ in range(num_layers - 1): + layers.append(Up(feats, feats // 2, bilinear)) + feats //= 2 + + layers.append(nn.Conv2d(feats, num_classes, kernel_size=1)) + + self.layers = nn.ModuleList(layers) + + def forward(self, x): + xi = [self.layers[0](x)] + # Down path + for layer in self.layers[1 : self.num_layers]: + xi.append(layer(xi[-1])) + # Up path + for i, layer in enumerate(self.layers[self.num_layers : -1]): + xi[-1] = layer(xi[-1], xi[-2 - i]) + return self.layers[-1](xi[-1]) + + +class DoubleConv(nn.Module): + """Double Convolution and BN and ReLU (3x3 conv -> BN -> ReLU) ** 2. + + >>> DoubleConv(4, 4) # doctest: +ELLIPSIS +NORMALIZE_WHITESPACE + DoubleConv( + (net): Sequential(...) + ) + """ + + def __init__(self, in_ch: int, out_ch: int): + super().__init__() + self.net = nn.Sequential( + nn.Conv2d(in_ch, out_ch, kernel_size=3, padding=1), + nn.BatchNorm2d(out_ch), + nn.ReLU(inplace=True), + nn.Conv2d(out_ch, out_ch, kernel_size=3, padding=1), + nn.BatchNorm2d(out_ch), + nn.ReLU(inplace=True), + ) + + def forward(self, x): + return self.net(x) + + +class Down(nn.Module): + """Combination of MaxPool2d and DoubleConv in series. + + >>> Down(4, 8) # doctest: +ELLIPSIS +NORMALIZE_WHITESPACE + Down( + (net): Sequential( + (0): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False) + (1): DoubleConv( + (net): Sequential(...) + ) + ) + ) + """ + + def __init__(self, in_ch: int, out_ch: int): + super().__init__() + self.net = nn.Sequential(nn.MaxPool2d(kernel_size=2, stride=2), DoubleConv(in_ch, out_ch)) + + def forward(self, x): + return self.net(x) + + +class Up(nn.Module): + """Upsampling (by either bilinear interpolation or transpose convolutions) followed by concatenation of feature + map from contracting path, followed by double 3x3 convolution. + + >>> Up(8, 4) # doctest: +ELLIPSIS +NORMALIZE_WHITESPACE + Up( + (upsample): ConvTranspose2d(8, 4, kernel_size=(2, 2), stride=(2, 2)) + (conv): DoubleConv( + (net): Sequential(...) + ) + ) + """ + + def __init__(self, in_ch: int, out_ch: int, bilinear: bool = False): + super().__init__() + self.upsample = None + if bilinear: + self.upsample = nn.Sequential( + nn.Upsample(scale_factor=2, mode="bilinear", align_corners=True), + nn.Conv2d(in_ch, in_ch // 2, kernel_size=1), + ) + else: + self.upsample = nn.ConvTranspose2d(in_ch, in_ch // 2, kernel_size=2, stride=2) + + self.conv = DoubleConv(in_ch, out_ch) + + def forward(self, x1, x2): + x1 = self.upsample(x1) + + # Pad x1 to the size of x2 + diff_h = x2.shape[2] - x1.shape[2] + diff_w = x2.shape[3] - x1.shape[3] + + x1 = F.pad(x1, [diff_w // 2, diff_w - diff_w // 2, diff_h // 2, diff_h - diff_h // 2]) + + # Concatenate along the channels axis + x = torch.cat([x2, x1], dim=1) + return self.conv(x) + + +class SegModel(LightningModule): + """Semantic Segmentation Module. + + This is a basic semantic segmentation module implemented with Lightning. + It uses CrossEntropyLoss as the default loss function. May be replaced with + other loss functions as required. + It is specific to KITTI dataset i.e. dataloaders are for KITTI + and Normalize transform uses the mean and standard deviation of this dataset. + It uses the FCN ResNet50 model as an example. + + Adam optimizer is used along with Cosine Annealing learning rate scheduler. + + >>> dataset_path = os.path.join(".", "Kitti") + >>> _create_synth_kitti_dataset(dataset_path, image_dims=(1024, 512)) + >>> SegModel(dataset_path) # doctest: +ELLIPSIS +NORMALIZE_WHITESPACE + SegModel( + (net): UNet( + (layers): ModuleList( + (0): DoubleConv(...) + (1): Down(...) + (2): Down(...) + (3): Up(...) + (4): Up(...) + (5): Conv2d(64, 19, kernel_size=(1, 1), stride=(1, 1)) + ) + ) + ) + """ + + def __init__( + self, + data_path: str, + batch_size: int = 4, + lr: float = 1e-3, + num_layers: int = 3, + features_start: int = 64, + bilinear: bool = False, + **kwargs, + ): + super().__init__(**kwargs) + self.data_path = data_path + self.batch_size = batch_size + self.lr = lr + self.num_layers = num_layers + self.features_start = features_start + self.bilinear = bilinear + + self.net = UNet( + num_classes=19, num_layers=self.num_layers, features_start=self.features_start, bilinear=self.bilinear + ) + self.transform = transforms.Compose( + [ + transforms.ToTensor(), + transforms.Normalize( + mean=[0.35675976, 0.37380189, 0.3764753], std=[0.32064945, 0.32098866, 0.32325324] + ), + ] + ) + self.trainset = KITTI(self.data_path, split="train", transform=self.transform) + self.validset = KITTI(self.data_path, split="valid", transform=self.transform) + + def forward(self, x): + return self.net(x) + + def training_step(self, batch, batch_nb): + img, mask = batch + img = img.float() + mask = mask.long() + out = self(img) + loss = F.cross_entropy(out, mask, ignore_index=250) + log_dict = {"train_loss": loss} + return {"loss": loss, "log": log_dict, "progress_bar": log_dict} + + def validation_step(self, batch, batch_idx): + img, mask = batch + img = img.float() + mask = mask.long() + out = self(img) + val_loss = F.cross_entropy(out, mask, ignore_index=250) + self.log("val_loss", val_loss, prog_bar=True) + + def configure_optimizers(self): + opt = torch.optim.Adam(self.net.parameters(), lr=self.learning_rate) + sch = torch.optim.lr_scheduler.CosineAnnealingLR(opt, T_max=10) + return [opt], [sch] + + def train_dataloader(self): + return DataLoader(self.trainset, batch_size=self.batch_size, shuffle=True) + + def val_dataloader(self): + return DataLoader(self.validset, batch_size=self.batch_size, shuffle=False) + + +def main(hparams: Namespace): + # ------------------------ + # 1 INIT LIGHTNING MODEL + # ------------------------ + model = SegModel(**vars(hparams)) + + # ------------------------ + # 2 INIT TRAINER + # ------------------------ + trainer = Trainer() + + # ------------------------ + # 3 START TRAINING + # ------------------------ + trainer.fit(model) + + +if __name__ == "__main__": + cli_lightning_logo() + + parser = ArgumentParser() + parser.add_argument("--data_path", type=str, help="path where dataset is stored") + parser.add_argument("--batch_size", type=int, default=16, help="size of the batches") + parser.add_argument("--lr", type=float, default=0.001, help="adam: learning rate") + parser.add_argument("--num_layers", type=int, default=5, help="number of layers on u-net") + parser.add_argument("--features_start", type=float, default=64, help="number of features in first layer") + parser.add_argument( + "--bilinear", action="store_true", default=False, help="whether to use bilinear interpolation or transposed" + ) + hparams = parser.parse_args() + + main(hparams) diff --git a/examples/pytorch/hpu/mnist_sample.py b/examples/pytorch/hpu/mnist_sample.py new file mode 100644 index 0000000..0d04074 --- /dev/null +++ b/examples/pytorch/hpu/mnist_sample.py @@ -0,0 +1,73 @@ +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +import torch +from jsonargparse import lazy_instance +from lightning_habana import HPUPrecisionPlugin +from torch.nn import functional as F + +from lightning.pytorch import LightningModule +from lightning.pytorch.cli import LightningCLI +from lightning.pytorch.demos.mnist_datamodule import MNISTDataModule + + +class LitClassifier(LightningModule): + def __init__(self): + super().__init__() + self.l1 = torch.nn.Linear(28 * 28, 10) + + def forward(self, x): + return torch.relu(self.l1(x.view(x.size(0), -1))) + + def training_step(self, batch, batch_idx): + x, y = batch + return F.cross_entropy(self(x), y) + + def validation_step(self, batch, batch_idx): + x, y = batch + probs = self(x) + acc = self.accuracy(probs, y) + self.log("val_acc", acc) + + def test_step(self, batch, batch_idx): + x, y = batch + logits = self(x) + acc = self.accuracy(logits, y) + self.log("test_acc", acc) + + @staticmethod + def accuracy(logits, y): + return torch.sum(torch.eq(torch.argmax(logits, -1), y).to(torch.float32)) / len(y) + + def configure_optimizers(self): + return torch.optim.Adam(self.parameters(), lr=0.02) + + +if __name__ == "__main__": + cli = LightningCLI( + LitClassifier, + MNISTDataModule, + trainer_defaults={ + "accelerator": "hpu", + "devices": 1, + "max_epochs": 1, + "plugins": lazy_instance(HPUPrecisionPlugin, precision="16-mixed"), + }, + run=False, + save_config_kwargs={"overwrite": True}, + ) + + # Run the model ⚡ + cli.trainer.fit(cli.model, datamodule=cli.datamodule) + cli.trainer.validate(cli.model, datamodule=cli.datamodule) + cli.trainer.test(cli.model, datamodule=cli.datamodule) diff --git a/examples/pytorch/hpu/ops_bf16_mnist.txt b/examples/pytorch/hpu/ops_bf16_mnist.txt new file mode 100644 index 0000000..53ec99c --- /dev/null +++ b/examples/pytorch/hpu/ops_bf16_mnist.txt @@ -0,0 +1,2 @@ +linear +relu diff --git a/examples/pytorch/hpu/ops_fp32_mnist.txt b/examples/pytorch/hpu/ops_fp32_mnist.txt new file mode 100644 index 0000000..4509b7e --- /dev/null +++ b/examples/pytorch/hpu/ops_fp32_mnist.txt @@ -0,0 +1 @@ +cross_entropy diff --git a/examples/pytorch/ipu/mnist_sample.py b/examples/pytorch/ipu/mnist_sample.py new file mode 100644 index 0000000..8cef121 --- /dev/null +++ b/examples/pytorch/ipu/mnist_sample.py @@ -0,0 +1,84 @@ +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +import torch +from torch.nn import functional as F + +from lightning.pytorch import LightningModule, Trainer +from lightning.pytorch.demos.mnist_datamodule import MNISTDataModule + + +class LitClassifier(LightningModule): + def __init__(self, hidden_dim: int = 128, learning_rate: float = 0.0001): + super().__init__() + self.save_hyperparameters() + + self.l1 = torch.nn.Linear(28 * 28, self.hparams.hidden_dim) + self.l2 = torch.nn.Linear(self.hparams.hidden_dim, 10) + + self.val_outptus = [] + self.test_outputs = [] + + def forward(self, x): + x = x.view(x.size(0), -1) + x = torch.relu(self.l1(x)) + x = torch.relu(self.l2(x)) + return x + + def training_step(self, batch, batch_idx): + x, y = batch + y_hat = self(x) + return F.cross_entropy(y_hat, y) + + def validation_step(self, batch, batch_idx): + x, y = batch + probs = self(x) + acc = self.accuracy(probs, y) + self.val_outputs.append(acc) + return acc + + def test_step(self, batch, batch_idx): + x, y = batch + logits = self(x) + acc = self.accuracy(logits, y) + self.test_outputs.append(acc) + return acc + + def accuracy(self, logits, y): + # currently IPU poptorch doesn't implicit convert bools to tensor + # hence we use an explicit calculation for accuracy here. Once fixed in poptorch + # we can use the accuracy metric. + return torch.sum(torch.eq(torch.argmax(logits, -1), y).to(torch.float32)) / len(y) + + def on_validation_epoch_end(self) -> None: + # since the training step/validation step and test step are run on the IPU device + # we must log the average loss outside the step functions. + self.log("val_acc", torch.stack(self.val_outptus).mean(), prog_bar=True) + self.val_outptus.clear() + + def on_test_epoch_end(self) -> None: + self.log("test_acc", torch.stack(self.test_outputs).mean()) + self.test_outputs.clear() + + def configure_optimizers(self): + return torch.optim.Adam(self.parameters(), lr=self.hparams.learning_rate) + + +if __name__ == "__main__": + dm = MNISTDataModule(batch_size=32) + model = LitClassifier() + trainer = Trainer(max_epochs=2, accelerator="ipu", devices=8) + + trainer.fit(model, datamodule=dm) + trainer.test(model, datamodule=dm) diff --git a/examples/pytorch/servable_module/production.py b/examples/pytorch/servable_module/production.py new file mode 100644 index 0000000..c13b1bf --- /dev/null +++ b/examples/pytorch/servable_module/production.py @@ -0,0 +1,124 @@ +import base64 +from dataclasses import dataclass +from io import BytesIO +from os import path +from typing import Dict, Optional + +import numpy as np +import torch +import torchvision +import torchvision.transforms as T +from PIL import Image as PILImage + +from lightning.pytorch import cli_lightning_logo, LightningDataModule, LightningModule +from lightning.pytorch.cli import LightningCLI +from lightning.pytorch.serve import ServableModule, ServableModuleValidator +from lightning.pytorch.utilities.model_helpers import get_torchvision_model + +DATASETS_PATH = path.join(path.dirname(__file__), "..", "..", "Datasets") + + +class LitModule(LightningModule): + def __init__(self, name: str = "resnet18"): + super().__init__() + self.model = get_torchvision_model(name, weights="DEFAULT") + self.model.fc = torch.nn.Linear(self.model.fc.in_features, 10) + self.criterion = torch.nn.CrossEntropyLoss() + + def training_step(self, batch, batch_idx): + inputs, labels = batch + outputs = self.model(inputs) + loss = self.criterion(outputs, labels) + self.log("train_loss", loss) + return loss + + def validation_step(self, batch, batch_idx): + inputs, labels = batch + outputs = self.model(inputs) + loss = self.criterion(outputs, labels) + self.log("val_loss", loss) + + def configure_optimizers(self): + return torch.optim.SGD(self.parameters(), lr=0.001, momentum=0.9) + + +class CIFAR10DataModule(LightningDataModule): + transform = T.Compose([T.Resize(256), T.CenterCrop(224), T.ToTensor()]) + + def train_dataloader(self, *args, **kwargs): + trainset = torchvision.datasets.CIFAR10(root=DATASETS_PATH, train=True, download=True, transform=self.transform) + return torch.utils.data.DataLoader(trainset, batch_size=2, shuffle=True, num_workers=0) + + def val_dataloader(self, *args, **kwargs): + valset = torchvision.datasets.CIFAR10(root=DATASETS_PATH, train=False, download=True, transform=self.transform) + return torch.utils.data.DataLoader(valset, batch_size=2, shuffle=True, num_workers=0) + + +@dataclass(unsafe_hash=True) +class Image: + height: Optional[int] = None + width: Optional[int] = None + extension: str = "JPEG" + mode: str = "RGB" + channel_first: bool = False + + def deserialize(self, data: str) -> torch.Tensor: + encoded_with_padding = (data + "===").encode("UTF-8") + img = base64.b64decode(encoded_with_padding) + buffer = BytesIO(img) + img = PILImage.open(buffer, mode="r") + if self.height and self.width: + img = img.resize((self.width, self.height)) + arr = np.array(img) + return T.ToTensor()(arr).unsqueeze(0) + + +class Top1: + def serialize(self, tensor: torch.Tensor) -> int: + return torch.nn.functional.softmax(tensor).argmax().item() + + +class ProductionReadyModel(LitModule, ServableModule): + def configure_payload(self): + # 1: Access the train dataloader and load a single sample. + image, _ = self.trainer.train_dataloader.dataset[0] + + # 2: Convert the image into a PIL Image to bytes and encode it with base64 + pil_image = T.ToPILImage()(image) + buffered = BytesIO() + pil_image.save(buffered, format="JPEG") + img_str = base64.b64encode(buffered.getvalue()).decode("UTF-8") + + return {"body": {"x": img_str}} + + def configure_serialization(self): + return {"x": Image(224, 224).deserialize}, {"output": Top1().serialize} + + def serve_step(self, x: torch.Tensor) -> Dict[str, torch.Tensor]: + return {"output": self.model(x)} + + def configure_response(self): + return {"output": 7} + + +def cli_main(): + cli = LightningCLI( + ProductionReadyModel, + CIFAR10DataModule, + seed_everything_default=42, + save_config_kwargs={"overwrite": True}, + run=False, + trainer_defaults={ + "accelerator": "cpu", + "callbacks": [ServableModuleValidator()], + "max_epochs": 1, + "limit_train_batches": 5, + "limit_val_batches": 5, + }, + ) + cli.trainer.fit(cli.model, cli.datamodule) + + +if __name__ == "__main__": + cli_lightning_logo() + cli_main() diff --git a/examples/run_fabric_examples.sh b/examples/run_fabric_examples.sh new file mode 100644 index 0000000..e03c8ca --- /dev/null +++ b/examples/run_fabric_examples.sh @@ -0,0 +1,21 @@ +#!/bin/bash +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +set -ex + +export PYTHONPATH="${PYTHONPATH}:$(pwd)" +dir_path=$(dirname "${BASH_SOURCE[0]}") + +args="--epochs=1" +python -m lightning_fabric.cli "${dir_path}/fabric/image_classifier/train_fabric.py" ${args} "$@" diff --git a/examples/run_pl_examples.sh b/examples/run_pl_examples.sh new file mode 100644 index 0000000..0d5410d --- /dev/null +++ b/examples/run_pl_examples.sh @@ -0,0 +1,36 @@ +#!/bin/bash +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +set -ex + +export PYTHONPATH="${PYTHONPATH}:$(pwd)" +dir_path=$(dirname "${BASH_SOURCE[0]}") +args=" + --data.batch_size=32 + --trainer.max_epochs=1 + --trainer.limit_train_batches=2 + --trainer.limit_val_batches=2 + --trainer.limit_test_batches=2 + --trainer.limit_predict_batches=2 + --optimizer=Adam +" + +python "${dir_path}/pytorch/basics/backbone_image_classifier.py" ${args} "$@" +python "${dir_path}/pytorch/basics/autoencoder.py" ${args} "$@" + + +# test that a user can manually launch individual processes +args="--trainer.devices 2 --trainer.strategy ddp --trainer.max_epochs=1 --trainer.limit_train_batches=1 --trainer.limit_val_batches=1 --trainer.limit_test_batches=1" +MASTER_ADDR="localhost" MASTER_PORT=1234 LOCAL_RANK=1 python "${dir_path}/pytorch/basics/autoencoder.py" ${args} & +MASTER_ADDR="localhost" MASTER_PORT=1234 LOCAL_RANK=0 python "${dir_path}/pytorch/basics/autoencoder.py" ${args} diff --git a/requirements.txt b/requirements.txt index 52c1fc7..4cdb001 100644 --- a/requirements.txt +++ b/requirements.txt @@ -1,24 +1,7 @@ -# docs requirements -# from pytorch-lightning/requirements/docs.txt -sphinx>=4.0,<5.0 -myst-parser>=0.15,<0.17 -nbsphinx>=0.8.5 -ipython[notebook] -pandoc>=1.0 -docutils>=0.16 -sphinxcontrib-fulltoc>=1.0 -sphinxcontrib-mockautodoc -sphinx-autodoc-typehints>=1.11,<1.15 # v1.15 failing on master (#11405) -sphinx-paramlinks>=0.5.1 -sphinx-togglebutton>=0.2 -sphinx-copybutton>=0.3 -typing-extensions # already in `requirements.txt` but the docs CI job does not install it -jinja2>=3.0.0,<3.1.0 +# instead of install from source, use the pre-built wheel +lightning -# -r ../_notebooks/.actions/requirements.txt - -# switch sphinx theme to PyTorchKorea's -pt-lightning-sphinx-theme @ https://github.com/PyTorchKorea/lightning_sphinx_theme/archive/master.zip - -# PyTorch Lightning -pytorch-lightning==1.6.4 +# the default package dependencies +-r ./requirements/app/base.txt +-r ./requirements/pytorch/base.txt +-r ./requirements/pytorch/docs.txt \ No newline at end of file diff --git a/requirements/README.md b/requirements/README.md new file mode 100644 index 0000000..5b408f3 --- /dev/null +++ b/requirements/README.md @@ -0,0 +1,12 @@ +# Project Requirements + +This root requirements folder branches into sub-folders depending on the python package. +Within the folder, we have grouped requirements files/lists per focus, which shall closely match package extra +So, for example, when you install PL as `pip install pytorch-lightning[extra]`, this list is stored in `requirements/pytorch/extra.txt`. + +## CI/CD upper bounds + +For Ci stability, we have set for all package versions upper bounds (the latest version), so with any sudden release, we won't put our development on fire. +The continues updated of these upper bounds are managed by dependabot. +Note that these upper bounds are lifters when installing a package from the source or as a package. +If you want to preserve/enforce restrictions on the latest compatible version, add "strict" as an in-line comment. diff --git a/requirements/_integrations/accelerators.txt b/requirements/_integrations/accelerators.txt new file mode 100644 index 0000000..cfdb7d6 --- /dev/null +++ b/requirements/_integrations/accelerators.txt @@ -0,0 +1,3 @@ +# validation HPU connectors +lightning-habana >=0.1.0 +lightning-graphcore >=0.1.0.rc3 diff --git a/requirements/_integrations/strategies.txt b/requirements/_integrations/strategies.txt new file mode 100644 index 0000000..3227549 --- /dev/null +++ b/requirements/_integrations/strategies.txt @@ -0,0 +1,5 @@ +# NOTE: the upper bound for the package version is only set for CI stability, and it is dropped while installing this package +# in case you want to preserve/enforce restrictions on the latest compatible version, add "strict" as an in-line comment + +lightning-colossalai >=0.1.0 +lightning-bagua >=0.1.0 diff --git a/requirements/app/base.txt b/requirements/app/base.txt new file mode 100644 index 0000000..edeb5ad --- /dev/null +++ b/requirements/app/base.txt @@ -0,0 +1,30 @@ +lightning-cloud >=0.5.37 +packaging +typing-extensions >=4.0.0, <=4.7.1 +deepdiff >=5.7.0, <6.3.2 +starsessions >=1.2.1, <2.0 # strict +fsspec >=2022.5.0, <=2023.6.0 +croniter >=1.3.0, <1.5.0 # strict; TODO: for now until we find something more robust. +traitlets >=5.3.0, <5.10.0 +arrow >=1.2.0, <1.2.4 +lightning-utilities >=0.8.0, <0.10.0 +beautifulsoup4 >=4.8.0, <4.12.3 +inquirer >=2.10.0, <=3.1.3 +psutil <5.9.5 +click <=8.1.3 +python-multipart>=0.0.5, <=0.0.6 +backoff >=2.2.1, <2.3.0 + +fastapi >=0.92.0, <0.100.0 +starlette # https://fastapi.tiangolo.com/deployment/versions/#about-starlette +pydantic >=1.7.4, <2.1.0 # strict # https://fastapi.tiangolo.com/deployment/versions/#about-pydantic + +dateutils <=0.6.12 +Jinja2 <=3.1.2 +PyYAML <=6.0 +requests <2.31.1 +rich >=12.3.0, <=13.4.2 +urllib3 <=2.0.2 +uvicorn <=0.22.0 +websocket-client <1.6.2 +websockets <=11.0.3 diff --git a/requirements/app/cloud.txt b/requirements/app/cloud.txt new file mode 100644 index 0000000..d7a9d2a --- /dev/null +++ b/requirements/app/cloud.txt @@ -0,0 +1,4 @@ +redis >=4.0.1, <=4.6.0 +docker >=5.0.0, <6.1.4 +s3fs >=2022.5.0, <2023.6.1 +# setuptools==59.5.0 diff --git a/requirements/app/components.txt b/requirements/app/components.txt new file mode 100644 index 0000000..b821f7a --- /dev/null +++ b/requirements/app/components.txt @@ -0,0 +1,5 @@ +# deps required by components in the lightning app repository (src/lightning/app/components) +lightning_api_access >=0.0.3 # serve +aiohttp >=3.8.0, <=3.8.4 # auto_scaler +lightning-fabric >=1.9.0 # multinode +pytorch-lightning >=1.9.0 # multinode diff --git a/requirements/app/docs.txt b/requirements/app/docs.txt new file mode 100644 index 0000000..4f5c18a --- /dev/null +++ b/requirements/app/docs.txt @@ -0,0 +1,5 @@ +-r ../docs.txt + +# lai-sphinx-theme is not installable +# refer: https://github.com/Lightning-AI/lightning/issues/16158 +# lai-sphinx-theme diff --git a/requirements/app/test.txt b/requirements/app/test.txt new file mode 100644 index 0000000..f9cd551 --- /dev/null +++ b/requirements/app/test.txt @@ -0,0 +1,16 @@ +coverage ==7.2.7 +pytest ==7.3.1 +pytest-timeout ==2.1.0 +pytest-cov ==4.0.0 +pytest-doctestplus >=0.9.0 +pytest-asyncio ==0.21.0 +# pytest-random-order ==1.1.0 +pytest-rerunfailures <=11.1.2 + +playwright ==1.35.0 +httpx ==0.24.1 +trio <0.22.0 # strict https://github.com/python-trio/trio/pull/2213 +pympler +psutil <=5.9.5 +setuptools <67.7.0 +requests-mock <=1.10.0 diff --git a/requirements/app/ui.txt b/requirements/app/ui.txt new file mode 100644 index 0000000..6ba6bbc --- /dev/null +++ b/requirements/app/ui.txt @@ -0,0 +1,2 @@ +streamlit >=1.13.0, <1.22.1 +panel >=1.0.0, <=1.1.1 diff --git a/requirements/base.txt b/requirements/base.txt new file mode 100644 index 0000000..fe77f77 --- /dev/null +++ b/requirements/base.txt @@ -0,0 +1,36 @@ +Jinja2<4.0 +PyYAML<7.0 +PyYAML<7.0,>=5.4 +arrow<2.0,>=1.2.0 +backoff<3.0,>=2.2.1 +beautifulsoup4<5.0,>=4.8.0 +click<9.0 +croniter<1.5.0,>=1.3.0 # strict +dateutils<1.0 +deepdiff<7.0,>=5.7.0 +fastapi<1.0,>=0.92.0 +fsspec<2024.0,>=2022.5.0 +fsspec[http]<2024.0,>2021.06.0 +inquirer<4.0,>=2.10.0 +lightning-cloud>=0.5.37 +lightning-utilities<1.0,>=0.8.0 +numpy<2.0,>=1.17.2 +packaging +packaging<24.0,>=20.0 +psutil<6.0 +pydantic<2.1.0,>=1.7.4 # strict +python-multipart<1.0,>=0.0.5 +requests<3.0 +rich<14.0,>=12.3.0 +starlette +starsessions<2.0,>=1.2.1 # strict +torch<3.0,>=1.11.0 +torchmetrics<2.0,>=0.7.0 +tqdm<5.0,>=4.57.0 +traitlets<6.0,>=5.3.0 +typing-extensions<5.0,>=4.0.0 +urllib3<3.0 +uvicorn<1.0 +websocket-client<2.0 +websockets<12.0 + diff --git a/requirements/collect_env_details.py b/requirements/collect_env_details.py new file mode 100644 index 0000000..3dd2b8d --- /dev/null +++ b/requirements/collect_env_details.py @@ -0,0 +1,87 @@ +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +"""Diagnose your system and show basic information. + +This server mainly to get detail info for better bug reporting. +""" + +import os +import platform +import sys + +import pkg_resources +import torch + +sys.path += [os.path.abspath(".."), os.path.abspath("")] + + +LEVEL_OFFSET = "\t" +KEY_PADDING = 20 + + +def info_system() -> dict: + return { + "OS": platform.system(), + "architecture": platform.architecture(), + "version": platform.version(), + "release": platform.release(), + "processor": platform.processor(), + "python": platform.python_version(), + } + + +def info_cuda() -> dict: + return { + "GPU": [torch.cuda.get_device_name(i) for i in range(torch.cuda.device_count())] or None, + "available": torch.cuda.is_available(), + "version": torch.version.cuda, + } + + +def info_packages() -> dict: + """Get name and version of all installed packages.""" + packages = {} + for dist in pkg_resources.working_set: + package = dist.as_requirement() + packages[package.key] = package.specs[0][1] + return packages + + +def nice_print(details: dict, level: int = 0) -> list: + lines = [] + for k in sorted(details): + key = f"* {k}:" if level == 0 else f"- {k}:" + if isinstance(details[k], dict): + lines += [level * LEVEL_OFFSET + key] + lines += nice_print(details[k], level + 1) + elif isinstance(details[k], (set, list, tuple)): + lines += [level * LEVEL_OFFSET + key] + lines += [(level + 1) * LEVEL_OFFSET + "- " + v for v in details[k]] + else: + template = "{:%is} {}" % KEY_PADDING + key_val = template.format(key, details[k]) + lines += [(level * LEVEL_OFFSET) + key_val] + return lines + + +def main() -> None: + details = {"System": info_system(), "CUDA": info_cuda(), "Packages": info_packages()} + details["Lightning"] = {k: v for k, v in details["Packages"].items() if "torch" in k or "lightning" in k} + lines = nice_print(details) + text = os.linesep.join(lines) + print(f"
\n Current environment\n\n{text}\n\n
") + + +if __name__ == "__main__": + main() diff --git a/requirements/data/cloud.txt b/requirements/data/cloud.txt new file mode 100644 index 0000000..950fb4b --- /dev/null +++ b/requirements/data/cloud.txt @@ -0,0 +1,5 @@ +# NOTE: the upper bound for the package version is only set for CI stability, and it is dropped while installing this package +# in case you want to preserve/enforce restrictions on the latest compatible version, add "strict" as an in-line comment + +fsspec[http] >2021.06.0, <2023.5.0 +s3fs >=2022.5.0, <=2023.6.0 diff --git a/requirements/data/data.txt b/requirements/data/data.txt new file mode 100644 index 0000000..4fa81bd --- /dev/null +++ b/requirements/data/data.txt @@ -0,0 +1,8 @@ +# NOTE: the upper bound for the package version is only set for CI stability, and it is dropped while installing this package +# in case you want to preserve/enforce restrictions on the latest compatible version, add "strict" as an in-line comment + +lightning-utilities >=0.8.0, <0.10.0 +# to be able to include also 0.6 and preserve `>` needed for CI min version bypass +torchdata >0.5.9, <0.7.0 +# to be able to include also PL 2.0 and preserve `>` needed for CI min version bypass +torch >0.14.0, <2.1.0 diff --git a/requirements/data/examples.txt b/requirements/data/examples.txt new file mode 100644 index 0000000..4daff66 --- /dev/null +++ b/requirements/data/examples.txt @@ -0,0 +1,3 @@ +Pillow >= 9.5.0 +# min version to match torch >= 2.0.1 +torchvision >=0.15.2, <=0.16 diff --git a/requirements/data/test.txt b/requirements/data/test.txt new file mode 100644 index 0000000..55459ea --- /dev/null +++ b/requirements/data/test.txt @@ -0,0 +1,5 @@ +coverage ==7.2.7 +pytest ==7.3.1 +pytest-cov ==4.0.0 +pytest-rerunfailures ==10.3 +pytest-random-order ==1.1.0 diff --git a/requirements/docs.txt b/requirements/docs.txt new file mode 100644 index 0000000..b4bd535 --- /dev/null +++ b/requirements/docs.txt @@ -0,0 +1,19 @@ +sphinx >=4.0, <5.0 +myst-parser >=0.18.1, <1.0.0 +nbsphinx >=0.8.5, <=0.8.9 +pandoc >=1.0, <=2.3 +docutils >=0.16, <0.21 +sphinxcontrib-fulltoc >=1.0, <=1.2.0 +sphinxcontrib-mockautodoc +sphinx-autobuild +sphinx-autodoc-typehints >=1.16 +sphinx-paramlinks >=0.5.1, <=0.5.4 +sphinx-togglebutton >=0.2, <=0.3.2 +sphinx-copybutton >=0.3, <=0.5.2 +sphinx-multiproject +sphinx-toolbox ==3.4.0 +sphinx-rtd-dark-mode +sphinxcontrib-video ==0.2.0 +jinja2 <3.2.0 + +lightning-utilities >=0.9.0 diff --git a/requirements/fabric/base.txt b/requirements/fabric/base.txt new file mode 100644 index 0000000..6f479b8 --- /dev/null +++ b/requirements/fabric/base.txt @@ -0,0 +1,9 @@ +# NOTE: the upper bound for the package version is only set for CI stability, and it is dropped while installing this package +# in case you want to preserve/enforce restrictions on the latest compatible version, add "strict" as an in-line comment + +numpy >=1.17.2, <1.25.1 +torch >=1.11.0, <2.1.0 +fsspec[http]>2021.06.0, <2023.5.0 +packaging >=20.0, <=23.0 +typing-extensions >=4.0.0, <=4.7.1 +lightning-utilities >=0.8.0, <0.10.0 diff --git a/requirements/fabric/docs.txt b/requirements/fabric/docs.txt new file mode 100644 index 0000000..3d55fb8 --- /dev/null +++ b/requirements/fabric/docs.txt @@ -0,0 +1,5 @@ +-r ../docs.txt + +# pt-lightning-sphinx-theme @ https://github.com/Lightning-AI/lightning_sphinx_theme/archive/master.zip +pt-lightning-sphinx-theme @ https://github.com/PyTorchKorea/lightning_sphinx_theme/archive/master.zip +tensorboard diff --git a/requirements/fabric/examples.txt b/requirements/fabric/examples.txt new file mode 100644 index 0000000..b609512 --- /dev/null +++ b/requirements/fabric/examples.txt @@ -0,0 +1,5 @@ +# NOTE: the upper bound for the package version is only set for CI stability, and it is dropped while installing this package +# in case you want to preserve/enforce restrictions on the latest compatible version, add "strict" as an in-line comment +torchvision >=0.12.0, <=0.15.2 +torchmetrics >=0.10.0, <0.12.0 +lightning-utilities >=0.8.0, <0.10.0 diff --git a/requirements/fabric/strategies.txt b/requirements/fabric/strategies.txt new file mode 100644 index 0000000..dba2b79 --- /dev/null +++ b/requirements/fabric/strategies.txt @@ -0,0 +1,3 @@ +# NOTE: the upper bound for the package version is only set for CI stability, and it is dropped while installing this package +# in case you want to preserve/enforce restrictions on the latest compatible version, add "strict" as an in-line comment +deepspeed >=0.8.2, <=0.9.3; platform_system != "Windows" diff --git a/requirements/fabric/test.txt b/requirements/fabric/test.txt new file mode 100644 index 0000000..a26e7e0 --- /dev/null +++ b/requirements/fabric/test.txt @@ -0,0 +1,8 @@ +coverage ==7.2.7 +pytest ==7.3.1 +pytest-cov ==4.0.0 +pytest-rerunfailures ==10.3 +pytest-random-order ==1.1.0 +click ==8.1.3 +tensorboardX >=2.2, <=2.6.1 # min version is set by torch.onnx missing attribute +torchmetrics >=0.7.0, <1.1.0 # needed for using fixed compare_version diff --git a/requirements/pytorch/base.txt b/requirements/pytorch/base.txt new file mode 100644 index 0000000..6f685aa --- /dev/null +++ b/requirements/pytorch/base.txt @@ -0,0 +1,12 @@ +# NOTE: the upper bound for the package version is only set for CI stability, and it is dropped while installing this package +# in case you want to preserve/enforce restrictions on the latest compatible version, add "strict" as an in-line comment + +numpy >=1.17.2, <1.25.1 +torch >=1.11.0, <2.1.0 +tqdm >=4.57.0, <4.66.0 +PyYAML >=5.4, <=6.0 +fsspec[http] >2021.06.0, <2023.5.0 +torchmetrics >=0.7.0, <1.1.0 # needed for using fixed compare_version +packaging >=20.0, <=23.0 +typing-extensions >=4.0.0, <=4.7.1 +lightning-utilities >=0.8.0, <0.10.0 diff --git a/requirements/pytorch/check-avail-extras.py b/requirements/pytorch/check-avail-extras.py new file mode 100644 index 0000000..3ab8d28 --- /dev/null +++ b/requirements/pytorch/check-avail-extras.py @@ -0,0 +1,6 @@ +if __name__ == "__main__": + import hydra # noqa: F401 + import jsonargparse # noqa: F401 + import matplotlib # noqa: F401 + import omegaconf # noqa: F401 + import rich # noqa: F401 diff --git a/requirements/pytorch/docs.txt b/requirements/pytorch/docs.txt new file mode 100644 index 0000000..ff76cdc --- /dev/null +++ b/requirements/pytorch/docs.txt @@ -0,0 +1,11 @@ +-r ../docs.txt + +# ipython[notebook] <8.7.0 +ipython[notebook]==8.10 +# setuptools<58.0 # workaround for `error in ipython setup command: use_2to3 is invalid.` +setuptools==65.5.1 + +# pt-lightning-sphinx-theme @ https://github.com/Lightning-AI/lightning_sphinx_theme/archive/master.zip +pt-lightning-sphinx-theme@https://github.com/PyTorchKorea/lightning_sphinx_theme/archive/master.zip + +-r ../../_notebooks/.actions/requires.txt diff --git a/requirements/pytorch/examples.txt b/requirements/pytorch/examples.txt new file mode 100644 index 0000000..65ed18b --- /dev/null +++ b/requirements/pytorch/examples.txt @@ -0,0 +1,7 @@ +# NOTE: the upper bound for the package version is only set for CI stability, and it is dropped while installing this package +# in case you want to preserve/enforce restrictions on the latest compatible version, add "strict" as an in-line comment +torchvision >=0.12.0, <=0.15.2 +gym[classic_control] >=0.17.0, <0.26.3 +ipython[all] <8.14.1 +torchmetrics >=0.10.0, <0.12.0 +lightning-utilities >=0.7.0, <0.10.0 diff --git a/requirements/pytorch/extra.txt b/requirements/pytorch/extra.txt new file mode 100644 index 0000000..414d9bf --- /dev/null +++ b/requirements/pytorch/extra.txt @@ -0,0 +1,10 @@ +# NOTE: the upper bound for the package version is only set for CI stability, and it is dropped while installing this package +# in case you want to preserve/enforce restrictions on the latest compatible version, add "strict" as an in-line comment + +# extended list of package dependencies to reach full functionality +matplotlib>3.1, <3.6.2 +omegaconf >=2.0.5, <2.4.0 +hydra-core >=1.0.5, <1.4.0 +jsonargparse[signatures] >=4.18.0, <4.23.0 +rich >=12.3.0, <=13.4.2 +tensorboardX >=2.2, <=2.6.1 # min version is set by torch.onnx missing attribute diff --git a/requirements/pytorch/loggers.info b/requirements/pytorch/loggers.info new file mode 100644 index 0000000..ad8c6a8 --- /dev/null +++ b/requirements/pytorch/loggers.info @@ -0,0 +1,6 @@ +# all supported loggers. this list is here as a reference, but they are not installed in CI +neptune +comet-ml +mlflow >=1.0.0 +wandb >=0.12.0 +tensorboard >=2.9.1 diff --git a/requirements/pytorch/strategies.txt b/requirements/pytorch/strategies.txt new file mode 100644 index 0000000..dba2b79 --- /dev/null +++ b/requirements/pytorch/strategies.txt @@ -0,0 +1,3 @@ +# NOTE: the upper bound for the package version is only set for CI stability, and it is dropped while installing this package +# in case you want to preserve/enforce restrictions on the latest compatible version, add "strict" as an in-line comment +deepspeed >=0.8.2, <=0.9.3; platform_system != "Windows" diff --git a/requirements/pytorch/test.txt b/requirements/pytorch/test.txt new file mode 100644 index 0000000..12ce033 --- /dev/null +++ b/requirements/pytorch/test.txt @@ -0,0 +1,19 @@ +coverage ==7.2.7 +pytest ==7.3.1 +pytest-cov ==4.0.0 +pytest-forked ==1.4.0 +pytest-rerunfailures ==10.3 +pytest-random-order ==1.1.0 + +# needed in tests +cloudpickle >=1.3, <2.3.0 +scikit-learn >0.22.1, <1.3.1 +onnx <1.15.0 +onnxruntime <1.16.0 +psutil <5.9.5 # for `DeviceStatsMonitor` +pandas >1.0, <2.0.3 # needed in benchmarks +fastapi <0.100.0 # for `ServableModuleValidator` +uvicorn <0.22.1 # for `ServableModuleValidator` + +tensorboard >=2.9.1, <2.14.0 # for `TensorBoardLogger` +protobuf <=3.20.1 # strict # an extra is updating protobuf, this pin prevents TensorBoard failure diff --git a/requirements/typing.txt b/requirements/typing.txt new file mode 100644 index 0000000..ba7adf0 --- /dev/null +++ b/requirements/typing.txt @@ -0,0 +1,20 @@ +mypy==1.4.1 +torch==2.0.1 + +types-Markdown +types-PyYAML +types-bleach +types-cachetools +types-croniter +types-paramiko +types-protobuf +types-python-dateutil +types-redis +types-requests +types-setuptools +types-six +types-tabulate +types-toml +types-tzlocal +types-ujson +types-decorator diff --git a/setup.py b/setup.py new file mode 100755 index 0000000..043308e --- /dev/null +++ b/setup.py @@ -0,0 +1,170 @@ +#!/usr/bin/env python +# Copyright The Lightning AI team. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +"""This is the main and only one setup entry point for installing each package as stand-alone as well as joint +installation for all packages. + +There are considered three main scenarios for installing this project: + +1. Using PyPI registry when you can install `pytorch-lightning`, `lightning-app`, etc. or `lightning` for all. + +2. Installation from source code after cloning repository. + In such case we recommend to use command `pip install .` or `pip install -e .` for development version + (development ver. do not copy python files to your pip file system, just create links, so you can edit here) + In case you want to install just one package you need to export env. variable before calling `pip` + + - for `pytorch-lightning` use `export PACKAGE_NAME=pytorch ; pip install .` + - for `lightning-fabric` use `export PACKAGE_NAME=fabric ; pip install .` + - for `lightning-app` use `export PACKAGE_NAME=app ; pip install .` + +3. Building packages as sdist or binary wheel and installing or publish to PyPI afterwords you use command + `python setup.py sdist` or `python setup.py bdist_wheel` accordingly. + In case you want to build just a particular package you want to set an environment variable: + `PACKAGE_NAME=lightning|pytorch|app|fabric python setup.py sdist|bdist_wheel` + +4. Automated releasing with GitHub action is natural extension of 3) is composed of three consecutive steps: + a) determine which packages shall be released based on version increment in `__version__.py` and eventually + compared against PyPI registry + b) with a parameterization build desired packages in to standard `dist/` folder + c) validate packages and publish to PyPI +""" +import contextlib +import glob +import logging +import os +import tempfile +from importlib.util import module_from_spec, spec_from_file_location +from types import ModuleType +from typing import Generator, Mapping, Optional + +import setuptools +import setuptools.command.egg_info + +_PACKAGE_NAME = os.environ.get("PACKAGE_NAME") +_PACKAGE_MAPPING = { + "lightning": "lightning", + "pytorch": "pytorch_lightning", + "app": "lightning_app", + "fabric": "lightning_fabric", +} +# https://packaging.python.org/guides/single-sourcing-package-version/ +# http://blog.ionelmc.ro/2014/05/25/python-packaging/ +_PATH_ROOT = os.path.dirname(__file__) +_PATH_SRC = os.path.join(_PATH_ROOT, "src") +_PATH_REQUIRE = os.path.join(_PATH_ROOT, "requirements") +_FREEZE_REQUIREMENTS = os.environ.get("FREEZE_REQUIREMENTS", "0").lower() in ("1", "true") + + +def _load_py_module(name: str, location: str) -> ModuleType: + spec = spec_from_file_location(name, location) + assert spec, f"Failed to load module {name} from {location}" + py = module_from_spec(spec) + assert spec.loader, f"ModuleSpec.loader is None for {name} from {location}" + spec.loader.exec_module(py) + return py + + +def _named_temporary_file(directory: Optional[str] = None) -> str: + # `tempfile.NamedTemporaryFile` has issues in Windows + # https://github.com/deepchem/deepchem/issues/707#issuecomment-556002823 + if directory is None: + directory = tempfile.gettempdir() + return os.path.join(directory, os.urandom(24).hex()) + + +@contextlib.contextmanager +def _set_manifest_path(manifest_dir: str, aggregate: bool = False, mapping: Mapping = _PACKAGE_MAPPING) -> Generator: + if aggregate: + # aggregate all MANIFEST.in contents into a single temporary file + manifest_path = _named_temporary_file(manifest_dir) + lines = [] + # load manifest and aggregated all manifests + for pkg in mapping.values(): + pkg_manifest = os.path.join(_PATH_SRC, pkg, "MANIFEST.in") + if os.path.isfile(pkg_manifest): + with open(pkg_manifest) as fh: + lines.extend(fh.readlines()) + # convert lightning_foo to lightning/foo + for new, old in mapping.items(): + if old == "lightning": + continue # avoid `lightning` -> `lightning/lightning` + lines = [ln.replace(old, f"lightning/{new}") for ln in lines] + lines = sorted(set(filter(lambda ln: not ln.strip().startswith("#"), lines))) + logging.debug(f"aggregated manifest consists of: {lines}") + with open(manifest_path, mode="w") as fp: + fp.writelines(lines) + else: + manifest_path = os.path.join(manifest_dir, "MANIFEST.in") + assert os.path.exists(manifest_path) + # avoid error: setup script specifies an absolute path + manifest_path = os.path.relpath(manifest_path, _PATH_ROOT) + logging.info("Set manifest path to", manifest_path) + setuptools.command.egg_info.manifest_maker.template = manifest_path + yield + # cleanup + setuptools.command.egg_info.manifest_maker.template = "MANIFEST.in" + if aggregate: + os.remove(manifest_path) + + +if __name__ == "__main__": + assistant = _load_py_module(name="assistant", location=os.path.join(_PATH_ROOT, ".actions", "assistant.py")) + + if os.path.isdir(_PATH_SRC): + # copy the version information to all packages + assistant.distribute_version(_PATH_SRC) + print(f"Requested package: '{_PACKAGE_NAME}'") # requires `-v` to appear + + local_pkgs = [ + os.path.basename(p) + for p in glob.glob(os.path.join(_PATH_SRC, "*")) + if os.path.isdir(p) and not p.endswith(".egg-info") + ] + print(f"Local package candidates: {local_pkgs}") + is_source_install = len(local_pkgs) > 2 + print(f"Installing from source: {is_source_install}") + if is_source_install: + if _PACKAGE_NAME is not None and _PACKAGE_NAME not in _PACKAGE_MAPPING: + raise ValueError( + f"Unexpected package name: {_PACKAGE_NAME}. Possible choices are: {list(_PACKAGE_MAPPING)}" + ) + package_to_install = _PACKAGE_MAPPING.get(_PACKAGE_NAME, "lightning") + if package_to_install == "lightning": + # merge all requirements files + assistant._load_aggregate_requirements(_PATH_REQUIRE, _FREEZE_REQUIREMENTS) + else: + # replace imports and copy the code + assistant.create_mirror_package(_PATH_SRC, _PACKAGE_MAPPING) + else: + assert len(local_pkgs) > 0 + # PL as a package is distributed together with Fabric, so in such case there are more than one candidate + package_to_install = "pytorch_lightning" if "pytorch_lightning" in local_pkgs else local_pkgs[0] + print(f"Installing package: {package_to_install}") + + # going to install with `setuptools.setup` + pkg_path = os.path.join(_PATH_SRC, package_to_install) + pkg_setup = os.path.join(pkg_path, "__setup__.py") + if not os.path.exists(pkg_setup): + raise RuntimeError(f"Something's wrong, no package was installed. Package name: {_PACKAGE_NAME}") + setup_module = _load_py_module(name=f"{package_to_install}_setup", location=pkg_setup) + setup_args = setup_module._setup_args() + is_main_pkg = package_to_install == "lightning" + print(f"Installing as the main package: {is_main_pkg}") + if is_source_install: + # we are installing from source, set the correct manifest path + with _set_manifest_path(pkg_path, aggregate=is_main_pkg): + setuptools.setup(**setup_args) + else: + setuptools.setup(**setup_args) + print("Finished setup configuration.") diff --git a/source/_static/images/accelerator/ipus/profiler.png b/source/_static/images/accelerator/ipus/profiler.png deleted file mode 100644 index cbed276..0000000 Binary files a/source/_static/images/accelerator/ipus/profiler.png and /dev/null differ diff --git a/source/_static/images/benchmarks/figure-parity-times.png b/source/_static/images/benchmarks/figure-parity-times.png deleted file mode 100644 index 2e8c589..0000000 Binary files a/source/_static/images/benchmarks/figure-parity-times.png and /dev/null differ diff --git a/source/_static/images/course_UvA-DL/01-introduction-to-pytorch.jpg b/source/_static/images/course_UvA-DL/01-introduction-to-pytorch.jpg deleted file mode 100644 index a56ca66..0000000 Binary files a/source/_static/images/course_UvA-DL/01-introduction-to-pytorch.jpg and /dev/null differ diff --git a/source/_static/images/course_UvA-DL/02-activation-functions.jpg b/source/_static/images/course_UvA-DL/02-activation-functions.jpg deleted file mode 100644 index 1b21f50..0000000 Binary files a/source/_static/images/course_UvA-DL/02-activation-functions.jpg and /dev/null differ diff --git a/source/_static/images/course_UvA-DL/03-initialization-and-optimization.jpg b/source/_static/images/course_UvA-DL/03-initialization-and-optimization.jpg deleted file mode 100644 index e8d42d4..0000000 Binary files a/source/_static/images/course_UvA-DL/03-initialization-and-optimization.jpg and /dev/null differ diff --git a/source/_static/images/course_UvA-DL/04-inception-resnet-densenet.jpg b/source/_static/images/course_UvA-DL/04-inception-resnet-densenet.jpg deleted file mode 100644 index a7e0205..0000000 Binary files a/source/_static/images/course_UvA-DL/04-inception-resnet-densenet.jpg and /dev/null differ diff --git a/source/_static/images/course_UvA-DL/05-transformers-and-MH-attention.jpg b/source/_static/images/course_UvA-DL/05-transformers-and-MH-attention.jpg deleted file mode 100644 index e644f9a..0000000 Binary files a/source/_static/images/course_UvA-DL/05-transformers-and-MH-attention.jpg and /dev/null differ diff --git a/source/_static/images/course_UvA-DL/06-graph-neural-networks.jpg b/source/_static/images/course_UvA-DL/06-graph-neural-networks.jpg deleted file mode 100644 index 0cda6bd..0000000 Binary files a/source/_static/images/course_UvA-DL/06-graph-neural-networks.jpg and /dev/null differ diff --git a/source/_static/images/course_UvA-DL/07-deep-energy-based-generative-models.jpg b/source/_static/images/course_UvA-DL/07-deep-energy-based-generative-models.jpg deleted file mode 100644 index 32cd948..0000000 Binary files a/source/_static/images/course_UvA-DL/07-deep-energy-based-generative-models.jpg and /dev/null differ diff --git a/source/_static/images/course_UvA-DL/08-deep-autoencoders.jpg b/source/_static/images/course_UvA-DL/08-deep-autoencoders.jpg deleted file mode 100644 index 1b07169..0000000 Binary files a/source/_static/images/course_UvA-DL/08-deep-autoencoders.jpg and /dev/null differ diff --git a/source/_static/images/course_UvA-DL/09-normalizing-flows.jpg b/source/_static/images/course_UvA-DL/09-normalizing-flows.jpg deleted file mode 100644 index 9654f8a..0000000 Binary files a/source/_static/images/course_UvA-DL/09-normalizing-flows.jpg and /dev/null differ diff --git a/source/_static/images/course_UvA-DL/10-autoregressive-image-modeling.jpg b/source/_static/images/course_UvA-DL/10-autoregressive-image-modeling.jpg deleted file mode 100644 index 1ad5d61..0000000 Binary files a/source/_static/images/course_UvA-DL/10-autoregressive-image-modeling.jpg and /dev/null differ diff --git a/source/_static/images/course_UvA-DL/11-vision-transformer.jpg b/source/_static/images/course_UvA-DL/11-vision-transformer.jpg deleted file mode 100644 index c129c4b..0000000 Binary files a/source/_static/images/course_UvA-DL/11-vision-transformer.jpg and /dev/null differ diff --git a/source/_static/images/course_UvA-DL/12-meta-learning.jpg b/source/_static/images/course_UvA-DL/12-meta-learning.jpg deleted file mode 100644 index 4f8f6d9..0000000 Binary files a/source/_static/images/course_UvA-DL/12-meta-learning.jpg and /dev/null differ diff --git a/source/_static/images/course_UvA-DL/13-contrastive-learning.jpg b/source/_static/images/course_UvA-DL/13-contrastive-learning.jpg deleted file mode 100644 index 6e05cce..0000000 Binary files a/source/_static/images/course_UvA-DL/13-contrastive-learning.jpg and /dev/null differ diff --git a/source/_static/images/general/PTL101_youtube_thumbnail.jpg b/source/_static/images/general/PTL101_youtube_thumbnail.jpg deleted file mode 100644 index a09dc43..0000000 Binary files a/source/_static/images/general/PTL101_youtube_thumbnail.jpg and /dev/null differ diff --git a/source/_static/images/general/fast_2.gif b/source/_static/images/general/fast_2.gif deleted file mode 100644 index 77c6f85..0000000 Binary files a/source/_static/images/general/fast_2.gif and /dev/null differ diff --git a/source/_static/images/general/pl_overview.gif b/source/_static/images/general/pl_overview.gif deleted file mode 100644 index 1aa6419..0000000 Binary files a/source/_static/images/general/pl_overview.gif and /dev/null differ diff --git a/source/_static/images/general/pl_overview_flat.jpg b/source/_static/images/general/pl_overview_flat.jpg deleted file mode 100644 index c7c6480..0000000 Binary files a/source/_static/images/general/pl_overview_flat.jpg and /dev/null differ diff --git a/source/_static/images/general/pl_quick_start_full_compressed.gif b/source/_static/images/general/pl_quick_start_full_compressed.gif deleted file mode 100644 index f7136d0..0000000 Binary files a/source/_static/images/general/pl_quick_start_full_compressed.gif and /dev/null differ diff --git a/source/_static/images/general/tf_loss.jpg b/source/_static/images/general/tf_loss.jpg deleted file mode 100644 index 869947f..0000000 Binary files a/source/_static/images/general/tf_loss.jpg and /dev/null differ diff --git a/source/_static/images/general/tf_tags.jpg b/source/_static/images/general/tf_tags.jpg deleted file mode 100644 index 40918ec..0000000 Binary files a/source/_static/images/general/tf_tags.jpg and /dev/null differ diff --git a/source/_static/images/general/tutorial_cover.jpg b/source/_static/images/general/tutorial_cover.jpg deleted file mode 100644 index 1c0e7f3..0000000 Binary files a/source/_static/images/general/tutorial_cover.jpg and /dev/null differ diff --git a/source/_static/images/icon.svg b/source/_static/images/icon.svg deleted file mode 100644 index 481762a..0000000 --- a/source/_static/images/icon.svg +++ /dev/null @@ -1,3 +0,0 @@ - - - diff --git a/source/_static/images/lightning_examples/augmentation_kornia.svg b/source/_static/images/lightning_examples/augmentation_kornia.svg deleted file mode 100644 index 481762a..0000000 --- a/source/_static/images/lightning_examples/augmentation_kornia.svg +++ /dev/null @@ -1,3 +0,0 @@ - - - diff --git a/source/_static/images/lightning_lite/lite.gif b/source/_static/images/lightning_lite/lite.gif deleted file mode 100644 index 8413b2d..0000000 Binary files a/source/_static/images/lightning_lite/lite.gif and /dev/null differ diff --git a/source/_static/images/lightning_module/pt_to_pl.png b/source/_static/images/lightning_module/pt_to_pl.png deleted file mode 100644 index 5135ec2..0000000 Binary files a/source/_static/images/lightning_module/pt_to_pl.png and /dev/null differ diff --git a/source/_static/images/lightning_module/pt_trainer.png b/source/_static/images/lightning_module/pt_trainer.png deleted file mode 100644 index f465d43..0000000 Binary files a/source/_static/images/lightning_module/pt_trainer.png and /dev/null differ diff --git a/source/_static/images/logo.png b/source/_static/images/logo.png deleted file mode 100644 index 331f201..0000000 Binary files a/source/_static/images/logo.png and /dev/null differ diff --git a/source/_static/images/logo.svg b/source/_static/images/logo.svg deleted file mode 100644 index dca54b3..0000000 --- a/source/_static/images/logo.svg +++ /dev/null @@ -1,70 +0,0 @@ - - - - - - - - image/svg+xml - - - - - - - - - - - - diff --git a/source/_static/images/logo_light.svg b/source/_static/images/logo_light.svg deleted file mode 100644 index 4695557..0000000 --- a/source/_static/images/logo_light.svg +++ /dev/null @@ -1,70 +0,0 @@ - - - - - - - - image/svg+xml - - - - - - - - - - - - diff --git a/source/_static/images/mnist_imgs/mnist_cpu_bar.png b/source/_static/images/mnist_imgs/mnist_cpu_bar.png deleted file mode 100644 index fa896ea..0000000 Binary files a/source/_static/images/mnist_imgs/mnist_cpu_bar.png and /dev/null differ diff --git a/source/_static/images/mnist_imgs/mnist_gpu.png b/source/_static/images/mnist_imgs/mnist_gpu.png deleted file mode 100644 index 75021ce..0000000 Binary files a/source/_static/images/mnist_imgs/mnist_gpu.png and /dev/null differ diff --git a/source/_static/images/mnist_imgs/mnist_tb.png b/source/_static/images/mnist_imgs/mnist_tb.png deleted file mode 100644 index a8cf719..0000000 Binary files a/source/_static/images/mnist_imgs/mnist_tb.png and /dev/null differ diff --git a/source/_static/images/mnist_imgs/pt_to_pl.jpg b/source/_static/images/mnist_imgs/pt_to_pl.jpg deleted file mode 100644 index 4bad788..0000000 Binary files a/source/_static/images/mnist_imgs/pt_to_pl.jpg and /dev/null differ diff --git a/source/_static/images/mnist_imgs/restart_runtime.png b/source/_static/images/mnist_imgs/restart_runtime.png deleted file mode 100644 index 84ccae4..0000000 Binary files a/source/_static/images/mnist_imgs/restart_runtime.png and /dev/null differ diff --git a/source/_static/images/mnist_imgs/runtime_tpu.png b/source/_static/images/mnist_imgs/runtime_tpu.png deleted file mode 100644 index 9dc069a..0000000 Binary files a/source/_static/images/mnist_imgs/runtime_tpu.png and /dev/null differ diff --git a/source/_static/images/mnist_imgs/tpu_fast.png b/source/_static/images/mnist_imgs/tpu_fast.png deleted file mode 100644 index 08d9f9a..0000000 Binary files a/source/_static/images/mnist_imgs/tpu_fast.png and /dev/null differ diff --git a/source/_static/images/mnist_imgs/tpu_start.png b/source/_static/images/mnist_imgs/tpu_start.png deleted file mode 100644 index 3474f68..0000000 Binary files a/source/_static/images/mnist_imgs/tpu_start.png and /dev/null differ diff --git a/source/_static/images/trainer/lr_finder.png b/source/_static/images/trainer/lr_finder.png deleted file mode 100644 index bd1667b..0000000 Binary files a/source/_static/images/trainer/lr_finder.png and /dev/null differ diff --git a/source/_templates/classtemplate.rst b/source/_templates/classtemplate.rst deleted file mode 100644 index 398a0ec..0000000 --- a/source/_templates/classtemplate.rst +++ /dev/null @@ -1,14 +0,0 @@ -.. role:: hidden - :class: hidden-section -.. currentmodule:: {{ module }} - - -{{ name | underline }} - -.. autoclass:: {{ name }} - :members: - - -.. - autogenerated from source/_templates/classtemplate.rst - note it does not have :inherited-members: diff --git a/source/_templates/theme_variables.jinja b/source/_templates/theme_variables.jinja deleted file mode 100644 index 5073b7a..0000000 --- a/source/_templates/theme_variables.jinja +++ /dev/null @@ -1,20 +0,0 @@ -{%- set external_urls = { - 'github': 'https://github.com/PyTorchLightning/pytorch-lightning', - 'github_issues': 'https://github.com/PyTorchLightning/pytorch-lightning/issues', - 'contributing': 'https://github.com/PyTorchLightning/pytorch-lightning/blob/master/CONTRIBUTING.md', - 'governance': 'https://pytorch-lightning.readthedocs.io/en/latest/governance.html', - 'docs': 'https://pytorch-lightning.rtfd.io/en/latest', - 'twitter': 'https://twitter.com/PyTorchLightnin', - 'discuss': 'https://www.pytorchlightning.ai/community', - 'tutorials': 'https://pytorch-lightning.readthedocs.io/en/latest/#tutorials', - 'previous_pytorch_versions': 'https://pytorch-lightning.rtfd.io/en/latest/', - 'home': 'https://pytorch-lightning.rtfd.io/en/latest/', - 'get_started': 'https://pytorch-lightning.readthedocs.io/en/latest/starter/introduction.html', - 'features': 'https://pytorch-lightning.rtfd.io/en/latest/', - 'blog': 'https://www.pytorchlightning.ai/blog', - 'resources': 'https://pytorch-lightning.readthedocs.io/en/latest/#community-examples', - 'support': 'https://pytorch-lightning.rtfd.io/en/latest/', - 'community': 'https://www.pytorchlightning.ai/community', - 'forums': 'https://github.com/PyTorchLightning/pytorch-lightning/discussions', -} --%} diff --git a/source/accelerators/gpu_advanced.rst b/source/accelerators/gpu_advanced.rst deleted file mode 100644 index eadeb03..0000000 --- a/source/accelerators/gpu_advanced.rst +++ /dev/null @@ -1,16 +0,0 @@ -:orphan: - -.. _gpu_advanced: - -GPU training (Advanced) -======================= -**Audience:** Users looking to scale massive models (ie: 1 Trillion parameters). - ----- - -For experts pushing the state-of-the-art in model development, Lightning offers various techniques to enable Trillion+ parameter-scale models. - ----- - -.. - .. include:: ../advanced/model_parallel.rst diff --git a/source/accelerators/gpu_basic.rst b/source/accelerators/gpu_basic.rst deleted file mode 100644 index 43be718..0000000 --- a/source/accelerators/gpu_basic.rst +++ /dev/null @@ -1,97 +0,0 @@ -:orphan: - -.. _gpu_basic: - -GPU training (Basic) -==================== -**Audience:** Users looking to save money and run large models faster using single or multiple - ----- - -What is a GPU? --------------- -A Graphics Processing Unit (GPU), is a specialized hardware accelerator designed to speed up mathematical computations used in gaming and deep learning. - ----- - -Train on 1 GPU --------------- - -Make sure you're running on a machine with at least one GPU. There's no need to specify any NVIDIA flags -as Lightning will do it for you. - -.. testcode:: - :skipif: torch.cuda.device_count() < 1 - - trainer = Trainer(accelerator="gpu", devices=1) - ----------------- - - -.. _multi_gpu: - -Train on multiple GPUs ----------------------- - -To use multiple GPUs, set the number of devices in the Trainer or the index of the GPUs. - -.. code:: - - trainer = Trainer(accelerator="gpu", devices=4) - -Choosing GPU devices -^^^^^^^^^^^^^^^^^^^^ - -You can select the GPU devices using ranges, a list of indices or a string containing -a comma separated list of GPU ids: - -.. testsetup:: - - k = 1 - -.. testcode:: - :skipif: torch.cuda.device_count() < 2 - - # DEFAULT (int) specifies how many GPUs to use per node - Trainer(accelerator="gpu", devices=k) - - # Above is equivalent to - Trainer(accelerator="gpu", devices=list(range(k))) - - # Specify which GPUs to use (don't use when running on cluster) - Trainer(accelerator="gpu", devices=[0, 1]) - - # Equivalent using a string - Trainer(accelerator="gpu", devices="0, 1") - - # To use all available GPUs put -1 or '-1' - # equivalent to list(range(torch.cuda.device_count())) - Trainer(accelerator="gpu", devices=-1) - -The table below lists examples of possible input formats and how they are interpreted by Lightning. - -+------------------+-----------+---------------------+---------------------------------+ -| `devices` | Type | Parsed | Meaning | -+==================+===========+=====================+=================================+ -| 3 | int | [0, 1, 2] | first 3 GPUs | -+------------------+-----------+---------------------+---------------------------------+ -| -1 | int | [0, 1, 2, ...] | all available GPUs | -+------------------+-----------+---------------------+---------------------------------+ -| [0] | list | [0] | GPU 0 | -+------------------+-----------+---------------------+---------------------------------+ -| [1, 3] | list | [1, 3] | GPUs 1 and 3 | -+------------------+-----------+---------------------+---------------------------------+ -| "3" | str | [0, 1, 2] | first 3 GPUs | -+------------------+-----------+---------------------+---------------------------------+ -| "1, 3" | str | [1, 3] | GPUs 1 and 3 | -+------------------+-----------+---------------------+---------------------------------+ -| "-1" | str | [0, 1, 2, ...] | all available GPUs | -+------------------+-----------+---------------------+---------------------------------+ - -.. note:: - - When specifying number of ``devices`` as an integer ``devices=k``, setting the trainer flag - ``auto_select_gpus=True`` will automatically help you find ``k`` GPUs that are not - occupied by other processes. This is especially useful when GPUs are configured - to be in "exclusive mode", such that only one process at a time can access them. - For more details see the :doc:`trainer guide <../common/trainer>`. diff --git a/source/accelerators/gpu_faq.rst b/source/accelerators/gpu_faq.rst deleted file mode 100644 index c697b2c..0000000 --- a/source/accelerators/gpu_faq.rst +++ /dev/null @@ -1,97 +0,0 @@ -:orphan: - -.. _gpu_faq: - -GPU training (FAQ) -================== - -****************************************************************** -How should I adjust the learning rate when using multiple devices? -****************************************************************** - -When using distributed training make sure to modify your learning rate according to your effective -batch size. - -Let's say you have a batch size of 7 in your dataloader. - -.. testcode:: - - class LitModel(LightningModule): - def train_dataloader(self): - return Dataset(..., batch_size=7) - -In DDP, DDP_SPAWN, Deepspeed, DDP_SHARDED, or Horovod your effective batch size will be 7 * devices * num_nodes. - -.. code-block:: python - - # effective batch size = 7 * 8 - Trainer(accelerator="gpu", devices=8, strategy="ddp") - Trainer(accelerator="gpu", devices=8, strategy="ddp_spawn") - Trainer(accelerator="gpu", devices=8, strategy="ddp_sharded") - Trainer(accelerator="gpu", devices=8, strategy="horovod") - - # effective batch size = 7 * 8 * 10 - Trainer(accelerator="gpu", devices=8, num_nodes=10, strategy="ddp") - Trainer(accelerator="gpu", devices=8, num_nodes=10, strategy="ddp_spawn") - Trainer(accelerator="gpu", devices=8, num_nodes=10, strategy="ddp_sharded") - Trainer(accelerator="gpu", devices=8, num_nodes=10, strategy="horovod") - -In DDP2 or DP, your effective batch size will be 7 * num_nodes. -The reason is that the full batch is visible to all GPUs on the node when using DDP2. - -.. code-block:: python - - # effective batch size = 7 - Trainer(accelerator="gpu", devices=8, strategy="ddp2") - Trainer(accelerator="gpu", devices=8, strategy="dp") - - # effective batch size = 7 * 10 - Trainer(accelerator="gpu", devices=8, num_nodes=10, strategy="ddp2") - Trainer(accelerator="gpu", devices=8, strategy="dp") - - -.. note:: Huge batch sizes are actually really bad for convergence. Check out: - `Accurate, Large Minibatch SGD: Training ImageNet in 1 Hour `_ - ----- - -********************************************************* -How do I use multiple GPUs on Jupyter or Colab notebooks? -********************************************************* - -To use multiple GPUs on notebooks, use the *DP* mode. - -.. code-block:: python - - Trainer(accelerator="gpu", devices=4, strategy="dp") - -If you want to use other models, please launch your training via the command-shell. - -.. note:: Learn how to :ref:`access a cloud machine with multiple GPUs ` in this guide. - ----- - -***************************************************** -I'm getting errors related to Pickling. What do I do? -***************************************************** - -Pickle is Python's mechanism for serializing and unserializing data. A majority of distributed modes require that your code is fully pickle compliant. If you run into an issue with pickling try the following to figure out the issue - -.. code-block:: python - - import pickle - - model = YourModel() - pickle.dumps(model) - -If you `ddp` your code doesn't need to be pickled. - -.. code-block:: python - - Trainer(accelerator="gpu", devices=4, strategy="ddp") - -If you use `ddp_spawn` the pickling requirement remains. This is a limitation of Python. - -.. code-block:: python - - Trainer(accelerator="gpu", devices=4, strategy="ddp_spawn") diff --git a/source/accelerators/gpu_intermediate.rst b/source/accelerators/gpu_intermediate.rst deleted file mode 100644 index c4d9ad8..0000000 --- a/source/accelerators/gpu_intermediate.rst +++ /dev/null @@ -1,533 +0,0 @@ -:orphan: - -.. _gpu_intermediate: - -GPU training (Intermediate) -=========================== -**Audience:** Users looking to train across machines or experiment with different scaling techniques. - ----- - -Distributed Training strategies -------------------------------- -Lightning supports multiple ways of doing distributed training. - -.. raw:: html - - - -| - -- Data Parallel (``strategy='dp'``) (multiple-gpus, 1 machine) -- DistributedDataParallel (``strategy='ddp'``) (multiple-gpus across many machines (python script based)). -- DistributedDataParallel (``strategy='ddp_spawn'``) (multiple-gpus across many machines (spawn based)). -- DistributedDataParallel 2 (``strategy='ddp2'``) (DP in a machine, DDP across machines). -- Horovod (``strategy='horovod'``) (multi-machine, multi-gpu, configured at runtime) -- Bagua (``strategy='bagua'``) (multiple-gpus across many machines with advanced training algorithms) - -.. note:: - If you request multiple GPUs or nodes without setting a mode, DDP Spawn will be automatically used. - -For a deeper understanding of what Lightning is doing, feel free to read this -`guide `_. - - -Data Parallel -^^^^^^^^^^^^^ -:class:`~torch.nn.DataParallel` (DP) splits a batch across k GPUs. -That is, if you have a batch of 32 and use DP with 2 GPUs, each GPU will process 16 samples, -after which the root node will aggregate the results. - -.. warning:: DP use is discouraged by PyTorch and Lightning. State is not maintained on the replicas created by the - :class:`~torch.nn.DataParallel` wrapper and you may see errors or misbehavior if you assign state to the module - in the ``forward()`` or ``*_step()`` methods. For the same reason we cannot fully support - :doc:`Manual Optimization <../model/manual_optimization>` with DP. Use DDP which is more stable and at least 3x faster. - -.. warning:: DP only supports scattering and gathering primitive collections of tensors like lists, dicts, etc. - Therefore the :meth:`~pytorch_lightning.core.hooks.ModelHooks.transfer_batch_to_device` hook does not apply in - this mode and if you have overridden it, it will not be called. - -.. testcode:: - :skipif: torch.cuda.device_count() < 2 - - # train on 2 GPUs (using DP mode) - trainer = Trainer(accelerator="gpu", devices=2, strategy="dp") - -Distributed Data Parallel -^^^^^^^^^^^^^^^^^^^^^^^^^ -:class:`~torch.nn.parallel.DistributedDataParallel` (DDP) works as follows: - -1. Each GPU across each node gets its own process. - -2. Each GPU gets visibility into a subset of the overall dataset. It will only ever see that subset. - -3. Each process inits the model. - -4. Each process performs a full forward and backward pass in parallel. - -5. The gradients are synced and averaged across all processes. - -6. Each process updates its optimizer. - -.. code-block:: python - - # train on 8 GPUs (same machine (ie: node)) - trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp") - - # train on 32 GPUs (4 nodes) - trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp", num_nodes=4) - -This Lightning implementation of DDP calls your script under the hood multiple times with the correct environment -variables: - -.. code-block:: bash - - # example for 3 GPUs DDP - MASTER_ADDR=localhost MASTER_PORT=random() WORLD_SIZE=3 NODE_RANK=0 LOCAL_RANK=0 python my_file.py --accelerator 'gpu' --devices 3 --etc - MASTER_ADDR=localhost MASTER_PORT=random() WORLD_SIZE=3 NODE_RANK=1 LOCAL_RANK=0 python my_file.py --accelerator 'gpu' --devices 3 --etc - MASTER_ADDR=localhost MASTER_PORT=random() WORLD_SIZE=3 NODE_RANK=2 LOCAL_RANK=0 python my_file.py --accelerator 'gpu' --devices 3 --etc - -We use DDP this way because `ddp_spawn` has a few limitations (due to Python and PyTorch): - -1. Since `.spawn()` trains the model in subprocesses, the model on the main process does not get updated. -2. Dataloader(num_workers=N), where N is large, bottlenecks training with DDP... ie: it will be VERY slow or won't work at all. This is a PyTorch limitation. -3. Forces everything to be picklable. - -There are cases in which it is NOT possible to use DDP. Examples are: - -- Jupyter Notebook, Google COLAB, Kaggle, etc. -- You have a nested script without a root package - -In these situations you should use `dp` or `ddp_spawn` instead. - -Distributed Data Parallel 2 -^^^^^^^^^^^^^^^^^^^^^^^^^^^ -In certain cases, it's advantageous to use all batches on the same machine instead of a subset. -For instance, you might want to compute a NCE loss where it pays to have more negative samples. - -In this case, we can use DDP2 which behaves like DP in a machine and DDP across nodes. DDP2 does the following: - -1. Copies a subset of the data to each node. - -2. Inits a model on each node. - -3. Runs a forward and backward pass using DP. - -4. Syncs gradients across nodes. - -5. Applies the optimizer updates. - -.. code-block:: python - - # train on 32 GPUs (4 nodes) - trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp2", num_nodes=4) - -Distributed Data Parallel Spawn -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -`ddp_spawn` is exactly like `ddp` except that it uses .spawn to start the training processes. - -.. warning:: It is STRONGLY recommended to use `DDP` for speed and performance. - -.. code-block:: python - - mp.spawn(self.ddp_train, nprocs=self.num_processes, args=(model,)) - -If your script does not support being called from the command line (ie: it is nested without a root -project module) you can use the following method: - -.. code-block:: python - - # train on 8 GPUs (same machine (ie: node)) - trainer = Trainer(accelerator="gpu", devices=8, strategy="ddp_spawn") - -We STRONGLY discourage this use because it has limitations (due to Python and PyTorch): - -1. The model you pass in will not update. Please save a checkpoint and restore from there. -2. Set Dataloader(num_workers=0) or it will bottleneck training. - -`ddp` is MUCH faster than `ddp_spawn`. We recommend you - -1. Install a top-level module for your project using setup.py - -.. code-block:: python - - # setup.py - #!/usr/bin/env python - - from setuptools import setup, find_packages - - setup( - name="src", - version="0.0.1", - description="Describe Your Cool Project", - author="", - author_email="", - url="https://github.com/YourSeed", # REPLACE WITH YOUR OWN GITHUB PROJECT LINK - install_requires=["pytorch-lightning"], - packages=find_packages(), - ) - -2. Setup your project like so: - -.. code-block:: bash - - /project - /src - some_file.py - /or_a_folder - setup.py - -3. Install as a root-level package - -.. code-block:: bash - - cd /project - pip install -e . - -You can then call your scripts anywhere - -.. code-block:: bash - - cd /project/src - python some_file.py --accelerator 'gpu' --devices 8 --strategy 'ddp' - - -Horovod -^^^^^^^ -`Horovod `_ allows the same training script to be used for single-GPU, -multi-GPU, and multi-node training. - -Like Distributed Data Parallel, every process in Horovod operates on a single GPU with a fixed -subset of the data. Gradients are averaged across all GPUs in parallel during the backward pass, -then synchronously applied before beginning the next step. - -The number of worker processes is configured by a driver application (`horovodrun` or `mpirun`). In -the training script, Horovod will detect the number of workers from the environment, and automatically -scale the learning rate to compensate for the increased total batch size. - -Horovod can be configured in the training script to run with any number of GPUs / processes as follows: - -.. code-block:: python - - # train Horovod on GPU (number of GPUs / machines provided on command-line) - trainer = Trainer(strategy="horovod", accelerator="gpu", devices=1) - - # train Horovod on CPU (number of processes / machines provided on command-line) - trainer = Trainer(strategy="horovod") - -When starting the training job, the driver application will then be used to specify the total -number of worker processes: - -.. code-block:: bash - - # run training with 4 GPUs on a single machine - horovodrun -np 4 python train.py - - # run training with 8 GPUs on two machines (4 GPUs each) - horovodrun -np 8 -H hostname1:4,hostname2:4 python train.py - -See the official `Horovod documentation `_ for details -on installation and performance tuning. - - -Bagua -^^^^^ -`Bagua `_ is a deep learning training acceleration framework which supports -multiple advanced distributed training algorithms including: - -- `Gradient AllReduce `_ for centralized synchronous communication, where gradients are averaged among all workers. -- `Decentralized SGD `_ for decentralized synchronous communication, where each worker exchanges data with one or a few specific workers. -- `ByteGrad `_ and `QAdam `_ for low precision communication, where data is compressed into low precision before communication. -- `Asynchronous Model Average `_ for asynchronous communication, where workers are not required to be synchronized in the same iteration in a lock-step style. - -By default, Bagua uses *Gradient AllReduce* algorithm, which is also the algorithm implemented in Distributed Data Parallel and Horovod, -but Bagua can usually produce a higher training throughput due to its backend written in Rust. - -.. code-block:: python - - # train on 4 GPUs (using Bagua mode) - trainer = Trainer(strategy="bagua", accelerator="gpu", devices=4) - - -By specifying the ``algorithm`` in the ``BaguaStrategy``, you can select more advanced training algorithms featured by Bagua: - - -.. code-block:: python - - # train on 4 GPUs, using Bagua Gradient AllReduce algorithm - trainer = Trainer( - strategy=BaguaStrategy(algorithm="gradient_allreduce"), - accelerator="gpu", - devices=4, - ) - - # train on 4 GPUs, using Bagua ByteGrad algorithm - trainer = Trainer( - strategy=BaguaStrategy(algorithm="bytegrad"), - accelerator="gpu", - devices=4, - ) - - # train on 4 GPUs, using Bagua Decentralized SGD - trainer = Trainer( - strategy=BaguaStrategy(algorithm="decentralized"), - accelerator="gpu", - devices=4, - ) - - # train on 4 GPUs, using Bagua Low Precision Decentralized SGD - trainer = Trainer( - strategy=BaguaStrategy(algorithm="low_precision_decentralized"), - accelerator="gpu", - devices=4, - ) - - # train on 4 GPUs, using Asynchronous Model Average algorithm, with a synchronization interval of 100ms - trainer = Trainer( - strategy=BaguaStrategy(algorithm="async", sync_interval_ms=100), - accelerator="gpu", - devices=4, - ) - -To use *QAdam*, we need to initialize -`QAdamOptimizer `_ first: - -.. code-block:: python - - from pytorch_lightning.strategies import BaguaStrategy - from bagua.torch_api.algorithms.q_adam import QAdamOptimizer - - - class MyModel(pl.LightningModule): - ... - - def configure_optimizers(self): - # initialize QAdam Optimizer - return QAdamOptimizer(self.parameters(), lr=0.05, warmup_steps=100) - - - model = MyModel() - trainer = Trainer( - accelerator="gpu", - devices=4, - strategy=BaguaStrategy(algorithm="qadam"), - ) - trainer.fit(model) - -Bagua relies on its own `launcher `_ to schedule jobs. -Below, find examples using ``bagua.distributed.launch`` which follows ``torch.distributed.launch`` API: - -.. code-block:: bash - - # start training with 8 GPUs on a single node - python -m bagua.distributed.launch --nproc_per_node=8 train.py - -If the ssh service is available with passwordless login on each node, you can launch the distributed job on a -single node with ``baguarun`` which has a similar syntax as ``mpirun``. When staring the job, ``baguarun`` will -automatically spawn new processes on each of your training node provided by ``--host_list`` option and each node in it -is described as an ip address followed by a ssh port. - -.. code-block:: bash - - # Run on node1 (or node2) to start training on two nodes (node1 and node2), 8 GPUs per node - baguarun --host_list hostname1:ssh_port1,hostname2:ssh_port2 --nproc_per_node=8 --master_port=port1 train.py - - -.. note:: You can also start training in the same way as Distributed Data Parallel. However, system optimizations like - `Bagua-Net `_ and - `Performance autotuning `_ can only be enabled through bagua - launcher. It is worth noting that with ``Bagua-Net``, Distributed Data Parallel can also achieve - better performance without modifying the training script. - - -See `Bagua Tutorials `_ for more details on installation and advanced features. - - -DP/DDP2 caveats -^^^^^^^^^^^^^^^ -In DP and DDP2 each GPU within a machine sees a portion of a batch. -DP and ddp2 roughly do the following: - -.. testcode:: - - def distributed_forward(batch, model): - batch = torch.Tensor(32, 8) - gpu_0_batch = batch[:8] - gpu_1_batch = batch[8:16] - gpu_2_batch = batch[16:24] - gpu_3_batch = batch[24:] - - y_0 = model_copy_gpu_0(gpu_0_batch) - y_1 = model_copy_gpu_1(gpu_1_batch) - y_2 = model_copy_gpu_2(gpu_2_batch) - y_3 = model_copy_gpu_3(gpu_3_batch) - - return [y_0, y_1, y_2, y_3] - -So, when Lightning calls any of the `training_step`, `validation_step`, `test_step` -you will only be operating on one of those pieces. - -.. testcode:: - - # the batch here is a portion of the FULL batch - def training_step(self, batch, batch_idx): - y_0 = batch - -For most metrics, this doesn't really matter. However, if you want -to add something to your computational graph (like softmax) -using all batch parts you can use the `training_step_end` step. - -.. testcode:: - - def training_step_end(self, outputs): - # only use when on dp - outputs = torch.cat(outputs, dim=1) - softmax = softmax(outputs, dim=1) - out = softmax.mean() - return out - -In pseudocode, the full sequence is: - -.. code-block:: python - - # get data - batch = next(dataloader) - - # copy model and data to each gpu - batch_splits = split_batch(batch, num_gpus) - models = copy_model_to_gpus(model) - - # in parallel, operate on each batch chunk - all_results = [] - for gpu_num in gpus: - batch_split = batch_splits[gpu_num] - gpu_model = models[gpu_num] - out = gpu_model(batch_split) - all_results.append(out) - - # use the full batch for something like softmax - full_out = model.training_step_end(all_results) - -To illustrate why this is needed, let's look at DataParallel - -.. testcode:: - - def training_step(self, batch, batch_idx): - x, y = batch - y_hat = self(batch) - - # on dp or ddp2 if we did softmax now it would be wrong - # because batch is actually a piece of the full batch - return y_hat - - - def training_step_end(self, step_output): - # step_output has outputs of each part of the batch - - # do softmax here - outputs = torch.cat(outputs, dim=1) - softmax = softmax(outputs, dim=1) - out = softmax.mean() - - return out - -If `training_step_end` is defined it will be called regardless of TPU, DP, DDP, etc... which means -it will behave the same regardless of the backend. - -Validation and test step have the same option when using DP. - -.. testcode:: - - def validation_step_end(self, step_output): - ... - - - def test_step_end(self, step_output): - ... - - -Distributed and 16-bit precision -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - -Due to an issue with Apex and DataParallel (PyTorch and NVIDIA issue), Lightning does -not allow 16-bit and DP training. We tried to get this to work, but it's an issue on their end. - -Below are the possible configurations we support. - -+-------+---------+-----+-----+--------+-----------------------------------------------------------------------+ -| 1 GPU | 1+ GPUs | DP | DDP | 16-bit | command | -+=======+=========+=====+=====+========+=======================================================================+ -| Y | | | | | `Trainer(accelerator="gpu", devices=1)` | -+-------+---------+-----+-----+--------+-----------------------------------------------------------------------+ -| Y | | | | Y | `Trainer(accelerator="gpu", devices=1, precision=16)` | -+-------+---------+-----+-----+--------+-----------------------------------------------------------------------+ -| | Y | Y | | | `Trainer(accelerator="gpu", devices=k, strategy='dp')` | -+-------+---------+-----+-----+--------+-----------------------------------------------------------------------+ -| | Y | | Y | | `Trainer(accelerator="gpu", devices=k, strategy='ddp')` | -+-------+---------+-----+-----+--------+-----------------------------------------------------------------------+ -| | Y | | Y | Y | `Trainer(accelerator="gpu", devices=k, strategy='ddp', precision=16)` | -+-------+---------+-----+-----+--------+-----------------------------------------------------------------------+ - - -Implement Your Own Distributed (DDP) training -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -If you need your own way to init PyTorch DDP you can override :meth:`pytorch_lightning.strategies.ddp.DDPStrategy.init_dist_connection`. - -If you also need to use your own DDP implementation, override :meth:`pytorch_lightning.strategies.ddp.DDPStrategy.configure_ddp`. - ----------- - -Torch Distributed Elastic -------------------------- -Lightning supports the use of Torch Distributed Elastic to enable fault-tolerant and elastic distributed job scheduling. To use it, specify the 'ddp' or 'ddp2' backend and the number of GPUs you want to use in the trainer. - -.. code-block:: python - - Trainer(accelerator="gpu", devices=8, strategy="ddp") - -To launch a fault-tolerant job, run the following on all nodes. - -.. code-block:: bash - - python -m torch.distributed.run - --nnodes=NUM_NODES - --nproc_per_node=TRAINERS_PER_NODE - --rdzv_id=JOB_ID - --rdzv_backend=c10d - --rdzv_endpoint=HOST_NODE_ADDR - YOUR_LIGHTNING_TRAINING_SCRIPT.py (--arg1 ... train script args...) - -To launch an elastic job, run the following on at least ``MIN_SIZE`` nodes and at most ``MAX_SIZE`` nodes. - -.. code-block:: bash - - python -m torch.distributed.run - --nnodes=MIN_SIZE:MAX_SIZE - --nproc_per_node=TRAINERS_PER_NODE - --rdzv_id=JOB_ID - --rdzv_backend=c10d - --rdzv_endpoint=HOST_NODE_ADDR - YOUR_LIGHTNING_TRAINING_SCRIPT.py (--arg1 ... train script args...) - -See the official `Torch Distributed Elastic documentation `_ for details -on installation and more use cases. - -Optimize multi-machine communication ------------------------------------- - -By default, Lightning will select the ``nccl`` backend over ``gloo`` when running on GPUs. -Find more information about PyTorch's supported backends `here `__. - -Lightning allows explicitly specifying the backend via the `process_group_backend` constructor argument on the relevant Strategy classes. By default, Lightning will select the appropriate process group backend based on the hardware used. - -.. code-block:: python - - from pytorch_lightning.strategies import DDPStrategy - - # Explicitly specify the process group backend if you choose to - ddp = DDPStrategy(process_group_backend="nccl") - - # Configure the strategy on the Trainer - trainer = Trainer(strategy=ddp, accelerator="gpu", devices=8) diff --git a/source/accelerators/hpu.rst b/source/accelerators/hpu.rst deleted file mode 100644 index 13eeab8..0000000 --- a/source/accelerators/hpu.rst +++ /dev/null @@ -1,40 +0,0 @@ -.. _hpu: - -Accelerator: HPU training -========================= - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Prepare your code (Optional) - :description: Prepare your code to run on any hardware - :col_css: col-md-4 - :button_link: accelerator_prepare.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Basic - :description: Learn the basics of single and multi-HPU core training. - :col_css: col-md-4 - :button_link: hpu_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Intermediate - :description: Enable state-of-the-art scaling with advanced mix-precision settings. - :col_css: col-md-4 - :button_link: hpu_intermediate.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
diff --git a/source/accelerators/hpu_basic.rst b/source/accelerators/hpu_basic.rst deleted file mode 100644 index e07e153..0000000 --- a/source/accelerators/hpu_basic.rst +++ /dev/null @@ -1,83 +0,0 @@ -:orphan: - -.. _hpu_basics: - -Accelerator: HPU training -========================= -**Audience:** Users looking to save money and run large models faster using single or multiple Gaudi devices. - ----- - -What is an HPU? ---------------- - -`Habana® Gaudi® AI Processor (HPU) `__ training processors are built on a heterogeneous architecture with a cluster of fully programmable Tensor Processing Cores (TPC) along with its associated development tools and libraries, and a configurable Matrix Math engine. - -The TPC core is a VLIW SIMD processor with an instruction set and hardware tailored to serve training workloads efficiently. -The Gaudi memory architecture includes on-die SRAM and local memories in each TPC and, -Gaudi is the first DL training processor that has integrated RDMA over Converged Ethernet (RoCE v2) engines on-chip. - -On the software side, the PyTorch Habana bridge interfaces between the framework and SynapseAI software stack to enable the execution of deep learning models on the Habana Gaudi device. - -Gaudi offers a substantial price/performance advantage -- so you get to do more deep learning training while spending less. - -For more information, check out `Gaudi Architecture `__ and `Gaudi Developer Docs `__. - ----- - -Run on 1 Gaudi --------------- - -To enable PyTorch Lightning to utilize the HPU accelerator, simply provide ``accelerator="hpu"`` parameter to the Trainer class. - -.. code-block:: python - - trainer = Trainer(accelerator="hpu", devices=1) - ----- - -Run on multiple Gaudis ----------------------- -The ``devices=8`` and ``accelerator="hpu"`` parameters to the Trainer class enables the Habana accelerator for distributed training with 8 Gaudis. -It uses :class:`~pytorch_lightning.strategies.hpu_parallel.HPUParallelStrategy` internally which is based on DDP strategy with the addition of Habana's collective communication library (HCCL) to support scale-up within a node and scale-out across multiple nodes. - -.. code-block:: python - - trainer = Trainer(devices=8, accelerator="hpu") - ----- - -Select Gaudis automatically ---------------------------- - -Lightning can automatically detect the number of Gaudi devices to run on. This setting is enabled by default if the devices argument is missing. - -.. code-block:: python - - # equivalent - trainer = Trainer(accelerator="hpu") - trainer = Trainer(accelerator="hpu", devices="auto") - ----- - -How to access HPUs ------------------- - -To use HPUs, you must have access to a system with HPU devices. - -AWS -^^^ -You can either use `Gaudi-based AWS EC2 DL1 instances `__ or `Supermicro X12 Gaudi server `__ to get access to HPUs. - -Check out the `Get Started Guide with AWS and Habana `__. - ----- - -.. _known-limitations_hpu: - -Known limitations ------------------ - -* Multiple optimizers are not supported. -* `Habana dataloader `__ is not supported. -* :class:`~pytorch_lightning.callbacks.device_stats_monitor.DeviceStatsMonitor` is not supported. diff --git a/source/accelerators/hpu_intermediate.rst b/source/accelerators/hpu_intermediate.rst deleted file mode 100644 index 65dca85..0000000 --- a/source/accelerators/hpu_intermediate.rst +++ /dev/null @@ -1,68 +0,0 @@ -:orphan: - -.. _hpu_intermediate: - -Accelerator: HPU training -========================= -**Audience:** Gaudi chip users looking to save memory and scale models with mixed-precision training. - ----- - -Enable Mixed Precision ----------------------- - -Lightning also allows mixed precision training with HPUs. -By default, HPU training will use 32-bit precision. To enable mixed precision, set the ``precision`` flag. - -.. code-block:: python - - trainer = Trainer(devices=1, accelerator="hpu", precision=16) - ----- - -Customize Mixed Precision -------------------------- - -Internally, :class:`~pytorch_lightning.plugins.precision.hpu.HPUPrecisionPlugin` uses the Habana Mixed Precision (HMP) package to enable mixed precision training. - -You can execute the ops in FP32 or BF16 precision. The HMP package modifies the Python operators to add the appropriate cast operations for the arguments before execution. -The default settings enable users to enable mixed precision training with minimal code easily. - -In addition to the default settings in HMP, users also have the option of overriding these defaults and providing their -BF16 and FP32 operator lists by passing them as parameter to :class:`~pytorch_lightning.plugins.precision.hpu.HPUPrecisionPlugin`. - -The below snippet shows an example model using MNIST with a single Habana Gaudi device and making use of HMP by overriding the default parameters. -This enables advanced users to provide their own BF16 and FP32 operator list instead of using the HMP defaults. - -.. code-block:: python - - import pytorch_lightning as pl - from pytorch_lightning.plugins import HPUPrecisionPlugin - - # Initialize a trainer with HPU accelerator for HPU strategy for single device, - # with mixed precision using overidden HMP settings - trainer = pl.Trainer( - accelerator="hpu", - devices=1, - # Optional Habana mixed precision params to be set - # Checkout `pl_examples/hpu_examples/simple_mnist/ops_bf16_mnist.txt` for the format - plugins=[ - HPUPrecisionPlugin( - precision=16, - opt_level="O1", - verbose=False, - bf16_file_path="ops_bf16_mnist.txt", - fp32_file_path="ops_fp32_mnist.txt", - ) - ], - ) - - # Init our model - model = LitClassifier() - # Init the data - dm = MNISTDataModule(batch_size=batch_size) - - # Train the model ⚡ - trainer.fit(model, datamodule=dm) - -For more details, please refer to `PyTorch Mixed Precision Training on Gaudi `__. diff --git a/source/accelerators/ipu_basic.rst b/source/accelerators/ipu_basic.rst deleted file mode 100644 index 492c7bf..0000000 --- a/source/accelerators/ipu_basic.rst +++ /dev/null @@ -1,68 +0,0 @@ -:orphan: - -.. _ipu_basic: - -Accelerator: IPU training -========================= -**Audience:** Users looking to save money and run large models faster using single or multiple IPU devices. - ----- - -What is an IPU? ---------------- - -The Graphcore `Intelligence Processing Unit (IPU) `__, built for Artificial Intelligence and Machine Learning, consists of many individual cores, called *tiles*, allowing highly parallel computation. Due to the high bandwidth between tiles, IPUs facilitate machine learning loads where parallelization is essential. Because computation is heavily parallelized, - -IPUs operate in a different way to conventional accelerators such as CPU/GPUs. IPUs do not require large batch sizes for maximum parallelization, can provide optimizations across the compiled graph and rely on model parallelism to fully utilize tiles for larger models. - -IPUs are used to build IPU-PODs, rack-based systems of IPU-Machines for larger workloads. See the `IPU Architecture `__ for more information. - -See the `Graphcore Glossary `__ for the definitions of other IPU-specific terminology. - -.. note:: - IPU support is experimental and a work in progress (see :ref:`known-limitations`). If you run into any problems, please leave an issue. - ----- - -Run on 1 IPU ------------- -To use a single IPU, set the accelerator and devices argument. - -.. code-block:: python - - trainer = pl.Trainer(accelerator="ipu", devices=1) - ----- - -Run on multiple IPUs --------------------- -To use multiple IPUs set the devices to a number that is a power of 2 (i.e: 2, 4, 8, 16, ...) - -.. code-block:: python - - trainer = pl.Trainer(accelerator="ipu", devices=8) - ----- - -How to access IPUs ------------------- - -To use IPUs you must have access to a system with IPU devices. To get access see `get started `__. - -You must ensure that the IPU system has enabled the PopART and Poplar packages from the SDK. Instructions are in the Get Started guide for your IPU system, on the Graphcore `documents portal `__. - ----- - -.. _known-limitations: - -Known limitations ------------------ - -Currently there are some known limitations that are being addressed in the near future to make the experience seamless when moving from different devices. - -Please see the `MNIST example `__ which displays most of the limitations and how to overcome them till they are resolved. - -* ``self.log`` is not supported in the ``training_step``, ``validation_step``, ``test_step`` or ``predict_step``. This is due to the step function being traced and sent to the IPU devices. We're actively working on fixing this -* Multiple optimizers are not supported. ``training_step`` only supports returning one loss from the ``training_step`` function as a result -* Since the step functions are traced, branching logic or any form of primitive values are traced into constants. Be mindful as this could lead to errors in your custom code -* Clipping gradients is not supported diff --git a/source/accelerators/tpu_advanced.rst b/source/accelerators/tpu_advanced.rst deleted file mode 100644 index 0aa490e..0000000 --- a/source/accelerators/tpu_advanced.rst +++ /dev/null @@ -1,68 +0,0 @@ -:orphan: - -TPU training (Advanced) -======================= -**Audience:** Users looking to apply advanced performance techniques to TPU training. - ----- - -Weight Sharing/Tying --------------------- -Weight Tying/Sharing is a technique where in the module weights are shared among two or more layers. -This is a common method to reduce memory consumption and is utilized in many State of the Art -architectures today. - -PyTorch XLA requires these weights to be tied/shared after moving the model -to the TPU device. To support this requirement Lightning provides a model hook which is -called after the model is moved to the device. Any weights that require to be tied should -be done in the `on_post_move_to_device` model hook. This will ensure that the weights -among the modules are shared and not copied. - -PyTorch Lightning has an inbuilt check which verifies that the model parameter lengths -match once the model is moved to the device. If the lengths do not match Lightning -throws a warning message. - -Example: - -.. code-block:: python - - from pytorch_lightning.core.lightning import LightningModule - from torch import nn - from pytorch_lightning.trainer.trainer import Trainer - - - class WeightSharingModule(LightningModule): - def __init__(self): - super().__init__() - self.layer_1 = nn.Linear(32, 10, bias=False) - self.layer_2 = nn.Linear(10, 32, bias=False) - self.layer_3 = nn.Linear(32, 10, bias=False) - # TPU shared weights are copied independently - # on the XLA device and this line won't have any effect. - # However, it works fine for CPU and GPU. - self.layer_3.weight = self.layer_1.weight - - def forward(self, x): - x = self.layer_1(x) - x = self.layer_2(x) - x = self.layer_3(x) - return x - - def on_post_move_to_device(self): - # Weights shared after the model has been moved to TPU Device - self.layer_3.weight = self.layer_1.weight - - - model = WeightSharingModule() - trainer = Trainer(max_epochs=1, accelerator="tpu", devices=8) - -See `XLA Documentation `_ - ----- - -XLA ---- -XLA is the library that interfaces PyTorch with the TPUs. -For more information check out `XLA `_. - -Guide for `troubleshooting XLA `_ diff --git a/source/accelerators/tpu_basic.rst b/source/accelerators/tpu_basic.rst deleted file mode 100644 index af7c45f..0000000 --- a/source/accelerators/tpu_basic.rst +++ /dev/null @@ -1,255 +0,0 @@ -:orphan: - -TPU training (Basic) -==================== -**Audience:** Users looking to train on single or multiple TPU cores. - ----- - -.. raw:: html - - - -| - -Lightning supports running on TPUs. At this moment, TPUs are available -on Google Cloud (GCP), Google Colab and Kaggle Environments. For more information on TPUs -`watch this video `_. - ----------------- - -What is a TPU? --------------- -Tensor Processing Unit (TPU) is an AI accelerator application-specific integrated circuit (ASIC) developed by Google specifically for neural networks. - -A TPU has 8 cores where each core is optimized for 128x128 matrix multiplies. In general, a single TPU is about as fast as 5 V100 GPUs! - -A TPU pod hosts many TPUs on it. Currently, TPU v3 Pod has up to 2048 TPU cores and 32 TiB of memory! -You can request a full pod from Google cloud or a "slice" which gives you -some subset of those 2048 cores. - ----- - -Run on 1 TPU core ------------------ -Enable the following Trainer arguments to run on 1 TPU. - -.. code:: - - trainer = Trainer(accelerator="tpu", devices=1) - ----- - -Run on multiple TPU cores -------------------------- -For multiple TPU cores, change the value of the devices flag. - -.. code:: - - trainer = Trainer(accelerator="tpu", devices=8) - ----- - -Run on a specific TPU core --------------------------- - -To run on a specific core, specify the index of the TPU core. - -.. code-block:: python - - trainer = pl.Trainer(accelerator="tpu", devices=[5]) - -This example runs on the 5th core, not on five cores. - ----- - -How to access TPUs ------------------- -To access TPUs, there are three main ways. - -Google Colab -^^^^^^^^^^^^ -Colab is like a jupyter notebook with a free GPU or TPU -hosted on GCP. - -To get a TPU on colab, follow these steps: - -1. Go to `https://colab.research.google.com/ `_. - -2. Click "new notebook" (bottom right of pop-up). - -3. Click runtime > change runtime settings. Select Python 3, and hardware accelerator "TPU". - This will give you a TPU with 8 cores. - -4. Next, insert this code into the first cell and execute. - This will install the xla library that interfaces between PyTorch and the TPU. - - .. code-block:: - - !pip install cloud-tpu-client==0.10 https://storage.googleapis.com/tpu-pytorch/wheels/torch_xla-1.9-cp37-cp37m-linux_x86_64.whl - -5. Once the above is done, install PyTorch Lightning. - - .. code-block:: - - !pip install pytorch-lightning - -6. Then set up your LightningModule as normal. - -Google Cloud (GCP) -^^^^^^^^^^^^^^^^^^ -? - -Kaggle -^^^^^^ -For starting Kaggle projects with TPUs, refer to this `kernel `_. - ----- - -Optimize Performance --------------------- - -The TPU was designed for specific workloads and operations to carry out large volumes of matrix multiplication, -convolution operations and other commonly used ops in applied deep learning. -The specialization makes it a strong choice for NLP tasks, sequential convolutional networks, and under low precision operation. -There are cases in which training on TPUs is slower when compared with GPUs, for possible reasons listed: - -- Too small batch size. -- Explicit evaluation of tensors during training, e.g. ``tensor.item()`` -- Tensor shapes (e.g. model inputs) change often during training. -- Limited resources when using TPU's with PyTorch `Link `_ -- XLA Graph compilation during the initial steps `Reference `_ -- Some tensor ops are not fully supported on TPU, or not supported at all. These operations will be performed on CPU (context switch). -- PyTorch integration is still experimental. Some performance bottlenecks may simply be the result of unfinished implementation. - -The official PyTorch XLA `performance guide `_ -has more detailed information on how PyTorch code can be optimized for TPU. In particular, the -`metrics report `_ allows -one to identify operations that lead to context switching. - ----- - -FAQ ---- - -**XLA configuration is missing** - -.. code-block:: - - File "/usr/local/lib/python3.8/dist-packages/torch_xla/core/xla_model.py", line 18, in - _DEVICES = xu.LazyProperty(lambda: torch_xla._XLAC._xla_get_devices()) - RuntimeError: tensorflow/compiler/xla/xla_client/computation_client.cc:273 : Missing XLA configuration - Traceback (most recent call last): - ... - File "/home/kaushikbokka/pytorch-lightning/pytorch_lightning/utilities/device_parser.py", line 125, in parse_tpu_cores - raise MisconfigurationException('No TPU devices were found.') - pytorch_lightning.utilities.exceptions.MisconfigurationException: No TPU devices were found. - -This means the system is missing XLA configuration. You would need to set up XRT TPU device configuration. - -For TPUVM architecture, you could set it in your terminal by: - -.. code-block:: bash - - export XRT_TPU_CONFIG="localservice;0;localhost:51011" - -And for the old TPU + 2VM architecture, you could set it by: - -.. code-block:: bash - - export TPU_IP_ADDRESS=10.39.209.42 # You could get the IP Address in the GCP TPUs section - export XRT_TPU_CONFIG="tpu_worker;0;$TPU_IP_ADDRESS:8470" - ----- - -**How to clear up the programs using TPUs in the background** - -.. code-block:: bash - - lsof -w /lib/libtpu.so | grep "python" | awk '{print $2}' | xargs -r kill -9 - -Sometimes, there can still be old programs running on the TPUs, which would make the TPUs unavailable to use. You could use the above command in the terminal to kill the running processes. - ----- - -**Replication issue** - -.. code-block:: - - File "/usr/local/lib/python3.6/dist-packages/torch_xla/core/xla_model.py", line 200, in set_replication - replication_devices = xla_replication_devices(devices) - File "/usr/local/lib/python3.6/dist-packages/torch_xla/core/xla_model.py", line 187, in xla_replication_devices - .format(len(local_devices), len(kind_devices))) - RuntimeError: Cannot replicate if number of devices (1) is different from 8 - -This error is raised when the XLA device is called outside the spawn process. Internally in `TPUSpawn` Strategy for training on multiple tpu cores, we use XLA's `xmp.spawn`. -Don't use ``xm.xla_device()`` while working on Lightning + TPUs! - ----- - -**Unsupported datatype transfer to TPU** - -.. code-block:: - - File "/usr/local/lib/python3.8/dist-packages/torch_xla/utils/utils.py", line 205, in _for_each_instance_rewrite - v = _for_each_instance_rewrite(result.__dict__[k], select_fn, fn, rwmap) - File "/usr/local/lib/python3.8/dist-packages/torch_xla/utils/utils.py", line 206, in _for_each_instance_rewrite - result.__dict__[k] = v - TypeError: 'mappingproxy' object does not support item assignment - -PyTorch XLA only supports Tensor objects for CPU to TPU data transfer. Might cause issues if the User is trying to send some non-tensor objects through the DataLoader or during saving states. - ----- - -**Using `tpu_spawn_debug` Strategy alias** - -.. code-block:: python - - import pytorch_lightning as pl - - my_model = MyLightningModule() - trainer = pl.Trainer(accelerator="tpu", devices=8, strategy="tpu_spawn_debug") - trainer.fit(my_model) - -Example Metrics report: - -.. code-block:: - - Metric: CompileTime - TotalSamples: 202 - Counter: 06m09s401ms746.001us - ValueRate: 778ms572.062us / second - Rate: 0.425201 / second - Percentiles: 1%=001ms32.778us; 5%=001ms61.283us; 10%=001ms79.236us; 20%=001ms110.973us; 50%=001ms228.773us; 80%=001ms339.183us; 90%=001ms434.305us; 95%=002ms921.063us; 99%=21s102ms853.173us - - -A lot of PyTorch operations aren't lowered to XLA, which could lead to significant slowdown of the training process. -These operations are moved to the CPU memory and evaluated, and then the results are transferred back to the XLA device(s). -By using the `tpu_spawn_debug` Strategy, users could create a metrics report to diagnose issues. - -The report includes things like (`XLA Reference `_): - -* how many times we issue XLA compilations and time spent on issuing. -* how many times we execute and time spent on execution -* how many device data handles we create/destroy etc. - ----- - -**TPU Pod Training Startup script** - -All TPU VMs in a Pod setup are required to access the model code and data. -One easy way to achieve this is to use the following startup script when creating the TPU VM pod. -It will perform the data downloading on all TPU VMs. Note that you need to export the corresponding environment variables following the instruction in Create TPU Node. - -.. code-block:: bash - - gcloud alpha compute tpus tpu-vm create ${TPU_NAME} --zone ${ZONE} --project ${PROJECT_ID} --accelerator-type v3-32 --version ${RUNTIME_VERSION} --metadata startup-script=setup.py - -Then users could ssh to any TPU worker, e.g. worker 0, check if data/model downloading is finished and -start the training after generating the ssh-keys to ssh between VM workers on a pod: - -.. code-block:: bash - - python3 -m torch_xla.distributed.xla_dist --tpu=$TPU_NAME -- python3 train.py --max_epochs=5 --batch_size=32 diff --git a/source/accelerators/tpu_faq.rst b/source/accelerators/tpu_faq.rst deleted file mode 100644 index af7c45f..0000000 --- a/source/accelerators/tpu_faq.rst +++ /dev/null @@ -1,255 +0,0 @@ -:orphan: - -TPU training (Basic) -==================== -**Audience:** Users looking to train on single or multiple TPU cores. - ----- - -.. raw:: html - - - -| - -Lightning supports running on TPUs. At this moment, TPUs are available -on Google Cloud (GCP), Google Colab and Kaggle Environments. For more information on TPUs -`watch this video `_. - ----------------- - -What is a TPU? --------------- -Tensor Processing Unit (TPU) is an AI accelerator application-specific integrated circuit (ASIC) developed by Google specifically for neural networks. - -A TPU has 8 cores where each core is optimized for 128x128 matrix multiplies. In general, a single TPU is about as fast as 5 V100 GPUs! - -A TPU pod hosts many TPUs on it. Currently, TPU v3 Pod has up to 2048 TPU cores and 32 TiB of memory! -You can request a full pod from Google cloud or a "slice" which gives you -some subset of those 2048 cores. - ----- - -Run on 1 TPU core ------------------ -Enable the following Trainer arguments to run on 1 TPU. - -.. code:: - - trainer = Trainer(accelerator="tpu", devices=1) - ----- - -Run on multiple TPU cores -------------------------- -For multiple TPU cores, change the value of the devices flag. - -.. code:: - - trainer = Trainer(accelerator="tpu", devices=8) - ----- - -Run on a specific TPU core --------------------------- - -To run on a specific core, specify the index of the TPU core. - -.. code-block:: python - - trainer = pl.Trainer(accelerator="tpu", devices=[5]) - -This example runs on the 5th core, not on five cores. - ----- - -How to access TPUs ------------------- -To access TPUs, there are three main ways. - -Google Colab -^^^^^^^^^^^^ -Colab is like a jupyter notebook with a free GPU or TPU -hosted on GCP. - -To get a TPU on colab, follow these steps: - -1. Go to `https://colab.research.google.com/ `_. - -2. Click "new notebook" (bottom right of pop-up). - -3. Click runtime > change runtime settings. Select Python 3, and hardware accelerator "TPU". - This will give you a TPU with 8 cores. - -4. Next, insert this code into the first cell and execute. - This will install the xla library that interfaces between PyTorch and the TPU. - - .. code-block:: - - !pip install cloud-tpu-client==0.10 https://storage.googleapis.com/tpu-pytorch/wheels/torch_xla-1.9-cp37-cp37m-linux_x86_64.whl - -5. Once the above is done, install PyTorch Lightning. - - .. code-block:: - - !pip install pytorch-lightning - -6. Then set up your LightningModule as normal. - -Google Cloud (GCP) -^^^^^^^^^^^^^^^^^^ -? - -Kaggle -^^^^^^ -For starting Kaggle projects with TPUs, refer to this `kernel `_. - ----- - -Optimize Performance --------------------- - -The TPU was designed for specific workloads and operations to carry out large volumes of matrix multiplication, -convolution operations and other commonly used ops in applied deep learning. -The specialization makes it a strong choice for NLP tasks, sequential convolutional networks, and under low precision operation. -There are cases in which training on TPUs is slower when compared with GPUs, for possible reasons listed: - -- Too small batch size. -- Explicit evaluation of tensors during training, e.g. ``tensor.item()`` -- Tensor shapes (e.g. model inputs) change often during training. -- Limited resources when using TPU's with PyTorch `Link `_ -- XLA Graph compilation during the initial steps `Reference `_ -- Some tensor ops are not fully supported on TPU, or not supported at all. These operations will be performed on CPU (context switch). -- PyTorch integration is still experimental. Some performance bottlenecks may simply be the result of unfinished implementation. - -The official PyTorch XLA `performance guide `_ -has more detailed information on how PyTorch code can be optimized for TPU. In particular, the -`metrics report `_ allows -one to identify operations that lead to context switching. - ----- - -FAQ ---- - -**XLA configuration is missing** - -.. code-block:: - - File "/usr/local/lib/python3.8/dist-packages/torch_xla/core/xla_model.py", line 18, in - _DEVICES = xu.LazyProperty(lambda: torch_xla._XLAC._xla_get_devices()) - RuntimeError: tensorflow/compiler/xla/xla_client/computation_client.cc:273 : Missing XLA configuration - Traceback (most recent call last): - ... - File "/home/kaushikbokka/pytorch-lightning/pytorch_lightning/utilities/device_parser.py", line 125, in parse_tpu_cores - raise MisconfigurationException('No TPU devices were found.') - pytorch_lightning.utilities.exceptions.MisconfigurationException: No TPU devices were found. - -This means the system is missing XLA configuration. You would need to set up XRT TPU device configuration. - -For TPUVM architecture, you could set it in your terminal by: - -.. code-block:: bash - - export XRT_TPU_CONFIG="localservice;0;localhost:51011" - -And for the old TPU + 2VM architecture, you could set it by: - -.. code-block:: bash - - export TPU_IP_ADDRESS=10.39.209.42 # You could get the IP Address in the GCP TPUs section - export XRT_TPU_CONFIG="tpu_worker;0;$TPU_IP_ADDRESS:8470" - ----- - -**How to clear up the programs using TPUs in the background** - -.. code-block:: bash - - lsof -w /lib/libtpu.so | grep "python" | awk '{print $2}' | xargs -r kill -9 - -Sometimes, there can still be old programs running on the TPUs, which would make the TPUs unavailable to use. You could use the above command in the terminal to kill the running processes. - ----- - -**Replication issue** - -.. code-block:: - - File "/usr/local/lib/python3.6/dist-packages/torch_xla/core/xla_model.py", line 200, in set_replication - replication_devices = xla_replication_devices(devices) - File "/usr/local/lib/python3.6/dist-packages/torch_xla/core/xla_model.py", line 187, in xla_replication_devices - .format(len(local_devices), len(kind_devices))) - RuntimeError: Cannot replicate if number of devices (1) is different from 8 - -This error is raised when the XLA device is called outside the spawn process. Internally in `TPUSpawn` Strategy for training on multiple tpu cores, we use XLA's `xmp.spawn`. -Don't use ``xm.xla_device()`` while working on Lightning + TPUs! - ----- - -**Unsupported datatype transfer to TPU** - -.. code-block:: - - File "/usr/local/lib/python3.8/dist-packages/torch_xla/utils/utils.py", line 205, in _for_each_instance_rewrite - v = _for_each_instance_rewrite(result.__dict__[k], select_fn, fn, rwmap) - File "/usr/local/lib/python3.8/dist-packages/torch_xla/utils/utils.py", line 206, in _for_each_instance_rewrite - result.__dict__[k] = v - TypeError: 'mappingproxy' object does not support item assignment - -PyTorch XLA only supports Tensor objects for CPU to TPU data transfer. Might cause issues if the User is trying to send some non-tensor objects through the DataLoader or during saving states. - ----- - -**Using `tpu_spawn_debug` Strategy alias** - -.. code-block:: python - - import pytorch_lightning as pl - - my_model = MyLightningModule() - trainer = pl.Trainer(accelerator="tpu", devices=8, strategy="tpu_spawn_debug") - trainer.fit(my_model) - -Example Metrics report: - -.. code-block:: - - Metric: CompileTime - TotalSamples: 202 - Counter: 06m09s401ms746.001us - ValueRate: 778ms572.062us / second - Rate: 0.425201 / second - Percentiles: 1%=001ms32.778us; 5%=001ms61.283us; 10%=001ms79.236us; 20%=001ms110.973us; 50%=001ms228.773us; 80%=001ms339.183us; 90%=001ms434.305us; 95%=002ms921.063us; 99%=21s102ms853.173us - - -A lot of PyTorch operations aren't lowered to XLA, which could lead to significant slowdown of the training process. -These operations are moved to the CPU memory and evaluated, and then the results are transferred back to the XLA device(s). -By using the `tpu_spawn_debug` Strategy, users could create a metrics report to diagnose issues. - -The report includes things like (`XLA Reference `_): - -* how many times we issue XLA compilations and time spent on issuing. -* how many times we execute and time spent on execution -* how many device data handles we create/destroy etc. - ----- - -**TPU Pod Training Startup script** - -All TPU VMs in a Pod setup are required to access the model code and data. -One easy way to achieve this is to use the following startup script when creating the TPU VM pod. -It will perform the data downloading on all TPU VMs. Note that you need to export the corresponding environment variables following the instruction in Create TPU Node. - -.. code-block:: bash - - gcloud alpha compute tpus tpu-vm create ${TPU_NAME} --zone ${ZONE} --project ${PROJECT_ID} --accelerator-type v3-32 --version ${RUNTIME_VERSION} --metadata startup-script=setup.py - -Then users could ssh to any TPU worker, e.g. worker 0, check if data/model downloading is finished and -start the training after generating the ssh-keys to ssh between VM workers on a pod: - -.. code-block:: bash - - python3 -m torch_xla.distributed.xla_dist --tpu=$TPU_NAME -- python3 train.py --max_epochs=5 --batch_size=32 diff --git a/source/accelerators/tpu_intermediate.rst b/source/accelerators/tpu_intermediate.rst deleted file mode 100644 index 826f568..0000000 --- a/source/accelerators/tpu_intermediate.rst +++ /dev/null @@ -1,113 +0,0 @@ -:orphan: - -TPU training (Intermediate) -=========================== -**Audience:** Users looking to use cloud TPUs. - ----- - -DistributedSamplers -------------------- -Lightning automatically inserts the correct samplers - no need to do this yourself! - -Usually, with TPUs (and DDP), you would need to define a DistributedSampler to move the right -chunk of data to the appropriate TPU. As mentioned, this is not needed in Lightning - -.. note:: Don't add distributedSamplers. Lightning does this automatically - -If for some reason you still need to, this is how to construct the sampler -for TPU use - -.. code-block:: python - - import torch_xla.core.xla_model as xm - - - def train_dataloader(self): - dataset = MNIST(os.getcwd(), train=True, download=True, transform=transforms.ToTensor()) - - # required for TPU support - sampler = None - if use_tpu: - sampler = torch.utils.data.distributed.DistributedSampler( - dataset, num_replicas=xm.xrt_world_size(), rank=xm.get_ordinal(), shuffle=True - ) - - loader = DataLoader(dataset, sampler=sampler, batch_size=32) - - return loader - -Configure the number of TPU cores in the trainer. You can only choose 1 or 8. -To use a full TPU pod skip to the TPU pod section. - -.. code-block:: python - - import pytorch_lightning as pl - - my_model = MyLightningModule() - trainer = pl.Trainer(accelerator="tpu", devices=8) - trainer.fit(my_model) - -That's it! Your model will train on all 8 TPU cores. - ----------------- - -Distributed Backend with TPU ----------------------------- -The ``accelerator`` option used for GPUs does not apply to TPUs. -TPUs work in DDP mode by default (distributing over each core) - ----------------- - -TPU VM ------- -Lightning supports training on the new Cloud TPU VMs. -Previously, we needed separate VMs to connect to the TPU machines, but as -Cloud TPU VMs run on the TPU Host machines, it allows direct SSH access -for the users. Hence, this architecture upgrade leads to cheaper and significantly -better performance and usability while working with TPUs. - -The TPUVMs come pre-installed with latest versions of PyTorch and PyTorch XLA. -After connecting to the VM and before running your Lightning code, you would need -to set the XRT TPU device configuration. - -.. code-block:: bash - - $ export XRT_TPU_CONFIG="localservice;0;localhost:51011" - -You could learn more about the Cloud TPU VM architecture `here `_ - ----------------- - -TPU Pod -------- -To train on more than 8 cores, your code actually doesn't change! -All you need to do is submit the following command: - -.. code-block:: bash - - $ python -m torch_xla.distributed.xla_dist - --tpu=$TPU_POD_NAME - --conda-env=torch-xla-nightly - -- python /usr/share/torch-xla-1.8.1/pytorch/xla/test/test_train_imagenet.py --fake_data - -See `this guide `_ -on how to set up the instance groups and VMs needed to run TPU Pods. - ----------------- - -16 bit precision ----------------- -Lightning also supports training in 16-bit precision with TPUs. -By default, TPU training will use 32-bit precision. To enable 16-bit, -set the 16-bit flag. - -.. code-block:: python - - import pytorch_lightning as pl - - my_model = MyLightningModule() - trainer = pl.Trainer(accelerator="tpu", devices=8, precision=16) - trainer.fit(my_model) - -Under the hood the xla library will use the `bfloat16 type `_. diff --git a/source/advanced/model_parallel.rst b/source/advanced/model_parallel.rst deleted file mode 100644 index 811bc57..0000000 --- a/source/advanced/model_parallel.rst +++ /dev/null @@ -1,905 +0,0 @@ -.. _model-parallel: - -Train 1 trillion+ parameter models -================================== - -When training large models, fitting larger batch sizes, or trying to increase throughput using multi-GPU compute, Lightning provides advanced optimized distributed training strategies to support these cases and offer substantial improvements in memory usage. - -In many cases these strategies are some flavour of model parallelism however we only introduce concepts at a high level to get you started. Refer to the `FairScale documentation `_ for more information about model parallelism. - -Note that some of the extreme memory saving configurations will affect the speed of training. This Speed/Memory trade-off in most cases can be adjusted. - -Some of these memory-efficient strategies rely on offloading onto other forms of memory, such as CPU RAM or NVMe. This means you can even see memory benefits on a **single GPU**, using a strategy such as :ref:`deepspeed-zero-stage-3-offload`. - -Check out this amazing video explaining model parallelism and how it works behind the scenes: - -.. raw:: html - - - - -Choosing an Advanced Distributed GPU Strategy -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - -If you would like to stick with PyTorch DDP, see :ref:`ddp-optimizations`. - -Unlike :class:`~torch.nn.parallel.DistributedDataParallel` (DDP) where the maximum trainable model size and batch size do not change with respect to the number of GPUs, memory-optimized strategies can accommodate bigger models and larger batches as more GPUs are used. This means as you scale up the number of GPUs, you can reach the number of model parameters you'd like to train. - -There are many considerations when choosing a strategy as described below. In addition, check out the visualization of various strategy benchmarks using `minGPT `__ `here `__. - -Pre-training vs Fine-tuning -""""""""""""""""""""""""""" - -When fine-tuning, we often use a magnitude less data compared to pre-training a model. This is important when choosing a distributed strategy as usually for pre-training, **we are compute-bound**. -This means we cannot sacrifice throughput as much as if we were fine-tuning, because in fine-tuning the data requirement is smaller. - -Overall: - -* When **fine-tuning** a model, use advanced memory efficient strategies such as :ref:`deepspeed-zero-stage-3` or :ref:`deepspeed-zero-stage-3-offload`, allowing you to fine-tune larger models if you are limited on compute -* When **pre-training** a model, use simpler optimizations such :ref:`sharded-training`, :ref:`deepspeed-zero-stage-2` or :ref:`fully-sharded-training`, scaling the number of GPUs to reach larger parameter sizes -* For both fine-tuning and pre-training, use :ref:`deepspeed-activation-checkpointing` or :ref:`fairscale-activation-checkpointing` as the throughput degradation is not significant - -For example when using 128 GPUs, you can **pre-train** large 10 to 20 Billion parameter models using :ref:`deepspeed-zero-stage-2` without having to take a performance hit with more advanced optimized multi-gpu strategy. - -But for **fine-tuning** a model, you can reach 10 to 20 Billion parameter models using :ref:`deepspeed-zero-stage-3-offload` on a **single GPU**. This does come with a significant throughput hit, which needs to be weighed accordingly. - -When Shouldn't I use an Optimized Distributed Strategy? -""""""""""""""""""""""""""""""""""""""""""""""""""""""" - -Sharding techniques help when model sizes are fairly large; roughly 500M+ parameters is where we've seen benefits. However, in the following cases, we recommend sticking to ordinary distributed strategies -* When your model is small (ResNet50 of around 80M Parameters), unless you are using unusually large batch sizes or inputs. -* Due to high distributed communication between devices, if running on a slow network/interconnect, the training might be much slower than expected and then it's up to you to determince the tradeoff here. - ----------- - -.. _sharded-training: - -Sharded Training -^^^^^^^^^^^^^^^^ -Lightning integration of optimizer sharded training provided by `FairScale `_. -The technique can be found within `DeepSpeed ZeRO `_ and -`ZeRO-2 `_, -however the implementation is built from the ground up to be PyTorch compatible and standalone. -Sharded Training allows you to maintain GPU scaling efficiency, whilst reducing memory overhead drastically. In short, expect near-normal linear scaling (if your network allows), and significantly reduced memory usage when training large models. - -Sharded Training still utilizes Data Parallel Training under the hood, except optimizer states and gradients are sharded across GPUs. -This means the memory overhead per GPU is lower, as each GPU only has to maintain a partition of your optimizer state and gradients. - -The benefits vary by model and parameter sizes, but we've recorded up to a 63% memory reduction per GPU allowing us to double our model sizes. Because of efficient communication, -these benefits in multi-GPU setups are almost free and throughput scales well with multi-node setups. - -It is highly recommended to use Sharded Training in multi-GPU environments where memory is limited, or where training larger models are beneficial (500M+ parameter models). -A technical note: as batch size scales, storing activations for the backwards pass becomes the bottleneck in training. As a result, sharding optimizer state and gradients becomes less impactful. -Use :ref:`fairscale-activation-checkpointing` to see even more benefit at the cost of some throughput. - -To use Sharded Training, you need to first install FairScale using the command below. - -.. code-block:: bash - - pip install fairscale - - -.. code-block:: python - - # train using Sharded DDP - trainer = Trainer(strategy="ddp_sharded") - -Sharded Training can work across all DDP variants by adding the additional ``--strategy ddp_sharded`` flag via command line using a PyTorch Lightning script. - -Internally we re-initialize your optimizers and shard them across your machines and processes. We handle all communication using PyTorch distributed, so no code changes are required. - ----------- - -.. _fully-sharded-training: - -Fully Sharded Training -^^^^^^^^^^^^^^^^^^^^^^ - -.. warning:: - Fully Sharded Training is in beta and the API is subject to change. Please create an `issue `_ if you run into any issues. - -`Fully Sharded `__ shards optimizer state, gradients and parameters across data parallel workers. This allows you to fit much larger models onto multiple GPUs into memory. - -Fully Sharded Training alleviates the need to worry about balancing layers onto specific devices using some form of pipe parallelism, and optimizes for distributed communication with minimal effort. - -Shard Parameters to Reach 10+ Billion Parameters -"""""""""""""""""""""""""""""""""""""""""""""""" - -To reach larger parameter sizes and be memory efficient, we have to shard parameters. There are various ways to enable this. - -.. note:: - Currently Fully Sharded Training relies on the user to wrap the model with Fully Sharded within the ``LightningModule``. - This means you must create a single model that is treated as a ``torch.nn.Module`` within the ``LightningModule``. - This is a limitation of Fully Sharded Training that will be resolved in the future. - -Enabling Module Sharding for Maximum Memory Efficiency -"""""""""""""""""""""""""""""""""""""""""""""""""""""" - -To activate parameter sharding, you must wrap your model using provided ``wrap`` or ``auto_wrap`` functions as described below. Internally in Lightning, we enable a context manager around the ``configure_sharded_model`` function to make sure the ``wrap`` and ``auto_wrap`` parameters are passed correctly. - -When not using Fully Sharded these wrap functions are a no-op. This means once the changes have been made, there is no need to remove the changes for other strategies. - -``auto_wrap`` will recursively wrap :class:`~torch.nn.Module` within the ``LightningModule`` with nested Fully Sharded Wrappers, -signalling that we'd like to partition these modules across data parallel devices, discarding the full weights when not required (information :class:`here `). - -``auto_wrap`` can have varying level of success based on the complexity of your model. **Auto Wrap does not support models with shared parameters**. - -``wrap`` will simply wrap the module with a Fully Sharded Parallel class with the correct parameters from the Lightning context manager. - -Below is an example of using both ``wrap`` and ``auto_wrap`` to create your model. - -.. code-block:: python - - import torch - import torch.nn as nn - import pytorch_lightning as pl - from pytorch_lightning import Trainer - from fairscale.nn import checkpoint_wrapper, auto_wrap, wrap - - - class MyModel(pl.LightningModule): - def __init__(self): - super().__init__() - self.linear_layer = nn.Linear(32, 32) - self.block = nn.Sequential(nn.Linear(32, 32), nn.ReLU()) - self.final_block = nn.Sequential(nn.Linear(32, 32), nn.ReLU()) - - def configure_sharded_model(self): - # modules are sharded across processes - # as soon as they are wrapped with ``wrap`` or ``auto_wrap``. - # During the forward/backward passes, weights get synced across processes - # and de-allocated once computation is complete, saving memory. - - # Wraps the layer in a Fully Sharded Wrapper automatically - linear_layer = wrap(self.linear_layer) - - # Wraps the module recursively - # based on a minimum number of parameters (default 100M parameters) - block = auto_wrap(self.block) - - # For best memory efficiency, - # add FairScale activation checkpointing - final_block = auto_wrap(checkpoint_wrapper(self.final_block)) - self.model = nn.Sequential(linear_layer, nn.ReLU(), block, final_block) - - def configure_optimizers(self): - return torch.optim.AdamW(self.model.parameters()) - - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="fsdp", precision=16) - trainer.fit(model) - - trainer.test() - trainer.predict() - - ----------- - -.. _fairscale-activation-checkpointing: - -FairScale Activation Checkpointing -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - -Activation checkpointing frees activations from memory as soon as they are not needed during the forward pass. They are then re-computed for the backwards pass as needed. Activation checkpointing is very useful when you have intermediate layers that produce large activations. - -FairScales' checkpointing wrapper also handles batch norm layers correctly unlike the PyTorch implementation, ensuring stats are tracked correctly due to the multiple forward passes. - -This saves memory when training larger models however requires wrapping modules you'd like to use activation checkpointing on. See :class:`here ` for more information. - -.. warning:: - - Ensure to not wrap the entire model with activation checkpointing. This is not the intended usage of activation checkpointing, and will lead to failures as seen in `this discussion `__. - -.. code-block:: python - - from pytorch_lightning import Trainer - from fairscale.nn import checkpoint_wrapper - - - class MyModel(pl.LightningModule): - def __init__(self): - super().__init__() - # Wrap layers using checkpoint_wrapper - self.block_1 = checkpoint_wrapper(nn.Sequential(nn.Linear(32, 32), nn.ReLU())) - self.block_2 = nn.Linear(32, 2) - - -.. _deepspeed_advanced: - -DeepSpeed -^^^^^^^^^ - -.. note:: - The DeepSpeed strategy is in beta and the API is subject to change. Please create an `issue `_ if you run into any issues. - -`DeepSpeed `__ is a deep learning training optimization library, providing the means to train massive billion parameter models at scale. -Using the DeepSpeed strategy, we were able to **train model sizes of 10 Billion parameters and above**, with a lot of useful information in this `benchmark `_ and the `DeepSpeed docs `__. -DeepSpeed also offers lower level training optimizations, and efficient optimizers such as `1-bit Adam `_. We recommend using DeepSpeed in environments where speed and memory optimizations are important (such as training large billion parameter models). - -Below is a summary of all the configurations of DeepSpeed. - -* :ref:`deepspeed-zero-stage-1` - **Shard optimizer states**, remains at speed parity with DDP whilst providing memory improvement - -* :ref:`deepspeed-zero-stage-2` - **Shard optimizer states and gradients**, remains at speed parity with DDP whilst providing even more memory improvement - -* :ref:`deepspeed-zero-stage-2-offload` - **Offload optimizer states and gradients to CPU**. Increases distributed communication volume and GPU-CPU device transfer, but provides significant memory improvement - -* :ref:`deepspeed-zero-stage-3` - **Shard optimizer states, gradients, parameters and optionally activations**. Increases distributed communication volume, but provides even more memory improvement - -* :ref:`deepspeed-zero-stage-3-offload` - **Offload optimizer states, gradients, parameters and optionally activations to CPU**. Increases distributed communication volume and GPU-CPU device transfer, but even more significant memory improvement. - -* :ref:`deepspeed-activation-checkpointing` - **Free activations after forward pass**. Increases computation, but provides memory improvement for all stages. - -To use DeepSpeed, you first need to install DeepSpeed using the commands below. - -.. code-block:: bash - - pip install deepspeed - -If you run into an issue with the install or later in training, ensure that the CUDA version of the PyTorch you've installed matches your locally installed CUDA (you can see which one has been recognized by running ``nvcc --version``). - -.. note:: - - DeepSpeed currently only supports single optimizer, single scheduler within the training loop. - - When saving a checkpoint we rely on DeepSpeed which saves a directory containing the model and various components. - - -.. _deepspeed-zero-stage-1: - -DeepSpeed ZeRO Stage 1 -"""""""""""""""""""""" - -`DeepSpeed ZeRO Stage 1 `_ partitions your optimizer states (Stage 1) across your GPUs to reduce memory. - -It is recommended to skip Stage 1 and use Stage 2, which comes with larger memory improvements and still remains efficient. Stage 1 is useful to pair with certain optimizations such as `Torch ORT `__. - -.. code-block:: python - - from pytorch_lightning import Trainer - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_1", precision=16) - trainer.fit(model) - - -.. _deepspeed-zero-stage-2: - -DeepSpeed ZeRO Stage 2 -"""""""""""""""""""""" - -`DeepSpeed ZeRO Stage 2 `_ partitions your optimizer states (Stage 1) and your gradients (Stage 2) across your GPUs to reduce memory. In most cases, this is more efficient or at parity with DDP, primarily due to the optimized custom communications written by the DeepSpeed team. -As a result, benefits can also be seen on a single GPU. Do note that the default bucket sizes allocate around ``3.6GB`` of VRAM to use during distributed communications, which can be tweaked when instantiating the strategy described in a few sections below. - -.. code-block:: python - - from pytorch_lightning import Trainer - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_2", precision=16) - trainer.fit(model) - -.. code-block:: bash - - python train.py --strategy deepspeed_stage_2 --precision 16 --accelerator 'gpu' --devices 4 - - -.. _deepspeed-zero-stage-2-offload: - -DeepSpeed ZeRO Stage 2 Offload -"""""""""""""""""""""""""""""" - -Below we show an example of running `ZeRO-Offload `_. ZeRO-Offload leverages the host CPU to offload optimizer memory/computation, reducing the overall memory consumption. - -.. code-block:: python - - from pytorch_lightning import Trainer - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_2_offload", precision=16) - trainer.fit(model) - - -This can also be done via the command line using a PyTorch Lightning script: - -.. code-block:: bash - - python train.py --strategy deepspeed_stage_2_offload --precision 16 --accelerator 'gpu' --devices 4 - - -You can also modify the ZeRO-Offload parameters via the strategy as below. - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DeepSpeedStrategy - - model = MyModel() - trainer = Trainer( - accelerator="gpu", - devices=4, - strategy=DeepSpeedStrategy(offload_optimizer=True, allgather_bucket_size=5e8, reduce_bucket_size=5e8), - precision=16, - ) - trainer.fit(model) - - -.. note:: - We suggest tuning the ``allgather_bucket_size`` parameter and ``reduce_bucket_size`` parameter to find optimum parameters based on your model size. - These control how large a buffer we limit the model to using when reducing gradients/gathering updated parameters. Smaller values will result in less memory, but tradeoff with speed. - - DeepSpeed allocates a reduce buffer size `multiplied by 1.5x `_ so take that into consideration when tweaking the parameters. - - The strategy sets a reasonable default of ``2e8``, which should work for most low VRAM GPUs (less than ``7GB``), allocating roughly ``3.6GB`` of VRAM as buffer. Higher VRAM GPUs should aim for values around ``5e8``. - -For even more speed benefit, DeepSpeed offers an optimized CPU version of ADAM called `DeepSpeedCPUAdam `_ to run the offloaded computation, which is faster than the standard PyTorch implementation. - -.. code-block:: python - - import pytorch_lightning - from pytorch_lightning import Trainer - from deepspeed.ops.adam import DeepSpeedCPUAdam - - - class MyModel(pl.LightningModule): - ... - - def configure_optimizers(self): - # DeepSpeedCPUAdam provides 5x to 7x speedup over torch.optim.adam(w) - return DeepSpeedCPUAdam(self.parameters()) - - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_2_offload", precision=16) - trainer.fit(model) - - -.. _deepspeed-zero-stage-3: - -DeepSpeed ZeRO Stage 3 -"""""""""""""""""""""" - -DeepSpeed ZeRO Stage 3 shards the optimizer states, gradients and the model parameters (also optionally activations). Sharding model parameters and activations comes with an increase in distributed communication, however allows you to scale your models massively from one GPU to multiple GPUs. -**The DeepSpeed team report the ability to fine-tune models with over 40B parameters on a single GPU and over 2 Trillion parameters on 512 GPUs.** For more information we suggest checking the `DeepSpeed ZeRO-3 Offload documentation `__. - -We've ran benchmarks for all these features and given a simple example of how all these features work in Lightning, which you can see at `minGPT `_. - -To reach the highest memory efficiency or model size, you must: - -1. Use the DeepSpeed strategy with the stage 3 parameter -2. Use CPU Offloading to offload weights to CPU, plus have a reasonable amount of CPU RAM to offload onto -3. Use DeepSpeed Activation Checkpointing to shard activations - -Below we describe how to enable all of these to see benefit. **With all these improvements we reached 45 Billion parameters training a GPT model on 8 GPUs with ~1TB of CPU RAM available**. - -Also please have a look at our :ref:`deepspeed-zero-stage-3-tips` which contains a lot of helpful information when configuring your own models. - -.. note:: - - When saving a model using DeepSpeed and Stage 3, model states and optimizer states will be saved in separate sharded states (based on the world size). See :ref:`deepspeed-zero-stage-3-single-file` to obtain a single checkpoint file. - -.. code-block:: python - - from pytorch_lightning import Trainer - from deepspeed.ops.adam import FusedAdam - - - class MyModel(pl.LightningModule): - ... - - def configure_optimizers(self): - return FusedAdam(self.parameters()) - - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3", precision=16) - trainer.fit(model) - - trainer.test() - trainer.predict() - - -You can also use the Lightning Trainer to run predict or evaluate with DeepSpeed once the model has been trained. - -.. code-block:: python - - from pytorch_lightning import Trainer - - - class MyModel(pl.LightningModule): - ... - - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3", precision=16) - trainer.test(ckpt_path="my_saved_deepspeed_checkpoint.ckpt") - - -Shard Model Instantly to Reduce Initialization Time/Memory -"""""""""""""""""""""""""""""""""""""""""""""""""""""""""" - -When instantiating really large models, it is sometimes necessary to shard the model layers instantly. - -This is the case if layers may not fit on one single machines CPU or GPU memory, but would fit once sharded across multiple machines. -We expose a hook that layers initialized within the hook will be sharded instantly on a per layer basis, allowing you to instantly shard models. - -This reduces the time taken to initialize very large models, as well as ensure we do not run out of memory when instantiating larger models. For more information you can refer to the DeepSpeed docs for `Constructing Massive Models `_. - -.. code-block:: python - - import torch.nn as nn - from pytorch_lightning import Trainer - from deepspeed.ops.adam import FusedAdam - - - class MyModel(pl.LightningModule): - ... - - def configure_sharded_model(self): - # Created within sharded model context, modules are instantly sharded across processes - # as soon as they are made. - self.block = nn.Sequential(nn.Linear(32, 32), nn.ReLU()) - - def configure_optimizers(self): - return FusedAdam(self.parameters()) - - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3", precision=16) - trainer.fit(model) - - trainer.test() - trainer.predict() - - -.. _deepspeed-zero-stage-3-offload: - -DeepSpeed ZeRO Stage 3 Offload -"""""""""""""""""""""""""""""" - -DeepSpeed ZeRO Stage 3 Offloads optimizer state, gradients to the host CPU to reduce memory usage as ZeRO Stage 2 does, however additionally allows you to offload the parameters as well for even more memory saving. - -.. note:: - - When saving a model using DeepSpeed and Stage 3, model states and optimizer states will be saved in separate sharded states (based on the world size). See :ref:`deepspeed-zero-stage-3-single-file` to obtain a single checkpoint file. - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DeepSpeedStrategy - - # Enable CPU Offloading - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3_offload", precision=16) - trainer.fit(model) - - # Enable CPU Offloading, and offload parameters to CPU - model = MyModel() - trainer = Trainer( - accelerator="gpu", - devices=4, - strategy=DeepSpeedStrategy( - stage=3, - offload_optimizer=True, - offload_parameters=True, - ), - precision=16, - ) - trainer.fit(model) - - -DeepSpeed Infinity (NVMe Offloading) -"""""""""""""""""""""""""""""""""""" - -Additionally, DeepSpeed supports offloading to NVMe drives for even larger models, utilizing the large memory space found in NVMes. DeepSpeed `reports `__ the ability to fine-tune 1 Trillion+ parameters using NVMe Offloading on one 8 GPU machine. Below shows how to enable this, assuming the NVMe drive is mounted in a directory called ``/local_nvme``. - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DeepSpeedStrategy - - # Enable CPU Offloading - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3_offload", precision=16) - trainer.fit(model) - - # Enable CPU Offloading, and offload parameters to CPU - model = MyModel() - trainer = Trainer( - accelerator="gpu", - devices=4, - strategy=DeepSpeedStrategy( - stage=3, - offload_optimizer=True, - offload_parameters=True, - remote_device="nvme", - offload_params_device="nvme", - offload_optimizer_device="nvme", - nvme_path="/local_nvme", - ), - precision=16, - ) - trainer.fit(model) - -When offloading to NVMe you may notice that the speed is slow. There are parameters that need to be tuned based on the drives that you are using. Running the `aio_bench_perf_sweep.py `__ script can help you to find optimum parameters. See the `issue `__ for more information on how to parse the information. - -.. _deepspeed-activation-checkpointing: - -DeepSpeed Activation Checkpointing -"""""""""""""""""""""""""""""""""" - -Activation checkpointing frees activations from memory as soon as they are not needed during the forward pass. -They are then re-computed for the backwards pass as needed. - -Activation checkpointing is very useful when you have intermediate layers that produce large activations. - -This saves memory when training larger models, however requires using a checkpoint function to run modules as shown below. - -.. warning:: - - Ensure to not wrap the entire model with activation checkpointing. This is not the intended usage of activation checkpointing, and will lead to failures as seen in `this discussion `__. - -.. code-block:: python - - from pytorch_lightning import Trainer - import deepspeed - - - class MyModel(LightningModule): - ... - - def __init__(self): - super().__init__() - self.block_1 = nn.Sequential(nn.Linear(32, 32), nn.ReLU()) - self.block_2 = torch.nn.Linear(32, 2) - - def forward(self, x): - # Use the DeepSpeed checkpointing function instead of calling the module directly - # checkpointing self.block_1 means the activations are deleted after use, - # and re-calculated during the backward passes - x = deepspeed.checkpointing.checkpoint(self.block_1, x) - return self.block_2(x) - - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DeepSpeedStrategy - import deepspeed - - - class MyModel(pl.LightningModule): - ... - - def configure_sharded_model(self): - self.block_1 = nn.Sequential(nn.Linear(32, 32), nn.ReLU()) - self.block_2 = torch.nn.Linear(32, 2) - - def forward(self, x): - # Use the DeepSpeed checkpointing function instead of calling the module directly - x = deepspeed.checkpointing.checkpoint(self.block_1, x) - return self.block_2(x) - - - model = MyModel() - - trainer = Trainer(accelerator="gpu", devices=4, strategy="deepspeed_stage_3_offload", precision=16) - - # Enable CPU Activation Checkpointing - trainer = Trainer( - accelerator="gpu", - devices=4, - strategy=DeepSpeedStrategy( - stage=3, - offload_optimizer=True, # Enable CPU Offloading - cpu_checkpointing=True, # (Optional) offload activations to CPU - ), - precision=16, - ) - trainer.fit(model) - - -.. _deepspeed-zero-stage-3-tips: - -DeepSpeed ZeRO Stage 3 Tips -""""""""""""""""""""""""""" - -Here is some helpful information when setting up DeepSpeed ZeRO Stage 3 with Lightning. - -* If you're using Adam or AdamW, ensure to use FusedAdam or DeepSpeedCPUAdam (for CPU Offloading) rather than the default torch optimizers as they come with large speed benefits -* Treat your GPU/CPU memory as one large pool. In some cases, you may not want to offload certain things (like activations) to provide even more space to offload model parameters -* When offloading to the CPU, make sure to bump up the batch size as GPU memory will be freed -* We also support sharded checkpointing. By passing ``save_full_weights=False`` to the ``DeepSpeedStrategy``, we'll save shards of the model which allows you to save extremely large models. However to load the model and run test/validation/predict you must use the Trainer object. - -.. _deepspeed-zero-stage-3-single-file: - -Collating Single File Checkpoint for DeepSpeed ZeRO Stage 3 -""""""""""""""""""""""""""""""""""""""""""""""""""""""""""" - -After training using ZeRO Stage 3, you'll notice that your checkpoints are a directory of sharded model and optimizer states. If you'd like to collate a single file from the checkpoint directory please use the below command, which handles all the Lightning states additionally when collating the file. - -.. code-block:: python - - from pytorch_lightning.utilities.deepspeed import convert_zero_checkpoint_to_fp32_state_dict - - # lightning deepspeed has saved a directory instead of a file - save_path = "lightning_logs/version_0/checkpoints/epoch=0-step=0.ckpt/" - output_path = "lightning_model.pt" - convert_zero_checkpoint_to_fp32_state_dict(save_path, output_path) - - -.. warning:: - - This single file checkpoint does not include the optimizer/lr-scheduler states. This means we cannot restore training via the ``trainer.fit(ckpt_path=)`` call. Ensure to keep the sharded checkpoint directory if this is required. - -Custom DeepSpeed Config -""""""""""""""""""""""" - -In some cases you may want to define your own DeepSpeed Config, to access all parameters defined. We've exposed most of the important parameters, however, there may be debugging parameters to enable. Also, DeepSpeed allows the use of custom DeepSpeed optimizers and schedulers defined within a config file that is supported. - -.. note:: - All strategy default parameters will be ignored when a config object is passed. - All compatible arguments can be seen in the `DeepSpeed docs `_. - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DeepSpeedStrategy - - deepspeed_config = { - "zero_allow_untested_optimizer": True, - "optimizer": { - "type": "OneBitAdam", - "params": { - "lr": 3e-5, - "betas": [0.998, 0.999], - "eps": 1e-5, - "weight_decay": 1e-9, - "cuda_aware": True, - }, - }, - "scheduler": { - "type": "WarmupLR", - "params": { - "last_batch_iteration": -1, - "warmup_min_lr": 0, - "warmup_max_lr": 3e-5, - "warmup_num_steps": 100, - }, - }, - "zero_optimization": { - "stage": 2, # Enable Stage 2 ZeRO (Optimizer/Gradient state partitioning) - "offload_optimizer": True, # Enable Offloading optimizer state/calculation to the host CPU - "contiguous_gradients": True, # Reduce gradient fragmentation. - "overlap_comm": True, # Overlap reduce/backward operation of gradients for speed. - "allgather_bucket_size": 2e8, # Number of elements to all gather at once. - "reduce_bucket_size": 2e8, # Number of elements we reduce/allreduce at once. - }, - } - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy=DeepSpeedStrategy(config=deepspeed_config), precision=16) - trainer.fit(model) - - -We support taking the config as a json formatted file: - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DeepSpeedStrategy - - model = MyModel() - trainer = Trainer( - accelerator="gpu", devices=4, strategy=DeepSpeedStrategy(config="/path/to/deepspeed_config.json"), precision=16 - ) - trainer.fit(model) - - -You can use also use an environment variable via your PyTorch Lightning script: - -.. code-block:: bash - - PL_DEEPSPEED_CONFIG_PATH=/path/to/deepspeed_config.json python train.py --strategy deepspeed - ----------- - -.. _ddp-optimizations: - -DDP Optimizations -^^^^^^^^^^^^^^^^^ - - -When Using DDP Strategies, Set find_unused_parameters=False -""""""""""""""""""""""""""""""""""""""""""""""""""""""""""" - -By default, we have set ``find_unused_parameters=True`` for compatibility reasons that have been observed in the past (refer to the `discussion `_ for more details). -When enabled, it can result in a performance hit and can be disabled in most cases. Read more about it `here `_. - -.. tip:: - It applies to all DDP strategies that support ``find_unused_parameters`` as input. - -.. code-block:: python - - from pytorch_lightning.strategies import DDPStrategy - - trainer = pl.Trainer( - accelerator="gpu", - devices=2, - strategy=DDPStrategy(find_unused_parameters=False), - ) - -.. code-block:: python - - from pytorch_lightning.strategies import DDPSpawnStrategy - - trainer = pl.Trainer( - accelerator="gpu", - devices=2, - strategy=DDPSpawnStrategy(find_unused_parameters=False), - ) - - -DDP Static Graph -"""""""""""""""" - -`DDP static graph `__ assumes that your model -employs the same set of used/unused parameters in every iteration, so that it can deterministically know the flow of -training and apply special optimizations during runtime. - -.. note:: - DDP static graph support requires PyTorch>=1.11.0 - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DDPStrategy - - trainer = Trainer(devices=4, strategy=DDPStrategy(static_graph=True)) - - -When Using DDP on a Multi-node Cluster, Set NCCL Parameters -""""""""""""""""""""""""""""""""""""""""""""""""""""""""""" - -`NCCL `__ is the NVIDIA Collective Communications Library that is used by PyTorch to handle communication across nodes and GPUs. There are reported benefits in terms of speedups when adjusting NCCL parameters as seen in this `issue `__. In the issue, we see a 30% speed improvement when training the Transformer XLM-RoBERTa and a 15% improvement in training with Detectron2. - -NCCL parameters can be adjusted via environment variables. - -.. note:: - - AWS and GCP already set default values for these on their clusters. This is typically useful for custom cluster setups. - -* `NCCL_NSOCKS_PERTHREAD `__ -* `NCCL_SOCKET_NTHREADS `__ -* `NCCL_MIN_NCHANNELS `__ - -.. code-block:: bash - - export NCCL_NSOCKS_PERTHREAD=4 - export NCCL_SOCKET_NTHREADS=2 - - -Gradients as Bucket View -"""""""""""""""""""""""" - -Enabling ``gradient_as_bucket_view=True`` in the ``DDPStrategy`` will make gradients views point to different offsets of the ``allreduce`` communication buckets. See :class:`~torch.nn.parallel.DistributedDataParallel` for more information. - -This can reduce peak memory usage and throughput as saved memory will be equal to the total gradient memory + removes the need to copy gradients to the ``allreduce`` communication buckets. - -.. note:: - - When ``gradient_as_bucket_view=True`` you cannot call ``detach_()`` on gradients. If hitting such errors, please fix it by referring to the :meth:`~torch.optim.Optimizer.zero_grad` function in ``torch/optim/optimizer.py`` as a solution (`source `__). - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DDPStrategy - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy=DDPStrategy(gradient_as_bucket_view=True)) - trainer.fit(model) - -DDP Communication Hooks -""""""""""""""""""""""" - -DDP Communication hooks is an interface to control how gradients are communicated across workers, overriding the standard allreduce in DistributedDataParallel. This allows you to enable performance improving communication hooks when using multiple nodes. - -Enable `FP16 Compress Hook for multi-node throughput improvement `__: - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DDPStrategy - from torch.distributed.algorithms.ddp_comm_hooks import default_hooks as default - - model = MyModel() - trainer = Trainer(accelerator="gpu", devices=4, strategy=DDPStrategy(ddp_comm_hook=default.fp16_compress_hook)) - trainer.fit(model) - -Enable `PowerSGD for multi-node throughput improvement `__: - -.. note:: - - PowerSGD typically requires extra memory of the same size as the model’s gradients to enable error feedback, which can compensate for biased compressed communication and improve accuracy (`source `__). - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DDPStrategy - from torch.distributed.algorithms.ddp_comm_hooks import powerSGD_hook as powerSGD - - model = MyModel() - trainer = Trainer( - accelerator="gpu", - devices=4, - strategy=DDPStrategy( - ddp_comm_state=powerSGD.PowerSGDState( - process_group=None, - matrix_approximation_rank=1, - start_powerSGD_iter=5000, - ), - ddp_comm_hook=powerSGD.powerSGD_hook, - ), - ) - trainer.fit(model) - - -Combine hooks for accumulated benefit: - -.. note:: - DDP communication wrappers support requires PyTorch>=1.9.0 - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DDPStrategy - from torch.distributed.algorithms.ddp_comm_hooks import ( - default_hooks as default, - powerSGD_hook as powerSGD, - ) - - model = MyModel() - trainer = Trainer( - accelerator="gpu", - devices=4, - strategy=DDPStrategy( - ddp_comm_state=powerSGD.PowerSGDState( - process_group=None, - matrix_approximation_rank=1, - start_powerSGD_iter=5000, - ), - ddp_comm_hook=powerSGD.powerSGD_hook, - ddp_comm_wrapper=default.fp16_compress_wrapper, - ), - ) - trainer.fit(model) - - -When using Post-localSGD, you must also pass ``model_averaging_period`` to allow for model parameter averaging: - -.. note:: - Post-localSGD support requires PyTorch>=1.10.0 - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.strategies import DDPStrategy - from torch.distributed.algorithms.ddp_comm_hooks import post_localSGD_hook as post_localSGD - - model = MyModel() - trainer = Trainer( - accelerator="gpu", - devices=4, - strategy=DDPStrategy( - ddp_comm_state=post_localSGD.PostLocalSGDState( - process_group=None, - subgroup=None, - start_localSGD_iter=8, - ), - ddp_comm_hook=post_localSGD.post_localSGD_hook, - model_averaging_period=4, - ), - ) - trainer.fit(model) diff --git a/source/advanced/pruning_quantization.rst b/source/advanced/pruning_quantization.rst deleted file mode 100644 index 552a96d..0000000 --- a/source/advanced/pruning_quantization.rst +++ /dev/null @@ -1,115 +0,0 @@ -.. _pruning_quantization: - -######################## -Pruning and Quantization -######################## - -Pruning and Quantization are techniques to compress model size for deployment, allowing inference speed up and energy saving without significant accuracy losses. - -******* -Pruning -******* - -.. warning:: - - Pruning is in beta and subject to change. - -Pruning is a technique which focuses on eliminating some of the model weights to reduce the model size and decrease inference requirements. - -Pruning has been shown to achieve significant efficiency improvements while minimizing the drop in model performance (prediction quality). Model pruning is recommended for cloud endpoints, deploying models on edge devices, or mobile inference (among others). - -To enable pruning during training in Lightning, simply pass in the :class:`~pytorch_lightning.callbacks.ModelPruning` callback to the Lightning Trainer. PyTorch's native pruning implementation is used under the hood. - -This callback supports multiple pruning functions: pass any `torch.nn.utils.prune `_ function as a string to select which weights to prune (`random_unstructured `_, `RandomStructured `_, etc) or implement your own by subclassing `BasePruningMethod `_. - -.. code-block:: python - - from pytorch_lightning.callbacks import ModelPruning - - # set the amount to be the fraction of parameters to prune - trainer = Trainer(callbacks=[ModelPruning("l1_unstructured", amount=0.5)]) - -You can also perform iterative pruning, apply the `lottery ticket hypothesis `__, and more! - -.. code-block:: python - - def compute_amount(epoch): - # the sum of all returned values need to be smaller than 1 - if epoch == 10: - return 0.5 - - elif epoch == 50: - return 0.25 - - elif 75 < epoch < 99: - return 0.01 - - - # the amount can be also be a callable - trainer = Trainer(callbacks=[ModelPruning("l1_unstructured", amount=compute_amount)]) - - -************ -Quantization -************ - -.. warning :: - Quantization is in beta and subject to change. - -Model quantization is another performance optimization technique that allows speeding up inference and decreasing memory requirements by performing computations and storing tensors at lower bitwidths (such as INT8 or FLOAT16) than floating-point precision. This is particularly beneficial during model deployment. - -Quantization Aware Training (QAT) mimics the effects of quantization during training: The computations are carried-out in floating-point precision but the subsequent quantization effect is taken into account. The weights and activations are quantized into lower precision only for inference, when training is completed. - -Quantization is useful when it is required to serve large models on machines with limited memory, or when there's a need to switch between models and reducing the I/O time is important. For example, switching between monolingual speech recognition models across multiple languages. - -Lightning includes :class:`~pytorch_lightning.callbacks.QuantizationAwareTraining` callback (using PyTorch's native quantization, read more `here `__), which allows creating fully quantized models (compatible with torchscript). - -.. code-block:: python - - from pytorch_lightning.callbacks import QuantizationAwareTraining - - - class RegressionModel(LightningModule): - def __init__(self): - super().__init__() - self.layer_0 = nn.Linear(16, 64) - self.layer_0a = torch.nn.ReLU() - self.layer_1 = nn.Linear(64, 64) - self.layer_1a = torch.nn.ReLU() - self.layer_end = nn.Linear(64, 1) - - def forward(self, x): - x = self.layer_0(x) - x = self.layer_0a(x) - x = self.layer_1(x) - x = self.layer_1a(x) - x = self.layer_end(x) - return x - - - trainer = Trainer(callbacks=[QuantizationAwareTraining()]) - qmodel = RegressionModel() - trainer.fit(qmodel, ...) - - batch = iter(my_dataloader()).next() - qmodel(qmodel.quant(batch[0])) - - tsmodel = qmodel.to_torchscript() - tsmodel(tsmodel.quant(batch[0])) - -You can further customize the callback: - -.. code-block:: python - - - qcb = QuantizationAwareTraining( - # specification of quant estimation quality - observer_type="histogram", - # specify which layers shall be merged together to increase efficiency - modules_to_fuse=[(f"layer_{i}", f"layer_{i}a") for i in range(2)], - # make your model compatible with all original input/outputs, in such case the model is wrapped in a shell with entry/exit layers. - input_compatible=True, - ) - - batch = iter(my_dataloader()).next() - qmodel(batch[0]) diff --git a/source/advanced/training_tricks.rst b/source/advanced/training_tricks.rst deleted file mode 100644 index a8d5c2d..0000000 --- a/source/advanced/training_tricks.rst +++ /dev/null @@ -1,356 +0,0 @@ -.. testsetup:: * - - from pytorch_lightning.callbacks import StochasticWeightAveraging - -.. _training_tricks: - -############################# -Effective Training Techniques -############################# - -Lightning implements various techniques to help during training that can help make the training smoother. - ----------- - -******************** -Accumulate Gradients -******************** - -.. include:: ../common/gradient_accumulation.rst - ----------- - -***************** -Gradient Clipping -***************** - -Gradient clipping can be enabled to avoid exploding gradients. By default, this will clip the gradient norm by calling -:func:`torch.nn.utils.clip_grad_norm_` computed over all model parameters together. -If the Trainer's ``gradient_clip_algorithm`` is set to ``'value'`` (``'norm'`` by default), this will use instead -:func:`torch.nn.utils.clip_grad_value_` for each parameter instead. - -.. note:: - If using mixed precision, the ``gradient_clip_val`` does not need to be changed as the gradients are unscaled - before applying the clipping function. - -.. seealso:: :class:`~pytorch_lightning.trainer.trainer.Trainer` - -.. testcode:: - - # DEFAULT (ie: don't clip) - trainer = Trainer(gradient_clip_val=0) - - # clip gradients' global norm to <=0.5 using gradient_clip_algorithm='norm' by default - trainer = Trainer(gradient_clip_val=0.5) - - # clip gradients' maximum magnitude to <=0.5 - trainer = Trainer(gradient_clip_val=0.5, gradient_clip_algorithm="value") - -Read more about :ref:`Configuring Gradient Clipping ` for advanced use-cases. - ----------- - -*************************** -Stochastic Weight Averaging -*************************** - -Stochastic Weight Averaging (SWA) can make your models generalize better at virtually no additional cost. -This can be used with both non-trained and trained models. The SWA procedure smooths the loss landscape thus making -it harder to end up in a local minimum during optimization. - -For a more detailed explanation of SWA and how it works, -read `this post `__ by the PyTorch team. - -.. seealso:: The :class:`~pytorch_lightning.callbacks.StochasticWeightAveraging` callback - -.. testcode:: - - # Enable Stochastic Weight Averaging using the callback - trainer = Trainer(callbacks=[StochasticWeightAveraging(swa_lrs=1e-2)]) - ----------- - -***************** -Batch Size Finder -***************** - -Auto-scaling of batch size can be enabled to find the largest batch size that fits into -memory. Large batch size often yields a better estimation of the gradients, but may also result in -longer training time. Inspired by https://github.com/BlackHC/toma. - -.. seealso:: :class:`~pytorch_lightning.trainer.trainer.Trainer` - -.. code-block:: python - - # DEFAULT (ie: don't scale batch size automatically) - trainer = Trainer(auto_scale_batch_size=None) - - # Autoscale batch size - trainer = Trainer(auto_scale_batch_size=None | "power" | "binsearch") - - # Find the batch size - trainer.tune(model) - -Currently, this feature supports two modes ``'power'`` scaling and ``'binsearch'`` -scaling. In ``'power'`` scaling, starting from a batch size of 1 keeps doubling -the batch size until an out-of-memory (OOM) error is encountered. Setting the -argument to ``'binsearch'`` will initially also try doubling the batch size until -it encounters an OOM, after which it will do a binary search that will finetune the -batch size. Additionally, it should be noted that the batch size scaler cannot -search for batch sizes larger than the size of the training dataset. - - -.. note:: - - This feature expects that a ``batch_size`` field is either located as a model attribute - i.e. ``model.batch_size`` or as a field in your ``hparams`` i.e. ``model.hparams.batch_size``. - Similarly it can work with datamodules too. The field should exist and will be updated by - the results of this algorithm. Additionally, your ``train_dataloader()`` method should depend - on this field for this feature to work i.e. - - .. code-block:: python - - # using LightningModule - class LitModel(LightningModule): - def __init__(self, batch_size): - super().__init__() - self.save_hyperparameters() - # or - self.batch_size = batch_size - - def train_dataloader(self): - return DataLoader(train_dataset, batch_size=self.batch_size | self.hparams.batch_size) - - - trainer = Trainer(...) - model = LitModel(batch_size=32) - trainer.tune(model) - - # using LightningDataModule - class LitDataModule(LightningDataModule): - def __init__(self, batch_size): - super().__init__() - self.save_hyperparameters() - # or - self.batch_size = batch_size - - def train_dataloader(self): - return DataLoader(train_dataset, batch_size=self.batch_size | self.hparams.batch_size) - - - trainer = Trainer(...) - model = MyModel() - datamodule = LitDataModule(batch_size=32) - trainer.tune(model, datamodule=datamodule) - -.. warning:: - - Due to the constraints listed above, this features does *NOT* work when passing dataloaders directly - to ``.fit()``. - -The scaling algorithm has a number of parameters that the user can control by -invoking the :meth:`~pytorch_lightning.tuner.tuning.Tuner.scale_batch_size` method: - -.. code-block:: python - - # Use default in trainer construction - trainer = Trainer() - tuner = Tuner(trainer) - - # Invoke method - new_batch_size = tuner.scale_batch_size(model, *extra_parameters_here) - - # Override old batch size (this is done automatically) - model.hparams.batch_size = new_batch_size - - # Fit as normal - trainer.fit(model) - -The algorithm in short works by: - 1. Dumping the current state of the model and trainer - 2. Iteratively until convergence or maximum number of tries ``max_trials`` (default 25) has been reached: - - Call ``fit()`` method of trainer. This evaluates ``steps_per_trial`` (default 3) number of - optimization steps. Each training step can trigger an OOM error if the tensors - (training batch, weights, gradients, etc.) allocated during the steps have a - too large memory footprint. - - If an OOM error is encountered, decrease batch size else increase it. - How much the batch size is increased/decreased is determined by the chosen - strategy. - 3. The found batch size is saved to either ``model.batch_size`` or ``model.hparams.batch_size`` - 4. Restore the initial state of model and trainer - -.. warning:: Batch size finder is not yet supported for DDP or any of its variations, it is coming soon. - ----------- - -.. _learning_rate_finder: - -******************** -Learning Rate Finder -******************** - -.. raw:: html - - - -| - -For training deep neural networks, selecting a good learning rate is essential -for both better performance and faster convergence. Even optimizers such as -:class:`~torch.optim.Adam` that are self-adjusting the learning rate can benefit from more optimal -choices. - -To reduce the amount of guesswork concerning choosing a good initial learning -rate, a `learning rate finder` can be used. As described in `this paper `_ -a learning rate finder does a small run where the learning rate is increased -after each processed batch and the corresponding loss is logged. The result of -this is a ``lr`` vs. ``loss`` plot that can be used as guidance for choosing an optimal -initial learning rate. - -.. warning:: - - For the moment, this feature only works with models having a single optimizer. - LR Finder support for DDP and any of its variations is not implemented yet. It is coming soon. - - -Using Lightning's built-in LR finder -==================================== - -To enable the learning rate finder, your :doc:`lightning module <../common/lightning_module>` needs to -have a ``learning_rate`` or ``lr`` attribute (or as a field in your ``hparams`` i.e. -``hparams.learning_rate`` or ``hparams.lr``). Then, set ``Trainer(auto_lr_find=True)`` -during trainer construction, and then call ``trainer.tune(model)`` to run the LR finder. -The suggested ``learning_rate`` will be written to the console and will be automatically -set to your :doc:`lightning module <../common/lightning_module>`, which can be accessed -via ``self.learning_rate`` or ``self.lr``. - -.. seealso:: :ref:`trainer.tune `. - -.. code-block:: python - - class LitModel(LightningModule): - def __init__(self, learning_rate): - super().__init__() - self.learning_rate = learning_rate - self.model = Model(...) - - def configure_optimizers(self): - return Adam(self.parameters(), lr=(self.lr or self.learning_rate)) - - - model = LitModel() - - # finds learning rate automatically - # sets hparams.lr or hparams.learning_rate to that learning rate - trainer = Trainer(auto_lr_find=True) - - trainer.tune(model) - -If your model is using an arbitrary value instead of ``self.lr`` or ``self.learning_rate``, set that value as ``auto_lr_find``: - -.. code-block:: python - - model = LitModel() - - # to set to your own hparams.my_value - trainer = Trainer(auto_lr_find="my_value") - - trainer.tune(model) - -You can also inspect the results of the learning rate finder or just play around -with the parameters of the algorithm. This can be done by invoking the -:meth:`~pytorch_lightning.tuner.tuning.Tuner.lr_find` method. A typical example of this would look like: - -.. code-block:: python - - model = MyModelClass(hparams) - trainer = Trainer() - - # Run learning rate finder - lr_finder = trainer.tuner.lr_find(model) - - # Results can be found in - print(lr_finder.results) - - # Plot with - fig = lr_finder.plot(suggest=True) - fig.show() - - # Pick point based on plot, or get suggestion - new_lr = lr_finder.suggestion() - - # update hparams of the model - model.hparams.lr = new_lr - - # Fit model - trainer.fit(model) - -The figure produced by ``lr_finder.plot()`` should look something like the figure -below. It is recommended to not pick the learning rate that achieves the lowest -loss, but instead something in the middle of the sharpest downward slope (red point). -This is the point returned py ``lr_finder.suggestion()``. - -.. figure:: ../_static/images/trainer/lr_finder.png - ----------- - -************************** -Advanced GPU Optimizations -************************** - -When training on single or multiple GPU machines, Lightning offers a host of advanced optimizations to improve throughput, memory efficiency, and model scaling. -Refer to :doc:`Advanced GPU Optimized Training <../advanced/model_parallel>` for more details. - ----------- - - -.. _ddp_spawn_shared_memory: - -****************************************** -Sharing Datasets Across Process Boundaries -****************************************** - -The :class:`~pytorch_lightning.core.datamodule.LightningDataModule` class provides an organized way to decouple data loading from training logic, with :meth:`~pytorch_lightning.core.hooks.DataHooks.prepare_data` being used for downloading and pre-processing the dataset on a single process, and :meth:`~pytorch_lightning.core.hooks.DataHooks.setup` loading the pre-processed data for each process individually: - -.. code-block:: python - - class MNISTDataModule(pl.LightningDataModule): - def prepare_data(self): - MNIST(self.data_dir, download=True) - - def setup(self, stage: Optional[str] = None): - self.mnist = MNIST(self.data_dir) - - def train_loader(self): - return DataLoader(self.mnist, batch_size=128) - -However, for in-memory datasets, that means that each process will hold a (redundant) replica of the dataset in memory, which may be impractical when using many processes while utilizing datasets that nearly fit into CPU memory, as the memory consumption will scale up linearly with the number of processes. -For example, when training Graph Neural Networks, a common strategy is to load the entire graph into CPU memory for fast access to the entire graph structure and its features, and to then perform neighbor sampling to obtain mini-batches that fit onto the GPU. - -A simple way to prevent redundant dataset replicas is to rely on :obj:`torch.multiprocessing` to share the `data automatically between spawned processes via shared memory `_. -For this, all data pre-loading should be done on the main process inside :meth:`DataModule.__init__`. As a result, all tensor-data will get automatically shared when using the :class:`~pytorch_lightning.plugins.strategies.ddp_spawn.DDPSpawnStrategy` strategy. - -.. warning:: - - :obj:`torch.multiprocessing` will send a handle of each individual tensor to other processes. - In order to prevent any errors due to too many open file handles, try to reduce the number of tensors to share, *e.g.*, by stacking your data into a single tensor. - -.. code-block:: python - - class MNISTDataModule(pl.LightningDataModule): - def __init__(self, data_dir: str): - self.mnist = MNIST(data_dir, download=True, transform=T.ToTensor()) - - def train_loader(self): - return DataLoader(self.mnist, batch_size=128) - - - model = Model(...) - datamodule = MNISTDataModule("data/MNIST") - - trainer = Trainer(accelerator="gpu", devices=2, strategy="ddp_spawn") - trainer.fit(model, datamodule) - -See the `graph-level `_ and `node-level `_ prediction examples in PyTorch Geometric for practical use-cases. diff --git a/source/benchmarking/benchmarks.rst b/source/benchmarking/benchmarks.rst deleted file mode 100644 index af9715f..0000000 --- a/source/benchmarking/benchmarks.rst +++ /dev/null @@ -1,19 +0,0 @@ -:orphan: - -Benchmark with vanilla PyTorch -============================== - -In this section we set grounds for comparison between vanilla PyTorch and PT Lightning for most common scenarios. - -Time comparison ---------------- - -We have set regular benchmarking against PyTorch vanilla training loop on with RNN and simple MNIST classifier as per of out CI. -In average for simple MNIST CNN classifier we are only about 0.06s slower per epoch, see detail chart bellow. - -.. figure:: ../_static/images/benchmarks/figure-parity-times.png - :alt: Speed parity to vanilla PT, created on 2020-12-16 - :width: 500 - - -Learn more about reproducible benchmarking from the `PyTorch Reproducibility Guide `__. diff --git a/source/cli/lightning_cli.rst b/source/cli/lightning_cli.rst deleted file mode 100644 index 76f3f12..0000000 --- a/source/cli/lightning_cli.rst +++ /dev/null @@ -1,94 +0,0 @@ -:orphan: - -.. _lightning-cli: - -############################ -Eliminate config boilerplate -############################ - -********* -Basic use -********* - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: 1: Control it all from the CLI - :description: Learn to control a LightningModule and LightningDataModule from the CLI - :col_css: col-md-4 - :button_link: lightning_cli_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: 2: Mix models and datasets - :description: Register models, datasets, optimizers and learning rate schedulers - :col_css: col-md-4 - :button_link: lightning_cli_intermediate_2.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: 3: Control it all via YAML - :description: Enable composable YAMLs - :col_css: col-md-4 - :button_link: lightning_cli_advanced.html - :height: 150 - :tag: advanced - -.. raw:: html - -
-
- ----- - -************ -Advanced use -************ - -.. raw:: html - -
-
- -.. displayitem:: - :header: YAML for production - :description: Use the Lightning CLI with YAMLs for production environments - :col_css: col-md-6 - :button_link: lightning_cli_advanced_2.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Customize configs for complex projects - :description: Learn how to connect complex projects with each Registry. - :col_css: col-md-6 - :button_link: lightning_cli_advanced_3.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: Extend the Lightning CLI - :description: Customize the Lightning CLI - :col_css: col-md-6 - :button_link: lightning_cli_expert.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: FAQ - :description: Frequently asked questions about working with the Lightning CLI and YAML files - :col_css: col-md-6 - :button_link: lightning_cli_faq.html - :height: 150 - -.. raw:: html - -
-
diff --git a/source/cli/lightning_cli_advanced.rst b/source/cli/lightning_cli_advanced.rst deleted file mode 100644 index 2d4f330..0000000 --- a/source/cli/lightning_cli_advanced.rst +++ /dev/null @@ -1,113 +0,0 @@ -:orphan: - -####################################### -Eliminate config boilerplate (Advanced) -####################################### -**Audience:** Users looking to modularize their code for a professional project. - -**Pre-reqs:** You must have read :doc:`(Control it all from the CLI) `. - ----- - -*************************** -What is a yaml config file? -*************************** -A yaml is a standard configuration file that describes parameters for sections of a program. It is a common tool in engineering, and it has recently started to gain popularity in machine learning. - -.. code:: yaml - - # file.yaml - car: - max_speed:100 - max_passengers:2 - plane: - fuel_capacity: 50 - class_3: - option_1: 'x' - option_2: 'y' - ----- - - -********************* -Print the config used -********************* -Before or after you run a training routine, you can print the full training spec in yaml format using ``--print_config``: - -.. code:: bash - - python main.py fit --print_config - -which generates the following config: - -.. code:: bash - - seed_everything: null - trainer: - logger: true - ... - terminate_on_nan: null - model: - out_dim: 10 - learning_rate: 0.02 - data: - data_dir: ./ - ckpt_path: null - ----- - -******************************** -Write a config yaml from the CLI -******************************** -To have a copy of the configuration that produced this model, save a *yaml* file from the *--print_config* outputs: - -.. code:: bash - - python main.py fit --model.learning_rate 0.001 --print_config > config.yaml - ----- - -********************** -Run from a single yaml -********************** -To run from a yaml, pass a yaml produced with ``--print_config`` to the ``--config`` argument: - -.. code:: bash - - python main.py fit --config config.yaml - -when using a yaml to run, you can still pass in inline arguments - -.. code:: bash - - python main.py fit --config config.yaml --trainer.max_epochs 100 - ----- - -****************** -Compose yaml files -****************** -For production or complex research projects it's advisable to have each object in its own config file. To compose all the configs, pass them all inline: - -.. code-block:: bash - - $ python trainer.py fit --config trainer.yaml --config datamodules.yaml --config models.yaml ... - -The configs will be parsed sequentially. Let's say we have two configs with the same args: - -.. code:: yaml - - # trainer.yaml - trainer: - num_epochs: 10 - - - # trainer_2.yaml - trainer: - num_epochs: 20 - -the ones from the last config will be used (num_epochs = 20) in this case: - -.. code-block:: bash - - $ python trainer.py fit --config trainer.yaml --config trainer_2.yaml diff --git a/source/cli/lightning_cli_advanced_2.rst b/source/cli/lightning_cli_advanced_2.rst deleted file mode 100644 index 0474699..0000000 --- a/source/cli/lightning_cli_advanced_2.rst +++ /dev/null @@ -1,207 +0,0 @@ -:orphan: - -.. testsetup:: * - :skipif: not _JSONARGPARSE_AVAILABLE - - import torch - from unittest import mock - from typing import List - import pytorch_lightning as pl - from pytorch_lightning import LightningModule, LightningDataModule, Trainer, Callback - - - class NoFitTrainer(Trainer): - def fit(self, *_, **__): - pass - - - class LightningCLI(pl.utilities.cli.LightningCLI): - def __init__(self, *args, trainer_class=NoFitTrainer, run=False, **kwargs): - super().__init__(*args, trainer_class=trainer_class, run=run, **kwargs) - - - class MyModel(LightningModule): - def __init__( - self, - encoder_layers: int = 12, - decoder_layers: List[int] = [2, 4], - batch_size: int = 8, - ): - pass - - - class MyDataModule(LightningDataModule): - def __init__(self, batch_size: int = 8): - self.num_classes = 5 - - - mock_argv = mock.patch("sys.argv", ["any.py"]) - mock_argv.start() - -.. testcleanup:: * - - mock_argv.stop() - -####################################### -Eliminate config boilerplate (Advanced) -####################################### - -****************************** -Customize arguments by command -****************************** -To customize arguments by subcommand, pass the config *before* the subcommand: - -.. code-block:: bash - - $ python main.py [before] [subcommand] [after] - $ python main.py ... fit ... - -For example, here we set the Trainer argument [max_steps = 100] for the full training routine and [max_steps = 10] for testing: - -.. code-block:: bash - - # config1.yaml - fit: - trainer: - max_steps: 100 - test: - trainer: - max_epochs: 10 - -now you can toggle this behavior by subcommand: - -.. code-block:: bash - - # full routine with max_steps = 100 - $ python main.py --config config1.yaml fit - - # test only with max_epochs = 10 - $ python main.py --config config1.yaml test - ----- - -********************* -Use groups of options -********************* -Groups of options can also be given as independent config files: - -.. code-block:: bash - - $ python trainer.py fit --trainer trainer.yaml --model model.yaml --data data.yaml [...] - ----- - -*************************** -Run from cloud yaml configs -*************************** -For certain enterprise workloads, Lightning CLI supports running from hosted configs: - -.. code-block:: bash - - $ python trainer.py [subcommand] --config s3://bucket/config.yaml - -For more options, refer to :doc:`Remote filesystems <../common/remote_fs>`. - ----- - -************************************** -Use a config via environment variables -************************************** -For certain CI/CD systems, it's useful to pass in config files as environment variables: - -.. code-block:: bash - - $ python trainer.py fit --trainer "$TRAINER_CONFIG" --model "$MODEL_CONFIG" [...] - ----- - -*************************************** -Run from environment variables directly -*************************************** -The Lightning CLI can convert every possible CLI flag into an environment variable. To enable this, set the *env_parse* argument: - -.. code:: python - - LightningCLI(env_parse=True) - -now use the ``--help`` CLI flag with any subcommand: - -.. code:: bash - - $ python main.py fit --help - -which will show you ALL possible environment variables you can now set: - -.. code:: bash - - usage: main.py [options] fit [-h] [-c CONFIG] - [--trainer.max_epochs MAX_EPOCHS] [--trainer.min_epochs MIN_EPOCHS] - [--trainer.max_steps MAX_STEPS] [--trainer.min_steps MIN_STEPS] - ... - [--ckpt_path CKPT_PATH] - - optional arguments: - ... - --model CONFIG Path to a configuration file. - --model.out_dim OUT_DIM - (type: int, default: 10) - --model.learning_rate LEARNING_RATE - (type: float, default: 0.02) - -now you can customize the behavior via environment variables: - -.. code:: bash - - # set the options via env vars - $ export LEARNING_RATE=0.01 - $ export OUT_DIM=5 - - $ python main.py fit - ----- - -************************ -Set default config files -************************ -To set a path to a config file of defaults, use the ``default_config_files`` argument: - -.. testcode:: - - cli = LightningCLI(MyModel, MyDataModule, parser_kwargs={"default_config_files": ["my_cli_defaults.yaml"]}) - -or if you want defaults per subcommand: - -.. testcode:: - - cli = LightningCLI(MyModel, MyDataModule, parser_kwargs={"fit": {"default_config_files": ["my_fit_defaults.yaml"]}}) - -For more configuration options, refer to the `ArgumentParser API -`_ documentation. - ----- - -***************************** -Enable variable interpolation -***************************** -In certain cases where multiple configs need to share variables, consider using variable interpolation. Variable interpolation -allows you to add variables to your yaml configs like so: - -.. code-block:: yaml - - model: - encoder_layers: 12 - decoder_layers: - - ${model.encoder_layers} - - 4 - -To enable variable interpolation, first install omegaconf: - -.. code:: bash - - pip install omegaconf - -Once this is installed, the Lightning CLI will automatically handle variables in yaml files: - -.. code bash: - - python main.py --model.encoder_layers=12 diff --git a/source/cli/lightning_cli_advanced_3.rst b/source/cli/lightning_cli_advanced_3.rst deleted file mode 100644 index 2eeae17..0000000 --- a/source/cli/lightning_cli_advanced_3.rst +++ /dev/null @@ -1,415 +0,0 @@ -:orphan: - -.. testsetup:: * - :skipif: not _JSONARGPARSE_AVAILABLE - - import torch - from unittest import mock - from typing import List - import pytorch_lightning as pl - from pytorch_lightning import LightningModule, LightningDataModule, Trainer, Callback - - - class NoFitTrainer(Trainer): - def fit(self, *_, **__): - pass - - - class LightningCLI(pl.utilities.cli.LightningCLI): - def __init__(self, *args, trainer_class=NoFitTrainer, run=False, **kwargs): - super().__init__(*args, trainer_class=trainer_class, run=run, **kwargs) - - - class MyModel(LightningModule): - def __init__( - self, - encoder_layers: int = 12, - decoder_layers: List[int] = [2, 4], - batch_size: int = 8, - ): - pass - - - class MyDataModule(LightningDataModule): - def __init__(self, batch_size: int = 8): - self.num_classes = 5 - - - MyModelBaseClass = MyModel - MyDataModuleBaseClass = MyDataModule - - mock_argv = mock.patch("sys.argv", ["any.py"]) - mock_argv.start() - -.. testcleanup:: * - - mock_argv.stop() - -Instantiation only mode -^^^^^^^^^^^^^^^^^^^^^^^ - -The CLI is designed to start fitting with minimal code changes. On class instantiation, the CLI will automatically -call the trainer function associated to the subcommand provided so you don't have to do it. -To avoid this, you can set the following argument: - -.. testcode:: - - cli = LightningCLI(MyModel, run=False) # True by default - # you'll have to call fit yourself: - cli.trainer.fit(cli.model) - -In this mode, there are subcommands added to the parser. -This can be useful to implement custom logic without having to subclass the CLI, but still using the CLI's instantiation -and argument parsing capabilities. - - -Subclass registration -^^^^^^^^^^^^^^^^^^^^^ - -To use shorthand notation, the options need to be registered beforehand. This can be easily done with: - -.. code-block:: - - LightningCLI(auto_registry=True) # False by default - -which will register all subclasses of :class:`torch.optim.Optimizer`, :class:`torch.optim.lr_scheduler._LRScheduler`, -:class:`~pytorch_lightning.core.lightning.LightningModule`, -:class:`~pytorch_lightning.core.datamodule.LightningDataModule`, :class:`~pytorch_lightning.callbacks.Callback`, and -:class:`~pytorch_lightning.loggers.LightningLoggerBase` across all imported modules. This includes those in your own -code. - -Alternatively, if this is left unset, only the subclasses defined in PyTorch's :class:`torch.optim.Optimizer`, -:class:`torch.optim.lr_scheduler._LRScheduler` and Lightning's :class:`~pytorch_lightning.callbacks.Callback` and -:class:`~pytorch_lightning.loggers.LightningLoggerBase` subclassess will be registered. - -In subsequent sections, we will go over adding specific classes to specific registries as well as how to use -shorthand notation. - - -Trainer Callbacks and arguments with class type -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - -A very important argument of the :class:`~pytorch_lightning.trainer.trainer.Trainer` class is the :code:`callbacks`. In -contrast to other more simple arguments which just require numbers or strings, :code:`callbacks` expects a list of -instances of subclasses of :class:`~pytorch_lightning.callbacks.Callback`. To specify this kind of argument in a config -file, each callback must be given as a dictionary including a :code:`class_path` entry with an import path of the class, -and optionally an :code:`init_args` entry with arguments required to instantiate it. Therefore, a simple configuration -file example that defines a couple of callbacks is the following: - -.. code-block:: yaml - - trainer: - callbacks: - - class_path: pytorch_lightning.callbacks.EarlyStopping - init_args: - patience: 5 - - class_path: pytorch_lightning.callbacks.LearningRateMonitor - init_args: - ... - -Similar to the callbacks, any arguments in :class:`~pytorch_lightning.trainer.trainer.Trainer` and user extended -:class:`~pytorch_lightning.core.lightning.LightningModule` and -:class:`~pytorch_lightning.core.datamodule.LightningDataModule` classes that have as type hint a class can be configured -the same way using :code:`class_path` and :code:`init_args`. - -For callbacks in particular, Lightning simplifies the command line so that only -the :class:`~pytorch_lightning.callbacks.Callback` name is required. -The argument's order matters and the user needs to pass the arguments in the following way. - -.. code-block:: bash - - $ python ... \ - --trainer.callbacks={CALLBACK_1_NAME} \ - --trainer.callbacks.{CALLBACK_1_ARGS_1}=... \ - --trainer.callbacks.{CALLBACK_1_ARGS_2}=... \ - ... - --trainer.callbacks={CALLBACK_N_NAME} \ - --trainer.callbacks.{CALLBACK_N_ARGS_1}=... \ - ... - -Here is an example: - -.. code-block:: bash - - $ python ... \ - --trainer.callbacks=EarlyStopping \ - --trainer.callbacks.patience=5 \ - --trainer.callbacks=LearningRateMonitor \ - --trainer.callbacks.logging_interval=epoch - -Lightning provides a mechanism for you to add your own callbacks and benefit from the command line simplification -as described above: - -.. code-block:: python - - from pytorch_lightning.utilities.cli import CALLBACK_REGISTRY - - - @CALLBACK_REGISTRY - class CustomCallback(Callback): - ... - - - cli = LightningCLI(...) - -.. code-block:: bash - - $ python ... --trainer.callbacks=CustomCallback ... - -.. note:: - - This shorthand notation is only supported in the shell and not inside a configuration file. The configuration file - generated by calling the previous command with ``--print_config`` will have the ``class_path`` notation. - - .. code-block:: yaml - - trainer: - callbacks: - - class_path: your_class_path.CustomCallback - init_args: - ... - - -.. tip:: - - ``--trainer.logger`` also supports shorthand notation and a ``LOGGER_REGISTRY`` is available to register custom - Loggers. - - -Multiple models and/or datasets -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - -Additionally, the tool can be configured such that a model and/or a datamodule is -specified by an import path and init arguments. For example, with a tool implemented as: - -.. code-block:: python - - cli = LightningCLI(MyModelBaseClass, MyDataModuleBaseClass, subclass_mode_model=True, subclass_mode_data=True) - -A possible config file could be as follows: - -.. code-block:: yaml - - model: - class_path: mycode.mymodels.MyModel - init_args: - decoder_layers: - - 2 - - 4 - encoder_layers: 12 - data: - class_path: mycode.mydatamodules.MyDataModule - init_args: - ... - trainer: - callbacks: - - class_path: pytorch_lightning.callbacks.EarlyStopping - init_args: - patience: 5 - ... - -Only model classes that are a subclass of :code:`MyModelBaseClass` would be allowed, and similarly only subclasses of -:code:`MyDataModuleBaseClass`. If as base classes :class:`~pytorch_lightning.core.lightning.LightningModule` and -:class:`~pytorch_lightning.core.datamodule.LightningDataModule` are given, then the tool would allow any lightning -module and data module. - -.. tip:: - - Note that with the subclass modes the :code:`--help` option does not show information for a specific subclass. To - get help for a subclass the options :code:`--model.help` and :code:`--data.help` can be used, followed by the - desired class path. Similarly :code:`--print_config` does not include the settings for a particular subclass. To - include them the class path should be given before the :code:`--print_config` option. Examples for both help and - print config are: - - .. code-block:: bash - - $ python trainer.py fit --model.help mycode.mymodels.MyModel - $ python trainer.py fit --model mycode.mymodels.MyModel --print_config - - -Models with multiple submodules -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - -Many use cases require to have several modules each with its own configurable options. One possible way to handle this -with LightningCLI is to implement a single module having as init parameters each of the submodules. Since the init -parameters have as type a class, then in the configuration these would be specified with :code:`class_path` and -:code:`init_args` entries. For instance a model could be implemented as: - -.. testcode:: - - class MyMainModel(LightningModule): - def __init__(self, encoder: nn.Module, decoder: nn.Module): - """Example encoder-decoder submodules model - - Args: - encoder: Instance of a module for encoding - decoder: Instance of a module for decoding - """ - super().__init__() - self.encoder = encoder - self.decoder = decoder - -If the CLI is implemented as :code:`LightningCLI(MyMainModel)` the configuration would be as follows: - -.. code-block:: yaml - - model: - encoder: - class_path: mycode.myencoders.MyEncoder - init_args: - ... - decoder: - class_path: mycode.mydecoders.MyDecoder - init_args: - ... - -It is also possible to combine :code:`subclass_mode_model=True` and submodules, thereby having two levels of -:code:`class_path`. - - -Class type defaults -^^^^^^^^^^^^^^^^^^^ - -The support for classes as type hints allows to try many possibilities with the same CLI. This is a useful feature, but -it can make it tempting to use an instance of a class as a default. For example: - -.. code-block:: - - class MyMainModel(LightningModule): - def __init__( - self, - backbone: torch.nn.Module = MyModel(encoder_layers=24), # BAD PRACTICE! - ): - super().__init__() - self.backbone = backbone - -Normally classes are mutable as it is in this case. The instance of :code:`MyModel` would be created the moment that the -module that defines :code:`MyMainModel` is first imported. This means that the default of :code:`backbone` will be -initialized before the CLI class runs :code:`seed_everything` making it non-reproducible. Furthermore, if -:code:`MyMainModel` is used more than once in the same Python process and the :code:`backbone` parameter is not -overridden, the same instance would be used in multiple places which very likely is not what the developer intended. -Having an instance as default also makes it impossible to generate the complete config file since for arbitrary classes -it is not known which arguments were used to instantiate it. - -A good solution to these problems is to not have a default or set the default to a special value (e.g. a -string) which would be checked in the init and instantiated accordingly. If a class parameter has no default and the CLI -is subclassed then a default can be set as follows: - -.. testcode:: - - default_backbone = { - "class_path": "import.path.of.MyModel", - "init_args": { - "encoder_layers": 24, - }, - } - - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.set_defaults({"model.backbone": default_backbone}) - -A more compact version that avoids writing a dictionary would be: - -.. testcode:: - - from jsonargparse import lazy_instance - - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.set_defaults({"model.backbone": lazy_instance(MyModel, encoder_layers=24)}) - -Optimizers -^^^^^^^^^^ - -If you will not be changing the class, you can manually add the arguments for specific optimizers and/or -learning rate schedulers by subclassing the CLI. This has the advantage of providing the proper help message for those -classes. The following code snippet shows how to implement it: - -.. testcode:: - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.add_optimizer_args(torch.optim.Adam) - parser.add_lr_scheduler_args(torch.optim.lr_scheduler.ExponentialLR) - -With this, in the config the :code:`optimizer` and :code:`lr_scheduler` groups would accept all of the options for the -given classes, in this example :code:`Adam` and :code:`ExponentialLR`. -Therefore, the config file would be structured like: - -.. code-block:: yaml - - optimizer: - lr: 0.01 - lr_scheduler: - gamma: 0.2 - model: - ... - trainer: - ... - -Where the arguments can be passed directly through command line without specifying the class. For example: - -.. code-block:: bash - - $ python trainer.py fit --optimizer.lr=0.01 --lr_scheduler.gamma=0.2 - -The automatic implementation of :code:`configure_optimizers` can be disabled by linking the configuration group. An -example can be when one wants to add support for multiple optimizers: - -.. code-block:: python - - from pytorch_lightning.utilities.cli import instantiate_class - - - class MyModel(LightningModule): - def __init__(self, optimizer1_init: dict, optimizer2_init: dict): - super().__init__() - self.optimizer1_init = optimizer1_init - self.optimizer2_init = optimizer2_init - - def configure_optimizers(self): - optimizer1 = instantiate_class(self.parameters(), self.optimizer1_init) - optimizer2 = instantiate_class(self.parameters(), self.optimizer2_init) - return [optimizer1, optimizer2] - - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.add_optimizer_args( - OPTIMIZER_REGISTRY.classes, nested_key="gen_optimizer", link_to="model.optimizer1_init" - ) - parser.add_optimizer_args( - OPTIMIZER_REGISTRY.classes, nested_key="gen_discriminator", link_to="model.optimizer2_init" - ) - - - cli = MyLightningCLI(MyModel) - -The value given to :code:`optimizer*_init` will always be a dictionary including :code:`class_path` and -:code:`init_args` entries. The function :func:`~pytorch_lightning.utilities.cli.instantiate_class` -takes care of importing the class defined in :code:`class_path` and instantiating it using some positional arguments, -in this case :code:`self.parameters()`, and the :code:`init_args`. -Any number of optimizers and learning rate schedulers can be added when using :code:`link_to`. - -With shorthand notation: - -.. code-block:: bash - - $ python trainer.py fit \ - --gen_optimizer=Adam \ - --gen_optimizer.lr=0.01 \ - --gen_discriminator=AdamW \ - --gen_discriminator.lr=0.0001 - -You can also pass the class path directly, for example, if the optimizer hasn't been registered to the -``OPTIMIZER_REGISTRY``: - -.. code-block:: bash - - $ python trainer.py fit \ - --gen_optimizer.class_path=torch.optim.Adam \ - --gen_optimizer.init_args.lr=0.01 \ - --gen_discriminator.class_path=torch.optim.AdamW \ - --gen_discriminator.init_args.lr=0.0001 diff --git a/source/cli/lightning_cli_expert.rst b/source/cli/lightning_cli_expert.rst deleted file mode 100644 index dbd6061..0000000 --- a/source/cli/lightning_cli_expert.rst +++ /dev/null @@ -1,266 +0,0 @@ -:orphan: - -.. testsetup:: * - :skipif: not _JSONARGPARSE_AVAILABLE - - import torch - from unittest import mock - from typing import List - import pytorch_lightning as pl - from pytorch_lightning import LightningModule, LightningDataModule, Trainer, Callback - - - class NoFitTrainer(Trainer): - def fit(self, *_, **__): - pass - - - class LightningCLI(pl.utilities.cli.LightningCLI): - def __init__(self, *args, trainer_class=NoFitTrainer, run=False, **kwargs): - super().__init__(*args, trainer_class=trainer_class, run=run, **kwargs) - - - class MyModel(LightningModule): - def __init__( - self, - encoder_layers: int = 12, - decoder_layers: List[int] = [2, 4], - batch_size: int = 8, - ): - pass - - - class MyClassModel(LightningModule): - def __init__(self, num_classes: int): - pass - - - class MyDataModule(LightningDataModule): - def __init__(self, batch_size: int = 8): - self.num_classes = 5 - - - def send_email(address, message): - pass - - - mock_argv = mock.patch("sys.argv", ["any.py"]) - mock_argv.start() - -.. testcleanup:: * - - mock_argv.stop() - -####################################### -Eliminate config boilerplate (Advanced) -####################################### -**Audience:** Users who already understand the LightningCLI and want to customize it. - ----- - -************************** -Customize the LightningCLI -************************** - -The init parameters of the :class:`~pytorch_lightning.utilities.cli.LightningCLI` class can be used to customize some -things, namely: the description of the tool, enabling parsing of environment variables and additional arguments to -instantiate the trainer and configuration parser. - -Nevertheless the init arguments are not enough for many use cases. For this reason the class is designed so that can be -extended to customize different parts of the command line tool. The argument parser class used by -:class:`~pytorch_lightning.utilities.cli.LightningCLI` is -:class:`~pytorch_lightning.utilities.cli.LightningArgumentParser` which is an extension of python's argparse, thus -adding arguments can be done using the :func:`add_argument` method. In contrast to argparse it has additional methods to -add arguments, for example :func:`add_class_arguments` adds all arguments from the init of a class, though requiring -parameters to have type hints. For more details about this please refer to the `respective documentation -`_. - -The :class:`~pytorch_lightning.utilities.cli.LightningCLI` class has the -:meth:`~pytorch_lightning.utilities.cli.LightningCLI.add_arguments_to_parser` method which can be implemented to include -more arguments. After parsing, the configuration is stored in the :code:`config` attribute of the class instance. The -:class:`~pytorch_lightning.utilities.cli.LightningCLI` class also has two methods that can be used to run code before -and after the trainer runs: :code:`before_` and :code:`after_`. -A realistic example for these would be to send an email before and after the execution. -The code for the :code:`fit` subcommand would be something like: - -.. testcode:: - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.add_argument("--notification_email", default="will@email.com") - - def before_fit(self): - send_email(address=self.config["notification_email"], message="trainer.fit starting") - - def after_fit(self): - send_email(address=self.config["notification_email"], message="trainer.fit finished") - - - cli = MyLightningCLI(MyModel) - -Note that the config object :code:`self.config` is a dictionary whose keys are global options or groups of options. It -has the same structure as the yaml format described previously. This means for instance that the parameters used for -instantiating the trainer class can be found in :code:`self.config['fit']['trainer']`. - -.. tip:: - - Have a look at the :class:`~pytorch_lightning.utilities.cli.LightningCLI` class API reference to learn about other - methods that can be extended to customize a CLI. - ----- - -************************** -Configure forced callbacks -************************** -As explained previously, any Lightning callback can be added by passing it through command line or -including it in the config via :code:`class_path` and :code:`init_args` entries. - -However, certain callbacks MUST be coupled with a model so they are always present and configurable. -This can be implemented as follows: - -.. testcode:: - - from pytorch_lightning.callbacks import EarlyStopping - - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.add_lightning_class_args(EarlyStopping, "my_early_stopping") - parser.set_defaults({"my_early_stopping.monitor": "val_loss", "my_early_stopping.patience": 5}) - - - cli = MyLightningCLI(MyModel) - -To change the configuration of the :code:`EarlyStopping` in the config it would be: - -.. code-block:: yaml - - model: - ... - trainer: - ... - my_early_stopping: - patience: 5 - -.. note:: - - The example above overrides a default in :code:`add_arguments_to_parser`. This is included to show that defaults can - be changed if needed. However, note that overriding of defaults in the source code is not intended to be used to - store the best hyperparameters for a task after experimentation. To ease reproducibility the source code should be - stable. It is better practice to store the best hyperparameters for a task in a configuration file independent from - the source code. - ----- - -******************* -Class type defaults -******************* - -The support for classes as type hints allows to try many possibilities with the same CLI. This is a useful feature, but -it can make it tempting to use an instance of a class as a default. For example: - -.. testcode:: - - class MyMainModel(LightningModule): - def __init__( - self, - backbone: torch.nn.Module = MyModel(encoder_layers=24), # BAD PRACTICE! - ): - super().__init__() - self.backbone = backbone - -Normally classes are mutable as it is in this case. The instance of :code:`MyModel` would be created the moment that the -module that defines :code:`MyMainModel` is first imported. This means that the default of :code:`backbone` will be -initialized before the CLI class runs :code:`seed_everything` making it non-reproducible. Furthermore, if -:code:`MyMainModel` is used more than once in the same Python process and the :code:`backbone` parameter is not -overridden, the same instance would be used in multiple places which very likely is not what the developer intended. -Having an instance as default also makes it impossible to generate the complete config file since for arbitrary classes -it is not known which arguments were used to instantiate it. - -A good solution to these problems is to not have a default or set the default to a special value (e.g. a -string) which would be checked in the init and instantiated accordingly. If a class parameter has no default and the CLI -is subclassed then a default can be set as follows: - -.. testcode:: - - default_backbone = { - "class_path": "import.path.of.MyModel", - "init_args": { - "encoder_layers": 24, - }, - } - - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.set_defaults({"model.backbone": default_backbone}) - -A more compact version that avoids writing a dictionary would be: - -.. testcode:: - - from jsonargparse import lazy_instance - - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.set_defaults({"model.backbone": lazy_instance(MyModel, encoder_layers=24)}) - ----- - -************************ -Connect two config files -************************ -Another case in which it might be desired to extend :class:`~pytorch_lightning.utilities.cli.LightningCLI` is that the -model and data module depend on a common parameter. For example in some cases both classes require to know the -:code:`batch_size`. It is a burden and error prone giving the same value twice in a config file. To avoid this the -parser can be configured so that a value is only given once and then propagated accordingly. With a tool implemented -like shown below, the :code:`batch_size` only has to be provided in the :code:`data` section of the config. - -.. testcode:: - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.link_arguments("data.batch_size", "model.batch_size") - - - cli = MyLightningCLI(MyModel, MyDataModule) - -The linking of arguments is observed in the help of the tool, which for this example would look like: - -.. code-block:: bash - - $ python trainer.py fit --help - ... - --data.batch_size BATCH_SIZE - Number of samples in a batch (type: int, default: 8) - - Linked arguments: - model.batch_size <-- data.batch_size - Number of samples in a batch (type: int) - -Sometimes a parameter value is only available after class instantiation. An example could be that your model requires -the number of classes to instantiate its fully connected layer (for a classification task) but the value is not -available until the data module has been instantiated. The code below illustrates how to address this. - -.. testcode:: - - class MyLightningCLI(LightningCLI): - def add_arguments_to_parser(self, parser): - parser.link_arguments("data.num_classes", "model.num_classes", apply_on="instantiate") - - - cli = MyLightningCLI(MyClassModel, MyDataModule) - -Instantiation links are used to automatically determine the order of instantiation, in this case data first. - -.. tip:: - - The linking of arguments can be used for more complex cases. For example to derive a value via a function that takes - multiple settings as input. For more details have a look at the API of `link_arguments - `_. - - -The linking of arguments is intended for things that are meant to be non-configurable. This improves the CLI user -experience since it avoids the need for providing more parameters. A related concept is -variable interpolation which in contrast keeps things being configurable. diff --git a/source/cli/lightning_cli_faq.rst b/source/cli/lightning_cli_faq.rst deleted file mode 100644 index ca1be71..0000000 --- a/source/cli/lightning_cli_faq.rst +++ /dev/null @@ -1,136 +0,0 @@ -:orphan: - -.. testsetup:: * - :skipif: not _JSONARGPARSE_AVAILABLE - - import torch - from unittest import mock - from typing import List - import pytorch_lightning as pl - from pytorch_lightning import LightningModule, LightningDataModule, Trainer, Callback - - - class NoFitTrainer(Trainer): - def fit(self, *_, **__): - pass - - - class LightningCLI(pl.utilities.cli.LightningCLI): - def __init__(self, *args, trainer_class=NoFitTrainer, run=False, **kwargs): - super().__init__(*args, trainer_class=trainer_class, run=run, **kwargs) - - - class MyModel(LightningModule): - def __init__( - self, - encoder_layers: int = 12, - decoder_layers: List[int] = [2, 4], - batch_size: int = 8, - ): - pass - - - mock_argv = mock.patch("sys.argv", ["any.py"]) - mock_argv.start() - -.. testcleanup:: * - - mock_argv.stop() - -##################################### -Eliminate config boilerplate (expert) -##################################### - -*************** -Troubleshooting -*************** -The standard behavior for CLIs, when they fail, is to terminate the process with a non-zero exit code and a short message -to hint the user about the cause. This is problematic while developing the CLI since there is no information to track -down the root of the problem. A simple change in the instantiation of the ``LightningCLI`` can be used such that when -there is a failure an exception is raised and the full stack trace printed. - -.. testcode:: - - cli = LightningCLI(MyModel, parser_kwargs={"error_handler": None}) - -.. note:: - - When asking about problems and reporting issues please set the ``error_handler`` to ``None`` and include the stack - trace in your description. With this, it is more likely for people to help out identifying the cause without needing - to create a reproducible script. - ----- - -************************************* -Reproducibility with the LightningCLI -************************************* -The topic of reproducibility is complex and it is impossible to guarantee reproducibility by just providing a class that -people can use in unexpected ways. Nevertheless, the :class:`~pytorch_lightning.utilities.cli.LightningCLI` tries to -give a framework and recommendations to make reproducibility simpler. - -When an experiment is run, it is good practice to use a stable version of the source code, either being a released -package or at least a commit of some version controlled repository. For each run of a CLI the config file is -automatically saved including all settings. This is useful to figure out what was done for a particular run without -requiring to look at the source code. If by mistake the exact version of the source code is lost or some defaults -changed, having the full config means that most of the information is preserved. - -The class is targeted at implementing CLIs because running a command from a shell provides a separation with the Python -source code. Ideally the CLI would be placed in your path as part of the installation of a stable package, instead of -running from a clone of a repository that could have uncommitted local modifications. Creating installable packages that -include CLIs is out of the scope of this document. This is mentioned only as a teaser for people who would strive for -the best practices possible. - - -For every CLI implemented, users are encouraged to learn how to run it by reading the documentation printed with the -:code:`--help` option and use the :code:`--print_config` option to guide the writing of config files. A few more details -that might not be clear by only reading the help are the following. - -:class:`~pytorch_lightning.utilities.cli.LightningCLI` is based on argparse and as such follows the same arguments style -as many POSIX command line tools. Long options are prefixed with two dashes and its corresponding values should be -provided with an empty space or an equal sign, as :code:`--option value` or :code:`--option=value`. Command line options -are parsed from left to right, therefore if a setting appears multiple times the value most to the right will override -the previous ones. If a class has an init parameter that is required (i.e. no default value), it is given as -:code:`--option` which makes it explicit and more readable instead of relying on positional arguments. - ----- - -********************* -What is a subcommand? -********************* -A subcommand is what is the action the LightningCLI applies to the script: - -.. code:: bash - - python main.py [subcommand] - -See the Potential subcommands with: - -.. code:: bash - - python main.py --help - -which prints: - -.. code:: bash - - ... - - fit Runs the full optimization routine. - validate Perform one evaluation epoch over the validation set. - test Perform one evaluation epoch over the test set. - predict Run inference on your data. - tune Runs routines to tune hyperparameters before training. - -use a subcommand as follows: - -.. code:: bash - - python main.py fit - python main.py test - ----- - -**************** -What is the CLI? -**************** -CLI is short for commandline interface. Use your terminal to enter these commands. diff --git a/source/cli/lightning_cli_intermediate.rst b/source/cli/lightning_cli_intermediate.rst deleted file mode 100644 index 36c6adb..0000000 --- a/source/cli/lightning_cli_intermediate.rst +++ /dev/null @@ -1,204 +0,0 @@ -:orphan: - -########################################### -Eliminate config boilerplate (Intermediate) -########################################### -**Audience:** Users who want advanced modularity via the commandline interface (CLI). - -**Pre-reqs:** You must already understand how to use a commandline and :doc:`LightningDataModule <../data/datamodule>`. - ----- - -*************************** -What is config boilerplate? -*************************** -As Lightning projects grow in complexity it becomes desirable to enable full customizability from the commandline (CLI) so you can -change any hyperparameters without changing your code: - -.. code:: bash - - # Mix and match anything - $ python main.py --command fit --model.learning_rate 0.02 - $ python main.py --command fit --model.learning_rate 0.01 --trainer.fast_dev_run True - -This is what the Lightning CLI enables. Without the Lightning CLI, you usually end up with a TON of boilerplate that looks like this: - -.. code:: python - - from argparse import ArgumentParser - - if __name__ == "__main__": - parser = ArgumentParser() - parser.add_argument("--learning_rate_1", default=0.02) - parser.add_argument("--learning_rate_2", default=0.03) - parser.add_argument("--model", default="cnn") - parser.add_argument("--command", default="fit") - parser.add_argument("--run_fast", default=True) - ... - # add 100 more of these - ... - - args = parser.parse_args() - - if args.model == "cnn": - model = ConvNet(learning_rate=args.learning_rate_1) - elif args.model == "transformer": - model = Transformer(learning_rate=args.learning_rate_2) - trainer = Trainer(fast_dev_run=args.run_fast) - ... - - if args.command == "fit": - trainer.fit() - elif args.command == "test": - ... - -This kind of boilerplate is unsustainable as projects grow in complexity. - ----- - -************************ -Enable the Lightning CLI -************************ -To enable the Lightning CLI install the extras: - -.. code:: bash - - pip install pytorch-lightning[extra] - -if the above fails, only install jsonargparse: - -.. code:: bash - - pip install -U jsonargparse[signatures] - ----- - -************************** -Connect a model to the CLI -************************** -The simplest way to control a model with the CLI is to wrap it in the LightningCLI object: - -.. code:: python - - # main.py - - import torch - from pytorch_lightning.utilities.cli import LightningCLI - from pytorch_lightning import LightningModule, demos - - - class DemoModel(LightningModule): - def __init__(self, out_dim: int = 10, learning_rate: float = 0.02): - super().__init__() - self.l1 = torch.nn.Linear(32, out_dim) - self.learning_rate = learning_rate - - def forward(self, x): - return torch.relu(self.l1(x.view(x.size(0), -1))) - - def training_step(self, batch, batch_nb): - x = batch - x = self(x) - loss = x.sum() - return loss - - def configure_optimizers(self): - return torch.optim.Adam(self.parameters(), lr=self.learning_rate) - - - cli = LightningCLI(DemoModel, demos.BoringDataModule) - # don't call fit!! - -Now your model can be managed via the CLI. To see the available commands type: - -.. code:: bash - - $ python main.py --help - -Which prints out: - -.. code:: bash - - usage: a.py [-h] [-c CONFIG] [--print_config [={comments,skip_null,skip_default}+]] - {fit,validate,test,predict,tune} ... - - pytorch-lightning trainer command line tool - - optional arguments: - -h, --help Show this help message and exit. - -c CONFIG, --config CONFIG - Path to a configuration file in json or yaml format. - --print_config [={comments,skip_null,skip_default}+] - Print configuration and exit. - - subcommands: - For more details of each subcommand add it as argument followed by --help. - - {fit,validate,test,predict,tune} - fit Runs the full optimization routine. - validate Perform one evaluation epoch over the validation set. - test Perform one evaluation epoch over the test set. - predict Run inference on your data. - tune Runs routines to tune hyperparameters before training. - - -the message tells us that we have a few available subcommands: - -.. code:: bash - - python main.py [subcommand] - -which you can use depending on your use case: - -.. code:: bash - - $ python main.py fit - $ python main.py validate - $ python main.py test - $ python main.py predict - $ python main.py tune - ----- - -************************** -Train a model with the CLI -************************** -To run the full training routine (train, val, test), use the subcommand ``fit``: - -.. code:: bash - - python main.py fit - -View all available options with the ``--help`` command: - -.. code:: bash - - usage: main.py [options] fit [-h] [-c CONFIG] - [--seed_everything SEED_EVERYTHING] [--trainer CONFIG] - ... - [--ckpt_path CKPT_PATH] - --trainer.logger LOGGER - - optional arguments: - : - --model.out_dim OUT_DIM - (type: int, default: 10) - --model.learning_rate LEARNING_RATE - (type: float, default: 0.02) - : - --data CONFIG Path to a configuration file. - --data.data_dir DATA_DIR - (type: str, default: ./) - -With the Lightning CLI enabled, you can now change the parameters without touching your code: - -.. code:: bash - - # change the learning_rate - python main.py fit --model.out_dim 30 - - # change the out dimensions also - python main.py fit --model.out_dim 10 --model.learning_rate 0.1 - - # change trainer and data arguments too - python main.py fit --model.out_dim 2 --model.learning_rate 0.1 --data.data_dir '~/' --trainer.logger False diff --git a/source/cli/lightning_cli_intermediate_2.rst b/source/cli/lightning_cli_intermediate_2.rst deleted file mode 100644 index 493d536..0000000 --- a/source/cli/lightning_cli_intermediate_2.rst +++ /dev/null @@ -1,251 +0,0 @@ -:orphan: - -########################################### -Eliminate config boilerplate (intermediate) -########################################### -**Audience:** Users who have multiple models and datasets per project. - -**Pre-reqs:** You must have read :doc:`(Control it all from the CLI) `. - ----- - -**************************************** -Why do I want to mix models and datasets -**************************************** -Lightning projects usually begin with one model and one dataset. As the project grows in complexity and you introduce more models and more datasets, it becomes desirable -to mix any model with any dataset directly from the commandline without changing your code. - - -.. code:: bash - - # Mix and match anything - $ python main.py fit --model=GAN --data=MNIST - $ python main.py fit --model=Transformer --data=MNIST - -This is what the Lightning CLI enables. Otherwise, this kind of configuration requires a significant amount of boilerplate that often looks like this: - -.. code:: python - - # choose model - if args.model == "gan": - model = GAN(args.feat_dim) - elif args.model == "transformer": - model = Transformer(args.feat_dim) - ... - - # choose datamodule - if args.data == "MNIST": - datamodule = MNIST() - elif args.data == "imagenet": - datamodule = Imagenet() - ... - - # mix them! - trainer.fit(model, datamodule) - ----- - -************************* -Register LightningModules -************************* -Connect models across different files with the ``MODEL_REGISTRY`` to make them available from the CLI: - -.. code:: python - - # main.py - - from pytorch_lightning import demos - from pytorch_lightning.utilities import cli as pl_cli - - - @pl_cli.MODEL_REGISTRY - class Model1(demos.DemoModel): - def configure_optimizers(self): - print("⚡", "using Model1", "⚡") - return super().configure_optimizers() - - - @pl_cli.MODEL_REGISTRY - class Model2(demos.DemoModel): - def configure_optimizers(self): - print("⚡", "using Model2", "⚡") - return super().configure_optimizers() - - - cli = pl_cli.LightningCLI(datamodule_class=demos.BoringDataModule) - -Now you can choose between any model from the CLI: - -.. code:: bash - - # use Model1 - python main.py fit --model Model1 - - # use Model2 - python main.py fit --model Model2 - ----- - -******************** -Register DataModules -******************** -Connect DataModules across different files with the ``DATAMODULE_REGISTRY`` to make them available from the CLI: - -.. code:: python - - # main.py - import torch - from pytorch_lightning.utilities import cli as pl_cli - from pytorch_lightning import demos - - - @pl_cli.DATAMODULE_REGISTRY - class FakeDataset1(demos.BoringDataModule): - def train_dataloader(self): - print("⚡", "using FakeDataset1", "⚡") - return torch.utils.data.DataLoader(self.random_train) - - - @pl_cli.DATAMODULE_REGISTRY - class FakeDataset2(demos.BoringDataModule): - def train_dataloader(self): - print("⚡", "using FakeDataset2", "⚡") - return torch.utils.data.DataLoader(self.random_train) - - - cli = pl_cli.LightningCLI(demos.DemoModel) - -Now you can choose between any dataset at runtime: - -.. code:: bash - - # use Model1 - python main.py fit --data FakeDataset1 - - # use Model2 - python main.py fit --data FakeDataset2 - ----- - -******************* -Register optimizers -******************* -Connect optimizers with the ``OPTIMIZER_REGISTRY`` to make them available from the CLI: - -.. code:: python - - # main.py - import torch - from pytorch_lightning.utilities import cli as pl_cli - from pytorch_lightning import demos - - - @pl_cli.OPTIMIZER_REGISTRY - class LitAdam(torch.optim.Adam): - def step(self, closure): - print("⚡", "using LitAdam", "⚡") - super().step(closure) - - - @pl_cli.OPTIMIZER_REGISTRY - class FancyAdam(torch.optim.Adam): - def step(self, closure): - print("⚡", "using FancyAdam", "⚡") - super().step(closure) - - - cli = pl_cli.LightningCLI(demos.DemoModel, demos.BoringDataModule) - -Now you can choose between any optimizer at runtime: - -.. code:: bash - - # use LitAdam - python main.py fit --optimizer LitAdam - - # use FancyAdam - python main.py fit --optimizer FancyAdam - -Bonus: If you need only 1 optimizer, the Lightning CLI already works out of the box with any Optimizer from ``torch.optim.optim``: - -.. code:: bash - - python main.py fit --optimizer AdamW - -If the optimizer you want needs other arguments, add them via the CLI (no need to change your code)! - -.. code:: bash - - python main.py fit --optimizer SGD --optimizer.lr=0.01 - ----- - -********************** -Register LR schedulers -********************** -Connect learning rate schedulers with the ``LR_SCHEDULER_REGISTRY`` to make them available from the CLI: - -.. code:: python - - # main.py - import torch - from pytorch_lightning.utilities import cli as pl_cli - from pytorch_lightning import demos - - - @pl_cli.LR_SCHEDULER_REGISTRY - class LitLRScheduler(torch.optim.lr_scheduler.CosineAnnealingLR): - def step(self): - print("⚡", "using LitLRScheduler", "⚡") - super().step() - - - cli = pl_cli.LightningCLI(demos.DemoModel, demos.BoringDataModule) - -Now you can choose between any learning rate scheduler at runtime: - -.. code:: bash - - # LitLRScheduler - python main.py fit --lr_scheduler LitLRScheduler - - -Bonus: If you need only 1 LRScheduler, the Lightning CLI already works out of the box with any LRScheduler from ``torch.optim``: - -.. code:: bash - - python main.py fit --lr_scheduler CosineAnnealingLR - python main.py fit --lr_scheduler LinearLR - ... - -If the scheduler you want needs other arguments, add them via the CLI (no need to change your code)! - -.. code:: bash - - python main.py fit --lr_scheduler=ReduceLROnPlateau --lr_scheduler.monitor=epoch - ----- - -************************* -Register from any package -************************* -A shortcut to register many classes from a package is to use the ``register_classes`` method. Here we register all optimizers from the ``torch.optim`` library: - -.. code:: python - - import torch - from pytorch_lightning.utilities import cli as pl_cli - from pytorch_lightning import demos - - # add all PyTorch optimizers! - pl_cli.OPTIMIZER_REGISTRY.register_classes(module=torch.optim, base_cls=torch.optim.Optimizer) - - cli = pl_cli.LightningCLI(demos.DemoModel, demos.BoringDataModule) - -Now use any of the optimizers in the ``torch.optim`` library: - -.. code:: bash - - python main.py fit --optimizer AdamW - -This method is supported by all the registry classes. diff --git a/source/clouds/cloud_training.rst b/source/clouds/cloud_training.rst deleted file mode 100644 index 1bd57b1..0000000 --- a/source/clouds/cloud_training.rst +++ /dev/null @@ -1,86 +0,0 @@ -.. _grid: - -################## -Train on the cloud -################## -**Audience:** Users who want to develop and train models on the cloud (public cloud, private cloud or onprem clusters). - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: 1: Access a GPU machine on the cloud - :description: Learn to train models using an interactive cloud machine. - :col_css: col-md-4 - :button_link: session_basic.html - :height: 200 - :tag: basic - -.. displayitem:: - :header: 2: Run a model in the background on the cloud - :description: Learn to run a model in the background on a cloud machine. - :col_css: col-md-4 - :button_link: run_basic.html - :height: 200 - :tag: intermediate - -.. displayitem:: - :header: 3: Save up to 80% on cloud costs with fault-tolerant training - :description: Run on the cloud for 1/10th the price with fault-tolerant training. - :col_css: col-md-4 - :button_link: fault_tolerant_training_basic.html - :height: 200 - :tag: intermediate - -.. displayitem:: - :header: 4: Run many models at once - :description: Run many models at once (sweep) to find the best performing model. - :col_css: col-md-4 - :button_link: run_intermediate.html - :height: 200 - :tag: intermediate - -.. displayitem:: - :header: 5: Run on your own cloud - :description: Learn how to run on your Company or University private clouds. - :col_css: col-md-4 - :button_link: run_expert.html - :height: 200 - :tag: expert - -.. raw:: html - -
-
- ----- - -.. raw:: html - -
-
- -.. raw:: html - - - - -.. raw:: html - -
-
- -`Grid.ai `_ is the official cloud training solution for PyTorch Lightning. Grid is designed to support researcher workloads at both academic labs and major companies. - -.. raw:: html - -
-
diff --git a/source/clouds/cloud_training_intermediate.rst b/source/clouds/cloud_training_intermediate.rst deleted file mode 100644 index c5a65d7..0000000 --- a/source/clouds/cloud_training_intermediate.rst +++ /dev/null @@ -1,7 +0,0 @@ -:orphan: - -.. _grid_cloud_intermediate: - -################################# -Train on the cloud (intermediate) -################################# diff --git a/source/clouds/cluster_advanced.rst b/source/clouds/cluster_advanced.rst deleted file mode 100644 index 918bf06..0000000 --- a/source/clouds/cluster_advanced.rst +++ /dev/null @@ -1,213 +0,0 @@ -#################################### -Run on an on-prem cluster (advanced) -#################################### - -.. _slurm: - ----- - -****************************** -Run on a SLRUM managed cluster -****************************** -Lightning automates the details behind training on a SLURM-powered cluster. In contrast to the general purpose -cluster above, the user does not start the jobs manually on each node and instead submits it to SLURM which -schedules the resources and time for which the job is allowed to run. - ----- - -*************************** -Design your training script -*************************** - -To train a model using multiple nodes, do the following: - -1. Design your :ref:`lightning_module` (no need to add anything specific here). - -2. Enable DDP in the trainer - - .. code-block:: python - - # train on 32 GPUs across 4 nodes - trainer = Trainer(accelerator="gpu", devices=8, num_nodes=4, strategy="ddp") - -3. It's a good idea to structure your training script like this: - - .. testcode:: - - # train.py - def main(hparams): - model = LightningTemplateModel(hparams) - - trainer = Trainer(accelerator="gpu", devices=8, num_nodes=4, strategy="ddp") - - trainer.fit(model) - - - if __name__ == "__main__": - root_dir = os.path.dirname(os.path.realpath(__file__)) - parent_parser = ArgumentParser(add_help=False) - hyperparams = parser.parse_args() - - # TRAIN - main(hyperparams) - -4. Create the appropriate SLURM job: - - .. code-block:: bash - - # (submit.sh) - #!/bin/bash -l - - # SLURM SUBMIT SCRIPT - #SBATCH --nodes=4 - #SBATCH --gres=gpu:8 - #SBATCH --ntasks-per-node=8 - #SBATCH --mem=0 - #SBATCH --time=0-02:00:00 - - # activate conda env - source activate $1 - - # debugging flags (optional) - export NCCL_DEBUG=INFO - export PYTHONFAULTHANDLER=1 - - # on your cluster you might need these: - # set the network interface - # export NCCL_SOCKET_IFNAME=^docker0,lo - - # might need the latest CUDA - # module load NCCL/2.4.7-1-cuda.10.0 - - # run script from above - srun python3 train.py - -5. If you want auto-resubmit (read below), add this line to the submit.sh script - - .. code-block:: bash - - #SBATCH --signal=SIGUSR1@90 - -6. Submit the SLURM job - - .. code-block:: bash - - sbatch submit.sh - ----- - -********************************** -Enable auto wall-time resubmitions -********************************** -When you use Lightning in a SLURM cluster, it automatically detects when it is about -to run into the wall time and does the following: - -1. Saves a temporary checkpoint. -2. Requeues the job. -3. When the job starts, it loads the temporary checkpoint. - -To get this behavior make sure to add the correct signal to your SLURM script - -.. code-block:: bash - - # 90 seconds before training ends - SBATCH --signal=SIGUSR1@90 - -If auto-resubmit is not desired, it can be turned off in the :class:`~pytorch_lightning.plugins.environments.slurm_environment.SLURMEnvironment` plugin: - -.. code-block:: python - - from pytorch_lightning.plugins.environments import SLURMEnvironment - - trainer = Trainer(plugins=[SLURMEnvironment(auto_requeue=False)]) - ----- - -*********************** -Build your SLURM script -*********************** -Instead of manually building SLURM scripts, you can use the -`SlurmCluster object `_ -to do this for you. The SlurmCluster can also run a grid search if you pass -in a `HyperOptArgumentParser -`_. - -Here is an example where you run a grid search of 9 combinations of hyperparameters. -See also the multi-node examples -`here `__. - -.. code-block:: python - - # grid search 3 values of learning rate and 3 values of number of layers for your net - # this generates 9 experiments (lr=1e-3, layers=16), (lr=1e-3, layers=32), - # (lr=1e-3, layers=64), ... (lr=1e-1, layers=64) - parser = HyperOptArgumentParser(strategy="grid_search", add_help=False) - parser.opt_list("--learning_rate", default=0.001, type=float, options=[1e-3, 1e-2, 1e-1], tunable=True) - parser.opt_list("--layers", default=1, type=float, options=[16, 32, 64], tunable=True) - hyperparams = parser.parse_args() - - # Slurm cluster submits 9 jobs, each with a set of hyperparams - cluster = SlurmCluster( - hyperparam_optimizer=hyperparams, - log_path="/some/path/to/save", - ) - - # OPTIONAL FLAGS WHICH MAY BE CLUSTER DEPENDENT - # which interface your nodes use for communication - cluster.add_command("export NCCL_SOCKET_IFNAME=^docker0,lo") - - # see the output of the NCCL connection process - # NCCL is how the nodes talk to each other - cluster.add_command("export NCCL_DEBUG=INFO") - - # setting a main port here is a good idea. - cluster.add_command("export MASTER_PORT=%r" % PORT) - - # ************** DON'T FORGET THIS *************** - # MUST load the latest NCCL version - cluster.load_modules(["NCCL/2.4.7-1-cuda.10.0"]) - - # configure cluster - cluster.per_experiment_nb_nodes = 12 - cluster.per_experiment_nb_gpus = 8 - - cluster.add_slurm_cmd(cmd="ntasks-per-node", value=8, comment="1 task per gpu") - - # submit a script with 9 combinations of hyper params - # (lr=1e-3, layers=16), (lr=1e-3, layers=32), (lr=1e-3, layers=64), ... (lr=1e-1, layers=64) - cluster.optimize_parallel_cluster_gpu( - main, nb_trials=9, job_name="name_for_squeue" # how many permutations of the grid search to run - ) - - -The other option is that you generate scripts on your own via a bash command or use our -:doc:`native solution <../clouds/cloud_training>`. - ----- - -******** -Get help -******** -Setting up a cluster for distributed training is not trivial. Lightning offers lightning-grid which allows you to configure a cluster easily and run experiments via the CLI and web UI. - -Try it out for free today: - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Train models on the cloud - :description: Learn to run a model in the background on a cloud machine. - :col_css: col-md-6 - :button_link: cloud_training.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
bool: - """Return True if the cluster is managed (you don't launch processes yourself)""" - return True - - def world_size(self) -> int: - return int(os.environ["WORLD_SIZE"]) - - def global_rank(self) -> int: - return int(os.environ["RANK"]) - - def local_rank(self) -> int: - return int(os.environ["LOCAL_RANK"]) - - def node_rank(self) -> int: - return int(os.environ["NODE_RANK"]) - - def main_address(self) -> str: - return os.environ["MASTER_ADDRESS"] - - def main_port(self) -> int: - return int(os.environ["MASTER_PORT"]) - - - trainer = Trainer(plugins=[MyClusterEnvironment()]) - ----- - -******** -Get help -******** -Setting up a cluster for distributed training is not trivial. Lightning offers lightning-grid which allows you to configure a cluster easily and run experiments via the CLI and web UI. - -Try it out for free today: - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Train models on the cloud - :description: Learn to run a model in the background on a cloud machine. - :col_css: col-md-6 - :button_link: cloud_training.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
`__ provides helper functions to setup distributed environment variables from the `PyTorch distributed communication package `__ that need to be defined on each node. - -Once the script is setup like described in :ref:` Training Script Setup`, you can run the below command across your nodes to start multi-node training. - -Like a custom cluster, you have to ensure that there is network connectivity between the nodes with firewall rules that allow traffic flow on a specified *MASTER_PORT*. - -Finally, you'll need to decide which node you'd like to be the main node (*MASTER_ADDR*), and the ranks of each node (*NODE_RANK*). - -For example: - -* *MASTER_ADDR* 10.10.10.16 -* *MASTER_PORT* 29500 -* *NODE_RANK* 0 for the first node, 1 for the second node - -Run the below command with the appropriate variables set on each node. - -.. code-block:: bash - - python -m torch.distributed.run - --nnodes=2 # number of nodes you'd like to run with - --master_addr - --master_port - --node_rank - train.py (--arg1 ... train script args...) - -.. note:: - - ``torch.distributed.run`` assumes that you'd like to spawn a process per GPU if GPU devices are found on the node. This can be adjusted with ``-nproc_per_node``. - ----- - -******** -Get help -******** -Setting up a cluster for distributed training is not trivial. Lightning offers lightning-grid which allows you to configure a cluster easily and run experiments via the CLI and web UI. - -Try it out for free today: - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Train models on the cloud - :description: Learn to run a model in the background on a cloud machine. - :col_css: col-md-6 - :button_link: cloud_training.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
`. - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Basic - :description: Save money with fault-tolerant training on the cloud - :col_css: col-md-4 - :button_link: fault_tolerant_training_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Expert - :description: Learn how to enable fault tolerance on any cloud or cluster environment - :col_css: col-md-4 - :button_link: fault_tolerant_training_expert.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: FAQ - :description: Frequently asked questions about fault-tolerant training. - :col_css: col-md-4 - :button_link: fault_tolerant_training_faq.html - :height: 150 - -.. raw:: html - -
-
diff --git a/source/clouds/fault_tolerant_training_basic.rst b/source/clouds/fault_tolerant_training_basic.rst deleted file mode 100644 index d5af9ed..0000000 --- a/source/clouds/fault_tolerant_training_basic.rst +++ /dev/null @@ -1,43 +0,0 @@ -:orphan: - -############################### -Fault-tolerant Training (basic) -############################### -**Audience:** User who want to run on the cloud or a cluster environment. - -**Pre-requisites**: Users must have first read :doc:`Run on the cloud (basic) ` - ----- - -******************************** -What is fault-tolerant training? -******************************** -When developing models on the cloud or cluster environments, you may be forced to restart from scratch in the event of a software or hardware failure (ie: a *fault*). Lightning models can run fault-proof. - -With Fault Tolerant Training, when ``Trainer.fit()`` fails in the middle of an epoch during training or validation, -Lightning will restart exactly where it failed, and everything will be restored (down to the batch it was on even if the dataset was shuffled). - -.. warning:: Fault-tolerant Training is currently an experimental feature within Lightning. - ----- - -*************************************************** -Use fault-tolerance to save money on cloud training -*************************************************** -Cloud providers offer pre-emptible machines which can be priced as low as 1/10th the cost but can be shut-down automatically at any time. -Because fault-tolerant training can automatically recover from an interruption, you can train models for many weeks/months at a time for the pre-emptible prices. - -To easily run on the cloud with fault-tolerance with lightning-grid, use the following arguments: - -.. code-block:: bash - - grid run --use_spot --auto_resume lightning_script.py - -The ``--use_spot`` argument enables cheap preemptible pricing (but the machines that can be interrupted). -If the machine is interrupted, the ``--auto_resume`` argument automatically restarts the machine. - -As long as you are running a script that runs a lightning model, the model will restore itself and handle all the details of fault tolerance. - ----- - -.. include:: grid_costs.rst diff --git a/source/clouds/fault_tolerant_training_expert.rst b/source/clouds/fault_tolerant_training_expert.rst deleted file mode 100644 index f0051f7..0000000 --- a/source/clouds/fault_tolerant_training_expert.rst +++ /dev/null @@ -1,34 +0,0 @@ -:orphan: - -################################ -Fault-tolerant Training (expert) -################################ -**Audience**: Experts looking to enable and handle their own fault-tolerance. - -**Pre-requisites**: Users must have first read :doc:`Fault-tolrance Training (basic) ` - ----- - -*************************************** -Enable fault-tolerant behavior anywhere -*************************************** -To enable fault tolerance on your own cloud or cluster environment enable the *PL_FAULT_TOLERANT_TRAINING* environment variable: - -.. code-block:: bash - - PL_FAULT_TOLERANT_TRAINING=1 python script.py - -Although Lighting will now be fault-tolerant, you'll have to handle all the nuances of making sure the models are automatically restarted. - -.. note:: This complexity is already handled for you if you use **lightning-grid**. - ----- - -************************************************** -Enable fault-tolerant behavior on your own cluster -************************************************** -The simplest way to enable fault-tolerant behavior is to enable lightning-grid to work on your on-prem cluster or cloud environment which will handle all the nuances of fault-tolerant training at scale. - -Email us to connect with your own cloud account: - -``_ diff --git a/source/clouds/fault_tolerant_training_faq.rst b/source/clouds/fault_tolerant_training_faq.rst deleted file mode 100644 index 4f2bdf4..0000000 --- a/source/clouds/fault_tolerant_training_faq.rst +++ /dev/null @@ -1,144 +0,0 @@ -:orphan: - -############################# -Fault-tolerant Training (FAQ) -############################# - -******************************* -How do I use iterable datasets? -******************************* -To support fault-tolerance, you will need to use and expose a sampler within your dataset. - -For example, the following implementation for an iterable dataset sub-classing :class:`~torch.utils.data.IterableDataset` won't be supported. - -.. code-block:: python - - from torch.utils.data import IterableDataset, DataLoader - - - # does not support fault tolerance training! - class RandomIterableDataset(IterableDataset): - def __init__(self, size: int, count: int): - self.count = count - self.size = size - - def __iter__(self): - for _ in range(self.count): - yield torch.randn(self.size) - - -There are two primary reasons why Lightning can't support the previous implementation. - -* Lightning cannot infer what you are iterating over, making it difficult to restart training. Lightning Fault Tolerant Training requires a :class:`~torch.utils.data.distributed.Sampler` to be used to encapsulate the fetching logic, requiring both the sampler and an iterator to be made available as attributes within the dataset, so Lightning can access them to track progress. -* Implementing the `__next__` method is required as it separates iterator creation from its consumption, which is essential for Lightning to wrap the iterator before their consumption. - -If your iterable dataset are implemented in the following way, everything should works as expected. - -.. code-block:: python - - import torch - from torch.utils.data import IterableDataset, DataLoader - - - class RandomIterableDataset(IterableDataset): - def __init__(self, size: int, length: int): - self.data = torch.randn(length, size) - - # expose the sampler as an attribute - self.sampler = RandomSampler(range(length)) - - def __iter__(self) -> "RandomIterableDataset": - # expose the generator from the sampler as an attribute - # the ``sampler_iter`` will be wrapped by Lightning to ensure - # we can capture random seeds and iteration count for fast-forward samplers - # while restarting. - self.sampler_iter = iter(self.sampler) - return self - - def __next__(self) -> torch.Tensor: - # call next on the iterator and get the associated data. - # the logic here can become more complex but the sampler - # should be the central piece for fetching the next sample - index = next(self.sampler_iter) - return self.data[index] - ----- - -********************************** -How do I use multiple dataloaders? -********************************** -If you are using multiple training dataloaders, Lightning won't be able to restore the random state properly. - -.. testcode:: - - class LitModel(LightningModule): - def train_dataloader(self): - loader_a = torch.utils.data.DataLoader(range(8), batch_size=4) - loader_b = torch.utils.data.DataLoader(range(16), batch_size=4) - return {"loader_a": loader_a, "loader_b": loader_b} - - def training_step(self, batch, batch_idx): - # access the data in the same format as the collection of dataloaders. - # dict, list are supported. - loader_a = batch["loader_a"] - loader_b = batch["loader_b"] - - -If you believe this to be useful, please open a `feature request `_. - - ----- - -********************************* -What are the performance impacts? -********************************* -Fault-tolerant Training was tested on common and worst-case scenarios in order to measure the impact of the internal state tracking on the total training time. -On tiny models like the `BoringModel and RandomDataset `_ -which has virtually no data loading and processing overhead, we noticed up to 50% longer training time with fault tolerance enabled. -In this worst-case scenario, fault-tolerant adds an overhead that is noticeable in comparison to the compute time for dataloading itself. -However, for more realistic training workloads where data loading and preprocessing is more expensive, the constant overhead that fault tolerance adds becomes less noticeable or not noticeable at all. -For example, when training with ResNet50 on CIFAR 10 we have observed a 0.5% to 1% increase in training time depending on ``batch size`` or ``number of workers``. - -More detailed benchmarks will be shared in the future. - -.. note:: - - The extra time is coming from several parts: - - - Capturing the iteration count + random states for each sample within each DataLoader workers and pass it through the data_queue - - Extra logic to handle / store the dataloader's states from each batch. - ----- - -************************************ -What happens to my shuffled dataset? -************************************ -If you are using a single map-based dataset by sub-classing :class:`~torch.utils.data.Dataset`, everything should work as expected. - -.. code-block:: python - - from torch.utils.data import Dataset, DataLoader - - - class RandomDataset(Dataset): - def __init__(self, size: int, length: int): - self.len = length - self.data = torch.randn(length, size) - - def __getitem__(self, index): - return self.data[index] - - def __len__(self): - return self.len - ----- - -****************************** -What parts are fault-tolerant? -****************************** -Lightning keeps track of the following state updates during training: - -* Samplers indices and random states across multiple processes and workers: This enables restoring random transforms and batch fetching to the exact state as it was right before the failure. -* Optimizers, learning rate schedulers, callbacks, etc.. -* Loop progression -* Logging internal states such that metric reductions on epoch end are not getting affected by the failure and model selection can continue as expected. diff --git a/source/clouds/grid_costs.rst b/source/clouds/grid_costs.rst deleted file mode 100644 index 04b1864..0000000 --- a/source/clouds/grid_costs.rst +++ /dev/null @@ -1,6 +0,0 @@ -**** -Cost -**** -Lightning (via `lightning-grid `_) provides access to cloud machines to the community for free. However, you must buy credits on `lightning-grid `_ which are used to pay the cloud providers on your behalf. - -If you want to run on your own AWS account and pay the cloud provider directly, please contact our onprem team: ``_ diff --git a/source/clouds/run_advanced.rst b/source/clouds/run_advanced.rst deleted file mode 100644 index 3418dee..0000000 --- a/source/clouds/run_advanced.rst +++ /dev/null @@ -1,130 +0,0 @@ -:orphan: - -.. _grid_cloud_advanced: - -############################# -Train on the cloud (advanced) -############################# -**Audience**: Anyone looking to train a model on the cloud in the background - ----- - -**************************** -What is background training? -**************************** -Background training lets you train models in the background without you needing to interact with the machine. As the model trains you can monitor its progress via Tensorboard or an experiment manager of your choice. - ----- - -************************* -0: Install lightning-grid -************************* -First Navigate to https://platform.grid.ai to create a free account. - -Next, install lightning-grid and login - -.. code:: bash - - pip install lightning-grid - grid login - ----- - -******************* -1: Create a dataset -******************* -Create a datastore which optimizes your datasets for training at scale on the cloud. - -First, let's download a dummy dataset we created. - -.. code:: bash - - # download - curl https://pl-flash-data.s3.amazonaws.com/cifar5.zip -o cifar5.zip - - # unzip - unzip cifar5.zip - -Now create the datastore - -.. code:: bash - - grid datastore create cifar5/ --name cifar5 - -Now your dataset is ready to be used for training on the cloud! - -.. note:: In some *research* workflows, your model script ALSO downloads the dataset. If the dataset is only a few GBs this is fine. Otherwise we recommend you create a Datastore. - ----- - -************************** -2: Choose the model to run -************************** -You can run any python script in the background. For this example, we'll use a simple classifier: - -Clone the code to your machine: - -.. code bash - - git clone https://github.com/williamFalcon/cifar5-simple.git - - -.. note:: Code repositories can be as complicated as needed. This is just a simple demo. - ----- - -******************* -3: Run on the cloud -******************* -To run this model on the cloud, use the **grid run** command which has two parts: - -.. code:: bash - - grid run [run args] file.py [file args] - -To attach the datastore **cifar5** to the **cifar5.py** file use the following command: - -.. code:: bash - - # command | the datastore to use | the model | argument to the model - grid run --datastore_name cifar5 cifar5.py.py --data_dir /datastores/cifar5 - ----- - -********************* -4: Monitor and manage -********************* -Now that your model is running in the background you can monitor and manage it `here `_. - -You can also monitor its progress on the commandline: - -.. code:: bash - - grid status - ----- - -********** -Next Steps -********** -Here are the recommended next steps depending on your workflow. - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Run many models at once - :description: Learn how to run many models at once using sweeps. - :col_css: col-md-12 - :button_link: session_intermediate.html - :height: 150 - :tag: basic - -.. raw:: html - -
-
`_. - -You can also monitor its progress on the commandline: - -.. code:: bash - - grid status - ----- - -.. include:: grid_costs.rst - ----- - -********** -Next Steps -********** -Here are the recommended next steps depending on your workflow. - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Run many models at once - :description: Learn how to find the best performaning model by running multiple models at once using a sweep. - :col_css: col-md-4 - :button_link: run_intermediate.html - :height: 150 - :tag: basic - -.. raw:: html - -
-
` for more information. - ----- - -*********************************** -Run on your own cloud (hassle free) -*********************************** -Cluster training can get complicated once you start doing multi-node training, fault-tolerant training or sweeps. -If you'd prefer to not deal with any of the hassles of running on your own cloud environments, lightning-grid enables University and Enterprise customers to run on the cloud with their own credentials or even onprem. - -These are some of the benefits of running via lightning-grid: - -- create datasets optimized for scale -- fully configurable on-prem deployment -- SOC-2 compliance (in-progress) (ETA Q3 2022) -- micro cost optimizations everywhere (which add up) -- built-in fault tolerance -- enabled collaboration for teams and enterprises - -Contact our sales support engineering team so we can help you set up Grid with your own cloud credentials. - -Email us to connect with your own cloud account: - -``_. diff --git a/source/clouds/run_intermediate.rst b/source/clouds/run_intermediate.rst deleted file mode 100644 index dad2edf..0000000 --- a/source/clouds/run_intermediate.rst +++ /dev/null @@ -1,229 +0,0 @@ -:orphan: - -.. _grid_cloud_run_intermediate: - -################################# -Train on the cloud (intermediate) -################################# -**Audience**: User looking to run many models at once - ----- - -**************** -What is a sweep? -**************** -A sweep is the term giving to running the same model multiple times with different hyperparameters to find the one that performs the best (according to your definition of performance). - -Let's say I have a python script that trains a Lighting model to classify images. We run this file like so: - -.. code:: bash - - grid run file.py --batch_size 8 - -with such a model, I would be interested in knowing how it performs with different batch size. In this case, I'm going to train many versions of this model. - -.. code:: bash - - # run 4 models in parallel - grid run file.py --batch_size 8 - grid run file.py --batch_size 16 - grid run file.py --batch_size 32 - grid run file.py --batch_size 64 - -Now I can see how my model performs according to the layers and based on time and cost I can pick my "best" model: - -.. list-table:: Training speed vs cost - :widths: 10 40 15 15 - :header-rows: 1 - - * - Batch size - - classification accuracy (%) - - training time - - cost - * - 8 - - 0.80 - - 5 minutes - - $0.15 - * - 16 - - 0.85 - - 10 minutes - - $0.30 - * - 32 - - 0.90 - - 30 minutes - - $0.50 - * - 64 - - 0.95 - - 60 minutes - - $1.01 - ----- - -************* -Start a Sweep -************* -First, recall that in the `previous tutorial `_ we ran a single model using this command: - -.. code:: bash - - grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5 - -Now we're going to run that same model 4 different times each with a different number of layers: - -.. code:: bash - - grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5 --batch_size 8 - grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5 --batch_size 16 - grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5 --batch_size 32 - grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5 --batch_size 64 - -Grid has a special syntax based on python that gives you shortcuts for sweeps. The shortcut for the above commands is: - -.. code:: bash - - grid run --datastore_name cifar5 cifar5.py --data_dir /datastores/cifar5 --batch_size "[8, 16, 32, 64]" - ----- - -**************** -Syntax Shortcuts -**************** - -List -==== - -.. code:: bash - - grid run file.py --batch_size "[8, 16, 32, 64]" - -equivalent to: - -.. code:: bash - - grid run file.py --batch_size 8 - grid run file.py --batch_size 16 - grid run file.py --batch_size 32 - grid run file.py --batch_size 64 - ----- - -Range -===== - -.. code:: bash - - grid run file.py --batch_size "range(1, 10, 2)" - -equivalent to: - -.. code:: bash - - grid run main.py --batch_size 1 - grid run main.py --batch_size 3 - grid run main.py --batch_size 5 - grid run main.py --batch_size 7 - grid run main.py --batch_size 9 - ---- - -String list -=========== - -.. code:: bash - - grid run file.py --model_backbone "['resnet18' 'transformer', 'resnet50']" - -equivalent to: - -.. code:: bash - - grid run file.py --model_backbone 'resnet18' - grid run file.py --model_backbone 'transformer' - grid run file.py --model_backbone 'resnet50' - ----- - -Sampling -======== - -.. code:: bash - - grid run file.py --learning_rate "uniform(1e-5, 1e-1, 3)" - -equivalent to: - -.. code:: bash - - grid run file.py --learning_rate 0.03977392 - grid run file.py --learning_rate 0.04835479 - grid run file.py --learning_rate 0.05200016 - ----- - -**************** -Sweep strategies -**************** -Models often have dozens of hyperparameters. We usually don't run all combinations because it would be too prohibitive. Grid supports two strategies: - ----- - -Grid search -=========== -Grid search is a common approach that tries all combinations of hyperparamaters. Grid will automatically compute combinations when it detects special syntax: - -.. code:: bash - - grid run file.py --batch_size "[1, 2]" --layers "[3, 5]" - -is equivalent to: - -.. code:: bash - - grid run file.py --batch_size 1 --layers 3 - grid run file.py --batch_size 2 --layers 3 - grid run file.py --batch_size 1 --layers 5 - grid run file.py --batch_size 2 --layers 5 - ----- - -Random search -============= -With random search, we choose only a subset of hyperparamaters. The larger the number of trials (*num_trials*) the more probable we'll find a great performing model without needing to try all possible combinations. - -.. code:: bash - - grid run --strategy random_search --num_trials 2 file.py --batch_size "[1, 2]" --layers "[3, 5]" - -the above command generates the 4 combinations and runs only 2 at random - -.. code:: bash - - grid run file.py --batch_size 2 --layers 3 - grid run file.py --batch_size 1 --layers 5 - ----- - -********** -Next Steps -********** -Here are the recommended next steps depending on your workflow. - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Run with your own cloud credentials - :description: Learn how to use Grid products with your Company or University cloud account. - :col_css: col-md-4 - :button_link: run_expert.html - :height: 180 - :tag: expert - -.. raw:: html - -
-
`_ to create a free account, then start a new Grid Session. - -A Grid Session is an interactive machine with 1-16 GPUs per machine. - -.. image:: https://docs.grid.ai/assets/images/new-session-3c58be3fd64ffabcdeb7b52516e0782e.gif - :alt: Start a Grid Session in a few seconds - ----- - -************************* -Open the Jupyter Notebook -************************* -Once the Session starts, open a Jupyter notebook. - -.. raw:: html - - - ----- - -************************ -Clone and run your model -************************ -On the Jupyter page you can use a Notebook, or to clone your code and run via the CLI. - -.. raw:: html - - - ----- - -.. include:: grid_costs.rst - ----- - -********** -Next Steps -********** -Here are the recommended next steps depending on your workflow. - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Run a model in the background - :description: Learn to run a model in the background - :col_css: col-md-6 - :button_link: run_basic.html - :height: 180 - :tag: basic - -.. displayitem:: - :header: Run with your own cloud credentials - :description: Learn how to use Grid products on your Company or University private cloud account. - :col_css: col-md-6 - :button_link: run_expert.html - :height: 180 - :tag: expert - -.. raw:: html - -
-
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Basic - :description: Learn to save and load checkpoints - :col_css: col-md-3 - :button_link: checkpointing_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: Intermediate - :description: Customize checkpointing behavior - :col_css: col-md-3 - :button_link: checkpointing_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Advanced - :description: Enable cloud-based checkpointing and composable checkpoints. - :col_css: col-md-3 - :button_link: checkpointing_advanced.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Expert - :description: Customize checkpointing for custom distributed strategies and accelerators. - :col_css: col-md-3 - :button_link: checkpointing_expert.html - :height: 150 - :tag: expert - -.. raw:: html - -
-
- ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: ModelCheckpoint API - :description: Dig into the ModelCheckpoint API - :col_css: col-md-4 - :button_link: ../api/pytorch_lightning.callbacks.ModelCheckpoint.html - :height: 150 - -.. raw:: html - -
-
diff --git a/source/common/checkpointing_expert.rst b/source/common/checkpointing_expert.rst deleted file mode 100644 index c1859d6..0000000 --- a/source/common/checkpointing_expert.rst +++ /dev/null @@ -1,89 +0,0 @@ -:orphan: - -.. _checkpointing_expert: - -###################### -Checkpointing (expert) -###################### - -TODO: I don't understand this... - -*********************** -Customize Checkpointing -*********************** - -.. warning:: - - The Checkpoint IO API is experimental and subject to change. - - -Lightning supports modifying the checkpointing save/load functionality through the ``CheckpointIO``. This encapsulates the save/load logic -that is managed by the ``Strategy``. ``CheckpointIO`` is different from :meth:`~pytorch_lightning.core.hooks.CheckpointHooks.on_save_checkpoint` -and :meth:`~pytorch_lightning.core.hooks.CheckpointHooks.on_load_checkpoint` methods as it determines how the checkpoint is saved/loaded to storage rather than -what's saved in the checkpoint. - - -****************************** -Built-in Checkpoint IO Plugins -****************************** - -.. list-table:: Built-in Checkpoint IO Plugins - :widths: 25 75 - :header-rows: 1 - - * - Plugin - - Description - * - :class:`~pytorch_lightning.plugins.io.TorchCheckpointIO` - - CheckpointIO that utilizes :func:`torch.save` and :func:`torch.load` to save and load checkpoints - respectively, common for most use cases. - * - :class:`~pytorch_lightning.plugins.io.XLACheckpointIO` - - CheckpointIO that utilizes :func:`xm.save` to save checkpoints for TPU training strategies. - - -*************************** -Custom Checkpoint IO Plugin -*************************** - -``CheckpointIO`` can be extended to include your custom save/load functionality to and from a path. The ``CheckpointIO`` object can be passed to either a ``Trainer`` directly or a ``Strategy`` as shown below: - -.. code-block:: python - - from pytorch_lightning import Trainer - from pytorch_lightning.callbacks import ModelCheckpoint - from pytorch_lightning.plugins import CheckpointIO - from pytorch_lightning.strategies import SingleDeviceStrategy - - - class CustomCheckpointIO(CheckpointIO): - def save_checkpoint(self, checkpoint, path, storage_options=None): - ... - - def load_checkpoint(self, path, storage_options=None): - ... - - def remove_checkpoint(self, path): - ... - - - custom_checkpoint_io = CustomCheckpointIO() - - # Either pass into the Trainer object - model = MyModel() - trainer = Trainer( - plugins=[custom_checkpoint_io], - callbacks=ModelCheckpoint(save_last=True), - ) - trainer.fit(model) - - # or pass into Strategy - model = MyModel() - device = torch.device("cpu") - trainer = Trainer( - strategy=SingleDeviceStrategy(device, checkpoint_io=custom_checkpoint_io), - callbacks=ModelCheckpoint(save_last=True), - ) - trainer.fit(model) - -.. note:: - - Some ``TrainingTypePlugins`` like ``DeepSpeedStrategy`` do not support custom ``CheckpointIO`` as checkpointing logic is not modifiable. diff --git a/source/common/early_stopping.rst b/source/common/early_stopping.rst deleted file mode 100644 index 593106f..0000000 --- a/source/common/early_stopping.rst +++ /dev/null @@ -1,99 +0,0 @@ -.. testsetup:: * - - from pytorch_lightning.callbacks.early_stopping import EarlyStopping - -.. _early_stopping: - - -############## -Early Stopping -############## - -.. raw:: html - - - - -*********************** -Stopping an Epoch Early -*********************** - -You can stop and skip the rest of the current epoch early by overriding :meth:`~pytorch_lightning.core.hooks.ModelHooks.on_train_batch_start` to return ``-1`` when some condition is met. - -If you do this repeatedly, for every epoch you had originally requested, then this will stop your entire training. - - -********************** -EarlyStopping Callback -********************** - -The :class:`~pytorch_lightning.callbacks.early_stopping.EarlyStopping` callback can be used to monitor a metric and stop the training when no improvement is observed. - -To enable it: - -- Import :class:`~pytorch_lightning.callbacks.early_stopping.EarlyStopping` callback. -- Log the metric you want to monitor using :meth:`~pytorch_lightning.core.lightning.LightningModule.log` method. -- Init the callback, and set ``monitor`` to the logged metric of your choice. -- Set the ``mode`` based on the metric needs to be monitored. -- Pass the :class:`~pytorch_lightning.callbacks.early_stopping.EarlyStopping` callback to the :class:`~pytorch_lightning.trainer.trainer.Trainer` callbacks flag. - -.. code-block:: python - - from pytorch_lightning.callbacks.early_stopping import EarlyStopping - - - class LitModel(LightningModule): - def validation_step(self, batch, batch_idx): - loss = ... - self.log("val_loss", loss) - - - model = LitModel() - trainer = Trainer(callbacks=[EarlyStopping(monitor="val_loss", mode="min")]) - trainer.fit(model) - -You can customize the callbacks behaviour by changing its parameters. - -.. testcode:: - - early_stop_callback = EarlyStopping(monitor="val_accuracy", min_delta=0.00, patience=3, verbose=False, mode="max") - trainer = Trainer(callbacks=[early_stop_callback]) - - -Additional parameters that stop training at extreme points: - -- ``stopping_threshold``: Stops training immediately once the monitored quantity reaches this threshold. - It is useful when we know that going beyond a certain optimal value does not further benefit us. -- ``divergence_threshold``: Stops training as soon as the monitored quantity becomes worse than this threshold. - When reaching a value this bad, we believes the model cannot recover anymore and it is better to stop early and run with different initial conditions. -- ``check_finite``: When turned on, it stops training if the monitored metric becomes NaN or infinite. -- ``check_on_train_epoch_end``: When turned on, it checks the metric at the end of a training epoch. Use this only when you are monitoring any metric logged within - training-specific hooks on epoch-level. - - -In case you need early stopping in a different part of training, subclass :class:`~pytorch_lightning.callbacks.early_stopping.EarlyStopping` -and change where it is called: - -.. testcode:: - - class MyEarlyStopping(EarlyStopping): - def on_validation_end(self, trainer, pl_module): - # override this to disable early stopping at the end of val loop - pass - - def on_train_end(self, trainer, pl_module): - # instead, do it at the end of training loop - self._run_early_stopping_check(trainer) - -.. note:: - The :class:`~pytorch_lightning.callbacks.early_stopping.EarlyStopping` callback runs - at the end of every validation epoch by default. However, the frequency of validation - can be modified by setting various parameters in the :class:`~pytorch_lightning.trainer.trainer.Trainer`, - for example :paramref:`~pytorch_lightning.trainer.trainer.Trainer.check_val_every_n_epoch` - and :paramref:`~pytorch_lightning.trainer.trainer.Trainer.val_check_interval`. - It must be noted that the ``patience`` parameter counts the number of - validation checks with no improvement, and not the number of training epochs. - Therefore, with parameters ``check_val_every_n_epoch=10`` and ``patience=3``, the trainer - will perform at least 40 training epochs before being stopped. diff --git a/source/common/gradient_accumulation.rst b/source/common/gradient_accumulation.rst deleted file mode 100644 index c65e75e..0000000 --- a/source/common/gradient_accumulation.rst +++ /dev/null @@ -1,43 +0,0 @@ -Accumulated gradients run K small batches of size ``N`` before doing a backward pass. The effect is a large effective batch size of size ``KxN``, where ``N`` is the batch size. -Internally it doesn't stack up the batches and do a forward pass rather it accumulates the gradients for K batches and then do an ``optimizer.step`` to make sure the -effective batch size is increased but there is no memory overhead. - -.. warning:: - - When using distributed training for eg. DDP, with let's say with ``P`` devices, each device accumulates independently i.e. it stores the gradients - after each ``loss.backward()`` and doesn't sync the gradients across the devices until we call ``optimizer.step()``. So for each accumulation - step, the effective batch size on each device will remain ``N*K`` but right before the ``optimizer.step()``, the gradient sync will make the effective - batch size as ``P*N*K``. For DP, since the batch is split across devices, the final effective batch size will be ``N*K``. - -.. seealso:: :class:`~pytorch_lightning.trainer.trainer.Trainer` - -.. testcode:: - - # DEFAULT (ie: no accumulated grads) - trainer = Trainer(accumulate_grad_batches=1) - - # Accumulate gradients for 7 batches - trainer = Trainer(accumulate_grad_batches=7) - -You can set different values for it at different epochs by passing a dictionary, where the key represents the epoch at which the value for gradient accumulation -should be updated. - -.. testcode:: - - # till 5th epoch, it will accumulate every 8 batches. From 5th epoch - # till 9th epoch it will accumulate every 4 batches and after that no accumulation - # will happen. Note that you need to use zero-indexed epoch keys here - trainer = Trainer(accumulate_grad_batches={0: 8, 4: 4, 8: 1}) - -Or, you can create custom :class:`~pytorch_lightning.callbacks.gradient_accumulation_scheduler.GradientAccumulationScheduler` - -.. testcode:: - - from pytorch_lightning.callbacks import GradientAccumulationScheduler - - - # till 5th epoch, it will accumulate every 8 batches. From 5th epoch - # till 9th epoch it will accumulate every 4 batches and after that no accumulation - # will happen. Note that you need to use zero-indexed epoch keys here - accumulator = GradientAccumulationScheduler(scheduling={0: 8, 4: 4, 8: 1}) - trainer = Trainer(callbacks=accumulator) diff --git a/source/common/hyperparameters.rst b/source/common/hyperparameters.rst deleted file mode 100644 index 9103100..0000000 --- a/source/common/hyperparameters.rst +++ /dev/null @@ -1,279 +0,0 @@ -.. testsetup:: * - - from argparse import ArgumentParser, Namespace - - sys.argv = ["foo"] - -Configure hyperparameters from the CLI --------------------------------------- - -Lightning has utilities to interact seamlessly with the command line ``ArgumentParser`` -and plays well with the hyperparameter optimization framework of your choice. - ----------- - -ArgumentParser -^^^^^^^^^^^^^^ -Lightning is designed to augment a lot of the functionality of the built-in Python ArgumentParser - -.. testcode:: - - from argparse import ArgumentParser - - parser = ArgumentParser() - parser.add_argument("--layer_1_dim", type=int, default=128) - args = parser.parse_args() - -This allows you to call your program like so: - -.. code-block:: bash - - python trainer.py --layer_1_dim 64 - ----------- - -Argparser Best Practices -^^^^^^^^^^^^^^^^^^^^^^^^ -It is best practice to layer your arguments in three sections. - -1. Trainer args (``accelerator``, ``devices``, ``num_nodes``, etc...) -2. Model specific arguments (``layer_dim``, ``num_layers``, ``learning_rate``, etc...) -3. Program arguments (``data_path``, ``cluster_email``, etc...) - -| - -We can do this as follows. First, in your ``LightningModule``, define the arguments -specific to that module. Remember that data splits or data paths may also be specific to -a module (i.e.: if your project has a model that trains on Imagenet and another on CIFAR-10). - -.. testcode:: - - class LitModel(LightningModule): - @staticmethod - def add_model_specific_args(parent_parser): - parser = parent_parser.add_argument_group("LitModel") - parser.add_argument("--encoder_layers", type=int, default=12) - parser.add_argument("--data_path", type=str, default="/some/path") - return parent_parser - -Now in your main trainer file, add the ``Trainer`` args, the program args, and add the model args - -.. testcode:: - - # ---------------- - # trainer_main.py - # ---------------- - from argparse import ArgumentParser - - parser = ArgumentParser() - - # add PROGRAM level args - parser.add_argument("--conda_env", type=str, default="some_name") - parser.add_argument("--notification_email", type=str, default="will@email.com") - - # add model specific args - parser = LitModel.add_model_specific_args(parser) - - # add all the available trainer options to argparse - # ie: now --accelerator --devices --num_nodes ... --fast_dev_run all work in the cli - parser = Trainer.add_argparse_args(parser) - - args = parser.parse_args() - -Now you can call run your program like so: - -.. code-block:: bash - - python trainer_main.py --accelerator 'gpu' --devices 2 --num_nodes 2 --conda_env 'my_env' --encoder_layers 12 - -Finally, make sure to start the training like so: - -.. code-block:: python - - # init the trainer like this - trainer = Trainer.from_argparse_args(args, early_stopping_callback=...) - - # NOT like this - trainer = Trainer(accelerator=hparams.accelerator, devices=hparams.devices, ...) - - # init the model with Namespace directly - model = LitModel(args) - - # or init the model with all the key-value pairs - dict_args = vars(args) - model = LitModel(**dict_args) - ----------- - -LightningModule hyperparameters -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -Often times we train many versions of a model. You might share that model or come back to it a few months later -at which point it is very useful to know how that model was trained (i.e.: what learning rate, neural network, etc...). - -Lightning has a standardized way of saving the information for you in checkpoints and YAML files. The goal here is to -improve readability and reproducibility. - -save_hyperparameters -"""""""""""""""""""" - -Use :meth:`~pytorch_lightning.core.lightning.LightningModule.save_hyperparameters` within your -:class:`~pytorch_lightning.core.lightning.LightningModule`'s ``__init__`` method. -It will enable Lightning to store all the provided arguments under the ``self.hparams`` attribute. -These hyperparameters will also be stored within the model checkpoint, which simplifies model re-instantiation after training. - -.. code-block:: python - - class LitMNIST(LightningModule): - def __init__(self, layer_1_dim=128, learning_rate=1e-2): - super().__init__() - # call this to save (layer_1_dim=128, learning_rate=1e-4) to the checkpoint - self.save_hyperparameters() - - # equivalent - self.save_hyperparameters("layer_1_dim", "learning_rate") - - # Now possible to access layer_1_dim from hparams - self.hparams.layer_1_dim - - -In addition, loggers that support it will automatically log the contents of ``self.hparams``. - -Excluding hyperparameters -""""""""""""""""""""""""" - -By default, every parameter of the ``__init__`` method will be considered a hyperparameter to the LightningModule. -However, sometimes some parameters need to be excluded from saving, for example when they are not serializable. -Those parameters should be provided back when reloading the LightningModule. -In this case, exclude them explicitly: - -.. code-block:: python - - class LitMNIST(LightningModule): - def __init__(self, loss_fx, generator_network, layer_1_dim=128): - super().__init__() - self.layer_1_dim = layer_1_dim - self.loss_fx = loss_fx - - # call this to save only (layer_1_dim=128) to the checkpoint - self.save_hyperparameters("layer_1_dim") - - # equivalent - self.save_hyperparameters(ignore=["loss_fx", "generator_network"]) - - -load_from_checkpoint -"""""""""""""""""""" - -LightningModules that have hyperparameters automatically saved with :meth:`~pytorch_lightning.core.lightning.LightningModule.save_hyperparameters` -can conveniently be loaded and instantiated directly from a checkpoint with :meth:`~pytorch_lightning.core.lightning.LightningModule.load_from_checkpoint`: - -.. code-block:: python - - # to load specify the other args - model = LitMNIST.load_from_checkpoint(PATH, loss_fx=torch.nn.SomeOtherLoss, generator_network=MyGenerator()) - - -If parameters were excluded, they need to be provided at the time of loading: - -.. code-block:: python - - # the excluded parameters were `loss_fx` and `generator_network` - model = LitMNIST.load_from_checkpoint(PATH, loss_fx=torch.nn.SomeOtherLoss, generator_network=MyGenerator()) - - ----------- - -Trainer args -^^^^^^^^^^^^ -To recap, add ALL possible trainer flags to the argparser and init the ``Trainer`` this way - -.. code-block:: python - - parser = ArgumentParser() - parser = Trainer.add_argparse_args(parser) - hparams = parser.parse_args() - - trainer = Trainer.from_argparse_args(hparams) - - # or if you need to pass in callbacks - trainer = Trainer.from_argparse_args(hparams, enable_checkpointing=..., callbacks=[...]) - ----------- - -Multiple Lightning Modules -^^^^^^^^^^^^^^^^^^^^^^^^^^ - -We often have multiple Lightning Modules where each one has different arguments. Instead of -polluting the ``main.py`` file, the ``LightningModule`` lets you define arguments for each one. - -.. testcode:: - - class LitMNIST(LightningModule): - def __init__(self, layer_1_dim, **kwargs): - super().__init__() - self.layer_1 = nn.Linear(28 * 28, layer_1_dim) - - @staticmethod - def add_model_specific_args(parent_parser): - parser = parent_parser.add_argument_group("LitMNIST") - parser.add_argument("--layer_1_dim", type=int, default=128) - return parent_parser - -.. testcode:: - - class GoodGAN(LightningModule): - def __init__(self, encoder_layers, **kwargs): - super().__init__() - self.encoder = Encoder(layers=encoder_layers) - - @staticmethod - def add_model_specific_args(parent_parser): - parser = parent_parser.add_argument_group("GoodGAN") - parser.add_argument("--encoder_layers", type=int, default=12) - return parent_parser - - -Now we can allow each model to inject the arguments it needs in the ``main.py`` - -.. code-block:: python - - def main(args): - dict_args = vars(args) - - # pick model - if args.model_name == "gan": - model = GoodGAN(**dict_args) - elif args.model_name == "mnist": - model = LitMNIST(**dict_args) - - trainer = Trainer.from_argparse_args(args) - trainer.fit(model) - - - if __name__ == "__main__": - parser = ArgumentParser() - parser = Trainer.add_argparse_args(parser) - - # figure out which model to use - parser.add_argument("--model_name", type=str, default="gan", help="gan or mnist") - - # THIS LINE IS KEY TO PULL THE MODEL NAME - temp_args, _ = parser.parse_known_args() - - # let the model add what it wants - if temp_args.model_name == "gan": - parser = GoodGAN.add_model_specific_args(parser) - elif temp_args.model_name == "mnist": - parser = LitMNIST.add_model_specific_args(parser) - - args = parser.parse_args() - - # train - main(args) - -and now we can train MNIST or the GAN using the command line interface! - -.. code-block:: bash - - $ python main.py --model_name gan --encoder_layers 24 - $ python main.py --model_name mnist --layer_1_dim 128 diff --git a/source/common/lightning_module.rst b/source/common/lightning_module.rst deleted file mode 100644 index 19bb9b0..0000000 --- a/source/common/lightning_module.rst +++ /dev/null @@ -1,1664 +0,0 @@ -.. role:: hidden - :class: hidden-section - -.. _lightning_module: - -############### -LightningModule -############### - -A :class:`~LightningModule` organizes your PyTorch code into 6 sections: - -- Computations (init). -- Train Loop (training_step) -- Validation Loop (validation_step) -- Test Loop (test_step) -- Prediction Loop (predict_step) -- Optimizers and LR Schedulers (configure_optimizers) - -| - -.. raw:: html - - - -| - -Notice a few things. - -1. It is the SAME code. -2. The PyTorch code IS NOT abstracted - just organized. -3. All the other code that's not in the :class:`~LightningModule` - has been automated for you by the Trainer. - -| - - .. code-block:: python - - net = Net() - trainer = Trainer() - trainer.fit(net) - -4. There are no ``.cuda()`` or ``.to(device)`` calls required. Lightning does these for you. - -| - - .. code-block:: python - - # don't do in Lightning - x = torch.Tensor(2, 3) - x = x.cuda() - x = x.to(device) - - # do this instead - x = x # leave it alone! - - # or to init a new tensor - new_x = torch.Tensor(2, 3) - new_x = new_x.type_as(x) - -5. When running under a distributed strategy, Lightning handles the distributed sampler for you by default. - -| - - .. code-block:: python - - # Don't do in Lightning... - data = MNIST(...) - sampler = DistributedSampler(data) - DataLoader(data, sampler=sampler) - - # do this instead - data = MNIST(...) - DataLoader(data) - -6. A :class:`~LightningModule` is a :class:`torch.nn.Module` but with added functionality. Use it as such! - -| - - .. code-block:: python - - net = Net.load_from_checkpoint(PATH) - net.freeze() - out = net(x) - -Thus, to use Lightning, you just need to organize your code which takes about 30 minutes, -(and let's be real, you probably should do anyway). - ------------- - -*************** -Starter Example -*************** - -Here are the only required methods. - -.. code-block:: python - - import pytorch_lightning as pl - import torch.nn as nn - import torch.nn.functional as F - - - class LitModel(pl.LightningModule): - def __init__(self): - super().__init__() - self.l1 = nn.Linear(28 * 28, 10) - - def forward(self, x): - return torch.relu(self.l1(x.view(x.size(0), -1))) - - def training_step(self, batch, batch_idx): - x, y = batch - y_hat = self(x) - loss = F.cross_entropy(y_hat, y) - return loss - - def configure_optimizers(self): - return torch.optim.Adam(self.parameters(), lr=0.02) - -Which you can train by doing: - -.. code-block:: python - - train_loader = DataLoader(MNIST(os.getcwd(), download=True, transform=transforms.ToTensor())) - trainer = pl.Trainer(max_epochs=1) - model = LitModel() - - trainer.fit(model, train_dataloaders=train_loader) - -The LightningModule has many convenience methods, but the core ones you need to know about are: - -.. list-table:: - :widths: 50 50 - :header-rows: 1 - - * - Name - - Description - * - init - - Define computations here - * - forward - - Use for inference only (separate from training_step) - * - training_step - - the complete training loop - * - validation_step - - the complete validation loop - * - test_step - - the complete test loop - * - predict_step - - the complete prediction loop - * - configure_optimizers - - define optimizers and LR schedulers - ----------- - -******** -Training -******** - -Training Loop -============= - -To activate the training loop, override the :meth:`~pytorch_lightning.core.lightning.LightningModule.training_step` method. - -.. code-block:: python - - class LitClassifier(pl.LightningModule): - def __init__(self, model): - super().__init__() - self.model = model - - def training_step(self, batch, batch_idx): - x, y = batch - y_hat = self.model(x) - loss = F.cross_entropy(y_hat, y) - return loss - -Under the hood, Lightning does the following (pseudocode): - -.. code-block:: python - - # put model in train mode and enable gradient calculation - model.train() - torch.set_grad_enabled(True) - - outs = [] - for batch_idx, batch in enumerate(train_dataloader): - loss = training_step(batch, batch_idx) - outs.append(loss.detach()) - - # clear gradients - optimizer.zero_grad() - - # backward - loss.backward() - - # update parameters - optimizer.step() - - -Train Epoch-level Metrics -========================= - -If you want to calculate epoch-level metrics and log them, use :meth:`~pytorch_lightning.core.lightning.LightningModule.log`. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - x, y = batch - y_hat = self.model(x) - loss = F.cross_entropy(y_hat, y) - - # logs metrics for each training_step, - # and the average across the epoch, to the progress bar and logger - self.log("train_loss", loss, on_step=True, on_epoch=True, prog_bar=True, logger=True) - return loss - -The :meth:`~pytorch_lightning.core.lightning.LightningModule.log` object automatically reduces the -requested metrics across a complete epoch and devices. Here's the pseudocode of what it does under the hood: - -.. code-block:: python - - outs = [] - for batch_idx, batch in enumerate(train_dataloader): - # forward - loss = training_step(batch, batch_idx) - outs.append(loss) - - # clear gradients - optimizer.zero_grad() - - # backward - loss.backward() - - # update parameters - optimizer.step() - - epoch_metric = torch.mean(torch.stack([x for x in outs])) - -Train Epoch-level Operations -============================ - -If you need to do something with all the outputs of each :meth:`~pytorch_lightning.core.lightning.LightningModule.training_step`, -override the :meth:`~pytorch_lightning.core.lightning.LightningModule.training_epoch_end` method. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - x, y = batch - y_hat = self.model(x) - loss = F.cross_entropy(y_hat, y) - preds = ... - return {"loss": loss, "other_stuff": preds} - - - def training_epoch_end(self, training_step_outputs): - all_preds = torch.stack(training_step_outputs) - ... - -The matching pseudocode is: - -.. code-block:: python - - outs = [] - for batch_idx, batch in enumerate(train_dataloader): - # forward - loss = training_step(batch, batch_idx) - outs.append(loss) - - # clear gradients - optimizer.zero_grad() - - # backward - loss.backward() - - # update parameters - optimizer.step() - - training_epoch_end(outs) - -Training with DataParallel -========================== - -When training using a ``strategy`` that splits data from each batch across GPUs, sometimes you might -need to aggregate them on the main GPU for processing (DP, or DDP2). - -In this case, implement the :meth:`~pytorch_lightning.core.lightning.LightningModule.training_step_end` -method which will have outputs from all the devices and you can accumulate to get the effective results. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - x, y = batch - y_hat = self.model(x) - loss = F.cross_entropy(y_hat, y) - pred = ... - return {"loss": loss, "pred": pred} - - - def training_step_end(self, batch_parts): - # predictions from each GPU - predictions = batch_parts["pred"] - # losses from each GPU - losses = batch_parts["loss"] - - gpu_0_prediction = predictions[0] - gpu_1_prediction = predictions[1] - - # do something with both outputs - return (losses[0] + losses[1]) / 2 - - - def training_epoch_end(self, training_step_outputs): - for out in training_step_outputs: - ... - -Here is the Lightning training pseudo-code for DP: - -.. code-block:: python - - outs = [] - for batch_idx, train_batch in enumerate(train_dataloader): - batches = split_batch(train_batch) - dp_outs = [] - for sub_batch in batches: - # 1 - dp_out = training_step(sub_batch, batch_idx) - dp_outs.append(dp_out) - - # 2 - out = training_step_end(dp_outs) - outs.append(out) - - # do something with the outputs for all batches - # 3 - training_epoch_end(outs) - ------------------- - -********** -Validation -********** - -Validation Loop -=============== - -To activate the validation loop while training, override the :meth:`~pytorch_lightning.core.lightning.LightningModule.validation_step` method. - -.. code-block:: python - - class LitModel(pl.LightningModule): - def validation_step(self, batch, batch_idx): - x, y = batch - y_hat = self.model(x) - loss = F.cross_entropy(y_hat, y) - self.log("val_loss", loss) - -Under the hood, Lightning does the following (pseudocode): - -.. code-block:: python - - # ... - for batch_idx, batch in enumerate(train_dataloader): - loss = model.training_step(batch, batch_idx) - loss.backward() - # ... - - if validate_at_some_point: - # disable grads + batchnorm + dropout - torch.set_grad_enabled(False) - model.eval() - - # ----------------- VAL LOOP --------------- - for val_batch_idx, val_batch in enumerate(val_dataloader): - val_out = model.validation_step(val_batch, val_batch_idx) - # ----------------- VAL LOOP --------------- - - # enable grads + batchnorm + dropout - torch.set_grad_enabled(True) - model.train() - -You can also run just the validation loop on your validation dataloaders by overriding :meth:`~pytorch_lightning.core.lightning.LightningModule.validation_step` -and calling :meth:`~pytorch_lightning.trainer.trainer.Trainer.validate`. - -.. code-block:: python - - model = Model() - trainer = Trainer() - trainer.validate(model) - -.. note:: - - It is recommended to validate on single device to ensure each sample/batch gets evaluated exactly once. - This is helpful to make sure benchmarking for research papers is done the right way. Otherwise, in a - multi-device setting, samples could occur duplicated when :class:`~torch.utils.data.distributed.DistributedSampler` - is used, for eg. with ``strategy="ddp"``. It replicates some samples on some devices to make sure all devices have - same batch size in case of uneven inputs. - - -Validation Epoch-level Metrics -============================== - -If you need to do something with all the outputs of each :meth:`~pytorch_lightning.core.lightning.LightningModule.validation_step`, -override the :meth:`~pytorch_lightning.core.lightning.LightningModule.validation_epoch_end` method. Note that this method is called before :meth:`~pytorch_lightning.core.lightning.LightningModule.training_epoch_end`. - -.. code-block:: python - - def validation_step(self, batch, batch_idx): - x, y = batch - y_hat = self.model(x) - loss = F.cross_entropy(y_hat, y) - pred = ... - return pred - - - def validation_epoch_end(self, validation_step_outputs): - all_preds = torch.stack(validation_step_outputs) - ... - -Validating with DataParallel -============================ - -When training using a ``strategy`` that splits data from each batch across GPUs, sometimes you might -need to aggregate them on the main GPU for processing (DP, or DDP2). - -In this case, implement the :meth:`~pytorch_lightning.core.lightning.LightningModule.validation_step_end` -method which will have outputs from all the devices and you can accumulate to get the effective results. - -.. code-block:: python - - def validation_step(self, batch, batch_idx): - x, y = batch - y_hat = self.model(x) - loss = F.cross_entropy(y_hat, y) - pred = ... - return {"loss": loss, "pred": pred} - - - def validation_step_end(self, batch_parts): - # predictions from each GPU - predictions = batch_parts["pred"] - # losses from each GPU - losses = batch_parts["loss"] - - gpu_0_prediction = predictions[0] - gpu_1_prediction = predictions[1] - - # do something with both outputs - return (losses[0] + losses[1]) / 2 - - - def validation_epoch_end(self, validation_step_outputs): - for out in validation_step_outputs: - ... - -Here is the Lightning validation pseudo-code for DP: - -.. code-block:: python - - outs = [] - for batch in dataloader: - batches = split_batch(batch) - dp_outs = [] - for sub_batch in batches: - # 1 - dp_out = validation_step(sub_batch) - dp_outs.append(dp_out) - - # 2 - out = validation_step_end(dp_outs) - outs.append(out) - - # do something with the outputs for all batches - # 3 - validation_epoch_end(outs) - ----------------- - -******* -Testing -******* - -Test Loop -========= - -The process for enabling a test loop is the same as the process for enabling a validation loop. Please refer to -the section above for details. For this you need to override the :meth:`~pytorch_lightning.core.lightning.LightningModule.test_step` method. - -The only difference is that the test loop is only called when :meth:`~pytorch_lightning.trainer.trainer.Trainer.test` is used. - -.. code-block:: python - - model = Model() - trainer = Trainer() - trainer.fit(model) - - # automatically loads the best weights for you - trainer.test(model) - -There are two ways to call ``test()``: - -.. code-block:: python - - # call after training - trainer = Trainer() - trainer.fit(model) - - # automatically auto-loads the best weights from the previous run - trainer.test(dataloaders=test_dataloader) - - # or call with pretrained model - model = MyLightningModule.load_from_checkpoint(PATH) - trainer = Trainer() - trainer.test(model, dataloaders=test_dataloader) - -.. note:: - - It is recommended to validate on single device to ensure each sample/batch gets evaluated exactly once. - This is helpful to make sure benchmarking for research papers is done the right way. Otherwise, in a - multi-device setting, samples could occur duplicated when :class:`~torch.utils.data.distributed.DistributedSampler` - is used, for eg. with ``strategy="ddp"``. It replicates some samples on some devices to make sure all devices have - same batch size in case of uneven inputs. - - ----------- - -********* -Inference -********* - -Prediction Loop -=============== - -By default, the :meth:`~pytorch_lightning.core.lightning.LightningModule.predict_step` method runs the -:meth:`~pytorch_lightning.core.lightning.LightningModule.forward` method. In order to customize this behaviour, -simply override the :meth:`~pytorch_lightning.core.lightning.LightningModule.predict_step` method. - -For the example let's override ``predict_step`` and try out `Monte Carlo Dropout `_: - -.. code-block:: python - - class LitMCdropoutModel(pl.LightningModule): - def __init__(self, model, mc_iteration): - super().__init__() - self.model = model - self.dropout = nn.Dropout() - self.mc_iteration = mc_iteration - - def predict_step(self, batch, batch_idx): - # enable Monte Carlo Dropout - self.dropout.train() - - # take average of `self.mc_iteration` iterations - pred = torch.vstack([self.dropout(self.model(x)).unsqueeze(0) for _ in range(self.mc_iteration)]).mean(dim=0) - return pred - -Under the hood, Lightning does the following (pseudocode): - -.. code-block:: python - - # disable grads + batchnorm + dropout - torch.set_grad_enabled(False) - model.eval() - all_preds = [] - - for batch_idx, batch in enumerate(predict_dataloader): - pred = model.predict_step(batch, batch_idx) - all_preds.append(pred) - -There are two ways to call ``predict()``: - -.. code-block:: python - - # call after training - trainer = Trainer() - trainer.fit(model) - - # automatically auto-loads the best weights from the previous run - predictions = trainer.predict(dataloaders=predict_dataloader) - - # or call with pretrained model - model = MyLightningModule.load_from_checkpoint(PATH) - trainer = Trainer() - predictions = trainer.predict(model, dataloaders=test_dataloader) - -Inference in Research -===================== - -If you want to perform inference with the system, you can add a ``forward`` method to the LightningModule. - -.. note:: When using forward, you are responsible to call :func:`~torch.nn.Module.eval` and use the :func:`~torch.no_grad` context manager. - -.. code-block:: python - - class Autoencoder(pl.LightningModule): - def forward(self, x): - return self.decoder(x) - - - model = Autoencoder() - model.eval() - with torch.no_grad(): - reconstruction = model(embedding) - -The advantage of adding a forward is that in complex systems, you can do a much more involved inference procedure, -such as text generation: - -.. code-block:: python - - class Seq2Seq(pl.LightningModule): - def forward(self, x): - embeddings = self(x) - hidden_states = self.encoder(embeddings) - for h in hidden_states: - # decode - ... - return decoded - -In the case where you want to scale your inference, you should be using -:meth:`~pytorch_lightning.core.lightning.LightningModule.predict_step`. - -.. code-block:: python - - class Autoencoder(pl.LightningModule): - def forward(self, x): - return self.decoder(x) - - def predict_step(self, batch, batch_idx, dataloader_idx=0): - # this calls forward - return self(batch) - - - data_module = ... - model = Autoencoder() - trainer = Trainer(accelerator="gpu", devices=2) - trainer.predict(model, data_module) - -Inference in Production -======================= - -For cases like production, you might want to iterate different models inside a LightningModule. - -.. code-block:: python - - from torchmetrics.functional import accuracy - - - class ClassificationTask(pl.LightningModule): - def __init__(self, model): - super().__init__() - self.model = model - - def training_step(self, batch, batch_idx): - x, y = batch - y_hat = self.model(x) - loss = F.cross_entropy(y_hat, y) - return loss - - def validation_step(self, batch, batch_idx): - loss, acc = self._shared_eval_step(batch, batch_idx) - metrics = {"val_acc": acc, "val_loss": loss} - self.log_dict(metrics) - return metrics - - def test_step(self, batch, batch_idx): - loss, acc = self._shared_eval_step(batch, batch_idx) - metrics = {"test_acc": acc, "test_loss": loss} - self.log_dict(metrics) - return metrics - - def _shared_eval_step(self, batch, batch_idx): - x, y = batch - y_hat = self.model(x) - loss = F.cross_entropy(y_hat, y) - acc = accuracy(y_hat, y) - return loss, acc - - def predict_step(self, batch, batch_idx, dataloader_idx=0): - x, y = batch - y_hat = self.model(x) - return y_hat - - def configure_optimizers(self): - return torch.optim.Adam(self.model.parameters(), lr=0.02) - -Then pass in any arbitrary model to be fit with this task - -.. code-block:: python - - for model in [resnet50(), vgg16(), BidirectionalRNN()]: - task = ClassificationTask(model) - - trainer = Trainer(accelerator="gpu", devices=2) - trainer.fit(task, train_dataloaders=train_dataloader, val_dataloaders=val_dataloader) - -Tasks can be arbitrarily complex such as implementing GAN training, self-supervised or even RL. - -.. code-block:: python - - class GANTask(pl.LightningModule): - def __init__(self, generator, discriminator): - super().__init__() - self.generator = generator - self.discriminator = discriminator - - ... - -When used like this, the model can be separated from the Task and thus used in production without needing to keep it in -a ``LightningModule``. - -The following example shows how you can run inference in the Python runtime: - -.. code-block:: python - - task = ClassificationTask(model) - trainer = Trainer(accelerator="gpu", devices=2) - trainer.fit(task, train_dataloader, val_dataloader) - trainer.save_checkpoint("best_model.ckpt") - - # use model after training or load weights and drop into the production system - model = ClassificationTask.load_from_checkpoint("best_model.ckpt") - x = ... - model.eval() - with torch.no_grad(): - y_hat = model(x) - -Check out :ref:`Inference in Production ` guide to learn about the possible ways to perform inference in production. - - ------------ - - -************* -Child Modules -************* - -.. include:: ../common/child_modules.rst - ------------ - -******************* -LightningModule API -******************* - - -Methods -======= - -all_gather -~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.all_gather - :noindex: - -configure_callbacks -~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.configure_callbacks - :noindex: - -configure_optimizers -~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.configure_optimizers - :noindex: - -forward -~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.forward - :noindex: - -freeze -~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.freeze - :noindex: - -.. _lm-log: - -log -~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.log - :noindex: - -log_dict -~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.log_dict - :noindex: - -lr_schedulers -~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.lr_schedulers - :noindex: - -manual_backward -~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.manual_backward - :noindex: - -optimizers -~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.optimizers - :noindex: - -print -~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.print - :noindex: - -predict_step -~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.predict_step - :noindex: - -save_hyperparameters -~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.save_hyperparameters - :noindex: - -toggle_optimizer -~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.toggle_optimizer - :noindex: - -test_step -~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.test_step - :noindex: - -test_step_end -~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.test_step_end - :noindex: - -test_epoch_end -~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.test_epoch_end - :noindex: - -to_onnx -~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.to_onnx - :noindex: - -to_torchscript -~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.to_torchscript - :noindex: - -training_step -~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.training_step - :noindex: - -training_step_end -~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.training_step_end - :noindex: - -training_epoch_end -~~~~~~~~~~~~~~~~~~ -.. automethod:: pytorch_lightning.core.lightning.LightningModule.training_epoch_end - :noindex: - -unfreeze -~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.unfreeze - :noindex: - -untoggle_optimizer -~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.untoggle_optimizer - :noindex: - -validation_step -~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.validation_step - :noindex: - -validation_step_end -~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.validation_step_end - :noindex: - -validation_epoch_end -~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.validation_epoch_end - :noindex: - ------------ - -Properties -========== - -These are properties available in a LightningModule. - -current_epoch -~~~~~~~~~~~~~ - -The number of epochs run. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - if self.current_epoch == 0: - ... - -device -~~~~~~ - -The device the module is on. Use it to keep your code device agnostic. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - z = torch.rand(2, 3, device=self.device) - -global_rank -~~~~~~~~~~~ - -The ``global_rank`` is the index of the current process across all nodes and devices. -Lightning will perform some operations such as logging, weight checkpointing only when ``global_rank=0``. You -usually do not need to use this property, but it is useful to know how to access it if needed. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - if self.global_rank == 0: - # do something only once across all the nodes - ... - -global_step -~~~~~~~~~~~ - -The number of optimizer steps taken (does not reset each epoch). -This includes multiple optimizers and TBPTT steps (if enabled). - -.. code-block:: python - - def training_step(self, batch, batch_idx): - self.logger.experiment.log_image(..., step=self.global_step) - -hparams -~~~~~~~ - -The arguments passed through ``LightningModule.__init__()`` and saved by calling -:meth:`~pytorch_lightning.core.mixins.hparams_mixin.HyperparametersMixin.save_hyperparameters` could be accessed by the ``hparams`` attribute. - -.. code-block:: python - - def __init__(self, learning_rate): - self.save_hyperparameters() - - - def configure_optimizers(self): - return Adam(self.parameters(), lr=self.hparams.learning_rate) - -logger -~~~~~~ - -The current logger being used (tensorboard or other supported logger) - -.. code-block:: python - - def training_step(self, batch, batch_idx): - # the generic logger (same no matter if tensorboard or other supported logger) - self.logger - - # the particular logger - tensorboard_logger = self.logger.experiment - -loggers -~~~~~~~ - -The list of loggers currently being used by the Trainer. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - # List of Logger objects - loggers = self.loggers - for logger in loggers: - logger.log_metrics({"foo": 1.0}) - -local_rank -~~~~~~~~~~~ - -The ``local_rank`` is the index of the current process across all the devices for the current node. -You usually do not need to use this property, but it is useful to know how to access it if needed. -For example, if using 10 machines (or nodes), the GPU at index 0 on each machine has local_rank = 0. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - if self.local_rank == 0: - # do something only once across each node - ... - -precision -~~~~~~~~~ - -The type of precision used: - -.. code-block:: python - - def training_step(self, batch, batch_idx): - if self.precision == 16: - ... - -trainer -~~~~~~~ - -Pointer to the trainer - -.. code-block:: python - - def training_step(self, batch, batch_idx): - max_steps = self.trainer.max_steps - any_flag = self.trainer.any_flag - -prepare_data_per_node -~~~~~~~~~~~~~~~~~~~~~ - -If set to ``True`` will call ``prepare_data()`` on LOCAL_RANK=0 for every node. -If set to ``False`` will only call from NODE_RANK=0, LOCAL_RANK=0. - -.. testcode:: - - class LitModel(LightningModule): - def __init__(self): - super().__init__() - self.prepare_data_per_node = True - -automatic_optimization -~~~~~~~~~~~~~~~~~~~~~~ - -When set to ``False``, Lightning does not automate the optimization process. This means you are responsible for handling -your optimizers. However, we do take care of precision and any accelerators used. - -See :ref:`manual optimization ` for details. - -.. code-block:: python - - def __init__(self): - self.automatic_optimization = False - - - def training_step(self, batch, batch_idx): - opt = self.optimizers(use_pl_optimizer=True) - - loss = ... - opt.zero_grad() - self.manual_backward(loss) - opt.step() - -This is recommended only if using 2+ optimizers AND if you know how to perform the optimization procedure properly. Note -that automatic optimization can still be used with multiple optimizers by relying on the ``optimizer_idx`` parameter. -Manual optimization is most useful for research topics like reinforcement learning, sparse coding, and GAN research. - -.. code-block:: python - - def __init__(self): - self.automatic_optimization = False - - - def training_step(self, batch, batch_idx): - # access your optimizers with use_pl_optimizer=False. Default is True - opt_a, opt_b = self.optimizers(use_pl_optimizer=True) - - gen_loss = ... - opt_a.zero_grad() - self.manual_backward(gen_loss) - opt_a.step() - - disc_loss = ... - opt_b.zero_grad() - self.manual_backward(disc_loss) - opt_b.step() - -example_input_array -~~~~~~~~~~~~~~~~~~~ - -Set and access example_input_array, which basically represents a single batch. - -.. code-block:: python - - def __init__(self): - self.example_input_array = ... - self.generator = ... - - - def on_train_epoch_end(self): - # generate some images using the example_input_array - gen_images = self.generator(self.example_input_array) - -truncated_bptt_steps -~~~~~~~~~~~~~~~~~~~~ - -Truncated Backpropagation Through Time (TBPTT) performs perform backpropogation every k steps of -a much longer sequence. This is made possible by passing training batches -split along the time-dimensions into splits of size k to the -``training_step``. In order to keep the same forward propagation behavior, all -hidden states should be kept in-between each time-dimension split. - - -If this is enabled, your batches will automatically get truncated -and the Trainer will apply Truncated Backprop to it. - -(`Williams et al. "An efficient gradient-based algorithm for on-line training of -recurrent network trajectories." -`_) - -`Tutorial `_ - -.. testcode:: python - - from pytorch_lightning import LightningModule - - - class MyModel(LightningModule): - def __init__(self, input_size, hidden_size, num_layers): - super().__init__() - # batch_first has to be set to True - self.lstm = nn.LSTM( - input_size=input_size, - hidden_size=hidden_size, - num_layers=num_layers, - batch_first=True, - ) - - ... - - # Important: This property activates truncated backpropagation through time - # Setting this value to 2 splits the batch into sequences of size 2 - self.truncated_bptt_steps = 2 - - # Truncated back-propagation through time - def training_step(self, batch, batch_idx, hiddens): - x, y = batch - - # the training step must be updated to accept a ``hiddens`` argument - # hiddens are the hiddens from the previous truncated backprop step - out, hiddens = self.lstm(x, hiddens) - - ... - - return {"loss": ..., "hiddens": hiddens} - -Lightning takes care of splitting your batch along the time-dimension. It is -assumed to be the second dimension of your batches. Therefore, in the -example above, we have set ``batch_first=True``. - -.. code-block:: python - - # we use the second as the time dimension - # (batch, time, ...) - sub_batch = batch[0, 0:t, ...] - -To modify how the batch is split, -override the :meth:`pytorch_lightning.core.lightning.LightningModule.tbptt_split_batch` method: - -.. testcode:: python - - class LitMNIST(LightningModule): - def tbptt_split_batch(self, batch, split_size): - # do your own splitting on the batch - return splits - --------------- - -.. _lightning_hooks: - -Hooks -===== - -This is the pseudocode to describe the structure of :meth:`~pytorch_lightning.trainer.Trainer.fit`. -The inputs and outputs of each function are not represented for simplicity. Please check each function's API reference -for more information. - -.. code-block:: python - - def fit(self): - if global_rank == 0: - # prepare data is called on GLOBAL_ZERO only - prepare_data() - - configure_callbacks() - - with parallel(devices): - # devices can be GPUs, TPUs, ... - train_on_device(model) - - - def train_on_device(model): - # called PER DEVICE - on_fit_start() - setup("fit") - configure_optimizers() - - # the sanity check runs here - - on_train_start() - for epoch in epochs: - fit_loop() - on_train_end() - - on_fit_end() - teardown("fit") - - - def fit_loop(): - on_train_epoch_start() - - for batch in train_dataloader(): - on_train_batch_start() - - on_before_batch_transfer() - transfer_batch_to_device() - on_after_batch_transfer() - - training_step() - - on_before_zero_grad() - optimizer_zero_grad() - - on_before_backward() - backward() - on_after_backward() - - on_before_optimizer_step() - configure_gradient_clipping() - optimizer_step() - - on_train_batch_end() - - if should_check_val: - val_loop() - # end training epoch - training_epoch_end() - - on_train_epoch_end() - - - def val_loop(): - on_validation_model_eval() # calls `model.eval()` - torch.set_grad_enabled(False) - - on_validation_start() - on_validation_epoch_start() - - val_outs = [] - for batch_idx, batch in enumerate(val_dataloader()): - on_validation_batch_start(batch, batch_idx) - - batch = on_before_batch_transfer(batch) - batch = transfer_batch_to_device(batch) - batch = on_after_batch_transfer(batch) - - out = validation_step(batch, batch_idx) - - on_validation_batch_end(batch, batch_idx) - val_outs.append(out) - - validation_epoch_end(val_outs) - - on_validation_epoch_end() - on_validation_end() - - # set up for train - on_validation_model_train() # calls `model.train()` - torch.set_grad_enabled(True) - -backward -~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.backward - :noindex: - -on_before_backward -~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_before_backward - :noindex: - -on_after_backward -~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_after_backward - :noindex: - -on_before_zero_grad -~~~~~~~~~~~~~~~~~~~ -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_before_zero_grad - :noindex: - -on_fit_start -~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_fit_start - :noindex: - -on_fit_end -~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_fit_end - :noindex: - - -on_load_checkpoint -~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_load_checkpoint - :noindex: - -on_save_checkpoint -~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_save_checkpoint - :noindex: - -load_from_checkpoint -~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.load_from_checkpoint - :noindex: - -on_hpc_save -~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_hpc_save - :noindex: - -on_hpc_load -~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_hpc_load - :noindex: - -on_train_start -~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_train_start - :noindex: - -on_train_end -~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_train_end - :noindex: - -on_validation_start -~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_validation_start - :noindex: - -on_validation_end -~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_validation_end - :noindex: - -on_test_batch_start -~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_test_batch_start - :noindex: - -on_test_batch_end -~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_test_batch_end - :noindex: - -on_test_epoch_start -~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_test_epoch_start - :noindex: - -on_test_epoch_end -~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_test_epoch_end - :noindex: - -on_test_start -~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_test_start - :noindex: - -on_test_end -~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_test_end - :noindex: - -on_predict_batch_start -~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_predict_batch_start - :noindex: - -on_predict_batch_end -~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_predict_batch_end - :noindex: - -on_predict_epoch_start -~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_predict_epoch_start - :noindex: - -on_predict_epoch_end -~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_predict_epoch_end - :noindex: - -on_predict_start -~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_predict_start - :noindex: - -on_predict_end -~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_predict_end - :noindex: - -on_train_batch_start -~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_train_batch_start - :noindex: - -on_train_batch_end -~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_train_batch_end - :noindex: - -on_train_epoch_start -~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_train_epoch_start - :noindex: - -on_train_epoch_end -~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_train_epoch_end - :noindex: - -on_validation_batch_start -~~~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_validation_batch_start - :noindex: - -on_validation_batch_end -~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_validation_batch_end - :noindex: - -on_validation_epoch_start -~~~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_validation_epoch_start - :noindex: - -on_validation_epoch_end -~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_validation_epoch_end - :noindex: - -on_post_move_to_device -~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_post_move_to_device - :noindex: - -configure_sharded_model -~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.configure_sharded_model - :noindex: - -on_validation_model_eval -~~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_validation_model_eval - :noindex: - -on_validation_model_train -~~~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_validation_model_train - :noindex: - -on_test_model_eval -~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_test_model_eval - :noindex: - -on_test_model_train -~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_test_model_train - :noindex: - -on_before_optimizer_step -~~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_before_optimizer_step - :noindex: - -configure_gradient_clipping -~~~~~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.configure_gradient_clipping - :noindex: - -optimizer_step -~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.optimizer_step - :noindex: - -optimizer_zero_grad -~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.optimizer_zero_grad - :noindex: - -prepare_data -~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.prepare_data - :noindex: - -setup -~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.setup - :noindex: - -tbptt_split_batch -~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.tbptt_split_batch - :noindex: - -teardown -~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.teardown - :noindex: - -train_dataloader -~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.train_dataloader - :noindex: - -val_dataloader -~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.val_dataloader - :noindex: - -test_dataloader -~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.test_dataloader - :noindex: - -predict_dataloader -~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.predict_dataloader - :noindex: - -on_train_dataloader -~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_train_dataloader - :noindex: - -on_val_dataloader -~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_val_dataloader - :noindex: - -on_test_dataloader -~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_test_dataloader - :noindex: - -on_predict_dataloader -~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_predict_dataloader - :noindex: - -transfer_batch_to_device -~~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.transfer_batch_to_device - :noindex: - -on_before_batch_transfer -~~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_before_batch_transfer - :noindex: - -on_after_batch_transfer -~~~~~~~~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.on_after_batch_transfer - :noindex: - -add_to_queue -~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.add_to_queue - :noindex: - -get_from_queue -~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.core.lightning.LightningModule.get_from_queue - :noindex: diff --git a/source/common/optimization.rst b/source/common/optimization.rst deleted file mode 100644 index e7e9e12..0000000 --- a/source/common/optimization.rst +++ /dev/null @@ -1,327 +0,0 @@ -:orphan: - -.. _optimization: - -############ -Optimization -############ - -Lightning offers two modes for managing the optimization process: - -- Manual Optimization -- Automatic Optimization - -For the majority of research cases, **automatic optimization** will do the right thing for you and it is what most -users should use. - -For advanced/expert users who want to do esoteric optimization schedules or techniques, use **manual optimization**. - -.. _manual_optimization: - ----- - -.. include:: ../model/manual_optimization.rst - ------ - -********************** -Automatic Optimization -********************** - -With Lightning, most users don't have to think about when to call ``.zero_grad()``, ``.backward()`` and ``.step()`` -since Lightning automates that for you. - -Under the hood, Lightning does the following: - -.. code-block:: python - - for epoch in epochs: - for batch in data: - - def closure(): - loss = model.training_step(batch, batch_idx, ...) - optimizer.zero_grad() - loss.backward() - return loss - - optimizer.step(closure) - - lr_scheduler.step() - -In the case of multiple optimizers, Lightning does the following: - -.. code-block:: python - - for epoch in epochs: - for batch in data: - for opt in optimizers: - - def closure(): - loss = model.training_step(batch, batch_idx, optimizer_idx) - opt.zero_grad() - loss.backward() - return loss - - opt.step(closure) - - for lr_scheduler in lr_schedulers: - lr_scheduler.step() - -As can be seen in the code snippet above, Lightning defines a closure with ``training_step()``, ``optimizer.zero_grad()`` -and ``loss.backward()`` for the optimization. This mechanism is in place to support optimizers which operate on the -output of the closure (e.g. the loss) or need to call the closure several times (e.g. :class:`~torch.optim.LBFGS`). - -.. warning:: - - Before v1.2.2, Lightning internally calls ``backward``, ``step`` and ``zero_grad`` in the order. - From v1.2.2, the order is changed to ``zero_grad``, ``backward`` and ``step``. - - -Gradient Accumulation -===================== - -.. include:: ../common/gradient_accumulation.rst - - -Use Multiple Optimizers (like GANs) -=================================== - -To use multiple optimizers (optionally with learning rate schedulers), return two or more optimizers from -:meth:`~pytorch_lightning.core.lightning.LightningModule.configure_optimizers`. - -.. testcode:: python - - # two optimizers, no schedulers - def configure_optimizers(self): - return Adam(...), SGD(...) - - - # two optimizers, one scheduler for adam only - def configure_optimizers(self): - opt1 = Adam(...) - opt2 = SGD(...) - optimizers = [opt1, opt2] - lr_schedulers = {"scheduler": ReduceLROnPlateau(opt1, ...), "monitor": "metric_to_track"} - return optimizers, lr_schedulers - - - # two optimizers, two schedulers - def configure_optimizers(self): - opt1 = Adam(...) - opt2 = SGD(...) - return [opt1, opt2], [StepLR(opt1, ...), OneCycleLR(opt2, ...)] - -Under the hood, Lightning will call each optimizer sequentially: - -.. code-block:: python - - for epoch in epochs: - for batch in data: - for opt in optimizers: - loss = train_step(batch, batch_idx, optimizer_idx) - opt.zero_grad() - loss.backward() - opt.step() - - for lr_scheduler in lr_schedulers: - lr_scheduler.step() - - -Step Optimizeres at Arbitrary Intervals -======================================= - -To do more interesting things with your optimizers such as learning rate warm-up or odd scheduling, -override the :meth:`~pytorch_lightning.core.lightning.LightningModule.optimizer_step` function. - -.. warning:: - If you are overriding this method, make sure that you pass the ``optimizer_closure`` parameter to - ``optimizer.step()`` function as shown in the examples because ``training_step()``, ``optimizer.zero_grad()``, - ``loss.backward()`` are called in the closure function. - -For example, here step optimizer A every batch and optimizer B every 2 batches. - -.. testcode:: python - - # Alternating schedule for optimizer steps (e.g. GANs) - def optimizer_step( - self, - epoch, - batch_idx, - optimizer, - optimizer_idx, - optimizer_closure, - on_tpu=False, - using_native_amp=False, - using_lbfgs=False, - ): - # update generator every step - if optimizer_idx == 0: - optimizer.step(closure=optimizer_closure) - - # update discriminator every 2 steps - if optimizer_idx == 1: - if (batch_idx + 1) % 2 == 0: - # the closure (which includes the `training_step`) will be executed by `optimizer.step` - optimizer.step(closure=optimizer_closure) - else: - # call the closure by itself to run `training_step` + `backward` without an optimizer step - optimizer_closure() - - # ... - # add as many optimizers as you want - -Here we add a manual learning rate warm-up without an lr scheduler. - -.. testcode:: python - - # learning rate warm-up - def optimizer_step( - self, - epoch, - batch_idx, - optimizer, - optimizer_idx, - optimizer_closure, - on_tpu=False, - using_native_amp=False, - using_lbfgs=False, - ): - # update params - optimizer.step(closure=optimizer_closure) - - # skip the first 500 steps - if self.trainer.global_step < 500: - lr_scale = min(1.0, float(self.trainer.global_step + 1) / 500.0) - for pg in optimizer.param_groups: - pg["lr"] = lr_scale * self.hparams.learning_rate - - -Access your Own Optimizer -========================= - -The provided ``optimizer`` is a :class:`~pytorch_lightning.core.optimizer.LightningOptimizer` object wrapping your own optimizer -configured in your :meth:`~pytorch_lightning.core.lightning.LightningModule.configure_optimizers`. -You can access your own optimizer with ``optimizer.optimizer``. However, if you use your own optimizer -to perform a step, Lightning won't be able to support accelerators, precision and profiling for you. - -.. testcode:: python - - # function hook in LightningModule - def optimizer_step( - self, - epoch, - batch_idx, - optimizer, - optimizer_idx, - optimizer_closure, - on_tpu=False, - using_native_amp=False, - using_lbfgs=False, - ): - optimizer.step(closure=optimizer_closure) - - - # `optimizer` is a `LightningOptimizer` wrapping the optimizer. - # To access it, do the following. - # However, it won't work on TPU, AMP, etc... - def optimizer_step( - self, - epoch, - batch_idx, - optimizer, - optimizer_idx, - optimizer_closure, - on_tpu=False, - using_native_amp=False, - using_lbfgs=False, - ): - optimizer = optimizer.optimizer - optimizer.step(closure=optimizer_closure) - ------ - - -Bring your own Custom Learning Rate Schedulers -============================================== - -Lightning allows using custom learning rate schedulers that aren't available in `PyTorch natively `_. -One good example is `Timm Schedulers `_. When using custom learning rate schedulers -relying on a different API from Native PyTorch ones, you should override the :meth:`~pytorch_lightning.core.lightning.LightningModule.lr_scheduler_step` with your desired logic. -If you are using native PyTorch schedulers, there is no need to override this hook since Lightning will handle it automatically by default. - -.. code-block:: python - - from timm.scheduler import TanhLRScheduler - - - def configure_optimizers(self): - optimizer = ... - scheduler = TanhLRScheduler(optimizer, ...) - return [optimizer], [{"scheduler": scheduler, "interval": "epoch"}] - - - def lr_scheduler_step(self, scheduler, optimizer_idx, metric): - scheduler.step(epoch=self.current_epoch) # timm's scheduler need the epoch value - - -.. _configure_gradient_clipping: - -Configure Gradient Clipping -=========================== - -To configure custom gradient clipping, consider overriding -the :meth:`~pytorch_lightning.core.lightning.LightningModule.configure_gradient_clipping` method. -Attributes ``gradient_clip_val`` and ``gradient_clip_algorithm`` from Trainer will be passed in the -respective arguments here and Lightning will handle gradient clipping for you. In case you want to set -different values for your arguments of your choice and let Lightning handle the gradient clipping, you can -use the inbuilt :meth:`~pytorch_lightning.core.lightning.LightningModule.clip_gradients` method and pass -the arguments along with your optimizer. - -.. warning:: - Make sure to not override :meth:`~pytorch_lightning.core.lightning.LightningModule.clip_gradients` - method. If you want to customize gradient clipping, consider using - :meth:`~pytorch_lightning.core.lightning.LightningModule.configure_gradient_clipping` method. - -For example, here we will apply gradient clipping only to the gradients associated with optimizer A. - -.. testcode:: python - - def configure_gradient_clipping(self, optimizer, optimizer_idx, gradient_clip_val, gradient_clip_algorithm): - if optimizer_idx == 0: - # Lightning will handle the gradient clipping - self.clip_gradients( - optimizer, gradient_clip_val=gradient_clip_val, gradient_clip_algorithm=gradient_clip_algorithm - ) - -Here we configure gradient clipping differently for optimizer B. - -.. testcode:: python - - def configure_gradient_clipping(self, optimizer, optimizer_idx, gradient_clip_val, gradient_clip_algorithm): - if optimizer_idx == 0: - # Lightning will handle the gradient clipping - self.clip_gradients( - optimizer, gradient_clip_val=gradient_clip_val, gradient_clip_algorithm=gradient_clip_algorithm - ) - elif optimizer_idx == 1: - self.clip_gradients( - optimizer, gradient_clip_val=gradient_clip_val * 2, gradient_clip_algorithm=gradient_clip_algorithm - ) - - -Total Stepping Batches -====================== - -You can use built-in trainer property :paramref:`~pytorch_lightning.trainer.trainer.Trainer.estimated_stepping_batches` to compute -total number of stepping batches for the complete training. The property is computed considering gradient accumulation factor and -distributed setting into consideration so you don't have to derive it manually. One good example where this can be helpful is while using -:class:`~torch.optim.lr_scheduler.OneCycleLR` scheduler, which requires pre-computed ``total_steps`` during initialization. - -.. code-block:: python - - def configure_optimizers(self): - optimizer = ... - scheduler = torch.optim.lr_scheduler.OneCycleLR( - optimizer, max_lr=1e-3, total_steps=self.trainer.estimated_stepping_batches - ) - return [optimizer], [scheduler] diff --git a/source/common/precision_basic.rst b/source/common/precision_basic.rst deleted file mode 100644 index 3cc0b3a..0000000 --- a/source/common/precision_basic.rst +++ /dev/null @@ -1,92 +0,0 @@ -:orphan: - -.. _precision_basic: - -####################### -N-Bit Precision (Basic) -####################### -**Audience:** Users looking to train models faster and consume less memory. - ----- - -If you're looking to run models faster or consume less memory, consider tweaking the precision settings of your models. - -Lower precision, such as 16-bit floating-point, requires less memory and enables training and deploying larger models. -Higher precision, such as the 64-bit floating-point, can be used for highly sensitive use-cases. - ----- - -**************** -16-bit Precision -**************** - -Use 16-bit precision to cut your memory consumption in half so that you can train and deploy larger models. If your GPUs are [`Tensor Core `_] GPUs, you can also get a ~3x speed improvement. Half precision can sometimes lead to unstable training. - -.. code:: - - Trainer(precision=16) - ----- - -**************** -32-bit Precision -**************** - -32-bit precision is the default used across all models and research. This precision is known to be stable in contrast to lower precision settings. - -.. testcode:: - - Trainer(precision=32) - ----- - -**************** -64-bit Precision -**************** - -For certain scientific computations, 64-bit precision enables more accurate models. However, doubling the precision from 32 to 64 bit also doubles the memory requirements. - -.. testcode:: - - Trainer(precision=64) - -.. note:: - - Since in deep learning, memory is always a bottleneck, especially when dealing with a large volume of data and with limited resources. - It is recommended using single precision for better speed. Although you can still use it if you want for your particular use-case. - ----- - -******************************** -Precision support by accelerator -******************************** - -.. list-table:: Precision with Accelerators - :widths: 20 20 20 20 20 - :header-rows: 1 - - * - Precision - - CPU - - GPU - - TPU - - IPU - * - 16 - - No - - Yes - - No - - Yes - * - BFloat16 - - Yes - - Yes - - Yes - - No - * - 32 - - Yes - - Yes - - Yes - - Yes - * - 64 - - Yes - - Yes - - No - - No diff --git a/source/common/precision_intermediate.rst b/source/common/precision_intermediate.rst deleted file mode 100644 index 9ed4c75..0000000 --- a/source/common/precision_intermediate.rst +++ /dev/null @@ -1,143 +0,0 @@ -:orphan: - -.. _precision_intermediate: - -############################## -N-Bit Precision (Intermediate) -############################## -**Audience:** Users looking to scale larger models or take advantage of optimized accelerators. - ----- - -************************ -What is Mixed Precision? -************************ - -PyTorch, like most deep learning frameworks, trains on 32-bit floating-point (FP32) arithmetic by default. However, many deep learning models do not require this to reach complete accuracy. By conducting -operations in half-precision format while keeping minimum information in single-precision to maintain as much information as possible in crucial areas of the network, mixed precision training delivers -significant computational speedup. Switching to mixed precision has resulted in considerable training speedups since the introduction of Tensor Cores in the Volta and Turing architectures. It combines -FP32 and lower-bit floating-points (such as FP16) to reduce memory footprint and increase performance during model training and evaluation. It accomplishes this by recognizing the steps that require -complete accuracy and employing a 32-bit floating-point for those steps only, while using a 16-bit floating-point for the rest. When compared to complete precision training, mixed precision training -delivers all of these benefits while ensuring that no task-specific accuracy is lost. [`2 `_]. - -.. note:: - - In some cases, it is essential to remain in FP32 for numerical stability, so keep this in mind when using mixed precision. - For example, when running scatter operations during the forward (such as torchpoint3d), computation must remain in FP32. - -.. warning:: - - Do not cast anything to other dtypes manually using ``torch.autocast`` or ``tensor.half()`` when using native precision because - this can bring instability. - - .. code-block:: python - - class LitModel(LightningModule): - def training_step(self, batch, batch_idx): - outs = self(batch) - - a_float32 = torch.rand((8, 8), device=self.device, dtype=self.dtype) - b_float32 = torch.rand((8, 4), device=self.device, dtype=self.dtype) - - # casting to float16 manually - with torch.autocast(device_type=self.device.type): - c_float16 = torch.mm(a_float32, b_float32) - target = self.layer(c_float16.flatten()[None]) - - # here outs is of type float32 and target is of type float16 - loss = torch.mm(target @ outs).float() - return loss - - - trainer = Trainer(accelerator="gpu", devices=1, precision=32) - ----- - -******************** -FP16 Mixed Precision -******************** - -In most cases, mixed precision uses FP16. Supported `PyTorch operations `__ automatically run in FP16, saving memory and improving throughput on the supported accelerators. - - -.. note:: - - When using TPUs, setting ``precision=16`` will enable bfloat16, the only supported half precision type on TPUs. - -.. testcode:: - :skipif: not torch.cuda.is_available() - - Trainer(accelerator="gpu", devices=1, precision=16) - - -PyTorch Native --------------- - -PyTorch 1.6 release introduced mixed precision functionality into their core as the AMP package, `torch.cuda.amp `__. It is more flexible and intuitive compared to `NVIDIA APEX `__. -Since computation happens in FP16, there is a chance of numerical instability during training. This is handled internally by a dynamic grad scaler which skips invalid steps and adjusts the scaler to ensure subsequent steps fall within a finite range. For more information `see the autocast docs `__. -Lightning uses native amp by default with ``precision=16|"bf16"``. You can also set it using: - -.. testcode:: - - Trainer(precision=16, amp_backend="native") - - -NVIDIA APEX ------------ - -.. warning:: - - We strongly recommend using the above native mixed precision rather than NVIDIA APEX unless you require more refined control. - -`NVIDIA APEX `__ offers additional flexibility in setting mixed precision. This can be useful when trying out different precision configurations, such as keeping most of your weights in FP16 and running computation in FP16. - -.. testcode:: - :skipif: not _APEX_AVAILABLE or not torch.cuda.is_available() - - Trainer(accelerator="gpu", devices=1, amp_backend="apex", precision=16) - -Set the `NVIDIA optimization level `__ via the trainer. - -.. testcode:: - :skipif: not _APEX_AVAILABLE or not torch.cuda.is_available() - - Trainer(accelerator="gpu", devices=1, amp_backend="apex", amp_level="O2", precision=16) - ----- - -************************ -BFloat16 Mixed Precision -************************ - -.. warning:: - - BFloat16 requires PyTorch 1.10 or later and is only supported with PyTorch Native AMP. - - BFloat16 is also experimental and may not provide significant speedups or memory improvements, offering better numerical stability. - - Do note for GPUs, the most significant benefits require `Ampere `__ based GPUs, such as A100s or 3090s. - -BFloat16 Mixed precision is similar to FP16 mixed precision, however, it maintains more of the "dynamic range" that FP32 offers. This means it is able to improve numerical stability than FP16 mixed precision. For more information, see `this TPU performance blogpost `__. - -Under the hood, we use `torch.autocast `__ with the dtype set to ``bfloat16``, with no gradient scaling. - -.. testcode:: - :skipif: not _TORCH_GREATER_EQUAL_1_10 or not torch.cuda.is_available() - - Trainer(accelerator="gpu", devices=1, precision="bf16") - -It is also possible to use BFloat16 mixed precision on the CPU, relying on MKLDNN under the hood. - -.. testcode:: - :skipif: not _TORCH_GREATER_EQUAL_1_10 - - Trainer(precision="bf16") - ----- - -*************** -8-bit Optimizer -*************** - -It is possible to further reduce the precision using third-party libraries like `bitsandbytes `_. Although, -Lightning doesn't support it out of the box yet but you can still use it by configuring it in your LightningModule and setting ``Trainer(precision=32)``. diff --git a/source/common/progress_bar.rst b/source/common/progress_bar.rst deleted file mode 100644 index d00c716..0000000 --- a/source/common/progress_bar.rst +++ /dev/null @@ -1,138 +0,0 @@ -.. testsetup:: * - - from pytorch_lightning.trainer.trainer import Trainer - -.. _progress_bar: - - -Customize the progress bar -========================== - -Lightning supports two different types of progress bars (`tqdm `_ and `rich `_). :class:`~pytorch_lightning.callbacks.TQDMProgressBar` is used by default, -but you can override it by passing a custom :class:`~pytorch_lightning.callbacks.TQDMProgressBar` or :class:`~pytorch_lightning.callbacks.RichProgressBar` to the ``callbacks`` argument of the :class:`~pytorch_lightning.trainer.trainer.Trainer`. - -You could also use the :class:`~pytorch_lightning.callbacks.ProgressBarBase` class to implement your own progress bar. - -------------- - -TQDMProgressBar ---------------- - -The :class:`~pytorch_lightning.callbacks.TQDMProgressBar` uses the `tqdm `_ library internally and is the default progress bar used by Lightning. -It prints to ``stdout`` and shows up to four different bars: - -- **sanity check progress:** the progress during the sanity check run -- **main progress:** shows training + validation progress combined. It also accounts for multiple validation runs during training when :paramref:`~pytorch_lightning.trainer.trainer.Trainer.val_check_interval` is used. -- **validation progress:** only visible during validation; shows total progress over all validation datasets. -- **test progress:** only active when testing; shows total progress over all test datasets. - -For infinite datasets, the progress bar never ends. - -You can update ``refresh_rate`` (rate (number of batches) at which the progress bar get updated) for :class:`~pytorch_lightning.callbacks.TQDMProgressBar` by: - -.. code-block:: python - - from pytorch_lightning.callbacks import TQDMProgressBar - - trainer = Trainer(callbacks=[TQDMProgressBar(refresh_rate=10)]) - -If you want to customize the default :class:`~pytorch_lightning.callbacks.TQDMProgressBar` used by Lightning, you can override -specific methods of the callback class and pass your custom implementation to the :class:`~pytorch_lightning.trainer.trainer.Trainer`. - -.. code-block:: python - - class LitProgressBar(TQDMProgressBar): - def init_validation_tqdm(self): - bar = super().init_validation_tqdm() - bar.set_description("running validation...") - return bar - - - trainer = Trainer(callbacks=[LitProgressBar()]) - -.. seealso:: - - :class:`~pytorch_lightning.callbacks.TQDMProgressBar` docs. - - `tqdm library `__ - ----------------- - -RichProgressBar ---------------- - -`Rich `_ is a Python library for rich text and beautiful formatting in the terminal. -To use the :class:`~pytorch_lightning.callbacks.RichProgressBar` as your progress bar, first install the package: - -.. code-block:: bash - - pip install rich - -Then configure the callback and pass it to the :class:`~pytorch_lightning.trainer.trainer.Trainer`: - -.. code-block:: python - - from pytorch_lightning.callbacks import RichProgressBar - - trainer = Trainer(callbacks=[RichProgressBar()]) - -Customize the theme for your :class:`~pytorch_lightning.callbacks.RichProgressBar` like this: - -.. code-block:: python - - from pytorch_lightning.callbacks import RichProgressBar - from pytorch_lightning.callbacks.progress.rich_progress import RichProgressBarTheme - - # create your own theme! - progress_bar = RichProgressBar( - theme=RichProgressBarTheme( - description="green_yellow", - progress_bar="green1", - progress_bar_finished="green1", - progress_bar_pulse="#6206E0", - batch_progress="green_yellow", - time="grey82", - processing_speed="grey82", - metrics="grey82", - ) - ) - - trainer = Trainer(callbacks=progress_bar) - -You can customize the components used within :class:`~pytorch_lightning.callbacks.RichProgressBar` with ease by overriding the -:func:`~pytorch_lightning.callbacks.RichProgressBar.configure_columns` method. - -.. code-block:: python - - from rich.progress import TextColumn - - custom_column = TextColumn("[progress.description]Custom Rich Progress Bar!") - - - class CustomRichProgressBar(RichProgressBar): - def configure_columns(self, trainer): - return [custom_column] - - - progress_bar = CustomRichProgressBar() - -If you wish for a new progress bar to be displayed at the end of every epoch, you should enable -:paramref:`RichProgressBar.leave ` by passing ``True`` - -.. code-block:: python - - from pytorch_lightning.callbacks import RichProgressBar - - trainer = Trainer(callbacks=[RichProgressBar(leave=True)]) - -.. seealso:: - - :class:`~pytorch_lightning.callbacks.RichProgressBar` docs. - - :class:`~pytorch_lightning.callbacks.RichModelSummary` docs to customize the model summary table. - - `Rich library `__. - - -.. note:: - - Progress bar is automatically enabled with the Trainer, and to disable it, one should do this: - - .. code-block:: python - - trainer = Trainer(enable_progress_bar=False) diff --git a/source/common/trainer.rst b/source/common/trainer.rst deleted file mode 100644 index 848ac8a..0000000 --- a/source/common/trainer.rst +++ /dev/null @@ -1,1832 +0,0 @@ -.. role:: hidden - :class: hidden-section - -.. testsetup:: * - - import os - from pytorch_lightning.trainer.trainer import Trainer - from pytorch_lightning.core.lightning import LightningModule - from pytorch_lightning.utilities.seed import seed_everything - -.. _trainer: - -Trainer -======= - -Once you've organized your PyTorch code into a LightningModule, -the Trainer automates everything else. - -.. raw:: html - - - -| - -This abstraction achieves the following: - -1. You maintain control over all aspects via PyTorch code without an added abstraction. - -2. The trainer uses best practices embedded by contributors and users - from top AI labs such as Facebook AI Research, NYU, MIT, Stanford, etc... - -3. The trainer allows overriding any key part that you don't want automated. - -| - ------------ - -Basic use ---------- - -This is the basic use of the trainer: - -.. code-block:: python - - model = MyLightningModule() - - trainer = Trainer() - trainer.fit(model, train_dataloader, val_dataloader) - --------- - -Under the hood --------------- -Under the hood, the Lightning Trainer handles the training loop details for you, some examples include: - -- Automatically enabling/disabling grads -- Running the training, validation and test dataloaders -- Calling the Callbacks at the appropriate times -- Putting batches and computations on the correct devices - -Here's the pseudocode for what the trainer does under the hood (showing the train loop only) - -.. code-block:: python - - # put model in train mode - model.train() - torch.set_grad_enabled(True) - - losses = [] - for batch in train_dataloader: - # calls hooks like this one - on_train_batch_start() - - # train step - loss = training_step(batch) - - # clear gradients - optimizer.zero_grad() - - # backward - loss.backward() - - # update parameters - optimizer.step() - - losses.append(loss) - - --------- - -Trainer in Python scripts -------------------------- -In Python scripts, it's recommended you use a main function to call the Trainer. - -.. code-block:: python - - from argparse import ArgumentParser - - - def main(hparams): - model = LightningModule() - trainer = Trainer(accelerator=hparams.accelerator, devices=hparams.devices) - trainer.fit(model) - - - if __name__ == "__main__": - parser = ArgumentParser() - parser.add_argument("--accelerator", default=None) - parser.add_argument("--devices", default=None) - args = parser.parse_args() - - main(args) - -So you can run it like so: - -.. code-block:: bash - - python main.py --accelerator 'gpu' --devices 2 - -.. note:: - - Pro-tip: You don't need to define all flags manually. Lightning can add them automatically - -.. code-block:: python - - from argparse import ArgumentParser - - - def main(args): - model = LightningModule() - trainer = Trainer.from_argparse_args(args) - trainer.fit(model) - - - if __name__ == "__main__": - parser = ArgumentParser() - parser = Trainer.add_argparse_args(parser) - args = parser.parse_args() - - main(args) - -So you can run it like so: - -.. code-block:: bash - - python main.py --accelerator 'gpu' --devices 2 --max_steps 10 --limit_train_batches 10 --any_trainer_arg x - -.. note:: - If you want to stop a training run early, you can press "Ctrl + C" on your keyboard. - The trainer will catch the ``KeyboardInterrupt`` and attempt a graceful shutdown, including - running accelerator callback ``on_train_end`` to clean up memory. The trainer object will also set - an attribute ``interrupted`` to ``True`` in such cases. If you have a callback which shuts down compute - resources, for example, you can conditionally run the shutdown logic for only uninterrupted runs. - ------------- - -Validation ----------- -You can perform an evaluation epoch over the validation set, outside of the training loop, -using :meth:`~pytorch_lightning.trainer.trainer.Trainer.validate`. This might be -useful if you want to collect new metrics from a model right at its initialization -or after it has already been trained. - -.. code-block:: python - - trainer.validate(dataloaders=val_dataloaders) - ------------- - -Testing -------- -Once you're done training, feel free to run the test set! -(Only right before publishing your paper or pushing to production) - -.. code-block:: python - - trainer.test(dataloaders=test_dataloaders) - ------------- - -Reproducibility ---------------- - -To ensure full reproducibility from run to run you need to set seeds for pseudo-random generators, -and set ``deterministic`` flag in ``Trainer``. - -Example:: - - from pytorch_lightning import Trainer, seed_everything - - seed_everything(42, workers=True) - # sets seeds for numpy, torch and python.random. - model = Model() - trainer = Trainer(deterministic=True) - - -By setting ``workers=True`` in :func:`~pytorch_lightning.utilities.seed.seed_everything`, Lightning derives -unique seeds across all dataloader workers and processes for :mod:`torch`, :mod:`numpy` and stdlib -:mod:`random` number generators. When turned on, it ensures that e.g. data augmentations are not repeated across workers. - -------- - -.. _trainer_flags: - -Trainer flags -------------- - -accelerator -^^^^^^^^^^^ - -Supports passing different accelerator types (``"cpu", "gpu", "tpu", "ipu", "auto"``) -as well as custom accelerator instances. - -.. code-block:: python - - # CPU accelerator - trainer = Trainer(accelerator="cpu") - - # Training with GPU Accelerator using 2 GPUs - trainer = Trainer(devices=2, accelerator="gpu") - - # Training with TPU Accelerator using 8 tpu cores - trainer = Trainer(devices=8, accelerator="tpu") - - # Training with GPU Accelerator using the DistributedDataParallel strategy - trainer = Trainer(devices=4, accelerator="gpu", strategy="ddp") - -.. note:: The ``"auto"`` option recognizes the machine you are on, and selects the respective ``Accelerator``. - -.. code-block:: python - - # If your machine has GPUs, it will use the GPU Accelerator for training - trainer = Trainer(devices=2, accelerator="auto") - -You can also modify hardware behavior by subclassing an existing accelerator to adjust for your needs. - -Example:: - - class MyOwnAcc(CPUAccelerator): - ... - - Trainer(accelerator=MyOwnAcc()) - -.. note:: - - If the ``devices`` flag is not defined, it will assume ``devices`` to be ``"auto"`` and fetch the ``auto_device_count`` - from the accelerator. - - .. code-block:: python - - # This is part of the built-in `GPUAccelerator` - class GPUAccelerator(Accelerator): - """Accelerator for GPU devices.""" - - @staticmethod - def auto_device_count() -> int: - """Get the devices when set to auto.""" - return torch.cuda.device_count() - - - # Training with GPU Accelerator using total number of gpus available on the system - Trainer(accelerator="gpu") - -.. warning:: Passing training strategies (e.g., ``"ddp"``) to ``accelerator`` has been deprecated in v1.5.0 - and will be removed in v1.7.0. Please use the ``strategy`` argument instead. - -accumulate_grad_batches -^^^^^^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Accumulates grads every k batches or as set up in the dict. -Trainer also calls ``optimizer.step()`` for the last indivisible step number. - -.. testcode:: - - # default used by the Trainer (no accumulation) - trainer = Trainer(accumulate_grad_batches=1) - -Example:: - - # accumulate every 4 batches (effective batch size is batch*4) - trainer = Trainer(accumulate_grad_batches=4) - - # no accumulation for epochs 1-4. accumulate 3 for epochs 5-10. accumulate 20 after that - trainer = Trainer(accumulate_grad_batches={5: 3, 10: 20}) - -amp_backend -^^^^^^^^^^^ - -.. raw:: html - - - -| - -Use PyTorch AMP ('native'), or NVIDIA apex ('apex'). - -.. testcode:: - - # using PyTorch built-in AMP, default used by the Trainer - trainer = Trainer(amp_backend="native") - - # using NVIDIA Apex - trainer = Trainer(amp_backend="apex") - -amp_level -^^^^^^^^^ - -.. raw:: html - - - -| - -The optimization level to use (O1, O2, etc...) -for 16-bit GPU precision (using NVIDIA apex under the hood). - -Check `NVIDIA apex docs `_ for level - -Example:: - - # default used by the Trainer - trainer = Trainer(amp_level='O2') - -auto_scale_batch_size -^^^^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Automatically tries to find the largest batch size that fits into memory, -before any training. - -.. code-block:: python - - # default used by the Trainer (no scaling of batch size) - trainer = Trainer(auto_scale_batch_size=None) - - # run batch size scaling, result overrides hparams.batch_size - trainer = Trainer(auto_scale_batch_size="binsearch") - - # call tune to find the batch size - trainer.tune(model) - -auto_select_gpus -^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -If enabled and ``devices`` is an integer, pick available GPUs automatically. -This is especially useful when GPUs are configured to be in "exclusive mode", -such that only one process at a time can access them. - -Example:: - - # no auto selection (picks first 2 GPUs on system, may fail if other process is occupying) - trainer = Trainer(accelerator="gpu", devices=2, auto_select_gpus=False) - - # enable auto selection (will find two available GPUs on system) - trainer = Trainer(accelerator="gpu", devices=2, auto_select_gpus=True) - - # specifies all GPUs regardless of its availability - Trainer(accelerator="gpu", devices=-1, auto_select_gpus=False) - - # specifies all available GPUs (if only one GPU is not occupied, uses one gpu) - Trainer(accelerator="gpu", devices=-1, auto_select_gpus=True) - -auto_lr_find -^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Runs a learning rate finder algorithm (see this `paper `_) -when calling trainer.tune(), to find optimal initial learning rate. - -.. code-block:: python - - # default used by the Trainer (no learning rate finder) - trainer = Trainer(auto_lr_find=False) - -Example:: - - # run learning rate finder, results override hparams.learning_rate - trainer = Trainer(auto_lr_find=True) - - # call tune to find the lr - trainer.tune(model) - -Example:: - - # run learning rate finder, results override hparams.my_lr_arg - trainer = Trainer(auto_lr_find='my_lr_arg') - - # call tune to find the lr - trainer.tune(model) - -.. note:: - See the :ref:`learning rate finder guide `. - -benchmark -^^^^^^^^^ - -.. raw:: html - - - -| - -Defaults to ``True`` if :paramref:`~pytorch_lightning.trainer.Trainer.deterministic` is not set. -This flag sets the ``torch.backends.cudnn.benchmark`` flag. You can read more about its impact -`here `__ - -This is likely to increase the speed of your system if your input sizes don't change. However, if they do, then it -might make your system slower. The CUDNN auto-tuner will try to find the best algorithm for the hardware when a new -input size is encountered. Read more about it `here `__. - -Example:: - - # defaults to True if not deterministic (which is False by default) - trainer = Trainer() - - # you can overwrite the value - trainer = Trainer(benchmark=False) - -deterministic -^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -This flag sets the ``torch.backends.cudnn.deterministic`` flag. -Might make your system slower, but ensures reproducibility. -Also sets ``$HOROVOD_FUSION_THRESHOLD=0``. - -For more info check `PyTorch docs `_. - -Example:: - - # default used by the Trainer - trainer = Trainer(deterministic=False) - -callbacks -^^^^^^^^^ - -.. raw:: html - - - -| - -Add a list of :class:`~pytorch_lightning.callbacks.Callback`. Callbacks run sequentially in the order defined here -with the exception of :class:`~pytorch_lightning.callbacks.model_checkpoint.ModelCheckpoint` callbacks which run -after all others to ensure all states are saved to the checkpoints. - -.. code-block:: python - - # a list of callbacks - callbacks = [PrintCallback()] - trainer = Trainer(callbacks=callbacks) - -Example:: - - from pytorch_lightning.callbacks import Callback - - class PrintCallback(Callback): - def on_train_start(self, trainer, pl_module): - print("Training is started!") - def on_train_end(self, trainer, pl_module): - print("Training is done.") - - -Model-specific callbacks can also be added inside the ``LightningModule`` through -:meth:`~pytorch_lightning.core.lightning.LightningModule.configure_callbacks`. -Callbacks returned in this hook will extend the list initially given to the ``Trainer`` argument, and replace -the trainer callbacks should there be two or more of the same type. -:class:`~pytorch_lightning.callbacks.model_checkpoint.ModelCheckpoint` callbacks always run last. - - -check_val_every_n_epoch -^^^^^^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Check val every n train epochs. - -Example:: - - # default used by the Trainer - trainer = Trainer(check_val_every_n_epoch=1) - - # run val loop every 10 training epochs - trainer = Trainer(check_val_every_n_epoch=10) - -checkpoint_callback -^^^^^^^^^^^^^^^^^^^ - -.. warning:: `checkpoint_callback` has been deprecated in v1.5 and will be removed in v1.7. - To disable checkpointing, pass ``enable_checkpointing = False`` to the Trainer instead. - - -default_root_dir -^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Default path for logs and weights when no logger or -:class:`pytorch_lightning.callbacks.ModelCheckpoint` callback passed. On -certain clusters you might want to separate where logs and checkpoints are -stored. If you don't then use this argument for convenience. Paths can be local -paths or remote paths such as `s3://bucket/path` or 'hdfs://path/'. Credentials -will need to be set up to use remote filepaths. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(default_root_dir=os.getcwd()) - -devices -^^^^^^^ - -Number of devices to train on (``int``), which devices to train on (``list`` or ``str``), or ``"auto"``. -It will be mapped to either ``gpus``, ``tpu_cores``, ``num_processes`` or ``ipus``, -based on the accelerator type (``"cpu", "gpu", "tpu", "ipu", "auto"``). - -.. code-block:: python - - # Training with CPU Accelerator using 2 processes - trainer = Trainer(devices=2, accelerator="cpu") - - # Training with GPU Accelerator using GPUs 1 and 3 - trainer = Trainer(devices=[1, 3], accelerator="gpu") - - # Training with TPU Accelerator using 8 tpu cores - trainer = Trainer(devices=8, accelerator="tpu") - -.. tip:: The ``"auto"`` option recognizes the devices to train on, depending on the ``Accelerator`` being used. - -.. code-block:: python - - # If your machine has GPUs, it will use all the available GPUs for training - trainer = Trainer(devices="auto", accelerator="auto") - - # Training with CPU Accelerator using 1 process - trainer = Trainer(devices="auto", accelerator="cpu") - - # Training with TPU Accelerator using 8 tpu cores - trainer = Trainer(devices="auto", accelerator="tpu") - - # Training with IPU Accelerator using 4 ipus - trainer = Trainer(devices="auto", accelerator="ipu") - -.. note:: - - If the ``devices`` flag is not defined, it will assume ``devices`` to be ``"auto"`` and fetch the ``auto_device_count`` - from the accelerator. - - .. code-block:: python - - # This is part of the built-in `GPUAccelerator` - class GPUAccelerator(Accelerator): - """Accelerator for GPU devices.""" - - @staticmethod - def auto_device_count() -> int: - """Get the devices when set to auto.""" - return torch.cuda.device_count() - - - # Training with GPU Accelerator using total number of gpus available on the system - Trainer(accelerator="gpu") - -enable_checkpointing -^^^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -By default Lightning saves a checkpoint for you in your current working directory, with the state of your last training epoch, -Checkpoints capture the exact value of all parameters used by a model. -To disable automatic checkpointing, set this to `False`. - -.. code-block:: python - - # default used by Trainer, saves the most recent model to a single checkpoint after each epoch - trainer = Trainer(enable_checkpointing=True) - - # turn off automatic checkpointing - trainer = Trainer(enable_checkpointing=False) - - -You can override the default behavior by initializing the :class:`~pytorch_lightning.callbacks.ModelCheckpoint` -callback, and adding it to the :paramref:`~pytorch_lightning.trainer.trainer.Trainer.callbacks` list. -See :doc:`Saving and Loading Checkpoints <../common/checkpointing>` for how to customize checkpointing. - -.. testcode:: - - from pytorch_lightning.callbacks import ModelCheckpoint - - # Init ModelCheckpoint callback, monitoring 'val_loss' - checkpoint_callback = ModelCheckpoint(monitor="val_loss") - - # Add your callback to the callbacks list - trainer = Trainer(callbacks=[checkpoint_callback]) - -fast_dev_run -^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Runs n if set to ``n`` (int) else 1 if set to ``True`` batch(es) of train, val and test -to find any bugs (ie: a sort of unit test). - -Under the hood the pseudocode looks like this when running *fast_dev_run* with a single batch: - -.. code-block:: python - - # loading - __init__() - prepare_data - - # test training step - training_batch = next(train_dataloader) - training_step(training_batch) - - # test val step - val_batch = next(val_dataloader) - out = validation_step(val_batch) - validation_epoch_end([out]) - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(fast_dev_run=False) - - # runs 1 train, val, test batch and program ends - trainer = Trainer(fast_dev_run=True) - - # runs 7 train, val, test batches and program ends - trainer = Trainer(fast_dev_run=7) - -.. note:: - - This argument is a bit different from ``limit_train/val/test_batches``. Setting this argument will - disable tuner, checkpoint callbacks, early stopping callbacks, loggers and logger callbacks like - ``LearningRateLogger`` and runs for only 1 epoch. This must be used only for debugging purposes. - ``limit_train/val/test_batches`` only limits the number of batches and won't disable anything. - -flush_logs_every_n_steps -^^^^^^^^^^^^^^^^^^^^^^^^ - -.. warning:: ``flush_logs_every_n_steps`` has been deprecated in v1.5 and will be removed in v1.7. - Please configure flushing directly in the logger instead. - -.. raw:: html - - - -| - -Writes logs to disk this often. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(flush_logs_every_n_steps=100) - -See Also: - - :doc:`logging <../extensions/logging>` - -.. _gpus: - -gpus -^^^^ - -.. warning:: ``gpus=x`` has been deprecated in v1.7 and will be removed in v2.0. - Please use ``accelerator='gpu'`` and ``devices=x`` instead. - -.. raw:: html - - - -| - -- Number of GPUs to train on (int) -- or which GPUs to train on (list) -- can handle strings - -.. testcode:: - - # default used by the Trainer (ie: train on CPU) - trainer = Trainer(gpus=None) - - # equivalent - trainer = Trainer(gpus=0) - -Example:: - - # int: train on 2 gpus - trainer = Trainer(gpus=2) - - # list: train on GPUs 1, 4 (by bus ordering) - trainer = Trainer(gpus=[1, 4]) - trainer = Trainer(gpus='1, 4') # equivalent - - # -1: train on all gpus - trainer = Trainer(gpus=-1) - trainer = Trainer(gpus='-1') # equivalent - - # combine with num_nodes to train on multiple GPUs across nodes - # uses 8 gpus in total - trainer = Trainer(gpus=2, num_nodes=4) - - # train only on GPUs 1 and 4 across nodes - trainer = Trainer(gpus=[1, 4], num_nodes=4) - -See Also: - - :ref:`Multi GPU Training ` - -gradient_clip_val -^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Gradient clipping value - -- 0 means don't clip. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(gradient_clip_val=0.0) - -limit_train_batches -^^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -How much of training dataset to check. -Useful when debugging or testing something that happens at the end of an epoch. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(limit_train_batches=1.0) - -Example:: - - # default used by the Trainer - trainer = Trainer(limit_train_batches=1.0) - - # run through only 25% of the training set each epoch - trainer = Trainer(limit_train_batches=0.25) - - # run through only 10 batches of the training set each epoch - trainer = Trainer(limit_train_batches=10) - -limit_test_batches -^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -How much of test dataset to check. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(limit_test_batches=1.0) - - # run through only 25% of the test set each epoch - trainer = Trainer(limit_test_batches=0.25) - - # run for only 10 batches - trainer = Trainer(limit_test_batches=10) - -In the case of multiple test dataloaders, the limit applies to each dataloader individually. - -limit_val_batches -^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -How much of validation dataset to check. -Useful when debugging or testing something that happens at the end of an epoch. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(limit_val_batches=1.0) - - # run through only 25% of the validation set each epoch - trainer = Trainer(limit_val_batches=0.25) - - # run for only 10 batches - trainer = Trainer(limit_val_batches=10) - -In the case of multiple validation dataloaders, the limit applies to each dataloader individually. - -log_every_n_steps -^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - - -How often to add logging rows (does not write to disk) - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(log_every_n_steps=50) - -See Also: - - :doc:`logging <../extensions/logging>` - -logger -^^^^^^ - -.. raw:: html - - - -| - -:doc:`Logger <../visualize/loggers>` (or iterable collection of loggers) for experiment tracking. A ``True`` value uses the default ``TensorBoardLogger`` shown below. ``False`` will disable logging. - -.. testcode:: - - from pytorch_lightning.loggers import TensorBoardLogger - - # default logger used by trainer - logger = TensorBoardLogger(save_dir=os.getcwd(), version=1, name="lightning_logs") - Trainer(logger=logger) - -max_epochs -^^^^^^^^^^ - -.. raw:: html - - - -| - -Stop training once this number of epochs is reached - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(max_epochs=1000) - -If both ``max_epochs`` and ``max_steps`` aren't specified, ``max_epochs`` will default to ``1000``. -To enable infinite training, set ``max_epochs = -1``. - -min_epochs -^^^^^^^^^^ - -.. raw:: html - - - -| - -Force training for at least these many epochs - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(min_epochs=1) - -max_steps -^^^^^^^^^ - -.. raw:: html - - - -| - -Stop training after this number of :ref:`global steps `. -Training will stop if max_steps or max_epochs have reached (earliest). - -.. testcode:: - - # Default (disabled) - trainer = Trainer(max_steps=None) - - # Stop after 100 steps - trainer = Trainer(max_steps=100) - -If ``max_steps`` is not specified, ``max_epochs`` will be used instead (and ``max_epochs`` defaults to -``1000`` if ``max_epochs`` is not specified). To disable this default, set ``max_steps = -1``. - -min_steps -^^^^^^^^^ - -.. raw:: html - - - -| - -Force training for at least this number of :ref:`global steps `. -Trainer will train model for at least min_steps or min_epochs (latest). - -.. testcode:: - - # Default (disabled) - trainer = Trainer(min_steps=None) - - # Run at least for 100 steps (disable min_epochs) - trainer = Trainer(min_steps=100, min_epochs=0) - -max_time -^^^^^^^^ - -Set the maximum amount of time for training. Training will get interrupted mid-epoch. -For customizable options use the :class:`~pytorch_lightning.callbacks.timer.Timer` callback. - -.. testcode:: - - # Default (disabled) - trainer = Trainer(max_time=None) - - # Stop after 12 hours of training or when reaching 10 epochs (string) - trainer = Trainer(max_time="00:12:00:00", max_epochs=10) - - # Stop after 1 day and 5 hours (dict) - trainer = Trainer(max_time={"days": 1, "hours": 5}) - -In case ``max_time`` is used together with ``min_steps`` or ``min_epochs``, the ``min_*`` requirement -always has precedence. - -num_nodes -^^^^^^^^^ - -.. raw:: html - - - -| - -Number of GPU nodes for distributed training. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(num_nodes=1) - - # to train on 8 nodes - trainer = Trainer(num_nodes=8) - -num_processes -^^^^^^^^^^^^^ - -.. warning:: ``num_processes=x`` has been deprecated in v1.7 and will be removed in v2.0. - Please use ``accelerator='cpu'`` and ``devices=x`` instead. - -.. raw:: html - - - -| - -Number of processes to train with. Automatically set to the number of GPUs -when using ``strategy="ddp"``. Set to a number greater than 1 when -using ``accelerator="cpu"`` and ``strategy="ddp"`` to mimic distributed training on a -machine without GPUs. This is useful for debugging, but **will not** provide -any speedup, since single-process Torch already makes efficient use of multiple -CPUs. While it would typically spawns subprocesses for training, setting -``num_nodes > 1`` and keeping ``num_processes = 1`` runs training in the main -process. - -.. testcode:: - - # Simulate DDP for debugging on your GPU-less laptop - trainer = Trainer(accelerator="cpu", strategy="ddp", num_processes=2) - -num_sanity_val_steps -^^^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Sanity check runs n batches of val before starting the training routine. -This catches any bugs in your validation without having to wait for the first validation check. -The Trainer uses 2 steps by default. Turn it off or modify it here. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(num_sanity_val_steps=2) - - # turn it off - trainer = Trainer(num_sanity_val_steps=0) - - # check all validation data - trainer = Trainer(num_sanity_val_steps=-1) - - -This option will reset the validation dataloader unless ``num_sanity_val_steps=0``. - -overfit_batches -^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Uses this much data of the training & validation set. -If the training & validation dataloaders have ``shuffle=True``, Lightning will automatically disable it. - -Useful for quickly debugging or trying to overfit on purpose. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(overfit_batches=0.0) - - # use only 1% of the train & val set - trainer = Trainer(overfit_batches=0.01) - - # overfit on 10 of the same batches - trainer = Trainer(overfit_batches=10) - -plugins -^^^^^^^ - -.. raw:: html - - - -| - -:ref:`Plugins` allow you to connect arbitrary backends, precision libraries, clusters etc. For example: - -- :ref:`Checkpoint IO ` -- `TorchElastic `_ -- :ref:`Precision Plugins ` - -To define your own behavior, subclass the relevant class and pass it in. Here's an example linking up your own -:class:`~pytorch_lightning.plugins.environments.ClusterEnvironment`. - -.. code-block:: python - - from pytorch_lightning.plugins.environments import ClusterEnvironment - - - class MyCluster(ClusterEnvironment): - def main_address(self): - return your_main_address - - def main_port(self): - return your_main_port - - def world_size(self): - return the_world_size - - - trainer = Trainer(plugins=[MyCluster()], ...) - -precision -^^^^^^^^^ - -.. raw:: html - - - -| - -Lightning supports either double (64), float (32), bfloat16 (bf16), or half (16) precision training. - -Half precision, or mixed precision, is the combined use of 32 and 16 bit floating points to reduce memory footprint during model training. This can result in improved performance, achieving +3X speedups on modern GPUs. - -.. testcode:: - :skipif: not torch.cuda.is_available() - - # default used by the Trainer - trainer = Trainer(precision=32) - - # 16-bit precision - trainer = Trainer(precision=16, accelerator="gpu", devices=1) # works only on CUDA - - # bfloat16 precision - trainer = Trainer(precision="bf16") - - # 64-bit precision - trainer = Trainer(precision=64) - - -.. note:: When running on TPUs, torch.bfloat16 will be used but tensor printing will still show torch.float32. - -.. admonition:: If you are interested in using Apex 16-bit training: - :class: dropdown - - NVIDIA Apex and DDP have instability problems. We recommend using the native AMP for 16-bit precision with multiple GPUs. - To use Apex 16-bit training: - - 1. `Install apex. `__ - - 2. Set the ``precision`` trainer flag to 16. You can customize the `Apex optimization level `_ by setting the `amp_level` flag. - - .. testcode:: - :skipif: not _APEX_AVAILABLE or not torch.cuda.is_available() - - # turn on 16-bit - trainer = Trainer(amp_backend="apex", amp_level="O2", precision=16, accelerator="gpu", devices=1) - - -process_position -^^^^^^^^^^^^^^^^ - -.. warning:: ``process_position`` has been deprecated in v1.5 and will be removed in v1.7. - Please pass :class:`~pytorch_lightning.callbacks.progress.TQDMProgressBar` with ``process_position`` - directly to the Trainer's ``callbacks`` argument instead. - -.. raw:: html - - - -| - -Orders the progress bar. Useful when running multiple trainers on the same node. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(process_position=0) - -.. note:: This argument is ignored if a custom callback is passed to :paramref:`~Trainer.callbacks`. - -profiler -^^^^^^^^ - -.. raw:: html - - - -| - -To profile individual steps during training and assist in identifying bottlenecks. - -See the :doc:`profiler documentation <../tuning/profiler>`. for more details. - -.. testcode:: - - from pytorch_lightning.profiler import SimpleProfiler, AdvancedProfiler - - # default used by the Trainer - trainer = Trainer(profiler=None) - - # to profile standard training events, equivalent to `profiler=SimpleProfiler()` - trainer = Trainer(profiler="simple") - - # advanced profiler for function-level stats, equivalent to `profiler=AdvancedProfiler()` - trainer = Trainer(profiler="advanced") - -enable_progress_bar -^^^^^^^^^^^^^^^^^^^ - -Whether to enable or disable the progress bar. Defaults to True. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(enable_progress_bar=True) - - # disable progress bar - trainer = Trainer(enable_progress_bar=False) - -reload_dataloaders_every_n_epochs -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Set to a positive integer to reload dataloaders every n epochs. - -.. code-block:: python - - # if 0 (default) - train_loader = model.train_dataloader() - for epoch in epochs: - for batch in train_loader: - ... - - # if a positive integer - for epoch in epochs: - if not epoch % reload_dataloaders_every_n_epochs: - train_loader = model.train_dataloader() - for batch in train_loader: - ... - -.. _replace-sampler-ddp: - -replace_sampler_ddp -^^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Enables auto adding of :class:`~torch.utils.data.distributed.DistributedSampler`. In PyTorch, you must use it in -distributed settings such as TPUs or multi-node. The sampler makes sure each GPU sees the appropriate part of your data. -By default it will add ``shuffle=True`` for train sampler and ``shuffle=False`` for val/test sampler. -If you want to customize it, you can set ``replace_sampler_ddp=False`` and add your own distributed sampler. -If ``replace_sampler_ddp=True`` and a distributed sampler was already added, -Lightning will not replace the existing one. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(replace_sampler_ddp=True) - -By setting to False, you have to add your own distributed sampler: - -.. code-block:: python - - # in your LightningModule or LightningDataModule - def train_dataloader(self): - # default used by the Trainer - sampler = torch.utils.data.distributed.DistributedSampler(dataset, shuffle=True) - dataloader = DataLoader(dataset, batch_size=32, sampler=sampler) - return dataloader - -.. note:: For iterable datasets, we don't do this automatically. - -resume_from_checkpoint -^^^^^^^^^^^^^^^^^^^^^^ - -.. warning:: ``resume_from_checkpoint`` is deprecated in v1.5 and will be removed in v2.0. - Please pass ``trainer.fit(ckpt_path="some/path/to/my_checkpoint.ckpt")`` instead. - - -.. raw:: html - - - -| - -To resume training from a specific checkpoint pass in the path here. If resuming from a mid-epoch -checkpoint, training will start from the beginning of the next epoch. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(resume_from_checkpoint=None) - - # resume from a specific checkpoint - trainer = Trainer(resume_from_checkpoint="some/path/to/my_checkpoint.ckpt") - -strategy -^^^^^^^^ - -Supports passing different training strategies with aliases (ddp, ddp_spawn, etc) as well as custom strategies. - -.. code-block:: python - - # Training with the DistributedDataParallel strategy on 4 GPUs - trainer = Trainer(strategy="ddp", accelerator="gpu", devices=4) - - # Training with the DDP Spawn strategy using 4 cpu processes - trainer = Trainer(strategy="ddp_spawn", accelerator="cpu", devices=4) - -.. note:: Additionally, you can pass your custom strategy to the ``strategy`` argument. - -.. code-block:: python - - from pytorch_lightning.strategies import DDPStrategy - - - class CustomDDPStrategy(DDPStrategy): - def configure_ddp(self): - self._model = MyCustomDistributedDataParallel( - self.model, - device_ids=..., - ) - - - trainer = Trainer(strategy=CustomDDPStrategy(), accelerator="gpu", devices=2) - -See Also: - - :ref:`Multi GPU Training `. - - :doc:`Model Parallel GPU training guide <../advanced/model_parallel>`. - - :doc:`TPU training guide <../accelerators/tpu>`. - -sync_batchnorm -^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -Enable synchronization between batchnorm layers across all GPUs. - -.. testcode:: - - trainer = Trainer(sync_batchnorm=True) - -track_grad_norm -^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -- no tracking (-1) -- Otherwise tracks that norm (2 for 2-norm) - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(track_grad_norm=-1) - - # track the 2-norm - trainer = Trainer(track_grad_norm=2) - -.. _tpu_cores: - -tpu_cores -^^^^^^^^^ - -.. warning:: ``tpu_cores=x`` has been deprecated in v1.7 and will be removed in v2.0. - Please use ``accelerator='tpu'`` and ``devices=x`` instead. - -.. raw:: html - - - -| - -- How many TPU cores to train on (1 or 8). -- Which TPU core to train on [1-8] - -A single TPU v2 or v3 has 8 cores. A TPU pod has -up to 2048 cores. A slice of a POD means you get as many cores -as you request. - -Your effective batch size is batch_size * total tpu cores. - -This parameter can be either 1 or 8. - -Example:: - - # your_trainer_file.py - - # default used by the Trainer (ie: train on CPU) - trainer = Trainer(tpu_cores=None) - - # int: train on a single core - trainer = Trainer(tpu_cores=1) - - # list: train on a single selected core - trainer = Trainer(tpu_cores=[2]) - - # int: train on all cores few cores - trainer = Trainer(tpu_cores=8) - - # for 8+ cores must submit via xla script with - # a max of 8 cores specified. The XLA script - # will duplicate script onto each TPU in the POD - trainer = Trainer(tpu_cores=8) - -To train on more than 8 cores (ie: a POD), -submit this script using the xla_dist script. - -Example:: - - python -m torch_xla.distributed.xla_dist - --tpu=$TPU_POD_NAME - --conda-env=torch-xla-nightly - --env=XLA_USE_BF16=1 - -- python your_trainer_file.py - - -val_check_interval -^^^^^^^^^^^^^^^^^^ - -.. raw:: html - - - -| - -How often within one training epoch to check the validation set. -Can specify as float or int. - -- pass a ``float`` in the range [0.0, 1.0] to check after a fraction of the training epoch. -- pass an ``int`` to check after a fixed number of training batches. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(val_check_interval=1.0) - - # check validation set 4 times during a training epoch - trainer = Trainer(val_check_interval=0.25) - - # check validation set every 1000 training batches - # use this when using iterableDataset and your dataset has no length - # (ie: production cases with streaming data) - trainer = Trainer(val_check_interval=1000) - - -.. code-block:: python - - # Here is the computation to estimate the total number of batches seen within an epoch. - - # Find the total number of train batches - total_train_batches = total_train_samples // (train_batch_size * world_size) - - # Compute how many times we will call validation during the training loop - val_check_batch = max(1, int(total_train_batches * val_check_interval)) - val_checks_per_epoch = total_train_batches / val_check_batch - - # Find the total number of validation batches - total_val_batches = total_val_samples // (val_batch_size * world_size) - - # Total number of batches run - total_fit_batches = total_train_batches + total_val_batches - - -weights_save_path -^^^^^^^^^^^^^^^^^ - - -.. warning:: `weights_save_path` has been deprecated in v1.6 and will be removed in v1.8. Please pass - ``dirpath`` directly to the :class:`~pytorch_lightning.callbacks.model_checkpoint.ModelCheckpoint` - callback. - - -.. raw:: html - - - -| - -Directory of where to save weights if specified. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(weights_save_path=os.getcwd()) - - # save to your custom path - trainer = Trainer(weights_save_path="my/path") - -Example:: - - # if checkpoint callback used, then overrides the weights path - # **NOTE: this saves weights to some/path NOT my/path - checkpoint = ModelCheckpoint(dirpath='some/path') - trainer = Trainer( - callbacks=[checkpoint], - weights_save_path='my/path' - ) - -weights_summary -^^^^^^^^^^^^^^^ - -.. warning:: `weights_summary` is deprecated in v1.5 and will be removed in v1.7. Please pass :class:`~pytorch_lightning.callbacks.model_summary.ModelSummary` - directly to the Trainer's ``callbacks`` argument instead. To disable the model summary, - pass ``enable_model_summary = False`` to the Trainer. - - -.. raw:: html - - - -| - -Prints a summary of the weights when training begins. -Options: 'full', 'top', None. - -.. testcode:: - - # default used by the Trainer (ie: print summary of top level modules) - trainer = Trainer(weights_summary="top") - - # print full summary of all modules and submodules - trainer = Trainer(weights_summary="full") - - # don't print a summary - trainer = Trainer(weights_summary=None) - - -enable_model_summary -^^^^^^^^^^^^^^^^^^^^ - -Whether to enable or disable the model summarization. Defaults to True. - -.. testcode:: - - # default used by the Trainer - trainer = Trainer(enable_model_summary=True) - - # disable summarization - trainer = Trainer(enable_model_summary=False) - - # enable custom summarization - from pytorch_lightning.callbacks import ModelSummary - - trainer = Trainer(enable_model_summary=True, callbacks=[ModelSummary(max_depth=-1)]) - ------ - -Trainer class API ------------------ - -Methods -^^^^^^^ - -init -**** - -.. automethod:: pytorch_lightning.trainer.Trainer.__init__ - :noindex: - -fit -**** - -.. automethod:: pytorch_lightning.trainer.Trainer.fit - :noindex: - -validate -******** - -.. automethod:: pytorch_lightning.trainer.Trainer.validate - :noindex: - -test -**** - -.. automethod:: pytorch_lightning.trainer.Trainer.test - :noindex: - -predict -******* - -.. automethod:: pytorch_lightning.trainer.Trainer.predict - :noindex: - -tune -**** - -.. automethod:: pytorch_lightning.trainer.Trainer.tune - :noindex: - - -Properties -^^^^^^^^^^ - -callback_metrics -**************** - -The metrics available to callbacks. These are automatically set when you log via `self.log` - -.. code-block:: python - - def training_step(self, batch, batch_idx): - self.log("a_val", 2) - - - callback_metrics = trainer.callback_metrics - assert callback_metrics["a_val"] == 2 - -current_epoch -************* - -The number of epochs run. - -.. code-block:: python - - if trainer.current_epoch >= 10: - ... - -global_step -*********** - -The number of optimizer steps taken (does not reset each epoch). -This includes multiple optimizers and TBPTT steps (if enabled). - -.. code-block:: python - - if trainer.global_step >= 100: - ... - -logger -******* - -The current logger being used. Here's an example using tensorboard - -.. code-block:: python - - logger = trainer.logger - tensorboard = logger.experiment - - -loggers -******** - -The list of loggers currently being used by the Trainer. - -.. code-block:: python - - # List of Logger objects - loggers = trainer.loggers - for logger in loggers: - logger.log_metrics({"foo": 1.0}) - - -logged_metrics -************** - -The metrics sent to the logger (visualizer). - -.. code-block:: python - - def training_step(self, batch, batch_idx): - self.log("a_val", 2, logger=True) - - - logged_metrics = trainer.logged_metrics - assert logged_metrics["a_val"] == 2 - -log_dir -******* -The directory for the current experiment. Use this to save images to, etc... - -.. code-block:: python - - def training_step(self, batch, batch_idx): - img = ... - save_img(img, self.trainer.log_dir) - - - -is_global_zero -************** - -Whether this process is the global zero in multi-node training - -.. code-block:: python - - def training_step(self, batch, batch_idx): - if self.trainer.is_global_zero: - print("in node 0, accelerator 0") - -progress_bar_metrics -******************** - -The metrics sent to the progress bar. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - self.log("a_val", 2, prog_bar=True) - - - progress_bar_metrics = trainer.progress_bar_metrics - assert progress_bar_metrics["a_val"] == 2 - - -estimated_stepping_batches -************************** - -Check out :meth:`~pytorch_lightning.trainer.trainer.Trainer.estimated_stepping_batches`. - -state -***** - -The current state of the Trainer, including the current function that is running, the stage of -execution within that function, and the status of the Trainer. - -.. code-block:: python - - # fn in ("fit", "validate", "test", "predict", "tune") - trainer.state.fn - # status in ("initializing", "running", "finished", "interrupted") - trainer.state.status - # stage in ("train", "sanity_check", "validate", "test", "predict", "tune") - trainer.state.stage diff --git a/source/conf.py b/source/conf.py deleted file mode 100644 index 2a5cdad..0000000 --- a/source/conf.py +++ /dev/null @@ -1,408 +0,0 @@ -# -# Configuration file for the Sphinx documentation builder. -# -# This file does only contain a selection of the most common options. For a -# full list see the documentation: -# http://www.sphinx-doc.org/en/master/config - -# -- Path setup -------------------------------------------------------------- - -# If extensions (or modules to document with autodoc) are in another directory, -# add these directories to sys.path here. If the directory is relative to the -# documentation root, use os.path.abspath to make it absolute, like shown here. - -# import m2r -import glob -import os -import shutil -import sys -import warnings -from importlib.util import module_from_spec, spec_from_file_location - -import pt_lightning_sphinx_theme - -# ----------------------- -# VARIABLES WHEN WORKING ON DOCS... MAKE THIS TRUE TO BUILD FASTER -# ----------------------- -_PL_FAST_DOCS_DEV = bool(int(os.getenv("PL_FAST_DOCS_DEV", 1))) - -# ----------------------- -# BUILD stuff -# ----------------------- -PATH_HERE = os.path.abspath(os.path.dirname(__file__)) -PATH_ROOT = os.path.join(PATH_HERE, "..") -PATH_RAW_NB = os.path.join(PATH_ROOT, "_notebooks") -sys.path.insert(0, os.path.abspath(PATH_ROOT)) -sys.path.append(os.path.join(PATH_RAW_NB, ".actions")) - -_SHOULD_COPY_NOTEBOOKS = False - - -try: - from assistant import AssistantCLI -except ImportError: - _SHOULD_COPY_NOTEBOOKS = False - warnings.warn("To build the code, please run: `git submodule update --init --recursive`", stacklevel=2) - -FOLDER_GENERATED = "generated" -SPHINX_MOCK_REQUIREMENTS = int(os.environ.get("SPHINX_MOCK_REQUIREMENTS", True)) - -spec = spec_from_file_location( - "pytorch_lightning/__about__.py", os.path.join(PATH_ROOT, "__about__.py") -) -about = module_from_spec(spec) -spec.loader.exec_module(about) - -# -- Project documents ------------------------------------------------------- -if _SHOULD_COPY_NOTEBOOKS: - AssistantCLI.copy_notebooks( - PATH_RAW_NB, PATH_HERE, "notebooks", patterns=[".", "course_UvA-DL", "lightning_examples"] - ) - - -def _transform_changelog(path_in: str, path_out: str) -> None: - with open(path_in) as fp: - chlog_lines = fp.readlines() - # enrich short subsub-titles to be unique - chlog_ver = "" - for i, ln in enumerate(chlog_lines): - if ln.startswith("## "): - chlog_ver = ln[2:].split("-")[0].strip() - elif ln.startswith("### "): - ln = ln.replace("###", f"### {chlog_ver} -") - chlog_lines[i] = ln - with open(path_out, "w") as fp: - fp.writelines(chlog_lines) - - -os.makedirs(os.path.join(PATH_HERE, FOLDER_GENERATED), exist_ok=True) -# # copy all documents from GH templates like contribution guide -# for md in glob.glob(os.path.join(PATH_ROOT, ".github", "*.md")): -# shutil.copy(md, os.path.join(PATH_HERE, FOLDER_GENERATED, os.path.basename(md))) -# # copy also the changelog -# _transform_changelog(os.path.join(PATH_ROOT, "CHANGELOG.md"), os.path.join(PATH_HERE, FOLDER_GENERATED, "CHANGELOG.md")) - -# -- Project information ----------------------------------------------------- - -project = "PyTorch Lightning" -copyright = about.__copyright__ -author = about.__author__ - -# The short X.Y version -version = about.__version__ -# The full version, including alpha/beta/rc tags -release = about.__version__ - -# -- General configuration --------------------------------------------------- - -# If your documentation needs a minimal Sphinx version, state it here. - -needs_sphinx = "4.0" - -# Add any Sphinx extension module names here, as strings. They can be -# extensions coming with Sphinx (named 'sphinx.ext.*') or your custom -# ones. -extensions = [ - "sphinx.ext.autodoc", - # 'sphinxcontrib.mockautodoc', # raises error: directive 'automodule' is already registered ... - # 'sphinxcontrib.fulltoc', # breaks pytorch-theme with unexpected kw argument 'titles_only' - "sphinx.ext.doctest", - "sphinx.ext.intersphinx", - "sphinx.ext.todo", - "sphinx.ext.coverage", - "sphinx.ext.viewcode", - "sphinx.ext.autosummary", - "sphinx.ext.napoleon", - "sphinx.ext.imgmath", - "sphinx.ext.autosectionlabel", - "myst_parser", - "nbsphinx", - "sphinx_autodoc_typehints", - "sphinx_copybutton", - "sphinx_paramlinks", - "sphinx_togglebutton", - "pt_lightning_sphinx_theme.extensions.lightning_tutorials", -] - -# Suppress warnings about duplicate labels (needed for PL tutorials) -suppress_warnings = [ - "autosectionlabel.*", -] - -# Add any paths that contain templates here, relative to this directory. -templates_path = ["_templates"] - -# https://berkeley-stat159-f17.github.io/stat159-f17/lectures/14-sphinx..html#conf.py-(cont.) -# https://stackoverflow.com/questions/38526888/embed-ipython-notebook-in-sphinx-document -# I execute the notebooks manually in advance. If notebooks test the code, -# they should be run at build time. -nbsphinx_execute = "never" -nbsphinx_allow_errors = True -nbsphinx_requirejs_path = "" - -# myst-parser, forcing to parse all html pages with mathjax -# https://github.com/executablebooks/MyST-Parser/issues/394 -myst_update_mathjax = False - -# The suffix(es) of source filenames. -# You can specify multiple suffix as a list of string: -# -source_parsers = {".rst": "restructuredtext", ".txt": "markdown", ".md": "markdown", ".ipynb": "nbsphinx"} - -# The master toctree document. -master_doc = "index" - -# The language for content autogenerated by Sphinx. Refer to documentation -# for a list of supported languages. -# -# This is also used if you do content translation via gettext catalogs. -# Usually you set "language" from the command line for these cases. -language = None - -# List of patterns, relative to source directory, that match files and -# directories to ignore when looking for source files. -# This pattern also affects html_static_path and html_extra_path. -exclude_patterns = [ - f"{FOLDER_GENERATED}/PULL_REQUEST_TEMPLATE.md", - "notebooks/sample-template*", -] - -if _PL_FAST_DOCS_DEV: - exclude_patterns.append("notebooks/*") - exclude_patterns.append("tutorials.rst") - - -# The name of the Pygments (syntax highlighting) style to use. -pygments_style = None - -# -- Options for HTML output ------------------------------------------------- - -# The theme to use for HTML and HTML Help pages. See the documentation for -# a list of builtin themes. -# http://www.sphinx-doc.org/en/master/usage/theming.html#builtin-themes -# html_theme = 'bizstyle' -# https://sphinx-themes.org -html_theme = "pt_lightning_sphinx_theme" -html_theme_path = [pt_lightning_sphinx_theme.get_html_theme_path()] -# html_theme_path = ["/Users/williamfalcon/Developer/opensource/lightning_sphinx_theme"] - -# Theme options are theme-specific and customize the look and feel of a theme -# further. For a list of options available for each theme, see the -# documentation. - -html_theme_options = { - "pytorch_project": "https://pytorchlightning.ai", - "canonical_url": about.__docs_url__, - "collapse_navigation": False, - "display_version": True, - "logo_only": False, -} - -html_logo = "_static/images/logo.svg" - -html_favicon = "_static/images/icon.svg" - -# Add any paths that contain custom static files (such as style sheets) here, -# relative to this directory. They are copied after the builtin static files, -# so a file named "default.css" will overwrite the builtin "default.css". -html_static_path = ["_templates", "_static"] - -# Custom sidebar templates, must be a dictionary that maps document names -# to template names. -# -# The default sidebars (for documents that don't match any pattern) are -# defined by theme itself. Builtin themes are using these templates by -# default: ``['localtoc.html', 'relations.html', 'sourcelink.html', -# 'searchbox.html']``. -# -# html_sidebars = {} - -# -- Options for HTMLHelp output --------------------------------------------- - -# Output file base name for HTML help builder. -htmlhelp_basename = project + "-doc" - -# -- Options for LaTeX output ------------------------------------------------ - -latex_elements = { - # The paper size ('letterpaper' or 'a4paper'). - # 'papersize': 'letterpaper', - # The font size ('10pt', '11pt' or '12pt'). - # 'pointsize': '10pt', - # Additional stuff for the LaTeX preamble. - # 'preamble': '', - # Latex figure (float) alignment - "figure_align": "htbp" -} - -# Grouping the document tree into LaTeX files. List of tuples -# (source start file, target name, title, -# author, documentclass [howto, manual, or own class]). -latex_documents = [(master_doc, project + ".tex", project + " Documentation", author, "manual")] - -# -- Options for manual page output ------------------------------------------ - -# One entry per manual page. List of tuples -# (source start file, name, description, authors, manual section). -man_pages = [(master_doc, project, project + " Documentation", [author], 1)] - -# -- Options for Texinfo output ---------------------------------------------- - -# Grouping the document tree into Texinfo files. List of tuples -# (source start file, target name, title, author, -# dir menu entry, description, category) -texinfo_documents = [ - ( - master_doc, - project, - project + " Documentation", - author, - project, - "One line description of project.", - "Miscellaneous", - ) -] - -# -- Options for Epub output ------------------------------------------------- - -# Bibliographic Dublin Core info. -epub_title = project - -# The unique identifier of the text. This can be a ISBN number -# or the project homepage. -# -# epub_identifier = '' - -# A unique identification for the text. -# -# epub_uid = '' - -# A list of files that should not be packed into the epub file. -epub_exclude_files = ["search.html"] - -# -- Extension configuration ------------------------------------------------- - -# -- Options for intersphinx extension --------------------------------------- - -# intersphinx_mapping = { -# "python": ("https://docs.python.org/3", None), -# "torch": ("https://pytorch.org/docs/stable/", None), -# "numpy": ("https://numpy.org/doc/stable/", None), -# "PIL": ("https://pillow.readthedocs.io/en/stable/", None), -# "torchmetrics": ("https://torchmetrics.readthedocs.io/en/stable/", None), -# "fairscale": ("https://fairscale.readthedocs.io/en/latest/", None), -# "graphcore": ("https://docs.graphcore.ai/en/latest/", None), -# } - -# -- Options for todo extension ---------------------------------------------- - -# If true, `todo` and `todoList` produce output, else they produce nothing. -todo_include_todos = True - - -def setup(app): - # this is for hiding doctest decoration, - # see: http://z4r.github.io/python/2011/12/02/hides-the-prompts-and-output/ - app.add_js_file("copybutton.js") - app.add_css_file("main.css") - - -# copy all notebooks to local folder -# path_nbs = os.path.join(PATH_HERE, 'notebooks') -# if not os.path.isdir(path_nbs): -# os.mkdir(path_nbs) -# for path_ipynb in glob.glob(os.path.join(PATH_ROOT, 'notebooks', '*.ipynb')): -# path_ipynb2 = os.path.join(path_nbs, os.path.basename(path_ipynb)) -# shutil.copy(path_ipynb, path_ipynb2) - - -# Ignoring Third-party packages -# https://stackoverflow.com/questions/15889621/sphinx-how-to-exclude-imports-in-automodule -def package_list_from_file(file): - """List up package name (not containing version and extras) from a package list file.""" - mocked_packages = [] - with open(file) as fp: - for ln in fp.readlines(): - # Example: `tqdm>=4.41.0` => `tqdm` - # `[` is for package with extras - found = [ln.index(ch) for ch in list(",=<>#[") if ch in ln] - pkg = ln[: min(found)] if found else ln - if pkg.rstrip(): - mocked_packages.append(pkg.rstrip()) - return mocked_packages - - -# define mapping from PyPI names to python imports -PACKAGE_MAPPING = { - "Pillow": "PIL", - "opencv-python": "cv2", - "PyYAML": "yaml", - "comet-ml": "comet_ml", - "neptune-client": "neptune", - "hydra-core": "hydra", - "pyDeprecate": "deprecate", -} -MOCK_PACKAGES = [] -if SPHINX_MOCK_REQUIREMENTS: - MOCK_PACKAGES += ["fairscale"] - # mock also base packages when we are on RTD since we don't install them there - MOCK_PACKAGES += package_list_from_file(os.path.join(PATH_ROOT, "requirements.txt")) - # MOCK_PACKAGES += package_list_from_file(os.path.join(PATH_ROOT, "requirements", "extra.txt")) - # MOCK_PACKAGES += package_list_from_file(os.path.join(PATH_ROOT, "requirements", "loggers.txt")) -MOCK_PACKAGES = [PACKAGE_MAPPING.get(pkg, pkg) for pkg in MOCK_PACKAGES] - -autodoc_mock_imports = MOCK_PACKAGES - -autosummary_generate = True - -autodoc_member_order = "groupwise" - -autoclass_content = "both" - -autodoc_default_options = { - "members": True, - "methods": True, - "special-members": "__call__", - "exclude-members": "_abc_impl", - "show-inheritance": True, -} - -# Sphinx will add “permalinks” for each heading and description environment as paragraph signs that -# become visible when the mouse hovers over them. -# This value determines the text for the permalink; it defaults to "¶". Set it to None or the empty -# string to disable permalinks. -# https://www.sphinx-doc.org/en/master/usage/configuration.html#confval-html_add_permalinks -html_permalinks = True -html_permalinks_icon = "¶" - -# True to prefix each section label with the name of the document it is in, followed by a colon. -# For example, index:Introduction for a section called Introduction that appears in document index.rst. -# Useful for avoiding ambiguity when the same section heading appears in different documents. -# http://www.sphinx-doc.org/en/master/usage/extensions/autosectionlabel.html -autosectionlabel_prefix_document = True - -# only run doctests marked with a ".. doctest::" directive -doctest_test_doctest_blocks = "" -doctest_global_setup = """ -import importlib -import os -import sys -from typing import Optional - -import torch -import pytorch_lightning as pl -from torch import nn -from torch.utils.data import IterableDataset, DataLoader, Dataset -from pytorch_lightning import LightningDataModule, LightningModule, Trainer, seed_everything -from pytorch_lightning.callbacks import Callback -from pytorch_lightning.utilities import ( - _APEX_AVAILABLE, - _XLA_AVAILABLE, - _TPU_AVAILABLE, - _TORCHVISION_AVAILABLE, - _TORCH_GREATER_EQUAL_1_10, - _module_available, -) -_JSONARGPARSE_AVAILABLE = _module_available("jsonargparse") -""" -coverage_skip_undoc_in_source = True diff --git a/source/data/datamodule.rst b/source/data/datamodule.rst deleted file mode 100644 index bce1877..0000000 --- a/source/data/datamodule.rst +++ /dev/null @@ -1,501 +0,0 @@ -.. _datamodules: - -################### -LightningDataModule -################### -A datamodule is a shareable, reusable class that encapsulates all the steps needed to process data: - -.. raw:: html - - - -| - -A datamodule encapsulates the five steps involved in data processing in PyTorch: - -1. Download / tokenize / process. -2. Clean and (maybe) save to disk. -3. Load inside :class:`~torch.utils.data.Dataset`. -4. Apply transforms (rotate, tokenize, etc...). -5. Wrap inside a :class:`~torch.utils.data.DataLoader`. - -| - -This class can then be shared and used anywhere: - -.. code-block:: python - - from pl_bolts.datamodules import CIFAR10DataModule, ImagenetDataModule - - model = LitClassifier() - trainer = Trainer() - - imagenet = ImagenetDataModule() - trainer.fit(model, datamodule=imagenet) - - cifar10 = CIFAR10DataModule() - trainer.fit(model, datamodule=cifar10) - ---------------- - -*************************** -Why do I need a DataModule? -*************************** -In normal PyTorch code, the data cleaning/preparation is usually scattered across many files. This makes -sharing and reusing the exact splits and transforms across projects impossible. - -Datamodules are for you if you ever asked the questions: - -- what splits did you use? -- what transforms did you use? -- what normalization did you use? -- how did you prepare/tokenize the data? - --------------- - -********************* -What is a DataModule? -********************* -A DataModule is simply a collection of a train_dataloader(s), val_dataloader(s), test_dataloader(s) and -predict_dataloader(s) along with the matching transforms and data processing/downloads steps required. - -Here's a simple PyTorch example: - -.. code-block:: python - - # regular PyTorch - test_data = MNIST(my_path, train=False, download=True) - predict_data = MNIST(my_path, train=False, download=True) - train_data = MNIST(my_path, train=True, download=True) - train_data, val_data = random_split(train_data, [55000, 5000]) - - train_loader = DataLoader(train_data, batch_size=32) - val_loader = DataLoader(val_data, batch_size=32) - test_loader = DataLoader(test_data, batch_size=32) - predict_loader = DataLoader(predict_data, batch_size=32) - -The equivalent DataModule just organizes the same exact code, but makes it reusable across projects. - -.. code-block:: python - - class MNISTDataModule(pl.LightningDataModule): - def __init__(self, data_dir: str = "path/to/dir", batch_size: int = 32): - super().__init__() - self.data_dir = data_dir - self.batch_size = batch_size - - def setup(self, stage: Optional[str] = None): - self.mnist_test = MNIST(self.data_dir, train=False) - self.mnist_predict = MNIST(self.data_dir, train=False) - mnist_full = MNIST(self.data_dir, train=True) - self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000]) - - def train_dataloader(self): - return DataLoader(self.mnist_train, batch_size=self.batch_size) - - def val_dataloader(self): - return DataLoader(self.mnist_val, batch_size=self.batch_size) - - def test_dataloader(self): - return DataLoader(self.mnist_test, batch_size=self.batch_size) - - def predict_dataloader(self): - return DataLoader(self.mnist_predict, batch_size=self.batch_size) - - def teardown(self, stage: Optional[str] = None): - # Used to clean-up when the run is finished - ... - -But now, as the complexity of your processing grows (transforms, multiple-GPU training), you can -let Lightning handle those details for you while making this dataset reusable so you can share with -colleagues or use in different projects. - -.. code-block:: python - - mnist = MNISTDataModule(my_path) - model = LitClassifier() - - trainer = Trainer() - trainer.fit(model, mnist) - -Here's a more realistic, complex DataModule that shows how much more reusable the datamodule is. - -.. code-block:: python - - import pytorch_lightning as pl - from torch.utils.data import random_split, DataLoader - - # Note - you must have torchvision installed for this example - from torchvision.datasets import MNIST - from torchvision import transforms - - - class MNISTDataModule(pl.LightningDataModule): - def __init__(self, data_dir: str = "./"): - super().__init__() - self.data_dir = data_dir - self.transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.1307,), (0.3081,))]) - - def prepare_data(self): - # download - MNIST(self.data_dir, train=True, download=True) - MNIST(self.data_dir, train=False, download=True) - - def setup(self, stage: Optional[str] = None): - - # Assign train/val datasets for use in dataloaders - if stage == "fit" or stage is None: - mnist_full = MNIST(self.data_dir, train=True, transform=self.transform) - self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000]) - - # Assign test dataset for use in dataloader(s) - if stage == "test" or stage is None: - self.mnist_test = MNIST(self.data_dir, train=False, transform=self.transform) - - if stage == "predict" or stage is None: - self.mnist_predict = MNIST(self.data_dir, train=False, transform=self.transform) - - def train_dataloader(self): - return DataLoader(self.mnist_train, batch_size=32) - - def val_dataloader(self): - return DataLoader(self.mnist_val, batch_size=32) - - def test_dataloader(self): - return DataLoader(self.mnist_test, batch_size=32) - - def predict_dataloader(self): - return DataLoader(self.mnist_predict, batch_size=32) - ---------------- - -*********************** -LightningDataModule API -*********************** -To define a DataModule the following methods are used to create train/val/test/predict dataloaders: - -- :ref:`prepare_data` (how to download, tokenize, etc...) -- :ref:`setup` (how to split, define dataset, etc...) -- :ref:`train_dataloader` -- :ref:`val_dataloader` -- :ref:`test_dataloader` -- :ref:`predict_dataloader` - - -prepare_data -============ -Downloading and saving data with multiple processes (distributed settings) will result in corrupted data. Lightning -ensures the :meth:`~pytorch_lightning.core.hooks.DataHooks.prepare_data` is called only within a single process on CPU, -so you can safely add your downloading logic within. In case of multi-node training, the execution of this hook -depends upon :ref:`prepare_data_per_node`. :meth:`~pytorch_lightning.core.hooks.DataHooks.setup` is called after -``prepare_data`` and there is a barrier in between which ensures that all the processes proceed to ``setup`` once the data is prepared and available for use. - -- download, i.e. download data only once on the disk from a single process -- tokenize. Since it's a one time process, it is not recommended to do it on all processes -- etc... - -.. code-block:: python - - class MNISTDataModule(pl.LightningDataModule): - def prepare_data(self): - # download - MNIST(os.getcwd(), train=True, download=True, transform=transforms.ToTensor()) - MNIST(os.getcwd(), train=False, download=True, transform=transforms.ToTensor()) - - -.. warning:: - - ``prepare_data`` is called from the main process. It is not recommended to assign state here (e.g. ``self.x = y``) since it is called on a single process and if you assign - states here then they won't be available for other processes. - - -setup -===== -There are also data operations you might want to perform on every GPU. Use :meth:`~pytorch_lightning.core.hooks.DataHooks.setup` to do things like: - -- count number of classes -- build vocabulary -- perform train/val/test splits -- create datasets -- apply transforms (defined explicitly in your datamodule) -- etc... - -.. code-block:: python - - import pytorch_lightning as pl - - - class MNISTDataModule(pl.LightningDataModule): - def setup(self, stage: Optional[str] = None): - - # Assign Train/val split(s) for use in Dataloaders - if stage in (None, "fit"): - mnist_full = MNIST(self.data_dir, train=True, download=True, transform=self.transform) - self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000]) - - # Assign Test split(s) for use in Dataloaders - if stage in (None, "test"): - self.mnist_test = MNIST(self.data_dir, train=False, download=True, transform=self.transform) - - -For eg., if you are working with NLP task where you need to tokenize the text and use it, then you can do something like as follows: - -.. code-block:: python - - class LitDataModule(LightningDataModule): - def prepare_data(self): - dataset = load_Dataset(...) - train_dataset = ... - val_dataset = ... - # tokenize - # save it to disk - - def setup(self, stage): - # load it back here - dataset = load_dataset_from_disk(...) - - -This method expects a ``stage`` argument. -It is used to separate setup logic for ``trainer.{fit,validate,test,predict}``. If ``setup`` is called with ``stage=None``, -we assume all stages have been set-up. - -.. note:: :ref:`setup` is called from every process across all the nodes. Setting state here is recommended. -.. note:: :ref:`teardown` can be used to clean up the state. It is also called from every process across all the nodes. - - -train_dataloader -================ -Use the :meth:`~pytorch_lightning.core.hooks.DataHooks.train_dataloader` method to generate the training dataloader(s). -Usually you just wrap the dataset you defined in :ref:`setup`. This is the dataloader that the Trainer -:meth:`~pytorch_lightning.trainer.trainer.Trainer.fit` method uses. - -.. code-block:: python - - import pytorch_lightning as pl - - - class MNISTDataModule(pl.LightningDataModule): - def train_dataloader(self): - return DataLoader(self.mnist_train, batch_size=64) - -.. _datamodule_val_dataloader_label: - -val_dataloader -============== -Use the :meth:`~pytorch_lightning.core.hooks.DataHooks.val_dataloader` method to generate the validation dataloader(s). -Usually you just wrap the dataset you defined in :ref:`setup`. This is the dataloader that the Trainer -:meth:`~pytorch_lightning.trainer.trainer.Trainer.fit` and :meth:`~pytorch_lightning.trainer.trainer.Trainer.validate` methods uses. - -.. code-block:: python - - import pytorch_lightning as pl - - - class MNISTDataModule(pl.LightningDataModule): - def val_dataloader(self): - return DataLoader(self.mnist_val, batch_size=64) - - -.. _datamodule_test_dataloader_label: - -test_dataloader -=============== -Use the :meth:`~pytorch_lightning.core.hooks.DataHooks.test_dataloader` method to generate the test dataloader(s). -Usually you just wrap the dataset you defined in :ref:`setup`. This is the dataloader that the Trainer -:meth:`~pytorch_lightning.trainer.trainer.Trainer.test` method uses. - -.. code-block:: python - - import pytorch_lightning as pl - - - class MNISTDataModule(pl.LightningDataModule): - def test_dataloader(self): - return DataLoader(self.mnist_test, batch_size=64) - - -predict_dataloader -================== -Use the :meth:`~pytorch_lightning.core.hooks.DataHooks.predict_dataloader` method to generate the prediction dataloader(s). -Usually you just wrap the dataset you defined in :ref:`setup`. This is the dataloader that the Trainer -:meth:`~pytorch_lightning.trainer.trainer.Trainer.predict` method uses. - -.. code-block:: python - - import pytorch_lightning as pl - - - class MNISTDataModule(pl.LightningDataModule): - def predict_dataloader(self): - return DataLoader(self.mnist_predict, batch_size=64) - - -transfer_batch_to_device -======================== - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.transfer_batch_to_device - :noindex: - -on_before_batch_transfer -======================== - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.on_before_batch_transfer - :noindex: - -on_after_batch_transfer -======================= - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.on_after_batch_transfer - :noindex: - -load_state_dict -=============== - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.load_state_dict - :noindex: - -state_dict -========== - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.state_dict - :noindex: - -on_train_dataloader -=================== - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.on_train_dataloader - :noindex: - -on_val_dataloader -================= - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.on_val_dataloader - :noindex: - -on_test_dataloader -================== - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.on_test_dataloader - :noindex: - -on_predict_dataloader -===================== - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.on_predict_dataloader - :noindex: - -teardown -======== - -.. automethod:: pytorch_lightning.core.datamodule.LightningDataModule.teardown - :noindex: - -prepare_data_per_node -===================== -If set to ``True`` will call ``prepare_data()`` on LOCAL_RANK=0 for every node. -If set to ``False`` will only call from NODE_RANK=0, LOCAL_RANK=0. - -.. testcode:: - - class LitDataModule(LightningDataModule): - def __init__(self): - super().__init__() - self.prepare_data_per_node = True - - ------------------- - -****************** -Using a DataModule -****************** - -The recommended way to use a DataModule is simply: - -.. code-block:: python - - dm = MNISTDataModule() - model = Model() - trainer.fit(model, datamodule=dm) - trainer.test(datamodule=dm) - trainer.validate(datamodule=dm) - trainer.predict(datamodule=dm) - -If you need information from the dataset to build your model, then run -:ref:`prepare_data` and -:ref:`setup` manually (Lightning ensures -the method runs on the correct devices). - -.. code-block:: python - - dm = MNISTDataModule() - dm.prepare_data() - dm.setup(stage="fit") - - model = Model(num_classes=dm.num_classes, width=dm.width, vocab=dm.vocab) - trainer.fit(model, dm) - - dm.setup(stage="test") - trainer.test(datamodule=dm) - ----------------- - -***************************** -DataModules without Lightning -***************************** -You can of course use DataModules in plain PyTorch code as well. - -.. code-block:: python - - # download, etc... - dm = MNISTDataModule() - dm.prepare_data() - - # splits/transforms - dm.setup(stage="fit") - - # use data - for batch in dm.train_dataloader(): - ... - - for batch in dm.val_dataloader(): - ... - - dm.teardown(stage="fit") - - # lazy load test data - dm.setup(stage="test") - for batch in dm.test_dataloader(): - ... - - dm.teardown(stage="test") - -But overall, DataModules encourage reproducibility by allowing all details of a dataset to be specified in a unified -structure. - ----------------- - -****************************** -Hyperparameters in DataModules -****************************** -Like LightningModules, DataModules support hyperparameters with the same API. - -.. code-block:: python - - import pytorch_lightning as pl - - - class CustomDataModule(pl.LightningDataModule): - def __init__(self, *args, **kwargs): - super().__init__() - self.save_hyperparameters() - - def configure_optimizers(self): - # access the saved hyperparameters - opt = optim.Adam(self.parameters(), lr=self.hparams.lr) - -Refer to ``save_hyperparameters`` in :doc:`lightning module <../common/lightning_module>` for more details. - - ----- - -.. include:: ../extensions/datamodules_state.rst diff --git a/source/debug/debugging_intermediate.rst b/source/debug/debugging_intermediate.rst deleted file mode 100644 index da8eb59..0000000 --- a/source/debug/debugging_intermediate.rst +++ /dev/null @@ -1,79 +0,0 @@ -:orphan: - -.. _debugging_intermediate: - - -############################### -Debug your model (intermediate) -############################### -**Audience**: Users who want to debug their ML code - ----- - -*************************** -Why should I debug ML code? -*************************** -Machine learning code requires debugging mathematical correctness, which is not something non-ML code has to deal with. Lightning implements a few best-practice techniques to give all users, expert level ML debugging abilities. - ----- - -************************************** -Overfit your model on a Subset of Data -************************************** -A good debugging technique is to take a tiny portion of your data (say 2 samples per class), -and try to get your model to overfit. If it can't, it's a sign it won't work with large datasets. - -(See: :paramref:`~pytorch_lightning.trainer.trainer.Trainer.overfit_batches` -argument of :class:`~pytorch_lightning.trainer.trainer.Trainer`) - -.. testcode:: - - # use only 1% of training data (and turn off validation) - trainer = Trainer(overfit_batches=0.01) - - # similar, but with a fixed 10 batches - trainer = Trainer(overfit_batches=10) - -When using this argument, the validation loop will be disabled. We will also replace the sampler -in the training set to turn off shuffle for you. - ----- - -******************************** -Look-out for exploding gradients -******************************** -One major problem that plagues models is exploding gradients. Gradient norm is one technique that can help keep gradients from exploding. - -.. testcode:: - - # the 2-norm - trainer = Trainer(track_grad_norm=2) - -This will plot the 2-norm to your experiment manager. If you notice the norm is going up, there's a good chance your gradients are/will explode. - -One technique to stop exploding gradients is to clip the gradient - -.. testcode:: - - # DEFAULT (ie: don't clip) - trainer = Trainer(gradient_clip_val=0) - - # clip gradients' global norm to <=0.5 using gradient_clip_algorithm='norm' by default - trainer = Trainer(gradient_clip_val=0.5) - - # clip gradients' maximum magnitude to <=0.5 - trainer = Trainer(gradient_clip_val=0.5, gradient_clip_algorithm="value") - ----- - -************************* -Detect autograd anomalies -************************* -Lightning helps you detect anomalies in the PyTorh autograd engine via PyTorch's built-in -`Anomaly Detection Context-manager `_. - -Enable it via the **detect_anomaly** trainer argument: - -.. testcode:: - - trainer = Trainer(detect_anomaly=True) diff --git a/source/deploy/production_advanced.rst b/source/deploy/production_advanced.rst deleted file mode 100644 index 750355d..0000000 --- a/source/deploy/production_advanced.rst +++ /dev/null @@ -1,60 +0,0 @@ -######################################## -Deploy models into production (advanced) -######################################## -**Audience**: Machine learning engineers optimizing models for enterprise-scale production environments. - ----- - -************************** -Compile your model to ONNX -************************** -`ONNX `_ is a package developed by Microsoft to optimize inference. ONNX allows the model to be independent of PyTorch and run on any ONNX Runtime. - -To export your model to ONNX format call the :meth:`~pytorch_lightning.core.lightning.LightningModule.to_onnx` function on your :class:`~pytorch_lightning.core.lightning.LightningModule` with the ``filepath`` and ``input_sample``. - -.. code-block:: python - - class SimpleModel(LightningModule): - def __init__(self): - super().__init__() - self.l1 = torch.nn.Linear(in_features=64, out_features=4) - - def forward(self, x): - return torch.relu(self.l1(x.view(x.size(0), -1))) - - - # create the model - model = SimpleModel() - filepath = "model.onnx" - input_sample = torch.randn((1, 64)) - model.to_onnx(filepath, input_sample, export_params=True) - -You can also skip passing the input sample if the ``example_input_array`` property is specified in your :class:`~pytorch_lightning.core.lightning.LightningModule`. - -.. code-block:: python - - class SimpleModel(LightningModule): - def __init__(self): - super().__init__() - self.l1 = torch.nn.Linear(in_features=64, out_features=4) - self.example_input_array = torch.randn(7, 64) - - def forward(self, x): - return torch.relu(self.l1(x.view(x.size(0), -1))) - - - # create the model - model = SimpleModel() - filepath = "model.onnx" - model.to_onnx(filepath, export_params=True) - -Once you have the exported model, you can run it on your ONNX runtime in the following way: - -.. code-block:: python - - import onnxruntime - - ort_session = onnxruntime.InferenceSession(filepath) - input_name = ort_session.get_inputs()[0].name - ort_inputs = {input_name: np.random.randn(1, 64)} - ort_outs = ort_session.run(None, ort_inputs) diff --git a/source/deploy/production_basic.rst b/source/deploy/production_basic.rst deleted file mode 100644 index 00e9caa..0000000 --- a/source/deploy/production_basic.rst +++ /dev/null @@ -1,80 +0,0 @@ -##################################### -Deploy models into production (basic) -##################################### -**Audience**: All users. - ----- - -***************************** -Load a checkpoint and predict -***************************** -The easiest way to use a model for predictions is to load the weights using **load_from_checkpoint** found in the LightningModule. - -.. code-block:: python - - model = LitModel.load_from_checkpoint("best_model.ckpt") - model.eval() - x = torch.randn(1, 64) - - with torch.no_grad(): - y_hat = model(x) - ----- - -************************************** -Predict step with your LightningModule -************************************** -Loading a checkpoint and predicting still leaves you with a lot of boilerplate around the predict epoch. The **predict step** in the LightningModule removes this boilerplate. - -.. code-block:: python - - class MyModel(LightningModule): - def predict_step(self, batch, batch_idx, dataloader_idx=0): - return self(batch) - -And pass in any dataloader to the Lightning Trainer: - -.. code-block:: python - - data_loader = DataLoader(...) - model = MyModel() - trainer = Trainer() - predictions = trainer.predict(model, data_loader) - ----- - -******************************** -Enable complicated predict logic -******************************** -When you need to add complicated pre-processing or post-processing logic to your data use the predict step. For example here we do `Monte Carlo Dropout `_ for predictions: - -.. code-block:: python - - class LitMCdropoutModel(pl.LightningModule): - def __init__(self, model, mc_iteration): - super().__init__() - self.model = model - self.dropout = nn.Dropout() - self.mc_iteration = mc_iteration - - def predict_step(self, batch, batch_idx): - # enable Monte Carlo Dropout - self.dropout.train() - - # take average of `self.mc_iteration` iterations - pred = [self.dropout(self.model(x)).unsqueeze(0) for _ in range(self.mc_iteration)] - pred = torch.vstack(pred).mean(dim=0) - return pred - ----- - -**************************** -Enable distributed inference -**************************** -By using the predict step in Lightning you get free distributed inference - - -.. code-block:: python - - trainer = Trainer(devices=8, accelerator="gpu") - predictions = trainer.predict(model, data_loader) diff --git a/source/ecosystem/transformers.rst b/source/ecosystem/transformers.rst deleted file mode 100644 index b20402a..0000000 --- a/source/ecosystem/transformers.rst +++ /dev/null @@ -1,47 +0,0 @@ -:orphan: - -Lightning Transformers -====================== - -`Lightning Transformers `_ offers a flexible interface for training and fine-tuning SOTA Transformer models -using the :doc:`PyTorch Lightning Trainer <../common/trainer>`. - -.. code-block:: bash - - pip install lightning-transformers - -In Lightning Transformers, we offer the following benefits: - -- Powered by `PyTorch Lightning `_ - Accelerators, custom Callbacks, Loggers, and high performance scaling with minimal changes. -- Backed by `HuggingFace Transformers `_ models and datasets, spanning multiple modalities and tasks within NLP/Audio and Vision. -- Task Abstraction for Rapid Research & Experimentation - Build your own custom transformer tasks across all modalities with little friction. -- Powerful config composition backed by `Hydra `_ - simply swap out models, optimizers, schedulers task, and many more configurations without touching the code. -- Seamless Memory and Speed Optimizations - Out-of-the-box training optimizations such as `DeepSpeed ZeRO `_ or `FairScale Sharded Training `_ with no code changes. - ------------------ - -Using Lightning-Transformers ----------------------------- - -Lightning Transformers has a collection of tasks for common NLP problems such as `language_modeling `_, -`translation `_ and more. To use, simply: - -1. Pick a task to train (passed to ``train.py`` as ``task=``) - -2. Pick a dataset (passed to ``train.py`` as ``dataset=``) - -3. Customize the backbone, optimizer, or any component within the config - -4. Add any :doc:`Lightning supported parameters and optimizations <../common/trainer>` - -.. code-block:: bash - - python train.py \ - task= \ - dataset= - backbone.pretrained_model_name_or_path= # Optionally change the HF backbone - optimizer= # Optionally specify optimizer (Default AdamW) - trainer. # Optionally specify Lightning trainer arguments - - -To learn more about Lightning Transformers, please refer to the `Lightning Transformers documentation `_. diff --git a/source/extensions/callbacks.rst b/source/extensions/callbacks.rst deleted file mode 100644 index 6def5ee..0000000 --- a/source/extensions/callbacks.rst +++ /dev/null @@ -1,408 +0,0 @@ -.. role:: hidden - :class: hidden-section - -.. _callbacks: - -######## -Callback -######## - -.. raw:: html - - - -| - -A callback is a self-contained program that can be reused across projects. - -Lightning has a callback system to execute them when needed. Callbacks should capture NON-ESSENTIAL -logic that is NOT required for your :doc:`lightning module <../common/lightning_module>` to run. - -Here's the flow of how the callback hooks are executed: - -.. raw:: html - - - -An overall Lightning system should have: - -1. Trainer for all engineering -2. LightningModule for all research code. -3. Callbacks for non-essential code. - -| - -Example: - -.. testcode:: - - from pytorch_lightning.callbacks import Callback - - - class MyPrintingCallback(Callback): - def on_train_start(self, trainer, pl_module): - print("Training is starting") - - def on_train_end(self, trainer, pl_module): - print("Training is ending") - - - trainer = Trainer(callbacks=[MyPrintingCallback()]) - -We successfully extended functionality without polluting our super clean -:doc:`lightning module <../common/lightning_module>` research code. - ------------ - -******** -Examples -******** -You can do pretty much anything with callbacks. - -- `Add a MLP to fine-tune self-supervised networks `_. -- `Find how to modify an image input to trick the classification result `_. -- `Interpolate the latent space of any variational model `_. -- `Log images to Tensorboard for any model `_. - - --------------- - -****************** -Built-in Callbacks -****************** -Lightning has a few built-in callbacks. - -.. note:: - For a richer collection of callbacks, check out our - `bolts library `_. - -.. currentmodule:: pytorch_lightning.callbacks - -.. autosummary:: - :nosignatures: - :template: classtemplate.rst - - BackboneFinetuning - BaseFinetuning - BasePredictionWriter - Callback - DeviceStatsMonitor - EarlyStopping - GradientAccumulationScheduler - LambdaCallback - LearningRateMonitor - ModelCheckpoint - ModelPruning - ModelSummary - ProgressBarBase - QuantizationAwareTraining - RichModelSummary - RichProgressBar - StochasticWeightAveraging - Timer - TQDMProgressBar - ----------- - -.. include:: callbacks_state.rst - ----------- - -************** -Best Practices -************** -The following are best practices when using/designing callbacks. - -1. Callbacks should be isolated in their functionality. -2. Your callback should not rely on the behavior of other callbacks in order to work properly. -3. Do not manually call methods from the callback. -4. Directly calling methods (eg. `on_validation_end`) is strongly discouraged. -5. Whenever possible, your callbacks should not depend on the order in which they are executed. - ------------ - -.. _callback_hooks: - -************ -Callback API -************ -Here is the full API of methods available in the Callback base class. - -The :class:`~pytorch_lightning.callbacks.Callback` class is the base for all the callbacks in Lightning just like the :class:`~pytorch_lightning.core.lightning.LightningModule` is the base for all models. -It defines a public interface that each callback implementation must follow, the key ones are: - -Properties -========== - -state_key -^^^^^^^^^ - -.. autoattribute:: pytorch_lightning.callbacks.Callback.state_key - :noindex: - - -Hooks -===== - -on_configure_sharded_model -^^^^^^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_configure_sharded_model - :noindex: - -setup -^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.setup - :noindex: - -teardown -^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.teardown - :noindex: - -on_init_start -^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_init_start - :noindex: - -on_init_end -^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_init_end - :noindex: - -on_fit_start -^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_fit_start - :noindex: - -on_fit_end -^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_fit_end - :noindex: - -on_sanity_check_start -^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_sanity_check_start - :noindex: - -on_sanity_check_end -^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_sanity_check_end - :noindex: - -on_train_batch_start -^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_train_batch_start - :noindex: - -on_train_batch_end -^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_train_batch_end - :noindex: - -on_train_epoch_start -^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_train_epoch_start - :noindex: - -on_train_epoch_end -^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_train_epoch_end - :noindex: - -on_validation_epoch_start -^^^^^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_validation_epoch_start - :noindex: - -on_validation_epoch_end -^^^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_validation_epoch_end - :noindex: - -on_test_epoch_start -^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_test_epoch_start - :noindex: - -on_test_epoch_end -^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_test_epoch_end - :noindex: - -on_predict_epoch_start -^^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_predict_epoch_start - :noindex: - -on_predict_epoch_end -^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_predict_epoch_end - :noindex: - -.. automethod:: pytorch_lightning.callbacks.Callback.on_epoch_end - :noindex: - -on_validation_batch_start -^^^^^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_validation_batch_start - :noindex: - -on_validation_batch_end -^^^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_validation_batch_end - :noindex: - -on_test_batch_start -^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_test_batch_start - :noindex: - -on_test_batch_end -^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_test_batch_end - :noindex: - -on_predict_batch_start -^^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_predict_batch_start - :noindex: - -on_predict_batch_end -^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_predict_batch_end - :noindex: - -on_train_start -^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_train_start - :noindex: - -on_train_end -^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_train_end - :noindex: - -on_validation_start -^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_validation_start - :noindex: - -on_validation_end -^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_validation_end - :noindex: - -on_test_start -^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_test_start - :noindex: - -on_test_end -^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_test_end - :noindex: - -on_predict_start -^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_predict_start - :noindex: - -on_predict_end -^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_predict_end - :noindex: - -on_keyboard_interrupt -^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_keyboard_interrupt - :noindex: - -on_exception -^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_exception - :noindex: - -state_dict -^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.state_dict - :noindex: - -on_save_checkpoint -^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_save_checkpoint - :noindex: - -load_state_dict -^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.load_state_dict - :noindex: - -on_load_checkpoint -^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_load_checkpoint - :noindex: - -on_before_backward -^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_before_backward - :noindex: - -on_after_backward -^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_after_backward - :noindex: - -on_before_optimizer_step -^^^^^^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_before_optimizer_step - :noindex: - -on_before_zero_grad -^^^^^^^^^^^^^^^^^^^ - -.. automethod:: pytorch_lightning.callbacks.Callback.on_before_zero_grad - :noindex: diff --git a/source/extensions/generated/pytorch_lightning.loggers.CSVLogger.rst b/source/extensions/generated/pytorch_lightning.loggers.CSVLogger.rst deleted file mode 100644 index bd8ccbf..0000000 --- a/source/extensions/generated/pytorch_lightning.loggers.CSVLogger.rst +++ /dev/null @@ -1,15 +0,0 @@ -.. role:: hidden - :class: hidden-section -.. currentmodule:: pytorch_lightning.loggers - - -CSVLogger -========= - -.. autoclass:: CSVLogger - :members: - - -.. - autogenerated from source/_templates/classtemplate.rst - note it does not have :inherited-members: \ No newline at end of file diff --git a/source/extensions/generated/pytorch_lightning.loggers.CometLogger.rst b/source/extensions/generated/pytorch_lightning.loggers.CometLogger.rst deleted file mode 100644 index 324d77c..0000000 --- a/source/extensions/generated/pytorch_lightning.loggers.CometLogger.rst +++ /dev/null @@ -1,15 +0,0 @@ -.. role:: hidden - :class: hidden-section -.. currentmodule:: pytorch_lightning.loggers - - -CometLogger -=========== - -.. autoclass:: CometLogger - :members: - - -.. - autogenerated from source/_templates/classtemplate.rst - note it does not have :inherited-members: \ No newline at end of file diff --git a/source/extensions/generated/pytorch_lightning.loggers.MLFlowLogger.rst b/source/extensions/generated/pytorch_lightning.loggers.MLFlowLogger.rst deleted file mode 100644 index 2eaf478..0000000 --- a/source/extensions/generated/pytorch_lightning.loggers.MLFlowLogger.rst +++ /dev/null @@ -1,15 +0,0 @@ -.. role:: hidden - :class: hidden-section -.. currentmodule:: pytorch_lightning.loggers - - -MLFlowLogger -============ - -.. autoclass:: MLFlowLogger - :members: - - -.. - autogenerated from source/_templates/classtemplate.rst - note it does not have :inherited-members: \ No newline at end of file diff --git a/source/extensions/generated/pytorch_lightning.loggers.NeptuneLogger.rst b/source/extensions/generated/pytorch_lightning.loggers.NeptuneLogger.rst deleted file mode 100644 index e9da513..0000000 --- a/source/extensions/generated/pytorch_lightning.loggers.NeptuneLogger.rst +++ /dev/null @@ -1,15 +0,0 @@ -.. role:: hidden - :class: hidden-section -.. currentmodule:: pytorch_lightning.loggers - - -NeptuneLogger -============= - -.. autoclass:: NeptuneLogger - :members: - - -.. - autogenerated from source/_templates/classtemplate.rst - note it does not have :inherited-members: \ No newline at end of file diff --git a/source/extensions/generated/pytorch_lightning.loggers.TensorBoardLogger.rst b/source/extensions/generated/pytorch_lightning.loggers.TensorBoardLogger.rst deleted file mode 100644 index 6bcd4a2..0000000 --- a/source/extensions/generated/pytorch_lightning.loggers.TensorBoardLogger.rst +++ /dev/null @@ -1,15 +0,0 @@ -.. role:: hidden - :class: hidden-section -.. currentmodule:: pytorch_lightning.loggers - - -TensorBoardLogger -================= - -.. autoclass:: TensorBoardLogger - :members: - - -.. - autogenerated from source/_templates/classtemplate.rst - note it does not have :inherited-members: \ No newline at end of file diff --git a/source/extensions/generated/pytorch_lightning.loggers.WandbLogger.rst b/source/extensions/generated/pytorch_lightning.loggers.WandbLogger.rst deleted file mode 100644 index 3dcb424..0000000 --- a/source/extensions/generated/pytorch_lightning.loggers.WandbLogger.rst +++ /dev/null @@ -1,15 +0,0 @@ -.. role:: hidden - :class: hidden-section -.. currentmodule:: pytorch_lightning.loggers - - -WandbLogger -=========== - -.. autoclass:: WandbLogger - :members: - - -.. - autogenerated from source/_templates/classtemplate.rst - note it does not have :inherited-members: \ No newline at end of file diff --git a/source/extensions/logging.rst b/source/extensions/logging.rst deleted file mode 100644 index 8bad452..0000000 --- a/source/extensions/logging.rst +++ /dev/null @@ -1,410 +0,0 @@ -:orphan: - -.. testsetup:: * - - from pytorch_lightning import loggers as pl_loggers - -.. role:: hidden - :class: hidden-section - -.. _logging: - - -####### -Logging -####### - -***************** -Supported Loggers -***************** - -The following are loggers we support: - -.. currentmodule:: pytorch_lightning.loggers - -.. autosummary:: - :toctree: generated - :nosignatures: - :template: classtemplate.rst - - CometLogger - CSVLogger - MLFlowLogger - NeptuneLogger - TensorBoardLogger - WandbLogger - - -The above loggers will normally plot an additional chart (**global_step VS epoch**). Depending on the loggers you use, there might be some additional charts too. - -By default, Lightning uses ``TensorBoard`` logger under the hood, and stores the logs to a directory (by default in ``lightning_logs/``). - -.. testcode:: - - from pytorch_lightning import Trainer - - # Automatically logs to a directory (by default ``lightning_logs/``) - trainer = Trainer() - -To see your logs: - -.. code-block:: bash - - tensorboard --logdir=lightning_logs/ - -To visualize tensorboard in a jupyter notebook environment, run the following command in a jupyter cell: - -.. code-block:: bash - - %reload_ext tensorboard - %tensorboard --logdir=lightning_logs/ - -You can also pass a custom Logger to the :class:`~pytorch_lightning.trainer.trainer.Trainer`. - -.. testcode:: - - from pytorch_lightning import loggers as pl_loggers - - tb_logger = pl_loggers.TensorBoardLogger(save_dir="logs/") - trainer = Trainer(logger=tb_logger) - -Choose from any of the others such as MLflow, Comet, Neptune, WandB, etc. - -.. testcode:: - - comet_logger = pl_loggers.CometLogger(save_dir="logs/") - trainer = Trainer(logger=comet_logger) - -To use multiple loggers, simply pass in a ``list`` or ``tuple`` of loggers. - -.. testcode:: - - tb_logger = pl_loggers.TensorBoardLogger(save_dir="logs/") - comet_logger = pl_loggers.CometLogger(save_dir="logs/") - trainer = Trainer(logger=[tb_logger, comet_logger]) - -.. note:: - - By default, Lightning logs every 50 steps. Use Trainer flags to :ref:`logging_frequency`. - -.. note:: - - By default, all loggers log to ``os.getcwd()``. You can change the logging path using - ``Trainer(default_root_dir="/your/path/to/save/checkpoints")`` without instantiating a logger. - ----------- - -****************************** -Logging from a LightningModule -****************************** - -Lightning offers automatic log functionalities for logging scalars, or manual logging for anything else. - -Automatic Logging -================= - -Use the :meth:`~pytorch_lightning.core.lightning.LightningModule.log` or :meth:`~pytorch_lightning.core.lightning.LightningModule.log_dict` -methods to log from anywhere in a :doc:`LightningModule <../common/lightning_module>` and :doc:`callbacks <../extensions/callbacks>`. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - self.log("my_metric", x) - - - # or a dict to get multiple metrics on the same plot if the logger supports it - def training_step(self, batch, batch_idx): - self.log("performance", {"acc": acc, "recall": recall}) - - - # or a dict to log all metrics at once with individual plots - def training_step(self, batch, batch_idx): - self.log_dict({"acc": acc, "recall": recall}) - -.. note:: - Everything explained below applies to both :meth:`~pytorch_lightning.core.lightning.LightningModule.log` or :meth:`~pytorch_lightning.core.lightning.LightningModule.log_dict` methods. - -Depending on where the :meth:`~pytorch_lightning.core.lightning.LightningModule.log` method is called, Lightning auto-determines -the correct logging mode for you. Of course you can override the default behavior by manually setting the -:meth:`~pytorch_lightning.core.lightning.LightningModule.log` parameters. - -.. code-block:: python - - def training_step(self, batch, batch_idx): - self.log("my_loss", loss, on_step=True, on_epoch=True, prog_bar=True, logger=True) - -The :meth:`~pytorch_lightning.core.lightning.LightningModule.log` method has a few options: - -* ``on_step``: Logs the metric at the current step. -* ``on_epoch``: Automatically accumulates and logs at the end of the epoch. -* ``prog_bar``: Logs to the progress bar (Default: ``False``). -* ``logger``: Logs to the logger like ``Tensorboard``, or any other custom logger passed to the :class:`~pytorch_lightning.trainer.trainer.Trainer` (Default: ``True``). -* ``reduce_fx``: Reduction function over step values for end of epoch. Uses :meth:`torch.mean` by default. -* ``enable_graph``: If True, will not auto detach the graph. -* ``sync_dist``: If True, reduces the metric across devices. Use with care as this may lead to a significant communication overhead. -* ``sync_dist_group``: The DDP group to sync across. -* ``add_dataloader_idx``: If True, appends the index of the current dataloader to the name (when using multiple dataloaders). If False, user needs to give unique names for each dataloader to not mix the values. -* ``batch_size``: Current batch size used for accumulating logs logged with ``on_epoch=True``. This will be directly inferred from the loaded batch, but for some data structures you might need to explicitly provide it. -* ``rank_zero_only``: Whether the value will be logged only on rank 0. This will prevent synchronization which would produce a deadlock as not all processes would perform this log call. - -.. list-table:: Default behavior of logging in Callback or LightningModule - :widths: 50 25 25 - :header-rows: 1 - - * - Hook - - on_step - - on_epoch - * - on_train_start, on_train_epoch_start, on_train_epoch_end, training_epoch_end - - False - - True - * - on_before_backward, on_after_backward, on_before_optimizer_step, on_before_zero_grad - - True - - False - * - on_train_batch_start, on_train_batch_end, training_step, training_step_end - - True - - False - * - on_validation_start, on_validation_epoch_start, on_validation_epoch_end, validation_epoch_end - - False - - True - * - on_validation_batch_start, on_validation_batch_end, validation_step, validation_step_end - - False - - True - - -.. note:: - - While logging tensor metrics with ``on_epoch=True`` inside step-level hooks and using mean-reduction (default) to accumulate the metrics across the current epoch, Lightning tries to extract the - batch size from the current batch. If multiple possible batch sizes are found, a warning is logged and if it fails to extract the batch size from the current batch, which is possible if - the batch is a custom structure/collection, then an error is raised. To avoid this, you can specify the ``batch_size`` inside the ``self.log(... batch_size=batch_size)`` call. - - .. code-block:: python - - def training_step(self, batch, batch_idx): - # extracts the batch size from `batch` - self.log("train_loss", loss, on_epoch=True) - - - def validation_step(self, batch, batch_idx): - # uses `batch_size=10` - self.log("val_loss", loss, batch_size=10) - -.. note:: - - - The above config for ``validation`` applies for ``test`` hooks as well. - - - Setting ``on_epoch=True`` will cache all your logged values during the full training epoch and perform a - reduction in ``on_train_epoch_end``. We recommend using `TorchMetrics `_, when working with custom reduction. - - - Setting both ``on_step=True`` and ``on_epoch=True`` will create two keys per metric you log with - suffix ``_step`` and ``_epoch`` respectively. You can refer to these keys e.g. in the `monitor` - argument of :class:`~pytorch_lightning.callbacks.model_checkpoint.ModelCheckpoint` or in the graphs plotted to the logger of your choice. - - -If your work requires to log in an unsupported method, please open an issue with a clear description of why it is blocking you. - - -Manual Logging Non-Scalar Artifacts -=================================== - -If you want to log anything that is not a scalar, like histograms, text, images, etc., you may need to use the logger object directly. - -.. code-block:: python - - def training_step(self): - ... - # the logger you used (in this case tensorboard) - tensorboard = self.logger.experiment - tensorboard.add_image() - tensorboard.add_histogram(...) - tensorboard.add_figure(...) - - ----------- - -******************** -Make a Custom Logger -******************** - -You can implement your own logger by writing a class that inherits from :class:`~pytorch_lightning.loggers.logger.Logger`. -Use the :func:`~pytorch_lightning.loggers.logger.rank_zero_experiment` and :func:`~pytorch_lightning.utilities.rank_zero.rank_zero_only` decorators to make sure that only the first process in DDP training creates the experiment and logs the data respectively. - -.. testcode:: - - from pytorch_lightning.loggers.logger import Logger, rank_zero_experiment - from pytorch_lightning.utilities.distributed import rank_zero_only - - - class MyLogger(Logger): - @property - def name(self): - return "MyLogger" - - @property - def version(self): - # Return the experiment version, int or str. - return "0.1" - - @rank_zero_only - def log_hyperparams(self, params): - # params is an argparse.Namespace - # your code to record hyperparameters goes here - pass - - @rank_zero_only - def log_metrics(self, metrics, step): - # metrics is a dictionary of metric names and values - # your code to record metrics goes here - pass - - @rank_zero_only - def save(self): - # Optional. Any code necessary to save logger data goes here - pass - - @rank_zero_only - def finalize(self, status): - # Optional. Any code that needs to be run after training - # finishes goes here - pass - -If you write a logger that may be useful to others, please send -a pull request to add it to Lightning! - ----------- - -.. _logging_frequency: - - -************************* -Control Logging Frequency -************************* - -Logging frequency -================= - -It may slow down training to log on every single batch. By default, Lightning logs every 50 rows, or 50 training steps. -To change this behaviour, set the ``log_every_n_steps`` :class:`~pytorch_lightning.trainer.trainer.Trainer` flag. - -.. testcode:: - - k = 10 - trainer = Trainer(log_every_n_steps=k) - - -Log Writing Frequency -===================== - -Individual logger implementations determine their flushing frequency. For example, on the -:class:`~pytorch_lightning.loggers.csv_logs.CSVLogger` you can set the flag ``flush_logs_every_n_steps``. - ----------- - -************ -Progress Bar -************ - -You can add any metric to the progress bar using :meth:`~pytorch_lightning.core.lightning.LightningModule.log` -method, setting ``prog_bar=True``. - - -.. code-block:: python - - def training_step(self, batch, batch_idx): - self.log("my_loss", loss, prog_bar=True) - - -You could learn more about progress bars supported by Lightning :doc:`here <../common/progress_bar>`. - -Modifying the Progress Bar -========================== - -The progress bar by default already includes the training loss and version number of the experiment -if you are using a logger. These defaults can be customized by overriding the -:meth:`~pytorch_lightning.callbacks.progress.base.ProgressBarBase.get_metrics` hook in your logger. - -.. code-block:: python - - from pytorch_lightning.callbacks.progress import Tqdm - - - class CustomProgressBar(Tqdm): - def get_metrics(self, *args, **kwargs): - # don't show the version number - items = super().get_metrics() - items.pop("v_num", None) - return items - - ----------- - - -************************* -Configure Console Logging -************************* - -Lightning logs useful information about the training process and user warnings to the console. -You can retrieve the Lightning console logger and change it to your liking. For example, adjust the logging level -or redirect output for certain modules to log files: - -.. testcode:: - - import logging - - # configure logging at the root level of Lightning - logging.getLogger("pytorch_lightning").setLevel(logging.ERROR) - - # configure logging on module level, redirect to file - logger = logging.getLogger("pytorch_lightning.core") - logger.addHandler(logging.FileHandler("core.log")) - -Read more about custom Python logging `here `_. - - ----------- - -*********************** -Logging Hyperparameters -*********************** - -When training a model, it is useful to know what hyperparams went into that model. -When Lightning creates a checkpoint, it stores a key ``"hyper_parameters"`` with the hyperparams. - -.. code-block:: python - - lightning_checkpoint = torch.load(filepath, map_location=lambda storage, loc: storage) - hyperparams = lightning_checkpoint["hyper_parameters"] - -Some loggers also allow logging the hyperparams used in the experiment. For instance, -when using the ``TensorBoardLogger``, all hyperparams will show -in the `hparams tab `_. - -.. note:: - If you want to track a metric in the tensorboard hparams tab, log scalars to the key ``hp_metric``. If tracking multiple metrics, initialize ``TensorBoardLogger`` with ``default_hp_metric=False`` and call ``log_hyperparams`` only once with your metric keys and initial values. Subsequent updates can simply be logged to the metric keys. Refer to the examples below for setting up proper hyperparams metrics tracking within the :doc:`LightningModule <../common/lightning_module>`. - - .. code-block:: python - - # Using default_hp_metric - def validation_step(self, batch, batch_idx): - self.log("hp_metric", some_scalar) - - - # Using custom or multiple metrics (default_hp_metric=False) - def on_train_start(self): - self.logger.log_hyperparams(self.hparams, {"hp/metric_1": 0, "hp/metric_2": 0}) - - - def validation_step(self, batch, batch_idx): - self.log("hp/metric_1", some_scalar_1) - self.log("hp/metric_2", some_scalar_2) - - In the example, using ``"hp/"`` as a prefix allows for the metrics to be grouped under "hp" in the tensorboard scalar tab where you can collapse them. - ------------ - -*************************** -Managing Remote Filesystems -*************************** - -Lightning supports saving logs to a variety of filesystems, including local filesystems and several cloud storage providers. - -Check out the :doc:`Remote Filesystems <../common/remote_fs>` doc for more info. diff --git a/source/extensions/loops.rst b/source/extensions/loops.rst deleted file mode 100644 index c24d4ce..0000000 --- a/source/extensions/loops.rst +++ /dev/null @@ -1,461 +0,0 @@ -.. _loop-customization-extensions: - - -Loops -===== - -Loops let advanced users swap out the default gradient descent optimization loop at the core of Lightning with a different optimization paradigm. - -The Lightning Trainer is built on top of the standard gradient descent optimization loop which works for 90%+ of machine learning use cases: - -.. code-block:: python - - for i, batch in enumerate(dataloader): - x, y = batch - y_hat = model(x) - loss = loss_function(y_hat, y) - optimizer.zero_grad() - loss.backward() - optimizer.step() - -However, some new research use cases such as meta-learning, active learning, recommendation systems, etc., require a different loop structure. -For example here is a simple loop that guides the weight updates with a loss from a special validation split: - -.. code-block:: python - - for i, batch in enumerate(train_dataloader): - x, y = batch - y_hat = model(x) - loss = loss_function(y_hat, y) - optimizer.zero_grad() - loss.backward() - - val_loss = 0 - for i, val_batch in enumerate(val_dataloader): - x, y = val_batch - y_hat = model(x) - val_loss += loss_function(y_hat, y) - - scale_gradients(model, 1 / val_loss) - optimizer.step() - - -With Lightning Loops, you can customize to non-standard gradient descent optimizations to get the same loop above: - -.. code-block:: python - - trainer = Trainer() - trainer.fit_loop.epoch_loop = MyGradientDescentLoop() - -Think of this as swapping out the engine in a car! - ----------- - -Understanding the Default Trainer Loop --------------------------------------- - -The Lightning :class:`~pytorch_lightning.trainer.trainer.Trainer` automates the standard optimization loop which every PyTorch user is familiar with: - -.. code-block:: python - - for i, batch in enumerate(dataloader): - x, y = batch - y_hat = model(x) - loss = loss_function(y_hat, y) - optimizer.zero_grad() - loss.backward() - optimizer.step() - -The core research logic is simply shifted to the :class:`~pytorch_lightning.core.lightning.LightningModule`: - -.. code-block:: python - - for i, batch in enumerate(dataloader): - # x, y = batch moved to training_step - # y_hat = model(x) moved to training_step - # loss = loss_function(y_hat, y) moved to training_step - loss = lightning_module.training_step(batch, i) - - # Lightning handles automatically: - optimizer.zero_grad() - loss.backward() - optimizer.step() - -Under the hood, the above loop is implemented using the :class:`~pytorch_lightning.loops.base.Loop` API like so: - -.. code-block:: python - - class DefaultLoop(Loop): - def advance(self, batch, i): - loss = lightning_module.training_step(batch, i) - optimizer.zero_grad() - loss.backward() - optimizer.step() - - def run(self, dataloader): - for i, batch in enumerate(dataloader): - self.advance(batch, i) - -Defining a loop within a class interface instead of hard-coding a raw Python for/while loop has several benefits: - -1. You can have full control over the data flow through loops. -2. You can add new loops and nest as many of them as you want. -3. If needed, the state of a loop can be :ref:`saved and resumed `. -4. New hooks can be injected at any point. - -.. image:: https://pl-public-data.s3.amazonaws.com/docs/static/images/loops/epoch-loop-steps.gif - :alt: Animation showing how to convert a standard training loop to a Lightning loop - ----------- - -.. _override-default-loops-extensions: - -Overriding the default Loops ----------------------------- - -The fastest way to get started with loops, is to override functionality of an existing loop. -Lightning has 4 main loops which relies on : :class:`~pytorch_lightning.loops.fit_loop.FitLoop` for fitting (training and validating), -:class:`~pytorch_lightning.loops.dataloader.evaluation_loop.EvaluationLoop` for validating or testing, -:class:`~pytorch_lightning.loops.dataloader.prediction_loop.PredictionLoop` for predicting. - -For simple changes that don't require a custom loop, you can modify each of these loops. - -Each loop has a series of methods that can be modified. -For example with the :class:`~pytorch_lightning.loops.fit_loop.FitLoop`: - -.. code-block:: python - - from pytorch_lightning.loops import FitLoop - - - class MyLoop(FitLoop): - def advance(self): - """Advance from one iteration to the next.""" - - def on_advance_end(self): - """Do something at the end of an iteration.""" - - def on_run_end(self): - """Do something when the loop ends.""" - -A full list with all built-in loops and subloops can be found :ref:`here `. - -To add your own modifications to a loop, simply subclass an existing loop class and override what you need. -Here is a simple example how to add a new hook: - -.. code-block:: python - - from pytorch_lightning.loops import FitLoop - - - class CustomFitLoop(FitLoop): - def advance(self): - # ... whatever code before - - # pass anything you want to the hook - self.trainer.call_hook("my_new_hook", *args, **kwargs) - - # ... whatever code after - -Now simply attach the correct loop in the trainer directly: - -.. code-block:: python - - trainer = Trainer(...) - trainer.fit_loop = CustomFitLoop() - - # fit() now uses the new FitLoop! - trainer.fit(...) - - # the equivalent for validate() - val_loop = CustomValLoop() - trainer = Trainer() - trainer.validate_loop = val_loop - trainer.validate(...) - -Now your code is FULLY flexible and you can still leverage ALL the best parts of Lightning! - -.. image:: https://pl-public-data.s3.amazonaws.com/docs/static/images/loops/replace-fit-loop.gif - :alt: Animation showing how to replace a loop on the Trainer - ----------- - -Creating a New Loop From Scratch --------------------------------- - -You can also go wild and implement a full loop from scratch by sub-classing the :class:`~pytorch_lightning.loops.base.Loop` base class. -You will need to override a minimum of two things: - -.. code-block:: python - - from pytorch_lightning.loop import Loop - - - class MyFancyLoop(Loop): - @property - def done(self): - """Provide a condition to stop the loop.""" - - def advance(self): - """ - Access your dataloader/s in whatever way you want. - Do your fancy optimization things. - Call the LightningModule methods at your leisure. - """ - -Finally, attach it into the :class:`~pytorch_lightning.trainer.trainer.Trainer`: - -.. code-block:: python - - trainer = Trainer(...) - trainer.fit_loop = MyFancyLoop() - - # fit() now uses your fancy loop! - trainer.fit(...) - -But beware: Loop customization gives you more power and full control over the Trainer and with great power comes great responsibility. -We recommend that you familiarize yourself with :ref:`overriding the default loops ` first before you start building a new loop from the ground up. - ----------- - -Loop API --------- -Here is the full API of methods available in the Loop base class. - -The :class:`~pytorch_lightning.loops.base.Loop` class is the base of all loops in the same way as the :class:`~pytorch_lightning.core.lightning.LightningModule` is the base of all models. -It defines a public interface that each loop implementation must follow, the key ones are: - -Properties -^^^^^^^^^^ - -done -~~~~ - -.. autoattribute:: pytorch_lightning.loops.base.Loop.done - :noindex: - -skip (optional) -~~~~~~~~~~~~~~~ - -.. autoattribute:: pytorch_lightning.loops.base.Loop.skip - :noindex: - -Methods -^^^^^^^ - -reset (optional) -~~~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.loops.base.Loop.reset - :noindex: - -advance -~~~~~~~ - -.. automethod:: pytorch_lightning.loops.base.Loop.advance - :noindex: - -run (optional) -~~~~~~~~~~~~~~ - -.. automethod:: pytorch_lightning.loops.base.Loop.run - :noindex: - - ----------- - -Subloops --------- - -When you want to customize nested loops within loops, use the :meth:`~pytorch_lightning.loops.base.Loop.replace` method: - -.. code-block:: python - - # This takes care of properly instantiating the new Loop and setting all references - trainer.fit_loop.replace(epoch_loop=MyEpochLoop) - # Trainer runs the fit loop with your new epoch loop! - trainer.fit(model) - -Alternatively, for more fine-grained control, use the :meth:`~pytorch_lightning.loops.base.Loop.connect` method: - -.. code-block:: python - - # Optional: stitch back the trainer arguments - epoch_loop = MyEpochLoop(trainer.fit_loop.epoch_loop.min_steps, trainer.fit_loop.epoch_loop.max_steps) - # Optional: connect children loops as they might have existing state - epoch_loop.connect(trainer.fit_loop.epoch_loop.batch_loop, trainer.fit_loop.epoch_loop.val_loop) - # Instantiate and connect the loop. - trainer.fit_loop.connect(epoch_loop=epoch_loop) - trainer.fit(model) - -More about the built-in loops and how they are composed is explained in the next section. - -.. image:: https://pl-public-data.s3.amazonaws.com/docs/static/images/loops/connect-epoch-loop.gif - :alt: Animation showing how to connect a custom subloop - ----------- - -Built-in Loops --------------- - -.. _loop-structure-extensions: - -The training loop in Lightning is called *fit loop* and is actually a combination of several loops. -Here is what the structure would look like in plain Python: - -.. code-block:: python - - # FitLoop - for epoch in range(max_epochs): - - # TrainingEpochLoop - for batch_idx, batch in enumerate(train_dataloader): - - # TrainingBatchLoop - for split_batch in tbptt_split(batch): - - # OptimizerLoop - for optimizer_idx, opt in enumerate(optimizers): - - loss = lightning_module.training_step(batch, batch_idx, optimizer_idx) - ... - - # ValidationEpochLoop - for batch_idx, batch in enumerate(val_dataloader): - lightning_module.validation_step(batch, batch_idx, optimizer_idx) - ... - - -Each of these :code:`for`-loops represents a class implementing the :class:`~pytorch_lightning.loops.base.Loop` interface. - - -.. list-table:: Trainer entry points and associated loops - :widths: 25 75 - :header-rows: 1 - - * - Built-in loop - - Description - * - :class:`~pytorch_lightning.loops.fit_loop.FitLoop` - - The :class:`~pytorch_lightning.loops.fit_loop.FitLoop` is the top-level loop where training starts. - It simply counts the epochs and iterates from one to the next by calling :code:`TrainingEpochLoop.run()` in its :code:`advance()` method. - * - :class:`~pytorch_lightning.loops.epoch.training_epoch_loop.TrainingEpochLoop` - - The :class:`~pytorch_lightning.loops.epoch.training_epoch_loop.TrainingEpochLoop` is the one that iterates over the dataloader that the user returns in their :meth:`~pytorch_lightning.core.lightning.LightningModule.train_dataloader` method. - Its main responsibilities are calling the :code:`*_epoch_start` and :code:`*_epoch_end` hooks, accumulating outputs if the user request them in one of these hooks, and running validation at the requested interval. - The validation is carried out by yet another loop, :class:`~pytorch_lightning.loops.epoch.validation_epoch_loop.ValidationEpochLoop`. - - In the :code:`run()` method, the training epoch loop could in theory simply call the :code:`LightningModule.training_step` already and perform the optimization. - However, Lightning has built-in support for automatic optimization with multiple optimizers and on top of that also supports :ref:`TBPTT `. - For this reason there are actually two more loops nested under :class:`~pytorch_lightning.loops.epoch.training_epoch_loop.TrainingEpochLoop`. - * - :class:`~pytorch_lightning.loops.batch.training_batch_loop.TrainingBatchLoop` - - The responsibility of the :class:`~pytorch_lightning.loops.batch.training_batch_loop.TrainingBatchLoop` is to split a batch given by the :class:`~pytorch_lightning.loops.epoch.training_epoch_loop.TrainingEpochLoop` along the time-dimension and iterate over the list of splits. - It also keeps track of the hidden state *hiddens* returned by the training step. - By default, when truncated back-propagation through time (TBPTT) is turned off, this loop does not do anything except redirect the call to the :class:`~pytorch_lightning.loops.optimization.optimizer_loop.OptimizerLoop`. - Read more about :ref:`TBPTT `. - * - :class:`~pytorch_lightning.loops.optimization.optimizer_loop.OptimizerLoop` - - The :class:`~pytorch_lightning.loops.optimization.optimizer_loop.OptimizerLoop` iterates over one or multiple optimizers and for each one it calls the :meth:`~pytorch_lightning.core.lightning.LightningModule.training_step` method with the batch, the current batch index and the optimizer index if multiple optimizers are requested. - It is the leaf node in the tree of loops and performs the actual optimization (forward, zero grad, backward, optimizer step). - * - :class:`~pytorch_lightning.loops.optimization.manual_loop.ManualOptimization` - - Substitutes the :class:`~pytorch_lightning.loops.optimization.optimizer_loop.OptimizerLoop` in case of :doc:`manual optimization <../model/manual_optimization>` and implements the manual optimization step. - * - :class:`~pytorch_lightning.loops.dataloader.evaluation_loop.EvaluationLoop` - - The :class:`~pytorch_lightning.loops.dataloader.evaluation_loop.EvaluationLoop` is the top-level loop where validation/testing starts. - It simply iterates over each evaluation dataloader from one to the next by calling :code:`EvaluationEpochLoop.run()` in its :code:`advance()` method. - * - :class:`~pytorch_lightning.loops.dataloader.prediction_loop.PredictionLoop` - - The :class:`~pytorch_lightning.loops.dataloader.prediction_loop.PredictionLoop` is the top-level loop where prediction starts. - It simply iterates over each prediction dataloader from one to the next by calling :code:`PredictionEpochLoop.run()` in its :code:`advance()` method. - - ----------- - -Available Loops in Lightning Flash ----------------------------------- - -`Active Learning `__ is a machine learning practice in which the user interacts with the learner in order to provide new labels when required. - -You can find a real use case in `Lightning Flash `_. - -Flash implements the :code:`ActiveLearningLoop` that you can use together with the :code:`ActiveLearningDataModule` to label new data on the fly. -To run the following demo, install Flash and `BaaL `__ first: - -.. code-block:: bash - - pip install lightning-flash baal - -.. code-block:: python - - import torch - - import flash - from flash.core.classification import Probabilities - from flash.core.data.utils import download_data - from flash.image import ImageClassificationData, ImageClassifier - from flash.image.classification.integrations.baal import ActiveLearningDataModule, ActiveLearningLoop - - # 1. Create the DataModule - download_data("https://pl-flash-data.s3.amazonaws.com/hymenoptera_data.zip", "./data") - - # Implement the research use-case where we mask labels from labelled dataset. - datamodule = ActiveLearningDataModule( - ImageClassificationData.from_folders(train_folder="data/hymenoptera_data/train/", batch_size=2), - initial_num_labels=5, - val_split=0.1, - ) - - # 2. Build the task - head = torch.nn.Sequential( - torch.nn.Dropout(p=0.1), - torch.nn.Linear(512, datamodule.num_classes), - ) - model = ImageClassifier(backbone="resnet18", head=head, num_classes=datamodule.num_classes, output=Probabilities()) - - - # 3.1 Create the trainer - trainer = flash.Trainer(max_epochs=3) - - # 3.2 Create the active learning loop and connect it to the trainer - active_learning_loop = ActiveLearningLoop(label_epoch_frequency=1) - active_learning_loop.connect(trainer.fit_loop) - trainer.fit_loop = active_learning_loop - - # 3.3 Finetune - trainer.finetune(model, datamodule=datamodule, strategy="freeze") - - # 4. Predict what's on a few images! ants or bees? - predictions = model.predict("data/hymenoptera_data/val/bees/65038344_52a45d090d.jpg") - print(predictions) - - # 5. Save the model! - trainer.save_checkpoint("image_classification_model.pt") - -Here is the `Active Learning Loop example `_ and the `code for the active learning loop `_. - - ----------- - -Advanced Examples ------------------ - - -.. list-table:: Ready-to-run loop examples and tutorials - :widths: 25 75 - :header-rows: 1 - - * - Link to Example - - Description - * - `K-fold Cross Validation `_ - - `KFold / Cross Validation `__ is a machine learning practice in which the training dataset is being partitioned into ``num_folds`` complementary subsets. - One cross validation round will perform fitting where one fold is left out for validation and the other folds are used for training. - To reduce variability, once all rounds are performed using the different folds, the trained models are ensembled and their predictions are - averaged when estimating the model's predictive performance on the test dataset. - * - `Yielding Training Step `_ - - This loop enables you to write the :meth:`~pytorch_lightning.core.lightning.LightningModule.training_step` hook - as a Python Generator for automatic optimization with multiple optimizers, i.e., you can :code:`yield` loss - values from it instead of returning them. This can enable more elegant and expressive implementations, as shown - shown with a GAN in this example. - - ----------- - -Advanced Features ------------------ - -Next: :doc:`Advanced loop features <../extensions/loops_advanced>` diff --git a/source/extensions/loops_advanced.rst b/source/extensions/loops_advanced.rst deleted file mode 100644 index e71c827..0000000 --- a/source/extensions/loops_advanced.rst +++ /dev/null @@ -1,41 +0,0 @@ -:orphan: - -Loops (Advanced) -================ - -.. _persisting loop state: - -Persisting the State of Loops ------------------------------ - -.. note:: - - This is an experimental feature and is not activated by default. - Set the environment variable `PL_FAULT_TOLERANT_TRAINING = 1` to enable saving the progress of loops. - Read more about :doc:`fault-tolerant training <../clouds/fault_tolerant_training>`. - -A powerful property of the class-based loop interface is that it can own an internal state. -Loop instances can save their state to the checkpoint through corresponding hooks and if implemented accordingly, resume the state of execution at the appropriate place. -This design is particularly interesting for fault-tolerant training which is an experimental feature released in Lightning v1.5. - -The two hooks :meth:`~pytorch_lightning.loops.base.Loop.on_save_checkpoint` and :meth:`~pytorch_lightning.loops.base.Loop.on_load_checkpoint` function very similarly to how LightningModules and Callbacks save and load state. - -.. code-block:: python - - def on_save_checkpoint(self): - state_dict["iteration"] = self.iteration - return state_dict - - - def on_load_checkpoint(self, state_dict): - self.iteration = state_dict["iteration"] - -When the Trainer is restarting from a checkpoint (e.g., through :code:`trainer.fit(ckpt_path=...)`), the loop exposes a boolean attribute :attr:`~pytorch_lightning.loops.base.Loop.restarting`. -Based around the value of this variable, the user can write the loop in such a way that it can restart from an arbitrary point given the state loaded from the checkpoint. -For example, the implementation of the :meth:`~pytorch_lightning.loops.base.Loop.reset` method could look like this given our previous example: - -.. code-block:: python - - def reset(self): - if not self.restarting: - self.iteration = 0 diff --git a/source/extensions/strategy.rst b/source/extensions/strategy.rst deleted file mode 100644 index ad9d799..0000000 --- a/source/extensions/strategy.rst +++ /dev/null @@ -1,122 +0,0 @@ -:orphan: - -################### -What is a Strategy? -################### - -Strategy controls the model distribution across training, evaluation, and prediction to be used by the :doc:`Trainer <../common/trainer>`. It can be controlled by passing different -strategy with aliases (``"ddp"``, ``"ddp_spawn"``, ``"deepspeed"`` and so on) as well as a custom strategy to the ``strategy`` parameter for Trainer. - -The Strategy in PyTorch Lightning handles the following responsibilities: - -* Launch and teardown of training processes (if applicable). -* Setup communication between processes (NCCL, GLOO, MPI, and so on). -* Provide a unified communication interface for reduction, broadcast, and so on. -* Owns the :class:`~pytorch_lightning.core.lightning.LightningModule` -* Handles/owns optimizers and schedulers. - - -:class:`~pytorch_lightning.strategies.strategy.Strategy` also manages the accelerator, precision, and checkpointing plugins. - -.. image:: https://pl-public-data.s3.amazonaws.com/docs/static/images/strategies/overview.jpeg - :alt: Illustration of the Strategy as a composition of the Accelerator and several plugins - -We expose Strategies mainly for expert users that want to extend Lightning for new hardware support or new distributed backends (e.g. a backend not yet supported by `PyTorch `_ itself). - - ----- - -########################### -Enable Different Strategies -########################### - -.. code-block:: python - - # Training with the DistributedDataParallel strategy on 4 GPUs - trainer = Trainer(strategy="ddp", accelerator="gpu", devices=4) - - # Training with the custom DistributedDataParallel strategy on 4 GPUs - trainer = Trainer(strategy=DDPStrategy(...), accelerator="gpu", devices=4) - - # Training with the DDP Spawn strategy using auto accelerator selection - trainer = Trainer(strategy="ddp_spawn", accelerator="auto", devices=4) - - # Training with the DeepSpeed strategy on available GPUs - trainer = Trainer(strategy="deepspeed", accelerator="gpu", devices="auto") - - # Training with the DDP strategy using 3 CPU processes - trainer = Trainer(strategy="ddp", accelerator="cpu", devices=3) - - # Training with the DDP Spawn strategy on 8 TPU cores - trainer = Trainer(strategy="ddp_spawn", accelerator="tpu", devices=8) - - # Training with the default IPU strategy on 8 IPUs - trainer = Trainer(accelerator="ipu", devices=8) - ----- - -######################## -Create a Custom Strategy -######################## - -Expert users may choose to extend an existing strategy by overriding its methods. - -.. code-block:: python - - from pytorch_lightning.strategies import DDPStrategy - - - class CustomDDPStrategy(DDPStrategy): - def configure_ddp(self): - self.model = MyCustomDistributedDataParallel( - self.model, - device_ids=..., - ) - -or by subclassing the base class :class:`~pytorch_lightning.strategies.Strategy` to create new ones. These custom strategies -can then be passed into the ``Trainer`` directly via the ``strategy`` parameter. - -.. code-block:: python - - # custom plugins - trainer = Trainer(strategy=CustomDDPStrategy()) - - # fully custom accelerator and plugins - accelerator = MyAccelerator() - precision_plugin = MyPrecisionPlugin() - training_strategy = CustomDDPStrategy(accelerator=accelerator, precision_plugin=precision_plugin) - trainer = Trainer(strategy=training_strategy) - - -The complete list of built-in strategies is listed below. - ----- - -############################# -Available Training Strategies -############################# - -.. currentmodule:: pytorch_lightning.strategies - -.. autosummary:: - :nosignatures: - :template: classtemplate.rst - - BaguaStrategy - DDP2Strategy - DDPFullyShardedStrategy - DDPShardedStrategy - DDPSpawnShardedStrategy - DDPSpawnStrategy - DDPStrategy - DataParallelStrategy - DeepSpeedStrategy - HorovodStrategy - HPUParallelStrategy - IPUStrategy - ParallelStrategy - SingleDeviceStrategy - SingleHPUStrategy - SingleTPUStrategy - Strategy - TPUSpawnStrategy diff --git a/source/guides/data.rst b/source/guides/data.rst deleted file mode 100644 index 72dba27..0000000 --- a/source/guides/data.rst +++ /dev/null @@ -1,423 +0,0 @@ -:orphan: - -.. _data: - -############# -Managing Data -############# - -**************************** -Data Containers in Lightning -**************************** - -There are a few different data containers used in Lightning: - -.. list-table:: Data objects - :widths: 20 80 - :header-rows: 1 - - * - Object - - Definition - * - :class:`~torch.utils.data.Dataset` - - The PyTorch :class:`~torch.utils.data.Dataset` represents a map from keys to data samples. - * - :class:`~torch.utils.data.IterableDataset` - - The PyTorch :class:`~torch.utils.data.IterableDataset` represents a stream of data. - * - :class:`~torch.utils.data.DataLoader` - - The PyTorch :class:`~torch.utils.data.DataLoader` represents a Python iterable over a Dataset. - * - :class:`~pytorch_lightning.core.datamodule.LightningDataModule` - - A :class:`~pytorch_lightning.core.datamodule.LightningDataModule` is simply a collection of: training DataLoader(s), validation DataLoader(s), test DataLoader(s) and predict DataLoader(s), along with the matching transforms and data processing/downloads steps required. - - -Why Use LightningDataModule? -============================ - -The :class:`~pytorch_lightning.core.datamodule.LightningDataModule` was designed as a way of decoupling data-related hooks from the :class:`~pytorch_lightning.core.lightning.LightningModule` so you can develop dataset agnostic models. The :class:`~pytorch_lightning.core.datamodule.LightningDataModule` makes it easy to hot swap different Datasets with your model, so you can test it and benchmark it across domains. It also makes sharing and reusing the exact data splits and transforms across projects possible. - -Read :ref:`this ` for more details on LightningDataModule. - ---------- - -.. _multiple-dataloaders: - -***************** -Multiple Datasets -***************** - -There are a few ways to pass multiple Datasets to Lightning: - -1. Create a DataLoader that iterates over multiple Datasets under the hood. -2. In the training loop, you can pass multiple DataLoaders as a dict or list/tuple, and Lightning will - automatically combine the batches from different DataLoaders. -3. In the validation, test, or prediction, you have the option to return multiple DataLoaders as list/tuple, which Lightning will call sequentially - or combine the DataLoaders using :class:`~pytorch_lightning.trainer.supporters.CombinedLoader`, which Lightning will - automatically combine the batches from different DataLoaders. - - -Using LightningDataModule -========================= - -You can set more than one :class:`~torch.utils.data.DataLoader` in your :class:`~pytorch_lightning.core.datamodule.LightningDataModule` using its DataLoader hooks -and Lightning will use the correct one. - -.. testcode:: - - class DataModule(LightningDataModule): - - ... - - def train_dataloader(self): - return DataLoader(self.train_dataset) - - def val_dataloader(self): - return [DataLoader(self.val_dataset_1), DataLoader(self.val_dataset_2)] - - def test_dataloader(self): - return DataLoader(self.test_dataset) - - def predict_dataloader(self): - return DataLoader(self.predict_dataset) - - -Using LightningModule Hooks -=========================== - -Concatenated Dataset --------------------- - -For training with multiple Datasets, you can create a :class:`~torch.utils.data.DataLoader` class -which wraps your multiple Datasets using :class:`~torch.utils.data.ConcatDataset`. This, of course, -also works for testing, validation, and prediction Datasets. - -.. testcode:: - - from torch.utils.data import ConcatDataset - - - class LitModel(LightningModule): - def train_dataloader(self): - concat_dataset = ConcatDataset(datasets.ImageFolder(traindir_A), datasets.ImageFolder(traindir_B)) - - loader = DataLoader( - concat_dataset, batch_size=args.batch_size, shuffle=True, num_workers=args.workers, pin_memory=True - ) - return loader - - def val_dataloader(self): - # SAME - ... - - def test_dataloader(self): - # SAME - ... - - -Return Multiple DataLoaders ---------------------------- - -You can set multiple DataLoaders in your :class:`~pytorch_lightning.core.lightning.LightningModule`, and Lightning will take care of batch combination. - -For more details, refer to :paramref:`~pytorch_lightning.trainer.trainer.Trainer.multiple_trainloader_mode` - -.. testcode:: - - class LitModel(LightningModule): - def train_dataloader(self): - - loader_a = DataLoader(range(6), batch_size=4) - loader_b = DataLoader(range(15), batch_size=5) - - # pass loaders as a dict. This will create batches like this: - # {'a': batch from loader_a, 'b': batch from loader_b} - loaders = {"a": loader_a, "b": loader_b} - - # OR: - # pass loaders as sequence. This will create batches like this: - # [batch from loader_a, batch from loader_b] - loaders = [loader_a, loader_b] - - return loaders - -Furthermore, Lightning also supports nested lists and dicts (or a combination). - -.. testcode:: - - class LitModel(LightningModule): - def train_dataloader(self): - - loader_a = DataLoader(range(8), batch_size=4) - loader_b = DataLoader(range(16), batch_size=2) - - return {"a": loader_a, "b": loader_b} - - def training_step(self, batch, batch_idx): - # access a dictionary with a batch from each DataLoader - batch_a = batch["a"] - batch_b = batch["b"] - - -.. testcode:: - - class LitModel(LightningModule): - def train_dataloader(self): - - loader_a = DataLoader(range(8), batch_size=4) - loader_b = DataLoader(range(16), batch_size=4) - loader_c = DataLoader(range(32), batch_size=4) - loader_c = DataLoader(range(64), batch_size=4) - - # pass loaders as a nested dict. This will create batches like this: - loaders = {"loaders_a_b": [loader_a, loader_b], "loaders_c_d": {"c": loader_c, "d": loader_d}} - return loaders - - def training_step(self, batch, batch_idx): - # access the data - batch_a_b = batch["loaders_a_b"] - batch_c_d = batch["loaders_c_d"] - - batch_a = batch_a_b[0] - batch_b = batch_a_b[1] - - batch_c = batch_c_d["c"] - batch_d = batch_c_d["d"] - -Alternatively, you can also pass in a :class:`~pytorch_lightning.trainer.supporters.CombinedLoader` containing multiple DataLoaders. - -.. testcode:: - - from pytorch_lightning.trainer.supporters import CombinedLoader - - - def train_dataloader(self): - loader_a = DataLoader() - loader_b = DataLoader() - loaders = {"a": loader_a, "b": loader_b} - combined_loader = CombinedLoader(loaders, mode="max_size_cycle") - return combined_loader - - - def training_step(self, batch, batch_idx): - batch_a = batch["a"] - batch_b = batch["b"] - - -Multiple Validation/Test/Predict DataLoaders -============================================ - -For validation, test and predict DataLoaders, you can pass a single DataLoader or a list of them. This optional named -parameter can be used in conjunction with any of the above use cases. You can choose to pass -the batches sequentially or simultaneously, as is done for the training step. -The default mode for these DataLoaders is sequential. Note that when using a sequence of DataLoaders you need -to add an additional argument ``dataloader_idx`` in their corresponding step specific hook. The corresponding loop will process -the DataLoaders in sequential order; that is, the first DataLoader will be processed completely, then the second one, and so on. - -Refer to the following for more details for the default sequential option: - -- :meth:`~pytorch_lightning.core.hooks.DataHooks.val_dataloader` -- :meth:`~pytorch_lightning.core.hooks.DataHooks.test_dataloader` -- :meth:`~pytorch_lightning.core.hooks.DataHooks.predict_dataloader` - -.. testcode:: - - def val_dataloader(self): - loader_1 = DataLoader() - loader_2 = DataLoader() - return [loader_1, loader_2] - - - def validation_step(self, batch, batch_idx, dataloader_idx): - ... - - -Evaluation DataLoaders are iterated over sequentially. If you want to iterate over them in parallel, PyTorch Lightning provides a :class:`~pytorch_lightning.trainer.supporters.CombinedLoader` object which supports collections of DataLoaders such as list, tuple, or dictionary. The DataLoaders can be accessed using in the same way as the provided structure: - -.. testcode:: - - from pytorch_lightning.trainer.supporters import CombinedLoader - - - def val_dataloader(self): - loader_a = DataLoader() - loader_b = DataLoader() - loaders = {"a": loader_a, "b": loader_b} - combined_loaders = CombinedLoader(loaders, mode="max_size_cycle") - return combined_loaders - - - def validation_step(self, batch, batch_idx): - batch_a = batch["a"] - batch_b = batch["b"] - - -Evaluate with Additional DataLoaders -==================================== - -You can evaluate your models using additional DataLoaders even if the DataLoader specific hooks haven't been defined within your -:class:`~pytorch_lightning.core.lightning.LightningModule`. For example, this would be the case if your test data -set is not available at the time your model was declared. Simply pass the test set to the :meth:`~pytorch_lightning.trainer.trainer.Trainer.test` method: - -.. code-block:: python - - # setup your DataLoader - test = DataLoader(...) - - # test (pass in the loader) - trainer.test(dataloaders=test) - --------------- - -******************************************** -Accessing DataLoaders within LightningModule -******************************************** - -In the case that you require access to the DataLoader or Dataset objects, DataLoaders for each step can be accessed using the ``Trainer`` object: - -.. testcode:: - - from pytorch_lightning import LightningModule - - - class Model(LightningModule): - def test_step(self, batch, batch_idx, dataloader_idx): - test_dl = self.trainer.test_dataloaders[dataloader_idx] - test_dataset = test_dl.dataset - test_sampler = test_dl.sampler - ... - # extract metadata, etc. from the dataset: - ... - -If you are using a :class:`~pytorch_lightning.trainer.supporters.CombinedLoader` object which allows you to fetch batches from a collection of DataLoaders -simultaneously which supports collections of DataLoader such as list, tuple, or dictionary. The DataLoaders can be accessed using the same collection structure: - -.. code-block:: python - - from pytorch_lightning.trainer.supporters import CombinedLoader - - test_dl1 = ... - test_dl2 = ... - - # If you provided a list of DataLoaders: - - combined_loader = CombinedLoader([test_dl1, test_dl2]) - list_of_loaders = combined_loader.loaders - test_dl1 = list_of_loaders.loaders[0] - - - # If you provided dictionary of DataLoaders: - - combined_loader = CombinedLoader({"dl1": test_dl1, "dl2": test_dl2}) - dictionary_of_loaders = combined_loader.loaders - test_dl1 = dictionary_of_loaders["dl1"] - --------------- - -.. _sequential-data: - -*************** -Sequential Data -*************** - -Lightning has built in support for dealing with sequential data. - - -Packed Sequences as Inputs -========================== - -When using :class:`~torch.nn.utils.rnn.PackedSequence`, do two things: - -1. Return either a padded tensor in dataset or a list of variable length tensors in the DataLoader's `collate_fn `_ (example shows the list implementation). -2. Pack the sequence in forward or training and validation steps depending on use case. - -| - -.. testcode:: - - # For use in DataLoader - def collate_fn(batch): - x = [item[0] for item in batch] - y = [item[1] for item in batch] - return x, y - - - # In LightningModule - def training_step(self, batch, batch_idx): - x = rnn.pack_sequence(batch[0], enforce_sorted=False) - y = rnn.pack_sequence(batch[1], enforce_sorted=False) - - -Truncated Backpropagation Through Time (TBPTT) -============================================== - -There are times when multiple backwards passes are needed for each batch. -For example, it may save memory to use **Truncated Backpropagation Through Time** when training RNNs. - -Lightning can handle TBPTT automatically via this flag. - -.. testcode:: - - from pytorch_lightning import LightningModule - - - class MyModel(LightningModule): - def __init__(self): - super().__init__() - # Important: This property activates truncated backpropagation through time - # Setting this value to 2 splits the batch into sequences of size 2 - self.truncated_bptt_steps = 2 - - # Truncated back-propagation through time - def training_step(self, batch, batch_idx, hiddens): - # the training step must be updated to accept a ``hiddens`` argument - # hiddens are the hiddens from the previous truncated backprop step - out, hiddens = self.lstm(data, hiddens) - return {"loss": ..., "hiddens": hiddens} - -.. note:: If you need to modify how the batch is split, - override :func:`~pytorch_lightning.core.lightning.LightningModule.tbptt_split_batch`. - - -Iterable Datasets -================= -Lightning supports using :class:`~torch.utils.data.IterableDataset` as well as map-style Datasets. IterableDatasets provide a more natural -option when using sequential data. - -.. note:: When using an :class:`~torch.utils.data.IterableDataset` you must set the ``val_check_interval`` to 1.0 (the default) or an int - (specifying the number of training batches to run before each validation loop) when initializing the Trainer. This is - because the IterableDataset does not have a ``__len__`` and Lightning requires this to calculate the validation - interval when ``val_check_interval`` is less than one. Similarly, you can set ``limit_{mode}_batches`` to a float or - an int. If it is set to 0.0 or 0, it will set ``num_{mode}_batches`` to 0, if it is an int, it will set ``num_{mode}_batches`` - to ``limit_{mode}_batches``, if it is set to 1.0 it will run for the whole dataset, otherwise it will throw an exception. - Here ``mode`` can be train/val/test/predict. - -When iterable datasets are used, Lightning will pre-fetch 1 batch (in addition to the current batch) so it can detect -when the training will stop and run validation if necessary. - -.. testcode:: - - # IterableDataset - class CustomDataset(IterableDataset): - def __init__(self, data): - self.data_source = data - - def __iter__(self): - return iter(self.data_source) - - - # Setup DataLoader - def train_dataloader(self): - seq_data = ["A", "long", "time", "ago", "in", "a", "galaxy", "far", "far", "away"] - iterable_dataset = CustomDataset(seq_data) - - dataloader = DataLoader(dataset=iterable_dataset, batch_size=5) - return dataloader - - -.. testcode:: - - # Set val_check_interval - trainer = Trainer(val_check_interval=100) - - # Set limit_val_batches to 0.0 or 0 - trainer = Trainer(limit_val_batches=0.0) - - # Set limit_val_batches as an int - trainer = Trainer(limit_val_batches=100) diff --git a/source/index.rst b/source/index.rst deleted file mode 100644 index d646beb..0000000 --- a/source/index.rst +++ /dev/null @@ -1,275 +0,0 @@ -.. PyTorch-Lightning documentation master file, created by - sphinx-quickstart on Fri Nov 15 07:48:22 2019. - You can adapt this file completely to your liking, but it should at least - contain the root `toctree` directive. - -⚡ PyTorch Lightning에 오신 것을 환영합니다! -============================================== - -.. twocolumns:: - :left: - .. image:: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/mov.gif - :alt: Animation showing how to convert a standard training loop to a Lightning loop - :right: - PyTorch Lightning(파이토치 라이트닝))은 대규모에서 성능을 포기하지 않으면서 최대한의 유연성을 필요로 하는 전문적인 AI 연구자들과 머신러닝 엔지니어들을 위한 딥러닝 프레임워크입니다. - Lightning(라이트닝)은 프로젝트가 생각으로부터 문서 / 제품화에 이르는 동안 함께 발전합니다. - -.. raw:: html - -
-
-
-
- -.. join_slack:: - :align: center - :margin: 0 - -.. raw:: html - -
-
- - -.. raw:: html - -
- - -Lightning 설치하기 ----------------------- - - -.. raw:: html - -
-
- -Pip 사용자라면, - -.. code-block:: bash - - pip install pytorch-lightning - -.. raw:: html - -
-
- -Conda 사용자라면, - -.. code-block:: bash - - conda install pytorch-lightning -c conda-forge - -.. raw:: html - -
-
- -또는 `advanced install guide `_ 참조하세요. - -.. raw:: html - -
- -처음이신가요? ------------------ - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. customcalloutitem:: - :header: LIGHTNING 15분 만에 배워보기 - :description: 일반적인 Lightning 워크플로우의 주요한 7단계를 배웁니다. - :button_link: starter/introduction.html - -.. customcalloutitem:: - :header: Benchmarking - :description: Learn how to benchmark PyTorch Lightning. - :button_link: benchmarking/benchmarks.html - -.. raw:: html - -
-
- -.. End of callout item section - -.. raw:: html - -
- -이미 Lightning 사용자라면? ---------------------------- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. customcalloutitem:: - :description: Learn Lightning in small bites at 4 levels of expertise: Introductory, intermediate, advanced and expert. - :header: Level Up! - :button_link: expertise_levels.html - -.. customcalloutitem:: - :description: Detailed description of API each package. Assumes you already have basic Lightning knowledge. - :header: API Reference - :button_link: api_references.html - -.. customcalloutitem:: - :description: From NLP, Computer vision to RL and meta learning - see how to use Lightning in ALL research areas. - :header: Hands-on Examples - :button_link: tutorials.html - -.. customcalloutitem:: - :description: Learn how to do everything from hyperparameters sweeps to cloud training to Pruning and Quantization with Lightning. - :header: Common Workflows - :button_link: common_usecases.html - -.. customcalloutitem:: - :description: Convert your current code to Lightning - :header: Convert code to PyTorch Lightning - :button_link: starter/converting.html - - -.. raw:: html - -
-
- -.. End of callout item section - -.. raw:: html - -
- -.. toctree:: - :maxdepth: 1 - :name: start - :caption: Get Started - - starter/introduction - Organize existing PyTorch into Lightning - - -.. toctree:: - :maxdepth: 2 - :name: levels - :caption: Level Up - - levels/core_skills - levels/intermediate - levels/advanced - levels/expert - -.. toctree:: - :maxdepth: 2 - :name: pl_docs - :caption: Core API - - common/lightning_module - common/trainer - -.. toctree:: - :maxdepth: 1 - :name: Common Workflows - :caption: Common Workflows - - Avoid overfitting - model/build_model.rst - common/hyperparameters - common/progress_bar - deploy/production - advanced/training_tricks - cli/lightning_cli - tuning/profiler - Finetune a model - Manage experiments - clouds/cluster - advanced/model_parallel - clouds/cloud_training - Save and load model progress - Save memory with half-precision - Train on single or multiple GPUs - Train on single or multiple HPUs - Train on single or multiple IPUs - Train on single or multiple TPUs - model/own_your_loop - -.. toctree:: - :maxdepth: 1 - :name: Glossary - :caption: Glossary - - Accelerators - Callback - Checkpointing - Cluster - Cloud checkpoint - Console Logging - Debugging - Early stopping - Experiment manager (Logger) - Fault tolerant training - Flash - Grid AI - GPU - Half precision - HPU - Inference - IPU - Lightning CLI - Lightning Lite - LightningDataModule - LightningModule - Lightning Transformers - Log - Loops - TPU - Metrics - Model - Model Parallel - Plugins - Progress bar - Production - Predict - Profiler - Pruning and Quantization - Remote filesystem and FSSPEC - Strategy registry - Style guide - Sweep - SWA - SLURM - Transfer learning - Trainer - Torch distributed - -.. toctree:: - :maxdepth: 1 - :name: Hands-on Examples - :caption: Hands-on Examples - :glob: - - PyTorch Lightning 101 class - From PyTorch to PyTorch Lightning [Blog] - From PyTorch to PyTorch Lightning [Video] - - -.. raw:: html - -
- -색인 및 검색 ------------------- - -* :ref:`genindex` -* :ref:`search` diff --git a/source/levels/advanced.rst b/source/levels/advanced.rst deleted file mode 100644 index 4ffe090..0000000 --- a/source/levels/advanced.rst +++ /dev/null @@ -1,87 +0,0 @@ - -############### -Advanced skills -############### - -Configure all aspects of Lightning for advanced usecases. - -.. join_slack:: - :align: left - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Level 15: Customize configs to run in production - :description: Enable composable YAMLs - :col_css: col-md-6 - :button_link: advanced_level_15.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 16: Customize the trainer - :description: Inject custom code into the trainer and modify the progress bar. - :col_css: col-md-6 - :button_link: advanced_level_16.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 17: Own the training loop - :description: Learn all the ways of owning your raw PyTorch loops with Lighting. - :col_css: col-md-6 - :button_link: advanced_level_17.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 18: Enable advanced checkpointing - :description: Enable composable or cloud based checkpoints. - :col_css: col-md-6 - :button_link: advanced_level_18.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 19: Explore IPUs - :description: Explore Intelligence Processing Unit (IPU) for model scaling. - :col_css: col-md-6 - :button_link: advanced_level_19.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 20: Explore HPUs - :description: Explore Havana Gaudi Processing Unit (HPU) for model scaling. - :col_css: col-md-6 - :button_link: advanced_level_20.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 21: Master TPUs - :description: Master TPUs and run on cloud TPUs. - :col_css: col-md-6 - :button_link: advanced_level_21.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Level 22: Reach 1 trillion parameters on GPUs - :description: Scale to 1 trillion params on GPUs. - :col_css: col-md-6 - :button_link: advanced_level_22.html - :height: 150 - :tag: advanced - -.. raw:: html - -
-
diff --git a/source/levels/advanced_level_17.rst b/source/levels/advanced_level_17.rst deleted file mode 100644 index c05c8c9..0000000 --- a/source/levels/advanced_level_17.rst +++ /dev/null @@ -1,45 +0,0 @@ -:orphan: - -############################### -Level 17: Own the training loop -############################### - -Learn all the ways of owning your raw PyTorch loops with Lighting. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Enable manual optimization - :description: Gain control of the training loop with manual optimization and LightningModule methods. - :col_css: col-md-4 - :button_link: ../model/build_model_advanced.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Use a Raw PyTorch Loop - :description: Migrate complex PyTorch projects to Lightning and push bleeding-edge research with the raw PyTorch loop. - :col_css: col-md-4 - :button_link: ../model/build_model_expert.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Make a custom Lightning Loop - :description: Conduct bleeding-edge research like meta-learning and RL with a custom Loop. - :col_css: col-md-4 - :button_link: ../extensions/loops.html - :height: 150 - :tag: expert - -.. raw:: html - -
-
diff --git a/source/levels/expert.rst b/source/levels/expert.rst deleted file mode 100644 index d41680b..0000000 --- a/source/levels/expert.rst +++ /dev/null @@ -1,63 +0,0 @@ - -############# -Expert skills -############# - -Customize and extend Lightning for things like custom hardware or distributed strategies. - -.. join_slack:: - :align: left - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Level 23: Extend the Lightning CLI - :description: Extend the functionality of the Lightning CLI. - :col_css: col-md-6 - :button_link: expert_level_23.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: Level 24: Integrate a custom cluster - :description: Integrate a custom cluster into Lightning. - :col_css: col-md-6 - :button_link: expert_level_24.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: Level 25: Explore fault-tolerance in-depth - :description: Understand the details of fault-tolerance. - :col_css: col-md-6 - :button_link: ../clouds/fault_tolerant_training_faq.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: Level 26: Make your own profiler - :description: Make your own profiler. - :col_css: col-md-6 - :button_link: ../tuning/profiler_expert.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: Level 27: Add a new accelerator or Strategy - :description: Integrate a new accelerator or distributed strategy. - :col_css: col-md-6 - :button_link: expert_level_27.html - :height: 150 - :tag: expert - -.. raw:: html - -
-
diff --git a/source/levels/expert_level_24.rst b/source/levels/expert_level_24.rst deleted file mode 100644 index b32a8ac..0000000 --- a/source/levels/expert_level_24.rst +++ /dev/null @@ -1,37 +0,0 @@ -:orphan: - -#################################### -Level 24: Integrate a custom cluster -#################################### - -Extend the functionality of the Lightning CLI. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Integrate your own cluster - :description: Learn how to integrate your own cluster - :col_css: col-md-6 - :button_link: ../clouds/cluster_expert.html - :height: 150 - :tag: expert - -.. displayitem:: - :header: Run on your own cloud - :description: Learn how to run on your Company or University private clouds. - :col_css: col-md-6 - :button_link: ../clouds/run_expert.html - :height: 150 - :tag: expert - -.. raw:: html - -
-
diff --git a/source/levels/intermediate.rst b/source/levels/intermediate.rst deleted file mode 100644 index 331e477..0000000 --- a/source/levels/intermediate.rst +++ /dev/null @@ -1,89 +0,0 @@ - -################### -Intermediate skills -################### - -Learn to scale up your models and enable collaborative model development at academic or industry research labs. - -.. join_slack:: - :align: left - ----- - -.. include:: ../links.rst - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Level 7: Interactive cloud development - :description: Learn how to access GPUs and TPUs on the cloud. - :button_link: intermediate_level_7.html - :col_css: col-md-6 - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 8: Train in the background on the cloud - :description: Learn how to run models on the cloud in the background. - :button_link: intermediate_level_8.html - :col_css: col-md-6 - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 9: Modularize your projects - :description: Create DataModules to enable dataset reusability. - :col_css: col-md-6 - :button_link: intermediate_level_9.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 10: Understand your model - :description: Use advanced visuals to find the best performing model. - :col_css: col-md-6 - :button_link: intermediate_level_10.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 11: Explore SOTA scaling techniques - :description: Explore SOTA techniques to help convergence, stability and scalability. - :col_css: col-md-6 - :button_link: intermediate_level_11.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 12: Deploy your models - :description: Learn how to deploy your models with optimizations like ONNX and torchscript. - :col_css: col-md-6 - :button_link: intermediate_level_12.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 13: Optimize training speed - :description: Use advanced profilers to mixed precision to train bigger models, faster. - :col_css: col-md-6 - :button_link: intermediate_level_13.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: Level 14: Run on on-prem clusters - :description: Run on a custom on-prem cluster or SLURM cluster. - :col_css: col-md-6 - :button_link: intermediate_level_14.html - :height: 150 - :tag: intermediate - -.. raw:: html - -
-
diff --git a/source/levels/intermediate_level_8.rst b/source/levels/intermediate_level_8.rst deleted file mode 100644 index 190364a..0000000 --- a/source/levels/intermediate_level_8.rst +++ /dev/null @@ -1,53 +0,0 @@ -:orphan: - -################################ -Level 8: Run models on the cloud -################################ - -Learn to run models on the cloud in the background asynchroneously. - ----- - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: 1: Run a model in the background on the cloud - :description: Learn to run a model in the background on a cloud machine. - :col_css: col-md-6 - :button_link: ../clouds/run_basic.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: 2: Save up to 80% on cloud costs with fault-tolerant training - :description: Run on the cloud for 1/10th the price with fault-tolerant training. - :col_css: col-md-6 - :button_link: ../clouds/fault_tolerant_training_basic.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: 3: Run many models at once - :description: Run many models at once (sweep) to find the best performing model. - :col_css: col-md-6 - :button_link: ../clouds/run_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: 4: Run on your own cloud - :description: Learn how to run on your Company or University private clouds. - :col_css: col-md-6 - :button_link: ../clouds/run_expert.html - :height: 150 - :tag: expert - -.. raw:: html - -
-
diff --git a/source/model/build_model.rst b/source/model/build_model.rst deleted file mode 100644 index 8d12110..0000000 --- a/source/model/build_model.rst +++ /dev/null @@ -1,55 +0,0 @@ -:orphan: - -############# -Build a Model -############# - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: 1: Train a model - :description: Build a model to learn the basic ideas of Lightning - :col_css: col-md-4 - :button_link: train_model_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: 2: Validate and test a model - :description: Add a validation and test data split to avoid overfitting. - :col_css: col-md-4 - :button_link: validate_model_basic.html - :height: 150 - :tag: basic - -.. displayitem:: - :header: 3: Supercharge training - :description: Enable state-of-the-art training techniques with the Trainer features. - :col_css: col-md-4 - :button_link: build_model_intermediate.html - :height: 150 - :tag: intermediate - -.. displayitem:: - :header: LightningModule API - :description: Dig into LightningModule API in depth - :col_css: col-md-4 - :button_link: ../common/lightning_module.html#lightningmodule-api - :height: 150 - -.. displayitem:: - :header: Trainer API - :description: Dig into Trainer API in depth - :col_css: col-md-4 - :button_link: ../common/trainer.html#trainer-class-api - :height: 150 - -.. raw:: html - -
-
diff --git a/source/model/build_model_expert.rst b/source/model/build_model_expert.rst deleted file mode 100644 index f321e90..0000000 --- a/source/model/build_model_expert.rst +++ /dev/null @@ -1,7 +0,0 @@ -:orphan: - -######################### -Raw PyTorch loop (expert) -######################### - -.. include:: ../starter/lightning_lite.rst diff --git a/source/model/manual_optimization.rst b/source/model/manual_optimization.rst deleted file mode 100644 index e4a31dd..0000000 --- a/source/model/manual_optimization.rst +++ /dev/null @@ -1,290 +0,0 @@ -******************* -Manual Optimization -******************* - -For advanced research topics like reinforcement learning, sparse coding, or GAN research, it may be desirable to -manually manage the optimization process. - -This is only recommended for experts who need ultimate flexibility. -Lightning will handle only accelerator, precision and strategy logic. -The users are left with ``optimizer.zero_grad()``, gradient accumulation, model toggling, etc.. - -To manually optimize, do the following: - -* Set ``self.automatic_optimization=False`` in your ``LightningModule``'s ``__init__``. -* Use the following functions and call them manually: - - * ``self.optimizers()`` to access your optimizers (one or multiple) - * ``optimizer.zero_grad()`` to clear the gradients from the previous training step - * ``self.manual_backward(loss)`` instead of ``loss.backward()`` - * ``optimizer.step()`` to update your model parameters - -Here is a minimal example of manual optimization. - -.. testcode:: python - - from pytorch_lightning import LightningModule - - - class MyModel(LightningModule): - def __init__(self): - super().__init__() - # Important: This property activates manual optimization. - self.automatic_optimization = False - - def training_step(self, batch, batch_idx): - opt = self.optimizers() - opt.zero_grad() - loss = self.compute_loss(batch) - self.manual_backward(loss) - opt.step() - -.. warning:: - Before 1.2, ``optimizer.step()`` was calling ``optimizer.zero_grad()`` internally. - From 1.2, it is left to the user's expertise. - -.. tip:: - Be careful where you call ``optimizer.zero_grad()``, or your model won't converge. - It is good practice to call ``optimizer.zero_grad()`` before ``self.manual_backward(loss)``. - - -Access your Own Optimizer -========================= - -The provided ``optimizer`` is a :class:`~pytorch_lightning.core.optimizer.LightningOptimizer` object wrapping your own optimizer -configured in your :meth:`~pytorch_lightning.core.lightning.LightningModule.configure_optimizers`. You can access your own optimizer -with ``optimizer.optimizer``. However, if you use your own optimizer to perform a step, Lightning won't be able to -support accelerators, precision and profiling for you. - -.. testcode:: python - - class Model(LightningModule): - def __init__(self): - super().__init__() - self.automatic_optimization = False - ... - - def training_step(self, batch, batch_idx): - optimizer = self.optimizers() - - # `optimizer` is a `LightningOptimizer` wrapping the optimizer. - # To access it, do the following. - # However, it won't work on TPU, AMP, etc... - optimizer = optimizer.optimizer - ... - -Gradient Accumulation -===================== - -You can accumulate gradients over batches similarly to ``accumulate_grad_batches`` argument in -:ref:`Trainer ` for automatic optimization. To perform gradient accumulation with one optimizer -after every ``N`` steps, you can do as such. - -.. testcode:: python - - def __init__(self): - super().__init__() - self.automatic_optimization = False - - - def training_step(self, batch, batch_idx): - opt = self.optimizers() - - loss = self.compute_loss(batch) - self.manual_backward(loss) - - # accumulate gradients of N batches - if (batch_idx + 1) % N == 0: - opt.step() - opt.zero_grad() - - -Use Multiple Optimizers (like GANs) -=================================== - -Here is an example training a simple GAN with multiple optimizers using manual optimization. - -.. testcode:: python - - import torch - from torch import Tensor - from pytorch_lightning import LightningModule - - - class SimpleGAN(LightningModule): - def __init__(self): - super().__init__() - self.G = Generator() - self.D = Discriminator() - - # Important: This property activates manual optimization. - self.automatic_optimization = False - - def sample_z(self, n) -> Tensor: - sample = self._Z.sample((n,)) - return sample - - def sample_G(self, n) -> Tensor: - z = self.sample_z(n) - return self.G(z) - - def training_step(self, batch, batch_idx): - # Implementation follows the PyTorch tutorial: - # https://pytorch.org/tutorials/beginner/dcgan_faces_tutorial.html - g_opt, d_opt = self.optimizers() - - X, _ = batch - batch_size = X.shape[0] - - real_label = torch.ones((batch_size, 1), device=self.device) - fake_label = torch.zeros((batch_size, 1), device=self.device) - - g_X = self.sample_G(batch_size) - - ########################## - # Optimize Discriminator # - ########################## - d_x = self.D(X) - errD_real = self.criterion(d_x, real_label) - - d_z = self.D(g_X.detach()) - errD_fake = self.criterion(d_z, fake_label) - - errD = errD_real + errD_fake - - d_opt.zero_grad() - self.manual_backward(errD) - d_opt.step() - - ###################### - # Optimize Generator # - ###################### - d_z = self.D(g_X) - errG = self.criterion(d_z, real_label) - - g_opt.zero_grad() - self.manual_backward(errG) - g_opt.step() - - self.log_dict({"g_loss": errG, "d_loss": errD}, prog_bar=True) - - def configure_optimizers(self): - g_opt = torch.optim.Adam(self.G.parameters(), lr=1e-5) - d_opt = torch.optim.Adam(self.D.parameters(), lr=1e-5) - return g_opt, d_opt - - -Learning Rate Scheduling -======================== - -Every optimizer you use can be paired with any -`Learning Rate Scheduler `_. Please see the -documentation of :meth:`~pytorch_lightning.core.lightning.LightningModule.configure_optimizers` for all the available options - -You can call ``lr_scheduler.step()`` at arbitrary intervals. -Use ``self.lr_schedulers()`` in your :class:`~pytorch_lightning.core.lightning.LightningModule` to access any learning rate schedulers -defined in your :meth:`~pytorch_lightning.core.lightning.LightningModule.configure_optimizers`. - -.. warning:: - * Before v1.3, Lightning automatically called ``lr_scheduler.step()`` in both automatic and manual optimization. From - 1.3, ``lr_scheduler.step()`` is now for the user to call at arbitrary intervals. - * Note that the ``lr_scheduler_config`` keys, such as ``"frequency"`` and ``"interval"``, will be ignored even if they are provided in - your :meth:`~pytorch_lightning.core.lightning.LightningModule.configure_optimizers` during manual optimization. - -Here is an example calling ``lr_scheduler.step()`` every step. - -.. testcode:: python - - # step every batch - def __init__(self): - super().__init__() - self.automatic_optimization = False - - - def training_step(self, batch, batch_idx): - # do forward, backward, and optimization - ... - - # single scheduler - sch = self.lr_schedulers() - sch.step() - - # multiple schedulers - sch1, sch2 = self.lr_schedulers() - sch1.step() - sch2.step() - -If you want to call ``lr_scheduler.step()`` every ``N`` steps/epochs, do the following. - -.. testcode:: python - - def __init__(self): - super().__init__() - self.automatic_optimization = False - - - def training_step(self, batch, batch_idx): - # do forward, backward, and optimization - ... - - sch = self.lr_schedulers() - - # step every N batches - if (batch_idx + 1) % N == 0: - sch.step() - - # step every N epochs - if self.trainer.is_last_batch and (self.trainer.current_epoch + 1) % N == 0: - sch.step() - -If you want to call schedulers that require a metric value after each epoch, consider doing the following: - -.. testcode:: - - def __init__(self): - super().__init__() - self.automatic_optimization = False - - - def training_epoch_end(self, outputs): - sch = self.lr_schedulers() - - # If the selected scheduler is a ReduceLROnPlateau scheduler. - if isinstance(sch, torch.optim.lr_scheduler.ReduceLROnPlateau): - sch.step(self.trainer.callback_metrics["loss"]) - -Use Closure for LBFGS-like Optimizers -===================================== - -It is a good practice to provide the optimizer with a closure function that performs a ``forward``, ``zero_grad`` and -``backward`` of your model. It is optional for most optimizers, but makes your code compatible if you switch to an -optimizer which requires a closure, such as :class:`~torch.optim.LBFGS`. - -See `the PyTorch docs `_ for more about the closure. - -Here is an example using a closure function. - -.. testcode:: python - - def __init__(self): - super().__init__() - self.automatic_optimization = False - - - def configure_optimizers(self): - return torch.optim.LBFGS(...) - - - def training_step(self, batch, batch_idx): - opt = self.optimizers() - - def closure(): - loss = self.compute_loss(batch) - opt.zero_grad() - self.manual_backward(loss) - return loss - - opt.step(closure=closure) - -.. warning:: - The :class:`~torch.optim.LBFGS` optimizer is not supported for apex AMP, native AMP, IPUs, or DeepSpeed. diff --git a/source/model/own_your_loop.rst b/source/model/own_your_loop.rst deleted file mode 100644 index 5982b0a..0000000 --- a/source/model/own_your_loop.rst +++ /dev/null @@ -1,41 +0,0 @@ -:orphan: - -################################ -Use a pure PyTorch training loop -################################ - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Enable manual optimization - :description: Gain control of the training loop with manual optimization and LightningModule methods. - :col_css: col-md-4 - :button_link: build_model_advanced.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Use a Raw PyTorch Loop - :description: Migrate complex PyTorch projects to Lightning and push bleeding-edge research with the raw PyTorch loop. - :col_css: col-md-4 - :button_link: build_model_expert.html - :height: 150 - :tag: advanced - -.. displayitem:: - :header: Make a custom Lightning Loop - :description: Conduct bleeding-edge research like meta-learning and RL with a custom Loop. - :col_css: col-md-4 - :button_link: loops.html - :height: 150 - :tag: expert - -.. raw:: html - -
-
diff --git a/source/notebooks/course_UvA-DL/01-introduction-to-pytorch.ipynb b/source/notebooks/course_UvA-DL/01-introduction-to-pytorch.ipynb deleted file mode 100644 index cdf4ec3..0000000 --- a/source/notebooks/course_UvA-DL/01-introduction-to-pytorch.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "c1ca2a69", "metadata": {"papermill": {"duration": 0.179789, "end_time": "2021-12-04T15:53:22.277549", "exception": false, "start_time": "2021-12-04T15:53:22.097760", "status": "completed"}, "tags": []}, "source": ["\n", "# Tutorial 1: Introduction to PyTorch\n", "\n", "* **Author:** Phillip Lippe\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-12-04T16:52:44.026092\n", "\n", "This tutorial will give a short introduction to PyTorch basics, and get you setup for writing your own neural networks.\n", "This notebook is part of a lecture series on Deep Learning at the University of Amsterdam.\n", "The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io.\n", "\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/course_UvA-DL/01-introduction-to-pytorch.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "8387d057", "metadata": {"papermill": {"duration": 0.177673, "end_time": "2021-12-04T15:53:22.631831", "exception": false, "start_time": "2021-12-04T15:53:22.454158", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "9d8201a6", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-12-04T15:53:22.994731Z", "iopub.status.busy": "2021-12-04T15:53:22.994231Z", "iopub.status.idle": "2021-12-04T15:53:25.459580Z", "shell.execute_reply": "2021-12-04T15:53:25.459996Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 2.651811, "end_time": "2021-12-04T15:53:25.460282", "exception": false, "start_time": "2021-12-04T15:53:22.808471", "status": "completed"}, "tags": []}, "outputs": [], "source": ["! pip install --quiet \"torchmetrics>=0.3\" \"matplotlib\" \"torch>=1.6, <1.9\" \"pytorch-lightning>=1.3\""]}, {"cell_type": "markdown", "id": "3ef762bf", "metadata": {"papermill": {"duration": 0.180076, "end_time": "2021-12-04T15:53:25.821045", "exception": false, "start_time": "2021-12-04T15:53:25.640969", "status": "completed"}, "tags": []}, "source": ["
\n", "Welcome to our PyTorch tutorial for the Deep Learning course 2020 at the University of Amsterdam!\n", "The following notebook is meant to give a short introduction to PyTorch basics, and get you setup for writing your own neural networks.\n", "PyTorch is an open source machine learning framework that allows you to write your own neural networks and optimize them efficiently.\n", "However, PyTorch is not the only framework of its kind.\n", "Alternatives to PyTorch include [TensorFlow](https://www.tensorflow.org/), [JAX](https://github.com/google/jax) and [Caffe](http://caffe.berkeleyvision.org/).\n", "We choose to teach PyTorch at the University of Amsterdam because it is well established, has a huge developer community (originally developed by Facebook), is very flexible and especially used in research.\n", "Many current papers publish their code in PyTorch, and thus it is good to be familiar with PyTorch as well.\n", "Meanwhile, TensorFlow (developed by Google) is usually known for being a production-grade deep learning library.\n", "Still, if you know one machine learning framework in depth, it is very easy to learn another one because many of them use the same concepts and ideas.\n", "For instance, TensorFlow's version 2 was heavily inspired by the most popular features of PyTorch, making the frameworks even more similar.\n", "If you are already familiar with PyTorch and have created your own neural network projects, feel free to just skim this notebook.\n", "\n", "We are of course not the first ones to create a PyTorch tutorial.\n", "There are many great tutorials online, including the [\"60-min blitz\"](https://pytorch.org/tutorials/beginner/deep_learning_60min_blitz.html) on the official [PyTorch website](https://pytorch.org/tutorials/).\n", "Yet, we choose to create our own tutorial which is designed to give you the basics particularly necessary for the practicals, but still understand how PyTorch works under the hood.\n", "Over the next few weeks, we will also keep exploring new PyTorch features in the series of Jupyter notebook tutorials about deep learning.\n", "\n", "We will use a set of standard libraries that are often used in machine learning projects.\n", "If you are running this notebook on Google Colab, all libraries should be pre-installed.\n", "If you are running this notebook locally, make sure you have installed our `dl2020` environment ([link](https://github.com/uvadlc/uvadlc_practicals_2020/blob/master/environment.yml)) and have activated it."]}, {"cell_type": "code", "execution_count": 2, "id": "fd4e9d73", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:26.189594Z", "iopub.status.busy": "2021-12-04T15:53:26.189116Z", "iopub.status.idle": "2021-12-04T15:53:27.107430Z", "shell.execute_reply": "2021-12-04T15:53:27.107817Z"}, "papermill": {"duration": 1.106304, "end_time": "2021-12-04T15:53:27.107981", "exception": false, "start_time": "2021-12-04T15:53:26.001677", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/tmp/ipykernel_739/4100430984.py:14: DeprecationWarning: `set_matplotlib_formats` is deprecated since IPython 7.23, directly use `matplotlib_inline.backend_inline.set_matplotlib_formats()`\n", " set_matplotlib_formats(\"svg\", \"pdf\")\n"]}], "source": ["import time\n", "\n", "import matplotlib.pyplot as plt\n", "import numpy as np\n", "import torch\n", "import torch.nn as nn\n", "import torch.utils.data as data\n", "\n", "%matplotlib inline\n", "from IPython.display import set_matplotlib_formats\n", "from matplotlib.colors import to_rgba\n", "from tqdm.notebook import tqdm # Progress bar\n", "\n", "set_matplotlib_formats(\"svg\", \"pdf\")"]}, {"cell_type": "markdown", "id": "e6ab2b50", "metadata": {"papermill": {"duration": 0.177291, "end_time": "2021-12-04T15:53:27.467274", "exception": false, "start_time": "2021-12-04T15:53:27.289983", "status": "completed"}, "tags": []}, "source": ["## The Basics of PyTorch\n", "\n", "We will start with reviewing the very basic concepts of PyTorch.\n", "As a prerequisite, we recommend to be familiar with the `numpy` package as most machine learning frameworks are based on very similar concepts.\n", "If you are not familiar with numpy yet, don't worry: here is a [tutorial](https://numpy.org/devdocs/user/quickstart.html) to go through.\n", "\n", "So, let's start with importing PyTorch.\n", "The package is called `torch`, based on its original framework [Torch](http://torch.ch/).\n", "As a first step, we can check its version:"]}, {"cell_type": "code", "execution_count": 3, "id": "11531bd1", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:27.828703Z", "iopub.status.busy": "2021-12-04T15:53:27.828236Z", "iopub.status.idle": "2021-12-04T15:53:27.830237Z", "shell.execute_reply": "2021-12-04T15:53:27.830613Z"}, "papermill": {"duration": 0.186067, "end_time": "2021-12-04T15:53:27.830761", "exception": false, "start_time": "2021-12-04T15:53:27.644694", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Using torch 1.8.1+cu102\n"]}], "source": ["print(\"Using torch\", torch.__version__)"]}, {"cell_type": "markdown", "id": "09c6bc8c", "metadata": {"papermill": {"duration": 0.180813, "end_time": "2021-12-04T15:53:28.192377", "exception": false, "start_time": "2021-12-04T15:53:28.011564", "status": "completed"}, "tags": []}, "source": ["At the time of writing this tutorial (mid of August 2021), the current stable version is 1.9.\n", "You should therefore see the output `Using torch 1.9.0`, eventually with some extension for the CUDA version on Colab.\n", "In case you use the `dl2020` environment, you should see `Using torch 1.6.0` since the environment was provided in October 2020.\n", "It is recommended to update the PyTorch version to the newest one.\n", "If you see a lower version number than 1.6, make sure you have installed the correct the environment, or ask one of your TAs.\n", "In case PyTorch 1.10 or newer will be published during the time of the course, don't worry.\n", "The interface between PyTorch versions doesn't change too much, and hence all code should also be runnable with newer versions.\n", "\n", "As in every machine learning framework, PyTorch provides functions that are stochastic like generating random numbers.\n", "However, a very good practice is to setup your code to be reproducible with the exact same random numbers.\n", "This is why we set a seed below."]}, {"cell_type": "code", "execution_count": 4, "id": "541190c5", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:28.555309Z", "iopub.status.busy": "2021-12-04T15:53:28.554820Z", "iopub.status.idle": "2021-12-04T15:53:28.559934Z", "shell.execute_reply": "2021-12-04T15:53:28.560320Z"}, "papermill": {"duration": 0.188101, "end_time": "2021-12-04T15:53:28.560451", "exception": false, "start_time": "2021-12-04T15:53:28.372350", "status": "completed"}, "tags": []}, "outputs": [{"data": {"text/plain": [""]}, "execution_count": 4, "metadata": {}, "output_type": "execute_result"}], "source": ["torch.manual_seed(42) # Setting the seed"]}, {"cell_type": "markdown", "id": "07432939", "metadata": {"papermill": {"duration": 0.179782, "end_time": "2021-12-04T15:53:28.920061", "exception": false, "start_time": "2021-12-04T15:53:28.740279", "status": "completed"}, "tags": []}, "source": ["### Tensors\n", "\n", "Tensors are the PyTorch equivalent to Numpy arrays, with the addition to also have support for GPU acceleration (more on that later).\n", "The name \"tensor\" is a generalization of concepts you already know.\n", "For instance, a vector is a 1-D tensor, and a matrix a 2-D tensor.\n", "When working with neural networks, we will use tensors of various shapes and number of dimensions.\n", "\n", "Most common functions you know from numpy can be used on tensors as well.\n", "Actually, since numpy arrays are so similar to tensors, we can convert most tensors to numpy arrays (and back) but we don't need it too often.\n", "\n", "#### Initialization\n", "\n", "Let's first start by looking at different ways of creating a tensor.\n", "There are many possible options, the most simple one is to call\n", "`torch.Tensor` passing the desired shape as input argument:"]}, {"cell_type": "code", "execution_count": 5, "id": "9a7c7abb", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:29.290240Z", "iopub.status.busy": "2021-12-04T15:53:29.289779Z", "iopub.status.idle": "2021-12-04T15:53:29.293533Z", "shell.execute_reply": "2021-12-04T15:53:29.293096Z"}, "papermill": {"duration": 0.186675, "end_time": "2021-12-04T15:53:29.293645", "exception": false, "start_time": "2021-12-04T15:53:29.106970", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["tensor([[[-8.4362e+34, 4.5652e-41, -2.7143e-34, -4.6629e+13],\n", " [-1.2059e+35, 4.5652e-41, -8.4184e+34, 4.5652e-41],\n", " [ 9.5052e-38, 2.5041e-19, -1.1549e+35, 4.5652e-41]],\n", "\n", " [[-8.4185e+34, 4.5652e-41, 1.1811e+06, 6.3794e+25],\n", " [-1.2059e+35, 4.5652e-41, -8.4186e+34, 4.5652e-41],\n", " [ 1.1561e+02, 3.9652e+37, -1.2049e+35, 4.5652e-41]]])\n"]}], "source": ["x = torch.Tensor(2, 3, 4)\n", "print(x)"]}, {"cell_type": "markdown", "id": "c3259cdd", "metadata": {"papermill": {"duration": 0.182347, "end_time": "2021-12-04T15:53:29.658142", "exception": false, "start_time": "2021-12-04T15:53:29.475795", "status": "completed"}, "tags": []}, "source": ["The function `torch.Tensor` allocates memory for the desired tensor, but reuses any values that have already been in the memory.\n", "To directly assign values to the tensor during initialization, there are many alternatives including:\n", "\n", "* `torch.zeros`: Creates a tensor filled with zeros\n", "* `torch.ones`: Creates a tensor filled with ones\n", "* `torch.rand`: Creates a tensor with random values uniformly sampled between 0 and 1\n", "* `torch.randn`: Creates a tensor with random values sampled from a normal distribution with mean 0 and variance 1\n", "* `torch.arange`: Creates a tensor containing the values $N,N+1,N+2,...,M$\n", "* `torch.Tensor` (input list): Creates a tensor from the list elements you provide"]}, {"cell_type": "code", "execution_count": 6, "id": "d7d674fc", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:30.029266Z", "iopub.status.busy": "2021-12-04T15:53:30.028795Z", "iopub.status.idle": "2021-12-04T15:53:30.031289Z", "shell.execute_reply": "2021-12-04T15:53:30.031670Z"}, "papermill": {"duration": 0.18988, "end_time": "2021-12-04T15:53:30.031801", "exception": false, "start_time": "2021-12-04T15:53:29.841921", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["tensor([[1., 2.],\n", " [3., 4.]])\n"]}], "source": ["# Create a tensor from a (nested) list\n", "x = torch.Tensor([[1, 2], [3, 4]])\n", "print(x)"]}, {"cell_type": "code", "execution_count": 7, "id": "2267c81e", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:30.409461Z", "iopub.status.busy": "2021-12-04T15:53:30.408988Z", "iopub.status.idle": "2021-12-04T15:53:30.411852Z", "shell.execute_reply": "2021-12-04T15:53:30.412236Z"}, "papermill": {"duration": 0.192911, "end_time": "2021-12-04T15:53:30.412364", "exception": false, "start_time": "2021-12-04T15:53:30.219453", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["tensor([[[0.8823, 0.9150, 0.3829, 0.9593],\n", " [0.3904, 0.6009, 0.2566, 0.7936],\n", " [0.9408, 0.1332, 0.9346, 0.5936]],\n", "\n", " [[0.8694, 0.5677, 0.7411, 0.4294],\n", " [0.8854, 0.5739, 0.2666, 0.6274],\n", " [0.2696, 0.4414, 0.2969, 0.8317]]])\n"]}], "source": ["# Create a tensor with random values between 0 and 1 with the shape [2, 3, 4]\n", "x = torch.rand(2, 3, 4)\n", "print(x)"]}, {"cell_type": "markdown", "id": "f11f5cfd", "metadata": {"papermill": {"duration": 0.184187, "end_time": "2021-12-04T15:53:30.778847", "exception": false, "start_time": "2021-12-04T15:53:30.594660", "status": "completed"}, "tags": []}, "source": ["You can obtain the shape of a tensor in the same way as in numpy (`x.shape`), or using the `.size` method:"]}, {"cell_type": "code", "execution_count": 8, "id": "217f784e", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:31.151326Z", "iopub.status.busy": "2021-12-04T15:53:31.150840Z", "iopub.status.idle": "2021-12-04T15:53:31.153313Z", "shell.execute_reply": "2021-12-04T15:53:31.153693Z"}, "papermill": {"duration": 0.191823, "end_time": "2021-12-04T15:53:31.153829", "exception": false, "start_time": "2021-12-04T15:53:30.962006", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Shape: torch.Size([2, 3, 4])\n", "Size: torch.Size([2, 3, 4])\n", "Size: 2 3 4\n"]}], "source": ["shape = x.shape\n", "print(\"Shape:\", x.shape)\n", "\n", "size = x.size()\n", "print(\"Size:\", size)\n", "\n", "dim1, dim2, dim3 = x.size()\n", "print(\"Size:\", dim1, dim2, dim3)"]}, {"cell_type": "markdown", "id": "692ea692", "metadata": {"papermill": {"duration": 0.18425, "end_time": "2021-12-04T15:53:31.521916", "exception": false, "start_time": "2021-12-04T15:53:31.337666", "status": "completed"}, "tags": []}, "source": ["#### Tensor to Numpy, and Numpy to Tensor\n", "\n", "Tensors can be converted to numpy arrays, and numpy arrays back to tensors.\n", "To transform a numpy array into a tensor, we can use the function `torch.from_numpy`:"]}, {"cell_type": "code", "execution_count": 9, "id": "52c87663", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:31.897321Z", "iopub.status.busy": "2021-12-04T15:53:31.896848Z", "iopub.status.idle": "2021-12-04T15:53:31.899783Z", "shell.execute_reply": "2021-12-04T15:53:31.899380Z"}, "papermill": {"duration": 0.193907, "end_time": "2021-12-04T15:53:31.899893", "exception": false, "start_time": "2021-12-04T15:53:31.705986", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Numpy array: [[1 2]\n", " [3 4]]\n", "PyTorch tensor: tensor([[1, 2],\n", " [3, 4]])\n"]}], "source": ["np_arr = np.array([[1, 2], [3, 4]])\n", "tensor = torch.from_numpy(np_arr)\n", "\n", "print(\"Numpy array:\", np_arr)\n", "print(\"PyTorch tensor:\", tensor)"]}, {"cell_type": "markdown", "id": "fe3837cb", "metadata": {"papermill": {"duration": 0.183323, "end_time": "2021-12-04T15:53:32.270124", "exception": false, "start_time": "2021-12-04T15:53:32.086801", "status": "completed"}, "tags": []}, "source": ["To transform a PyTorch tensor back to a numpy array, we can use the function `.numpy()` on tensors:"]}, {"cell_type": "code", "execution_count": 10, "id": "4a036f09", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:32.645038Z", "iopub.status.busy": "2021-12-04T15:53:32.644564Z", "iopub.status.idle": "2021-12-04T15:53:32.647718Z", "shell.execute_reply": "2021-12-04T15:53:32.647247Z"}, "papermill": {"duration": 0.193847, "end_time": "2021-12-04T15:53:32.647829", "exception": false, "start_time": "2021-12-04T15:53:32.453982", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["PyTorch tensor: tensor([0, 1, 2, 3])\n", "Numpy array: [0 1 2 3]\n"]}], "source": ["tensor = torch.arange(4)\n", "np_arr = tensor.numpy()\n", "\n", "print(\"PyTorch tensor:\", tensor)\n", "print(\"Numpy array:\", np_arr)"]}, {"cell_type": "markdown", "id": "7ed5a7da", "metadata": {"papermill": {"duration": 0.184638, "end_time": "2021-12-04T15:53:33.016987", "exception": false, "start_time": "2021-12-04T15:53:32.832349", "status": "completed"}, "tags": []}, "source": ["The conversion of tensors to numpy require the tensor to be on the CPU, and not the GPU (more on GPU support in a later section).\n", "In case you have a tensor on GPU, you need to call `.cpu()` on the tensor beforehand.\n", "Hence, you get a line like `np_arr = tensor.cpu().numpy()`."]}, {"cell_type": "markdown", "id": "e8e882b6", "metadata": {"papermill": {"duration": 0.183883, "end_time": "2021-12-04T15:53:33.386141", "exception": false, "start_time": "2021-12-04T15:53:33.202258", "status": "completed"}, "tags": []}, "source": ["#### Operations\n", "\n", "Most operations that exist in numpy, also exist in PyTorch.\n", "A full list of operations can be found in the [PyTorch documentation](https://pytorch.org/docs/stable/tensors.html#), but we will review the most important ones here.\n", "\n", "The simplest operation is to add two tensors:"]}, {"cell_type": "code", "execution_count": 11, "id": "a66afde2", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:33.763575Z", "iopub.status.busy": "2021-12-04T15:53:33.763098Z", "iopub.status.idle": "2021-12-04T15:53:33.768208Z", "shell.execute_reply": "2021-12-04T15:53:33.767800Z"}, "papermill": {"duration": 0.195513, "end_time": "2021-12-04T15:53:33.768317", "exception": false, "start_time": "2021-12-04T15:53:33.572804", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["X1 tensor([[0.1053, 0.2695, 0.3588],\n", " [0.1994, 0.5472, 0.0062]])\n", "X2 tensor([[0.9516, 0.0753, 0.8860],\n", " [0.5832, 0.3376, 0.8090]])\n", "Y tensor([[1.0569, 0.3448, 1.2448],\n", " [0.7826, 0.8848, 0.8151]])\n"]}], "source": ["x1 = torch.rand(2, 3)\n", "x2 = torch.rand(2, 3)\n", "y = x1 + x2\n", "\n", "print(\"X1\", x1)\n", "print(\"X2\", x2)\n", "print(\"Y\", y)"]}, {"cell_type": "markdown", "id": "3510743a", "metadata": {"papermill": {"duration": 0.188609, "end_time": "2021-12-04T15:53:34.145802", "exception": false, "start_time": "2021-12-04T15:53:33.957193", "status": "completed"}, "tags": []}, "source": ["Calling `x1 + x2` creates a new tensor containing the sum of the two inputs.\n", "However, we can also use in-place operations that are applied directly on the memory of a tensor.\n", "We therefore change the values of `x2` without the chance to re-accessing the values of `x2` before the operation.\n", "An example is shown below:"]}, {"cell_type": "code", "execution_count": 12, "id": "93e2d0e2", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:34.523641Z", "iopub.status.busy": "2021-12-04T15:53:34.523169Z", "iopub.status.idle": "2021-12-04T15:53:34.528393Z", "shell.execute_reply": "2021-12-04T15:53:34.528008Z"}, "papermill": {"duration": 0.195416, "end_time": "2021-12-04T15:53:34.528506", "exception": false, "start_time": "2021-12-04T15:53:34.333090", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["X1 (before) tensor([[0.5779, 0.9040, 0.5547],\n", " [0.3423, 0.6343, 0.3644]])\n", "X2 (before) tensor([[0.7104, 0.9464, 0.7890],\n", " [0.2814, 0.7886, 0.5895]])\n", "X1 (after) tensor([[0.5779, 0.9040, 0.5547],\n", " [0.3423, 0.6343, 0.3644]])\n", "X2 (after) tensor([[1.2884, 1.8504, 1.3437],\n", " [0.6237, 1.4230, 0.9539]])\n"]}], "source": ["x1 = torch.rand(2, 3)\n", "x2 = torch.rand(2, 3)\n", "print(\"X1 (before)\", x1)\n", "print(\"X2 (before)\", x2)\n", "\n", "x2.add_(x1)\n", "print(\"X1 (after)\", x1)\n", "print(\"X2 (after)\", x2)"]}, {"cell_type": "markdown", "id": "acae6209", "metadata": {"papermill": {"duration": 0.189916, "end_time": "2021-12-04T15:53:34.905098", "exception": false, "start_time": "2021-12-04T15:53:34.715182", "status": "completed"}, "tags": []}, "source": ["In-place operations are usually marked with a underscore postfix (e.g. \"add_\" instead of \"add\").\n", "\n", "Another common operation aims at changing the shape of a tensor.\n", "A tensor of size (2,3) can be re-organized to any other shape with the same number of elements (e.g. a tensor of size (6), or (3,2), ...).\n", "In PyTorch, this operation is called `view`:"]}, {"cell_type": "code", "execution_count": 13, "id": "12e785e2", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:35.283833Z", "iopub.status.busy": "2021-12-04T15:53:35.283366Z", "iopub.status.idle": "2021-12-04T15:53:35.285936Z", "shell.execute_reply": "2021-12-04T15:53:35.290804Z"}, "papermill": {"duration": 0.19887, "end_time": "2021-12-04T15:53:35.290937", "exception": false, "start_time": "2021-12-04T15:53:35.092067", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["X tensor([0, 1, 2, 3, 4, 5])\n"]}], "source": ["x = torch.arange(6)\n", "print(\"X\", x)"]}, {"cell_type": "code", "execution_count": 14, "id": "68681255", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:35.669862Z", "iopub.status.busy": "2021-12-04T15:53:35.669397Z", "iopub.status.idle": "2021-12-04T15:53:35.672118Z", "shell.execute_reply": "2021-12-04T15:53:35.671721Z"}, "papermill": {"duration": 0.193577, "end_time": "2021-12-04T15:53:35.672223", "exception": false, "start_time": "2021-12-04T15:53:35.478646", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["X tensor([[0, 1, 2],\n", " [3, 4, 5]])\n"]}], "source": ["x = x.view(2, 3)\n", "print(\"X\", x)"]}, {"cell_type": "code", "execution_count": 15, "id": "b87c271d", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:36.053012Z", "iopub.status.busy": "2021-12-04T15:53:36.052549Z", "iopub.status.idle": "2021-12-04T15:53:36.055288Z", "shell.execute_reply": "2021-12-04T15:53:36.054885Z"}, "papermill": {"duration": 0.195401, "end_time": "2021-12-04T15:53:36.055396", "exception": false, "start_time": "2021-12-04T15:53:35.859995", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["X tensor([[0, 3],\n", " [1, 4],\n", " [2, 5]])\n"]}], "source": ["x = x.permute(1, 0) # Swapping dimension 0 and 1\n", "print(\"X\", x)"]}, {"cell_type": "markdown", "id": "b45990ab", "metadata": {"papermill": {"duration": 0.191632, "end_time": "2021-12-04T15:53:36.435435", "exception": false, "start_time": "2021-12-04T15:53:36.243803", "status": "completed"}, "tags": []}, "source": ["Other commonly used operations include matrix multiplications, which are essential for neural networks.\n", "Quite often, we have an input vector $\\mathbf{x}$, which is transformed using a learned weight matrix $\\mathbf{W}$.\n", "There are multiple ways and functions to perform matrix multiplication, some of which we list below:\n", "\n", "* `torch.matmul`: Performs the matrix product over two tensors, where the specific behavior depends on the dimensions.\n", "If both inputs are matrices (2-dimensional tensors), it performs the standard matrix product.\n", "For higher dimensional inputs, the function supports broadcasting (for details see the [documentation](https://pytorch.org/docs/stable/generated/torch.matmul.html?highlight=matmul#torch.matmul)).\n", "Can also be written as `a @ b`, similar to numpy.\n", "* `torch.mm`: Performs the matrix product over two matrices, but doesn't support broadcasting (see [documentation](https://pytorch.org/docs/stable/generated/torch.mm.html?highlight=torch%20mm#torch.mm))\n", "* `torch.bmm`: Performs the matrix product with a support batch dimension.\n", "If the first tensor $T$ is of shape ($b\\times n\\times m$), and the second tensor $R$ ($b\\times m\\times p$), the output $O$ is of shape ($b\\times n\\times p$), and has been calculated by performing $b$ matrix multiplications of the submatrices of $T$ and $R$: $O_i = T_i @ R_i$\n", "* `torch.einsum`: Performs matrix multiplications and more (i.e. sums of products) using the Einstein summation convention.\n", "Explanation of the Einstein sum can be found in assignment 1.\n", "\n", "Usually, we use `torch.matmul` or `torch.bmm`. We can try a matrix multiplication with `torch.matmul` below."]}, {"cell_type": "code", "execution_count": 16, "id": "913092b1", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:36.816103Z", "iopub.status.busy": "2021-12-04T15:53:36.815637Z", "iopub.status.idle": "2021-12-04T15:53:36.818033Z", "shell.execute_reply": "2021-12-04T15:53:36.818409Z"}, "papermill": {"duration": 0.195078, "end_time": "2021-12-04T15:53:36.818538", "exception": false, "start_time": "2021-12-04T15:53:36.623460", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["X tensor([[0, 1, 2],\n", " [3, 4, 5]])\n"]}], "source": ["x = torch.arange(6)\n", "x = x.view(2, 3)\n", "print(\"X\", x)"]}, {"cell_type": "code", "execution_count": 17, "id": "aed345cb", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:37.208721Z", "iopub.status.busy": "2021-12-04T15:53:37.208252Z", "iopub.status.idle": "2021-12-04T15:53:37.212000Z", "shell.execute_reply": "2021-12-04T15:53:37.211600Z"}, "papermill": {"duration": 0.199386, "end_time": "2021-12-04T15:53:37.212109", "exception": false, "start_time": "2021-12-04T15:53:37.012723", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["W tensor([[0, 1, 2],\n", " [3, 4, 5],\n", " [6, 7, 8]])\n"]}], "source": ["W = torch.arange(9).view(3, 3) # We can also stack multiple operations in a single line\n", "print(\"W\", W)"]}, {"cell_type": "code", "execution_count": 18, "id": "ba15bb65", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:37.596703Z", "iopub.status.busy": "2021-12-04T15:53:37.596239Z", "iopub.status.idle": "2021-12-04T15:53:37.599133Z", "shell.execute_reply": "2021-12-04T15:53:37.598757Z"}, "papermill": {"duration": 0.197023, "end_time": "2021-12-04T15:53:37.599245", "exception": false, "start_time": "2021-12-04T15:53:37.402222", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["h tensor([[15, 18, 21],\n", " [42, 54, 66]])\n"]}], "source": ["h = torch.matmul(x, W) # Verify the result by calculating it by hand too!\n", "print(\"h\", h)"]}, {"cell_type": "markdown", "id": "e2969a0e", "metadata": {"papermill": {"duration": 0.191191, "end_time": "2021-12-04T15:53:37.983302", "exception": false, "start_time": "2021-12-04T15:53:37.792111", "status": "completed"}, "tags": []}, "source": ["#### Indexing\n", "\n", "We often have the situation where we need to select a part of a tensor.\n", "Indexing works just like in numpy, so let's try it:"]}, {"cell_type": "code", "execution_count": 19, "id": "9eabb311", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:38.371801Z", "iopub.status.busy": "2021-12-04T15:53:38.371341Z", "iopub.status.idle": "2021-12-04T15:53:38.373967Z", "shell.execute_reply": "2021-12-04T15:53:38.374339Z"}, "papermill": {"duration": 0.198334, "end_time": "2021-12-04T15:53:38.374469", "exception": false, "start_time": "2021-12-04T15:53:38.176135", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["X tensor([[ 0, 1, 2, 3],\n", " [ 4, 5, 6, 7],\n", " [ 8, 9, 10, 11]])\n"]}], "source": ["x = torch.arange(12).view(3, 4)\n", "print(\"X\", x)"]}, {"cell_type": "code", "execution_count": 20, "id": "9e961958", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:38.762589Z", "iopub.status.busy": "2021-12-04T15:53:38.762126Z", "iopub.status.idle": "2021-12-04T15:53:38.764774Z", "shell.execute_reply": "2021-12-04T15:53:38.764396Z"}, "papermill": {"duration": 0.199401, "end_time": "2021-12-04T15:53:38.764881", "exception": false, "start_time": "2021-12-04T15:53:38.565480", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["tensor([1, 5, 9])\n"]}], "source": ["print(x[:, 1]) # Second column"]}, {"cell_type": "code", "execution_count": 21, "id": "8df1b8d5", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:39.158549Z", "iopub.status.busy": "2021-12-04T15:53:39.158081Z", "iopub.status.idle": "2021-12-04T15:53:39.160695Z", "shell.execute_reply": "2021-12-04T15:53:39.160291Z"}, "papermill": {"duration": 0.199565, "end_time": "2021-12-04T15:53:39.160802", "exception": false, "start_time": "2021-12-04T15:53:38.961237", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["tensor([0, 1, 2, 3])\n"]}], "source": ["print(x[0]) # First row"]}, {"cell_type": "code", "execution_count": 22, "id": "91fda3e0", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:39.553851Z", "iopub.status.busy": "2021-12-04T15:53:39.553387Z", "iopub.status.idle": "2021-12-04T15:53:39.555977Z", "shell.execute_reply": "2021-12-04T15:53:39.555511Z"}, "papermill": {"duration": 0.201859, "end_time": "2021-12-04T15:53:39.556086", "exception": false, "start_time": "2021-12-04T15:53:39.354227", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["tensor([3, 7])\n"]}], "source": ["print(x[:2, -1]) # First two rows, last column"]}, {"cell_type": "code", "execution_count": 23, "id": "a9cf47ae", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:39.949800Z", "iopub.status.busy": "2021-12-04T15:53:39.949338Z", "iopub.status.idle": "2021-12-04T15:53:39.951698Z", "shell.execute_reply": "2021-12-04T15:53:39.952071Z"}, "papermill": {"duration": 0.201325, "end_time": "2021-12-04T15:53:39.952202", "exception": false, "start_time": "2021-12-04T15:53:39.750877", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["tensor([[ 4, 5, 6, 7],\n", " [ 8, 9, 10, 11]])\n"]}], "source": ["print(x[1:3, :]) # Middle two rows"]}, {"cell_type": "markdown", "id": "9fea92c8", "metadata": {"papermill": {"duration": 0.198501, "end_time": "2021-12-04T15:53:40.352499", "exception": false, "start_time": "2021-12-04T15:53:40.153998", "status": "completed"}, "tags": []}, "source": ["### Dynamic Computation Graph and Backpropagation\n", "\n", "One of the main reasons for using PyTorch in Deep Learning projects is that we can automatically get **gradients/derivatives** of functions that we define.\n", "We will mainly use PyTorch for implementing neural networks, and they are just fancy functions.\n", "If we use weight matrices in our function that we want to learn, then those are called the **parameters** or simply the **weights**.\n", "\n", "If our neural network would output a single scalar value, we would talk about taking the **derivative**, but you will see that quite often we will have **multiple** output variables (\"values\"); in that case we talk about **gradients**.\n", "It's a more general term.\n", "\n", "Given an input $\\mathbf{x}$, we define our function by **manipulating** that input, usually by matrix-multiplications with weight matrices and additions with so-called bias vectors.\n", "As we manipulate our input, we are automatically creating a **computational graph**.\n", "This graph shows how to arrive at our output from our input.\n", "PyTorch is a **define-by-run** framework; this means that we can just do our manipulations, and PyTorch will keep track of that graph for us.\n", "Thus, we create a dynamic computation graph along the way.\n", "\n", "So, to recap: the only thing we have to do is to compute the **output**, and then we can ask PyTorch to automatically get the **gradients**.\n", "\n", "> **Note: Why do we want gradients?\n", "** Consider that we have defined a function, a neural net, that is supposed to compute a certain output $y$ for an input vector $\\mathbf{x}$.\n", "We then define an **error measure** that tells us how wrong our network is; how bad it is in predicting output $y$ from input $\\mathbf{x}$.\n", "Based on this error measure, we can use the gradients to **update** the weights $\\mathbf{W}$ that were responsible for the output, so that the next time we present input $\\mathbf{x}$ to our network, the output will be closer to what we want.\n", "\n", "The first thing we have to do is to specify which tensors require gradients.\n", "By default, when we create a tensor, it does not require gradients."]}, {"cell_type": "code", "execution_count": 24, "id": "c2cc2ed7", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:40.750883Z", "iopub.status.busy": "2021-12-04T15:53:40.750396Z", "iopub.status.idle": "2021-12-04T15:53:40.752681Z", "shell.execute_reply": "2021-12-04T15:53:40.752209Z"}, "papermill": {"duration": 0.203425, "end_time": "2021-12-04T15:53:40.752790", "exception": false, "start_time": "2021-12-04T15:53:40.549365", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["False\n"]}], "source": ["x = torch.ones((3,))\n", "print(x.requires_grad)"]}, {"cell_type": "markdown", "id": "95fb29d4", "metadata": {"papermill": {"duration": 0.202898, "end_time": "2021-12-04T15:53:41.153550", "exception": false, "start_time": "2021-12-04T15:53:40.950652", "status": "completed"}, "tags": []}, "source": ["We can change this for an existing tensor using the function `requires_grad_()` (underscore indicating that this is a in-place operation).\n", "Alternatively, when creating a tensor, you can pass the argument\n", "`requires_grad=True` to most initializers we have seen above."]}, {"cell_type": "code", "execution_count": 25, "id": "7c78f25f", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:41.555039Z", "iopub.status.busy": "2021-12-04T15:53:41.554541Z", "iopub.status.idle": "2021-12-04T15:53:41.556872Z", "shell.execute_reply": "2021-12-04T15:53:41.556397Z"}, "papermill": {"duration": 0.20518, "end_time": "2021-12-04T15:53:41.556986", "exception": false, "start_time": "2021-12-04T15:53:41.351806", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["True\n"]}], "source": ["x.requires_grad_(True)\n", "print(x.requires_grad)"]}, {"cell_type": "markdown", "id": "20803bcc", "metadata": {"papermill": {"duration": 0.196387, "end_time": "2021-12-04T15:53:41.950177", "exception": false, "start_time": "2021-12-04T15:53:41.753790", "status": "completed"}, "tags": []}, "source": ["In order to get familiar with the concept of a computation graph, we will create one for the following function:\n", "\n", "$$y = \\frac{1}{|x|}\\sum_i \\left[(x_i + 2)^2 + 3\\right]$$\n", "\n", "You could imagine that $x$ are our parameters, and we want to optimize (either maximize or minimize) the output $y$.\n", "For this, we want to obtain the gradients $\\partial y / \\partial \\mathbf{x}$.\n", "For our example, we'll use $\\mathbf{x}=[0,1,2]$ as our input."]}, {"cell_type": "code", "execution_count": 26, "id": "1736b0d5", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:42.353546Z", "iopub.status.busy": "2021-12-04T15:53:42.353077Z", "iopub.status.idle": "2021-12-04T15:53:42.355812Z", "shell.execute_reply": "2021-12-04T15:53:42.356193Z"}, "papermill": {"duration": 0.206211, "end_time": "2021-12-04T15:53:42.356325", "exception": false, "start_time": "2021-12-04T15:53:42.150114", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["X tensor([0., 1., 2.], requires_grad=True)\n"]}], "source": ["x = torch.arange(3, dtype=torch.float32, requires_grad=True) # Only float tensors can have gradients\n", "print(\"X\", x)"]}, {"cell_type": "markdown", "id": "cf511f52", "metadata": {"papermill": {"duration": 0.200601, "end_time": "2021-12-04T15:53:42.755512", "exception": false, "start_time": "2021-12-04T15:53:42.554911", "status": "completed"}, "tags": []}, "source": ["Now let's build the computation graph step by step.\n", "You can combine multiple operations in a single line, but we will\n", "separate them here to get a better understanding of how each operation\n", "is added to the computation graph."]}, {"cell_type": "code", "execution_count": 27, "id": "fbcee41c", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:43.160150Z", "iopub.status.busy": "2021-12-04T15:53:43.159591Z", "iopub.status.idle": "2021-12-04T15:53:43.163509Z", "shell.execute_reply": "2021-12-04T15:53:43.163027Z"}, "papermill": {"duration": 0.209982, "end_time": "2021-12-04T15:53:43.163620", "exception": false, "start_time": "2021-12-04T15:53:42.953638", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Y tensor(12.6667, grad_fn=)\n"]}], "source": ["a = x + 2\n", "b = a ** 2\n", "c = b + 3\n", "y = c.mean()\n", "print(\"Y\", y)"]}, {"cell_type": "markdown", "id": "c012a822", "metadata": {"papermill": {"duration": 0.201708, "end_time": "2021-12-04T15:53:43.567654", "exception": false, "start_time": "2021-12-04T15:53:43.365946", "status": "completed"}, "tags": []}, "source": ["Using the statements above, we have created a computation graph that looks similar to the figure below:\n", "\n", "
\n", "\n", "We calculate $a$ based on the inputs $x$ and the constant $2$, $b$ is $a$ squared, and so on.\n", "The visualization is an abstraction of the dependencies between inputs and outputs of the operations we have applied.\n", "Each node of the computation graph has automatically defined a function for calculating the gradients with respect to its inputs, `grad_fn`.\n", "You can see this when we printed the output tensor $y$.\n", "This is why the computation graph is usually visualized in the reverse direction (arrows point from the result to the inputs).\n", "We can perform backpropagation on the computation graph by calling the\n", "function `backward()` on the last output, which effectively calculates\n", "the gradients for each tensor that has the property\n", "`requires_grad=True`:"]}, {"cell_type": "code", "execution_count": 28, "id": "3afeb787", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:43.969958Z", "iopub.status.busy": "2021-12-04T15:53:43.969494Z", "iopub.status.idle": "2021-12-04T15:53:44.203064Z", "shell.execute_reply": "2021-12-04T15:53:44.203439Z"}, "papermill": {"duration": 0.436371, "end_time": "2021-12-04T15:53:44.203621", "exception": false, "start_time": "2021-12-04T15:53:43.767250", "status": "completed"}, "tags": []}, "outputs": [], "source": ["y.backward()"]}, {"cell_type": "markdown", "id": "6b048147", "metadata": {"papermill": {"duration": 0.198366, "end_time": "2021-12-04T15:53:44.603913", "exception": false, "start_time": "2021-12-04T15:53:44.405547", "status": "completed"}, "tags": []}, "source": ["`x.grad` will now contain the gradient $\\partial y/ \\partial \\mathcal{x}$, and this gradient indicates how a change in $\\mathbf{x}$ will affect output $y$ given the current input $\\mathbf{x}=[0,1,2]$:"]}, {"cell_type": "code", "execution_count": 29, "id": "2a36cc4c", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:45.011258Z", "iopub.status.busy": "2021-12-04T15:53:45.010791Z", "iopub.status.idle": "2021-12-04T15:53:45.013643Z", "shell.execute_reply": "2021-12-04T15:53:45.013258Z"}, "papermill": {"duration": 0.210613, "end_time": "2021-12-04T15:53:45.013754", "exception": false, "start_time": "2021-12-04T15:53:44.803141", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["tensor([1.3333, 2.0000, 2.6667])\n"]}], "source": ["print(x.grad)"]}, {"cell_type": "markdown", "id": "01673131", "metadata": {"papermill": {"duration": 0.200204, "end_time": "2021-12-04T15:53:45.415831", "exception": false, "start_time": "2021-12-04T15:53:45.215627", "status": "completed"}, "tags": []}, "source": ["We can also verify these gradients by hand.\n", "We will calculate the gradients using the chain rule, in the same way as PyTorch did it:\n", "\n", "$$\\frac{\\partial y}{\\partial x_i} = \\frac{\\partial y}{\\partial c_i}\\frac{\\partial c_i}{\\partial b_i}\\frac{\\partial b_i}{\\partial a_i}\\frac{\\partial a_i}{\\partial x_i}$$\n", "\n", "Note that we have simplified this equation to index notation, and by using the fact that all operation besides the mean do not combine the elements in the tensor.\n", "The partial derivatives are:\n", "\n", "$$\n", "\\frac{\\partial a_i}{\\partial x_i} = 1,\\hspace{1cm}\n", "\\frac{\\partial b_i}{\\partial a_i} = 2\\cdot a_i\\hspace{1cm}\n", "\\frac{\\partial c_i}{\\partial b_i} = 1\\hspace{1cm}\n", "\\frac{\\partial y}{\\partial c_i} = \\frac{1}{3}\n", "$$\n", "\n", "Hence, with the input being $\\mathbf{x}=[0,1,2]$, our gradients are $\\partial y/\\partial \\mathbf{x}=[4/3,2,8/3]$.\n", "The previous code cell should have printed the same result."]}, {"cell_type": "markdown", "id": "7d826bdb", "metadata": {"papermill": {"duration": 0.198481, "end_time": "2021-12-04T15:53:45.813968", "exception": false, "start_time": "2021-12-04T15:53:45.615487", "status": "completed"}, "tags": []}, "source": ["### GPU support\n", "\n", "A crucial feature of PyTorch is the support of GPUs, short for Graphics Processing Unit.\n", "A GPU can perform many thousands of small operations in parallel, making it very well suitable for performing large matrix operations in neural networks.\n", "When comparing GPUs to CPUs, we can list the following main differences (credit: [Kevin Krewell, 2009](https://blogs.nvidia.com/blog/2009/12/16/whats-the-difference-between-a-cpu-and-a-gpu/))\n", "\n", "
\n", "\n", "CPUs and GPUs have both different advantages and disadvantages, which is why many computers contain both components and use them for different tasks.\n", "In case you are not familiar with GPUs, you can read up more details in this [NVIDIA blog post](https://blogs.nvidia.com/blog/2009/12/16/whats-the-difference-between-a-cpu-and-a-gpu/) or [here](https://www.intel.com/content/www/us/en/products/docs/processors/what-is-a-gpu.html).\n", "\n", "GPUs can accelerate the training of your network up to a factor of $100$ which is essential for large neural networks.\n", "PyTorch implements a lot of functionality for supporting GPUs (mostly those of NVIDIA due to the libraries [CUDA](https://developer.nvidia.com/cuda-zone) and [cuDNN](https://developer.nvidia.com/cudnn)).\n", "First, let's check whether you have a GPU available:"]}, {"cell_type": "code", "execution_count": 30, "id": "8fe50089", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:46.222636Z", "iopub.status.busy": "2021-12-04T15:53:46.222150Z", "iopub.status.idle": "2021-12-04T15:53:46.224494Z", "shell.execute_reply": "2021-12-04T15:53:46.224024Z"}, "papermill": {"duration": 0.209045, "end_time": "2021-12-04T15:53:46.224603", "exception": false, "start_time": "2021-12-04T15:53:46.015558", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Is the GPU available? True\n"]}], "source": ["gpu_avail = torch.cuda.is_available()\n", "print(f\"Is the GPU available? {gpu_avail}\")"]}, {"cell_type": "markdown", "id": "cc6dd1a9", "metadata": {"papermill": {"duration": 0.201657, "end_time": "2021-12-04T15:53:46.632585", "exception": false, "start_time": "2021-12-04T15:53:46.430928", "status": "completed"}, "tags": []}, "source": ["If you have a GPU on your computer but the command above returns False, make sure you have the correct CUDA-version installed.\n", "The `dl2020` environment comes with the CUDA-toolkit 10.1, which is selected for the Lisa supercomputer.\n", "Please change it if necessary (CUDA 10.2 is currently common).\n", "On Google Colab, make sure that you have selected a GPU in your runtime setup (in the menu, check under `Runtime -> Change runtime type`).\n", "\n", "By default, all tensors you create are stored on the CPU.\n", "We can push a tensor to the GPU by using the function `.to(...)`, or `.cuda()`.\n", "However, it is often a good practice to define a `device` object in your code which points to the GPU if you have one, and otherwise to the CPU.\n", "Then, you can write your code with respect to this device object, and it allows you to run the same code on both a CPU-only system, and one with a GPU.\n", "Let's try it below.\n", "We can specify the device as follows:"]}, {"cell_type": "code", "execution_count": 31, "id": "5a3d8e38", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:47.042732Z", "iopub.status.busy": "2021-12-04T15:53:47.042239Z", "iopub.status.idle": "2021-12-04T15:53:47.044024Z", "shell.execute_reply": "2021-12-04T15:53:47.044398Z"}, "papermill": {"duration": 0.208184, "end_time": "2021-12-04T15:53:47.044529", "exception": false, "start_time": "2021-12-04T15:53:46.836345", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Device cuda\n"]}], "source": ["device = torch.device(\"cuda\") if torch.cuda.is_available() else torch.device(\"cpu\")\n", "print(\"Device\", device)"]}, {"cell_type": "markdown", "id": "83f280ae", "metadata": {"papermill": {"duration": 0.203434, "end_time": "2021-12-04T15:53:47.452136", "exception": false, "start_time": "2021-12-04T15:53:47.248702", "status": "completed"}, "tags": []}, "source": ["Now let's create a tensor and push it to the device:"]}, {"cell_type": "code", "execution_count": 32, "id": "31cbb86a", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:47.862514Z", "iopub.status.busy": "2021-12-04T15:53:47.862045Z", "iopub.status.idle": "2021-12-04T15:53:51.511287Z", "shell.execute_reply": "2021-12-04T15:53:51.510793Z"}, "papermill": {"duration": 3.856813, "end_time": "2021-12-04T15:53:51.511416", "exception": false, "start_time": "2021-12-04T15:53:47.654603", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["X tensor([[0., 0., 0.],\n", " [0., 0., 0.]], device='cuda:0')\n"]}], "source": ["x = torch.zeros(2, 3)\n", "x = x.to(device)\n", "print(\"X\", x)"]}, {"cell_type": "markdown", "id": "de20fb36", "metadata": {"papermill": {"duration": 0.205639, "end_time": "2021-12-04T15:53:51.921267", "exception": false, "start_time": "2021-12-04T15:53:51.715628", "status": "completed"}, "tags": []}, "source": ["In case you have a GPU, you should now see the attribute `device='cuda:0'` being printed next to your tensor.\n", "The zero next to cuda indicates that this is the zero-th GPU device on your computer.\n", "PyTorch also supports multi-GPU systems, but this you will only need once you have very big networks to train (if interested, see the [PyTorch documentation](https://pytorch.org/docs/stable/distributed.html#distributed-basics)).\n", "We can also compare the runtime of a large matrix multiplication on the CPU with a operation on the GPU:"]}, {"cell_type": "code", "execution_count": 33, "id": "bbf73c6d", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:52.333482Z", "iopub.status.busy": "2021-12-04T15:53:52.333010Z", "iopub.status.idle": "2021-12-04T15:53:52.904067Z", "shell.execute_reply": "2021-12-04T15:53:52.904461Z"}, "papermill": {"duration": 0.778998, "end_time": "2021-12-04T15:53:52.904626", "exception": false, "start_time": "2021-12-04T15:53:52.125628", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["CPU time: 0.27197s\n", "GPU time: 0.02201s\n"]}], "source": ["x = torch.randn(5000, 5000)\n", "\n", "# CPU version\n", "start_time = time.time()\n", "_ = torch.matmul(x, x)\n", "end_time = time.time()\n", "print(f\"CPU time: {(end_time - start_time):6.5f}s\")\n", "\n", "# GPU version\n", "if torch.cuda.is_available():\n", " x = x.to(device)\n", " # CUDA is asynchronous, so we need to use different timing functions\n", " start = torch.cuda.Event(enable_timing=True)\n", " end = torch.cuda.Event(enable_timing=True)\n", " start.record()\n", " _ = torch.matmul(x, x)\n", " end.record()\n", " torch.cuda.synchronize() # Waits for everything to finish running on the GPU\n", " print(f\"GPU time: {0.001 * start.elapsed_time(end):6.5f}s\") # Milliseconds to seconds"]}, {"cell_type": "markdown", "id": "b6483a54", "metadata": {"papermill": {"duration": 0.208145, "end_time": "2021-12-04T15:53:53.320523", "exception": false, "start_time": "2021-12-04T15:53:53.112378", "status": "completed"}, "tags": []}, "source": ["Depending on the size of the operation and the CPU/GPU in your system, the speedup of this operation can be >50x.\n", "As `matmul` operations are very common in neural networks, we can already see the great benefit of training a NN on a GPU.\n", "The time estimate can be relatively noisy here because we haven't run it for multiple times.\n", "Feel free to extend this, but it also takes longer to run.\n", "\n", "When generating random numbers, the seed between CPU and GPU is not synchronized.\n", "Hence, we need to set the seed on the GPU separately to ensure a reproducible code.\n", "Note that due to different GPU architectures, running the same code on different GPUs does not guarantee the same random numbers.\n", "Still, we don't want that our code gives us a different output every time we run it on the exact same hardware.\n", "Hence, we also set the seed on the GPU:"]}, {"cell_type": "code", "execution_count": 34, "id": "119c0085", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:53.736717Z", "iopub.status.busy": "2021-12-04T15:53:53.736247Z", "iopub.status.idle": "2021-12-04T15:53:53.737755Z", "shell.execute_reply": "2021-12-04T15:53:53.738129Z"}, "papermill": {"duration": 0.215091, "end_time": "2021-12-04T15:53:53.738260", "exception": false, "start_time": "2021-12-04T15:53:53.523169", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# GPU operations have a separate seed we also want to set\n", "if torch.cuda.is_available():\n", " torch.cuda.manual_seed(42)\n", " torch.cuda.manual_seed_all(42)\n", "\n", "# Additionally, some operations on a GPU are implemented stochastic for efficiency\n", "# We want to ensure that all operations are deterministic on GPU (if used) for reproducibility\n", "torch.backends.cudnn.determinstic = True\n", "torch.backends.cudnn.benchmark = False"]}, {"cell_type": "markdown", "id": "d3e51727", "metadata": {"papermill": {"duration": 0.201794, "end_time": "2021-12-04T15:53:54.143745", "exception": false, "start_time": "2021-12-04T15:53:53.941951", "status": "completed"}, "tags": []}, "source": ["## Learning by example: Continuous XOR\n", "
\n", "\n", "If we want to build a neural network in PyTorch, we could specify all our parameters (weight matrices, bias vectors) using `Tensors` (with `requires_grad=True`), ask PyTorch to calculate the gradients and then adjust the parameters.\n", "But things can quickly get cumbersome if we have a lot of parameters.\n", "In PyTorch, there is a package called `torch.nn` that makes building neural networks more convenient.\n", "\n", "We will introduce the libraries and all additional parts you might need to train a neural network in PyTorch, using a simple example classifier on a simple yet well known example: XOR.\n", "Given two binary inputs $x_1$ and $x_2$, the label to predict is $1$ if either $x_1$ or $x_2$ is $1$ while the other is $0$, or the label is $0$ in all other cases.\n", "The example became famous by the fact that a single neuron, i.e. a linear classifier, cannot learn this simple function.\n", "Hence, we will learn how to build a small neural network that can learn this function.\n", "To make it a little bit more interesting, we move the XOR into continuous space and introduce some gaussian noise on the binary inputs.\n", "Our desired separation of an XOR dataset could look as follows:\n", "\n", "
"]}, {"cell_type": "markdown", "id": "be79359e", "metadata": {"papermill": {"duration": 0.205221, "end_time": "2021-12-04T15:53:54.552887", "exception": false, "start_time": "2021-12-04T15:53:54.347666", "status": "completed"}, "tags": []}, "source": ["### The model\n", "\n", "The package `torch.nn` defines a series of useful classes like linear networks layers, activation functions, loss functions etc.\n", "A full list can be found [here](https://pytorch.org/docs/stable/nn.html).\n", "In case you need a certain network layer, check the documentation of the package first before writing the layer yourself as the package likely contains the code for it already.\n", "We import it below:"]}, {"cell_type": "code", "execution_count": null, "id": "43daa017", "metadata": {"lines_to_next_cell": 0, "papermill": {"duration": 0.203631, "end_time": "2021-12-04T15:53:54.958970", "exception": false, "start_time": "2021-12-04T15:53:54.755339", "status": "completed"}, "tags": []}, "outputs": [], "source": []}, {"cell_type": "code", "execution_count": null, "id": "961da892", "metadata": {"papermill": {"duration": 0.204014, "end_time": "2021-12-04T15:53:55.368098", "exception": false, "start_time": "2021-12-04T15:53:55.164084", "status": "completed"}, "tags": []}, "outputs": [], "source": []}, {"cell_type": "markdown", "id": "5b961e6a", "metadata": {"papermill": {"duration": 0.203803, "end_time": "2021-12-04T15:53:55.774983", "exception": false, "start_time": "2021-12-04T15:53:55.571180", "status": "completed"}, "tags": []}, "source": ["Additionally to `torch.nn`, there is also `torch.nn.functional`.\n", "It contains functions that are used in network layers.\n", "This is in contrast to `torch.nn` which defines them as `nn.Modules` (more on it below), and `torch.nn` actually uses a lot of functionalities from `torch.nn.functional`.\n", "Hence, the functional package is useful in many situations, and so we import it as well here."]}, {"cell_type": "markdown", "id": "e60690c4", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.205786, "end_time": "2021-12-04T15:53:56.185307", "exception": false, "start_time": "2021-12-04T15:53:55.979521", "status": "completed"}, "tags": []}, "source": ["#### nn.Module\n", "\n", "In PyTorch, a neural network is built up out of modules.\n", "Modules can contain other modules, and a neural network is considered to be a module itself as well.\n", "The basic template of a module is as follows:"]}, {"cell_type": "code", "execution_count": 35, "id": "71eaf6ae", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:56.605744Z", "iopub.status.busy": "2021-12-04T15:53:56.605272Z", "iopub.status.idle": "2021-12-04T15:53:56.606804Z", "shell.execute_reply": "2021-12-04T15:53:56.607182Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.216416, "end_time": "2021-12-04T15:53:56.607313", "exception": false, "start_time": "2021-12-04T15:53:56.390897", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class MyModule(nn.Module):\n", " def __init__(self):\n", " super().__init__()\n", " # Some init for my module\n", "\n", " def forward(self, x):\n", " # Function for performing the calculation of the module.\n", " pass"]}, {"cell_type": "markdown", "id": "63463f01", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.229323, "end_time": "2021-12-04T15:53:57.045874", "exception": false, "start_time": "2021-12-04T15:53:56.816551", "status": "completed"}, "tags": []}, "source": ["The forward function is where the computation of the module is taken place, and is executed when you call the module (`nn = MyModule(); nn(x)`).\n", "In the init function, we usually create the parameters of the module, using `nn.Parameter`, or defining other modules that are used in the forward function.\n", "The backward calculation is done automatically, but could be overwritten as well if wanted.\n", "\n", "#### Simple classifier\n", "We can now make use of the pre-defined modules in the `torch.nn` package, and define our own small neural network.\n", "We will use a minimal network with a input layer, one hidden layer with tanh as activation function, and a output layer.\n", "In other words, our networks should look something like this:\n", "\n", "
\n", "\n", "The input neurons are shown in blue, which represent the coordinates $x_1$ and $x_2$ of a data point.\n", "The hidden neurons including a tanh activation are shown in white, and the output neuron in red.\n", "In PyTorch, we can define this as follows:"]}, {"cell_type": "code", "execution_count": 36, "id": "6c0cc064", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:57.460540Z", "iopub.status.busy": "2021-12-04T15:53:57.460070Z", "iopub.status.idle": "2021-12-04T15:53:57.461979Z", "shell.execute_reply": "2021-12-04T15:53:57.461520Z"}, "papermill": {"duration": 0.213388, "end_time": "2021-12-04T15:53:57.462086", "exception": false, "start_time": "2021-12-04T15:53:57.248698", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class SimpleClassifier(nn.Module):\n", " def __init__(self, num_inputs, num_hidden, num_outputs):\n", " super().__init__()\n", " # Initialize the modules we need to build the network\n", " self.linear1 = nn.Linear(num_inputs, num_hidden)\n", " self.act_fn = nn.Tanh()\n", " self.linear2 = nn.Linear(num_hidden, num_outputs)\n", "\n", " def forward(self, x):\n", " # Perform the calculation of the model to determine the prediction\n", " x = self.linear1(x)\n", " x = self.act_fn(x)\n", " x = self.linear2(x)\n", " return x"]}, {"cell_type": "markdown", "id": "84553ec2", "metadata": {"papermill": {"duration": 0.204402, "end_time": "2021-12-04T15:53:57.868446", "exception": false, "start_time": "2021-12-04T15:53:57.664044", "status": "completed"}, "tags": []}, "source": ["For the examples in this notebook, we will use a tiny neural network with two input neurons and four hidden neurons.\n", "As we perform binary classification, we will use a single output neuron.\n", "Note that we do not apply a sigmoid on the output yet.\n", "This is because other functions, especially the loss, are more efficient and precise to calculate on the original outputs instead of the sigmoid output.\n", "We will discuss the detailed reason later."]}, {"cell_type": "code", "execution_count": 37, "id": "4f9b83e1", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:58.283224Z", "iopub.status.busy": "2021-12-04T15:53:58.282754Z", "iopub.status.idle": "2021-12-04T15:53:58.285141Z", "shell.execute_reply": "2021-12-04T15:53:58.285538Z"}, "papermill": {"duration": 0.213062, "end_time": "2021-12-04T15:53:58.285669", "exception": false, "start_time": "2021-12-04T15:53:58.072607", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["SimpleClassifier(\n", " (linear1): Linear(in_features=2, out_features=4, bias=True)\n", " (act_fn): Tanh()\n", " (linear2): Linear(in_features=4, out_features=1, bias=True)\n", ")\n"]}], "source": ["model = SimpleClassifier(num_inputs=2, num_hidden=4, num_outputs=1)\n", "# Printing a module shows all its submodules\n", "print(model)"]}, {"cell_type": "markdown", "id": "360961ed", "metadata": {"papermill": {"duration": 0.202451, "end_time": "2021-12-04T15:53:58.691398", "exception": false, "start_time": "2021-12-04T15:53:58.488947", "status": "completed"}, "tags": []}, "source": ["Printing the model lists all submodules it contains.\n", "The parameters of a module can be obtained by using its `parameters()` functions, or `named_parameters()` to get a name to each parameter object.\n", "For our small neural network, we have the following parameters:"]}, {"cell_type": "code", "execution_count": 38, "id": "780fcc13", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:53:59.102900Z", "iopub.status.busy": "2021-12-04T15:53:59.102421Z", "iopub.status.idle": "2021-12-04T15:53:59.104603Z", "shell.execute_reply": "2021-12-04T15:53:59.104977Z"}, "papermill": {"duration": 0.211481, "end_time": "2021-12-04T15:53:59.105106", "exception": false, "start_time": "2021-12-04T15:53:58.893625", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Parameter linear1.weight, shape torch.Size([4, 2])\n", "Parameter linear1.bias, shape torch.Size([4])\n", "Parameter linear2.weight, shape torch.Size([1, 4])\n", "Parameter linear2.bias, shape torch.Size([1])\n"]}], "source": ["for name, param in model.named_parameters():\n", " print(f\"Parameter {name}, shape {param.shape}\")"]}, {"cell_type": "markdown", "id": "bc034c95", "metadata": {"papermill": {"duration": 0.203191, "end_time": "2021-12-04T15:53:59.512934", "exception": false, "start_time": "2021-12-04T15:53:59.309743", "status": "completed"}, "tags": []}, "source": ["Each linear layer has a weight matrix of the shape `[output, input]`, and a bias of the shape `[output]`.\n", "The tanh activation function does not have any parameters.\n", "Note that parameters are only registered for `nn.Module` objects that are direct object attributes, i.e. `self.a = ...`.\n", "If you define a list of modules, the parameters of those are not registered for the outer module and can cause some issues when you try to optimize your module.\n", "There are alternatives, like `nn.ModuleList`, `nn.ModuleDict` and `nn.Sequential`, that allow you to have different data structures of modules.\n", "We will use them in a few later tutorials and explain them there."]}, {"cell_type": "markdown", "id": "136035b4", "metadata": {"papermill": {"duration": 0.204985, "end_time": "2021-12-04T15:53:59.921347", "exception": false, "start_time": "2021-12-04T15:53:59.716362", "status": "completed"}, "tags": []}, "source": ["### The data\n", "\n", "PyTorch also provides a few functionalities to load the training and\n", "test data efficiently, summarized in the package `torch.utils.data`."]}, {"cell_type": "code", "execution_count": null, "id": "1cf8b77a", "metadata": {"papermill": {"duration": 0.204911, "end_time": "2021-12-04T15:54:00.331565", "exception": false, "start_time": "2021-12-04T15:54:00.126654", "status": "completed"}, "tags": []}, "outputs": [], "source": []}, {"cell_type": "markdown", "id": "056c9971", "metadata": {"papermill": {"duration": 0.203757, "end_time": "2021-12-04T15:54:00.743646", "exception": false, "start_time": "2021-12-04T15:54:00.539889", "status": "completed"}, "tags": []}, "source": ["The data package defines two classes which are the standard interface for handling data in PyTorch: `data.Dataset`, and `data.DataLoader`.\n", "The dataset class provides an uniform interface to access the\n", "training/test data, while the data loader makes sure to efficiently load\n", "and stack the data points from the dataset into batches during training."]}, {"cell_type": "markdown", "id": "92ffaea5", "metadata": {"papermill": {"duration": 0.20609, "end_time": "2021-12-04T15:54:01.153489", "exception": false, "start_time": "2021-12-04T15:54:00.947399", "status": "completed"}, "tags": []}, "source": ["#### The dataset class\n", "\n", "The dataset class summarizes the basic functionality of a dataset in a natural way.\n", "To define a dataset in PyTorch, we simply specify two functions: `__getitem__`, and `__len__`.\n", "The get-item function has to return the $i$-th data point in the dataset, while the len function returns the size of the dataset.\n", "For the XOR dataset, we can define the dataset class as follows:"]}, {"cell_type": "code", "execution_count": 39, "id": "9eadd4ba", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:01.569750Z", "iopub.status.busy": "2021-12-04T15:54:01.569274Z", "iopub.status.idle": "2021-12-04T15:54:01.571170Z", "shell.execute_reply": "2021-12-04T15:54:01.570790Z"}, "papermill": {"duration": 0.213645, "end_time": "2021-12-04T15:54:01.571284", "exception": false, "start_time": "2021-12-04T15:54:01.357639", "status": "completed"}, "tags": []}, "outputs": [], "source": ["\n", "\n", "class XORDataset(data.Dataset):\n", " def __init__(self, size, std=0.1):\n", " \"\"\"\n", " Inputs:\n", " size - Number of data points we want to generate\n", " std - Standard deviation of the noise (see generate_continuous_xor function)\n", " \"\"\"\n", " super().__init__()\n", " self.size = size\n", " self.std = std\n", " self.generate_continuous_xor()\n", "\n", " def generate_continuous_xor(self):\n", " # Each data point in the XOR dataset has two variables, x and y, that can be either 0 or 1\n", " # The label is their XOR combination, i.e. 1 if only x or only y is 1 while the other is 0.\n", " # If x=y, the label is 0.\n", " data = torch.randint(low=0, high=2, size=(self.size, 2), dtype=torch.float32)\n", " label = (data.sum(dim=1) == 1).to(torch.long)\n", " # To make it slightly more challenging, we add a bit of gaussian noise to the data points.\n", " data += self.std * torch.randn(data.shape)\n", "\n", " self.data = data\n", " self.label = label\n", "\n", " def __len__(self):\n", " # Number of data point we have. Alternatively self.data.shape[0], or self.label.shape[0]\n", " return self.size\n", "\n", " def __getitem__(self, idx):\n", " # Return the idx-th data point of the dataset\n", " # If we have multiple things to return (data point and label), we can return them as tuple\n", " data_point = self.data[idx]\n", " data_label = self.label[idx]\n", " return data_point, data_label"]}, {"cell_type": "markdown", "id": "170ab9ba", "metadata": {"papermill": {"duration": 0.207351, "end_time": "2021-12-04T15:54:01.984743", "exception": false, "start_time": "2021-12-04T15:54:01.777392", "status": "completed"}, "tags": []}, "source": ["Let's try to create such a dataset and inspect it:"]}, {"cell_type": "code", "execution_count": 40, "id": "be2c0ec7", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:02.398061Z", "iopub.status.busy": "2021-12-04T15:54:02.397602Z", "iopub.status.idle": "2021-12-04T15:54:02.401563Z", "shell.execute_reply": "2021-12-04T15:54:02.401095Z"}, "papermill": {"duration": 0.211018, "end_time": "2021-12-04T15:54:02.401672", "exception": false, "start_time": "2021-12-04T15:54:02.190654", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Size of dataset: 200\n", "Data point 0: (tensor([0.9632, 0.1117]), tensor(1))\n"]}], "source": ["dataset = XORDataset(size=200)\n", "print(\"Size of dataset:\", len(dataset))\n", "print(\"Data point 0:\", dataset[0])"]}, {"cell_type": "markdown", "id": "86828a5c", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.206005, "end_time": "2021-12-04T15:54:02.812653", "exception": false, "start_time": "2021-12-04T15:54:02.606648", "status": "completed"}, "tags": []}, "source": ["To better relate to the dataset, we visualize the samples below."]}, {"cell_type": "code", "execution_count": 41, "id": "84457292", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:03.229327Z", "iopub.status.busy": "2021-12-04T15:54:03.228861Z", "iopub.status.idle": "2021-12-04T15:54:03.230785Z", "shell.execute_reply": "2021-12-04T15:54:03.230390Z"}, "papermill": {"duration": 0.213933, "end_time": "2021-12-04T15:54:03.230894", "exception": false, "start_time": "2021-12-04T15:54:03.016961", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def visualize_samples(data, label):\n", " if isinstance(data, torch.Tensor):\n", " data = data.cpu().numpy()\n", " if isinstance(label, torch.Tensor):\n", " label = label.cpu().numpy()\n", " data_0 = data[label == 0]\n", " data_1 = data[label == 1]\n", "\n", " plt.figure(figsize=(4, 4))\n", " plt.scatter(data_0[:, 0], data_0[:, 1], edgecolor=\"#333\", label=\"Class 0\")\n", " plt.scatter(data_1[:, 0], data_1[:, 1], edgecolor=\"#333\", label=\"Class 1\")\n", " plt.title(\"Dataset samples\")\n", " plt.ylabel(r\"$x_2$\")\n", " plt.xlabel(r\"$x_1$\")\n", " plt.legend()"]}, {"cell_type": "code", "execution_count": 42, "id": "7b382126", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:03.657738Z", "iopub.status.busy": "2021-12-04T15:54:03.645550Z", "iopub.status.idle": "2021-12-04T15:54:04.134432Z", "shell.execute_reply": "2021-12-04T15:54:04.134847Z"}, "papermill": {"duration": 0.697237, "end_time": "2021-12-04T15:54:04.135014", "exception": false, "start_time": "2021-12-04T15:54:03.437777", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:54:03.873238\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["visualize_samples(dataset.data, dataset.label)\n", "plt.show()"]}, {"cell_type": "markdown", "id": "c4ff362d", "metadata": {"papermill": {"duration": 0.209873, "end_time": "2021-12-04T15:54:04.554262", "exception": false, "start_time": "2021-12-04T15:54:04.344389", "status": "completed"}, "tags": []}, "source": ["#### The data loader class\n", "\n", "The class `torch.utils.data.DataLoader` represents a Python iterable over a dataset with support for automatic batching, multi-process data loading and many more features.\n", "The data loader communicates with the dataset using the function `__getitem__`, and stacks its outputs as tensors over the first dimension to form a batch.\n", "In contrast to the dataset class, we usually don't have to define our own data loader class, but can just create an object of it with the dataset as input.\n", "Additionally, we can configure our data loader with the following input arguments (only a selection, see full list [here](https://pytorch.org/docs/stable/data.html#torch.utils.data.DataLoader)):\n", "\n", "* `batch_size`: Number of samples to stack per batch\n", "* `shuffle`: If True, the data is returned in a random order.\n", "This is important during training for introducing stochasticity.\n", "* `num_workers`: Number of subprocesses to use for data loading.\n", "The default, 0, means that the data will be loaded in the main process which can slow down training for datasets where loading a data point takes a considerable amount of time (e.g. large images).\n", "More workers are recommended for those, but can cause issues on Windows computers.\n", "For tiny datasets as ours, 0 workers are usually faster.\n", "* `pin_memory`: If True, the data loader will copy Tensors into CUDA pinned memory before returning them.\n", "This can save some time for large data points on GPUs.\n", "Usually a good practice to use for a training set, but not necessarily for validation and test to save memory on the GPU.\n", "* `drop_last`: If True, the last batch is dropped in case it is smaller than the specified batch size.\n", "This occurs when the dataset size is not a multiple of the batch size.\n", "Only potentially helpful during training to keep a consistent batch size.\n", "\n", "Let's create a simple data loader below:"]}, {"cell_type": "code", "execution_count": 43, "id": "93c89ea5", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:04.976648Z", "iopub.status.busy": "2021-12-04T15:54:04.976186Z", "iopub.status.idle": "2021-12-04T15:54:04.977746Z", "shell.execute_reply": "2021-12-04T15:54:04.978119Z"}, "papermill": {"duration": 0.215753, "end_time": "2021-12-04T15:54:04.978250", "exception": false, "start_time": "2021-12-04T15:54:04.762497", "status": "completed"}, "tags": []}, "outputs": [], "source": ["data_loader = data.DataLoader(dataset, batch_size=8, shuffle=True)"]}, {"cell_type": "code", "execution_count": 44, "id": "b7a50dd3", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:05.404638Z", "iopub.status.busy": "2021-12-04T15:54:05.404165Z", "iopub.status.idle": "2021-12-04T15:54:05.408587Z", "shell.execute_reply": "2021-12-04T15:54:05.408963Z"}, "papermill": {"duration": 0.219528, "end_time": "2021-12-04T15:54:05.409092", "exception": false, "start_time": "2021-12-04T15:54:05.189564", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Data inputs torch.Size([8, 2]) \n", " tensor([[ 1.2108, -0.1180],\n", " [-0.1895, 0.0415],\n", " [ 1.1542, -0.0989],\n", " [ 1.1135, 0.1228],\n", " [-0.0280, 0.0046],\n", " [-0.0378, 1.0500],\n", " [-0.0636, 0.9167],\n", " [-0.0392, 0.8611]])\n", "Data labels torch.Size([8]) \n", " tensor([1, 0, 1, 1, 0, 1, 1, 1])\n"]}], "source": ["# next(iter(...)) catches the first batch of the data loader\n", "# If shuffle is True, this will return a different batch every time we run this cell\n", "# For iterating over the whole dataset, we can simple use \"for batch in data_loader: ...\"\n", "data_inputs, data_labels = next(iter(data_loader))\n", "\n", "# The shape of the outputs are [batch_size, d_1,...,d_N] where d_1,...,d_N are the\n", "# dimensions of the data point returned from the dataset class\n", "print(\"Data inputs\", data_inputs.shape, \"\\n\", data_inputs)\n", "print(\"Data labels\", data_labels.shape, \"\\n\", data_labels)"]}, {"cell_type": "markdown", "id": "40090168", "metadata": {"papermill": {"duration": 0.213288, "end_time": "2021-12-04T15:54:05.833809", "exception": false, "start_time": "2021-12-04T15:54:05.620521", "status": "completed"}, "tags": []}, "source": ["### Optimization\n", "\n", "After defining the model and the dataset, it is time to prepare the optimization of the model.\n", "During training, we will perform the following steps:\n", "\n", "1. Get a batch from the data loader\n", "2. Obtain the predictions from the model for the batch\n", "3. Calculate the loss based on the difference between predictions and labels\n", "4. Backpropagation: calculate the gradients for every parameter with respect to the loss\n", "5. Update the parameters of the model in the direction of the gradients\n", "\n", "We have seen how we can do step 1, 2 and 4 in PyTorch. Now, we will look at step 3 and 5."]}, {"cell_type": "markdown", "id": "202634de", "metadata": {"papermill": {"duration": 0.216115, "end_time": "2021-12-04T15:54:06.271200", "exception": false, "start_time": "2021-12-04T15:54:06.055085", "status": "completed"}, "tags": []}, "source": ["#### Loss modules\n", "\n", "We can calculate the loss for a batch by simply performing a few tensor operations as those are automatically added to the computation graph.\n", "For instance, for binary classification, we can use Binary Cross Entropy (BCE) which is defined as follows:\n", "\n", "$$\\mathcal{L}_{BCE} = -\\sum_i \\left[ y_i \\log x_i + (1 - y_i) \\log (1 - x_i) \\right]$$\n", "\n", "where $y$ are our labels, and $x$ our predictions, both in the range of $[0,1]$.\n", "However, PyTorch already provides a list of predefined loss functions which we can use (see [here](https://pytorch.org/docs/stable/nn.html#loss-functions) for a full list).\n", "For instance, for BCE, PyTorch has two modules: `nn.BCELoss()`, `nn.BCEWithLogitsLoss()`.\n", "While `nn.BCELoss` expects the inputs $x$ to be in the range $[0,1]$, i.e. the output of a sigmoid, `nn.BCEWithLogitsLoss` combines a sigmoid layer and the BCE loss in a single class.\n", "This version is numerically more stable than using a plain Sigmoid followed by a BCE loss because of the logarithms applied in the loss function.\n", "Hence, it is adviced to use loss functions applied on \"logits\" where possible (remember to not apply a sigmoid on the output of the model in this case!).\n", "For our model defined above, we therefore use the module `nn.BCEWithLogitsLoss`."]}, {"cell_type": "code", "execution_count": 45, "id": "5427b133", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:06.708663Z", "iopub.status.busy": "2021-12-04T15:54:06.708193Z", "iopub.status.idle": "2021-12-04T15:54:06.710106Z", "shell.execute_reply": "2021-12-04T15:54:06.709723Z"}, "papermill": {"duration": 0.221156, "end_time": "2021-12-04T15:54:06.710216", "exception": false, "start_time": "2021-12-04T15:54:06.489060", "status": "completed"}, "tags": []}, "outputs": [], "source": ["loss_module = nn.BCEWithLogitsLoss()"]}, {"cell_type": "markdown", "id": "af76ed16", "metadata": {"papermill": {"duration": 0.21844, "end_time": "2021-12-04T15:54:07.146700", "exception": false, "start_time": "2021-12-04T15:54:06.928260", "status": "completed"}, "tags": []}, "source": ["#### Stochastic Gradient Descent\n", "\n", "For updating the parameters, PyTorch provides the package `torch.optim` that has most popular optimizers implemented.\n", "We will discuss the specific optimizers and their differences later in the course, but will for now use the simplest of them: `torch.optim.SGD`.\n", "Stochastic Gradient Descent updates parameters by multiplying the gradients with a small constant, called learning rate, and subtracting those from the parameters (hence minimizing the loss).\n", "Therefore, we slowly move towards the direction of minimizing the loss.\n", "A good default value of the learning rate for a small network as ours is 0.1."]}, {"cell_type": "code", "execution_count": 46, "id": "60eae78b", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:07.623913Z", "iopub.status.busy": "2021-12-04T15:54:07.623439Z", "iopub.status.idle": "2021-12-04T15:54:07.625388Z", "shell.execute_reply": "2021-12-04T15:54:07.625006Z"}, "papermill": {"duration": 0.22472, "end_time": "2021-12-04T15:54:07.625501", "exception": false, "start_time": "2021-12-04T15:54:07.400781", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# Input to the optimizer are the parameters of the model: model.parameters()\n", "optimizer = torch.optim.SGD(model.parameters(), lr=0.1)"]}, {"cell_type": "markdown", "id": "cab67e22", "metadata": {"papermill": {"duration": 0.214969, "end_time": "2021-12-04T15:54:08.054953", "exception": false, "start_time": "2021-12-04T15:54:07.839984", "status": "completed"}, "tags": []}, "source": ["The optimizer provides two useful functions: `optimizer.step()`, and `optimizer.zero_grad()`.\n", "The step function updates the parameters based on the gradients as explained above.\n", "The function `optimizer.zero_grad()` sets the gradients of all parameters to zero.\n", "While this function seems less relevant at first, it is a crucial pre-step before performing backpropagation.\n", "If we would call the `backward` function on the loss while the parameter gradients are non-zero from the previous batch, the new gradients would actually be added to the previous ones instead of overwriting them.\n", "This is done because a parameter might occur multiple times in a computation graph, and we need to sum the gradients in this case instead of replacing them.\n", "Hence, remember to call `optimizer.zero_grad()` before calculating the gradients of a batch."]}, {"cell_type": "markdown", "id": "815da7f3", "metadata": {"papermill": {"duration": 0.214692, "end_time": "2021-12-04T15:54:08.483699", "exception": false, "start_time": "2021-12-04T15:54:08.269007", "status": "completed"}, "tags": []}, "source": ["### Training\n", "\n", "Finally, we are ready to train our model.\n", "As a first step, we create a slightly larger dataset and specify a data loader with a larger batch size."]}, {"cell_type": "code", "execution_count": 47, "id": "be9ac2d0", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:08.929206Z", "iopub.status.busy": "2021-12-04T15:54:08.928716Z", "iopub.status.idle": "2021-12-04T15:54:08.931250Z", "shell.execute_reply": "2021-12-04T15:54:08.930773Z"}, "papermill": {"duration": 0.229194, "end_time": "2021-12-04T15:54:08.931361", "exception": false, "start_time": "2021-12-04T15:54:08.702167", "status": "completed"}, "tags": []}, "outputs": [], "source": ["train_dataset = XORDataset(size=1000)\n", "train_data_loader = data.DataLoader(train_dataset, batch_size=128, shuffle=True)"]}, {"cell_type": "markdown", "id": "0271a836", "metadata": {"papermill": {"duration": 0.214622, "end_time": "2021-12-04T15:54:09.363363", "exception": false, "start_time": "2021-12-04T15:54:09.148741", "status": "completed"}, "tags": []}, "source": ["Now, we can write a small training function.\n", "Remember our five steps: load a batch, obtain the predictions, calculate the loss, backpropagate, and update.\n", "Additionally, we have to push all data and model parameters to the device of our choice (GPU if available).\n", "For the tiny neural network we have, communicating the data to the GPU actually takes much more time than we could save from running the operation on GPU.\n", "For large networks, the communication time is significantly smaller than the actual runtime making a GPU crucial in these cases.\n", "Still, to practice, we will push the data to GPU here."]}, {"cell_type": "code", "execution_count": 48, "id": "c7b13460", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:09.806935Z", "iopub.status.busy": "2021-12-04T15:54:09.806433Z", "iopub.status.idle": "2021-12-04T15:54:09.810018Z", "shell.execute_reply": "2021-12-04T15:54:09.809609Z"}, "papermill": {"duration": 0.222561, "end_time": "2021-12-04T15:54:09.810128", "exception": false, "start_time": "2021-12-04T15:54:09.587567", "status": "completed"}, "tags": []}, "outputs": [{"data": {"text/plain": ["SimpleClassifier(\n", " (linear1): Linear(in_features=2, out_features=4, bias=True)\n", " (act_fn): Tanh()\n", " (linear2): Linear(in_features=4, out_features=1, bias=True)\n", ")"]}, "execution_count": 48, "metadata": {}, "output_type": "execute_result"}], "source": ["# Push model to device. Has to be only done once\n", "model.to(device)"]}, {"cell_type": "markdown", "id": "cadf5955", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.214526, "end_time": "2021-12-04T15:54:10.247009", "exception": false, "start_time": "2021-12-04T15:54:10.032483", "status": "completed"}, "tags": []}, "source": ["In addition, we set our model to training mode.\n", "This is done by calling `model.train()`.\n", "There exist certain modules that need to perform a different forward\n", "step during training than during testing (e.g. BatchNorm and Dropout),\n", "and we can switch between them using `model.train()` and `model.eval()`."]}, {"cell_type": "code", "execution_count": 49, "id": "b2e9a50f", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:10.679237Z", "iopub.status.busy": "2021-12-04T15:54:10.678761Z", "iopub.status.idle": "2021-12-04T15:54:10.680363Z", "shell.execute_reply": "2021-12-04T15:54:10.680739Z"}, "papermill": {"duration": 0.219695, "end_time": "2021-12-04T15:54:10.680870", "exception": false, "start_time": "2021-12-04T15:54:10.461175", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def train_model(model, optimizer, data_loader, loss_module, num_epochs=100):\n", " # Set model to train mode\n", " model.train()\n", "\n", " # Training loop\n", " for epoch in tqdm(range(num_epochs)):\n", " for data_inputs, data_labels in data_loader:\n", "\n", " # Step 1: Move input data to device (only strictly necessary if we use GPU)\n", " data_inputs = data_inputs.to(device)\n", " data_labels = data_labels.to(device)\n", "\n", " # Step 2: Run the model on the input data\n", " preds = model(data_inputs)\n", " preds = preds.squeeze(dim=1) # Output is [Batch size, 1], but we want [Batch size]\n", "\n", " # Step 3: Calculate the loss\n", " loss = loss_module(preds, data_labels.float())\n", "\n", " # Step 4: Perform backpropagation\n", " # Before calculating the gradients, we need to ensure that they are all zero.\n", " # The gradients would not be overwritten, but actually added to the existing ones.\n", " optimizer.zero_grad()\n", " # Perform backpropagation\n", " loss.backward()\n", "\n", " # Step 5: Update the parameters\n", " optimizer.step()"]}, {"cell_type": "code", "execution_count": 50, "id": "6857c620", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:11.110005Z", "iopub.status.busy": "2021-12-04T15:54:11.109541Z", "iopub.status.idle": "2021-12-04T15:54:12.322199Z", "shell.execute_reply": "2021-12-04T15:54:12.322585Z"}, "papermill": {"duration": 1.429741, "end_time": "2021-12-04T15:54:12.322764", "exception": false, "start_time": "2021-12-04T15:54:10.893023", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "8222db0c1ce847c18b82712853539f5e", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0/100 [00:00 Don't drop the last batch although it is smaller than 128\n", "test_data_loader = data.DataLoader(test_dataset, batch_size=128, shuffle=False, drop_last=False)"]}, {"cell_type": "markdown", "id": "9b0c0259", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.223015, "end_time": "2021-12-04T15:54:16.659749", "exception": false, "start_time": "2021-12-04T15:54:16.436734", "status": "completed"}, "tags": []}, "source": ["As metric, we will use accuracy which is calculated as follows:\n", "\n", "$$acc = \\frac{\\#\\text{correct predictions}}{\\#\\text{all predictions}} = \\frac{TP+TN}{TP+TN+FP+FN}$$\n", "\n", "where TP are the true positives, TN true negatives, FP false positives, and FN the fale negatives.\n", "\n", "When evaluating the model, we don't need to keep track of the computation graph as we don't intend to calculate the gradients.\n", "This reduces the required memory and speed up the model.\n", "In PyTorch, we can deactivate the computation graph using `with torch.no_grad(): ...`.\n", "Remember to additionally set the model to eval mode."]}, {"cell_type": "code", "execution_count": 55, "id": "81d5e627", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:17.100737Z", "iopub.status.busy": "2021-12-04T15:54:17.100266Z", "iopub.status.idle": "2021-12-04T15:54:17.102233Z", "shell.execute_reply": "2021-12-04T15:54:17.101833Z"}, "papermill": {"duration": 0.228058, "end_time": "2021-12-04T15:54:17.102341", "exception": false, "start_time": "2021-12-04T15:54:16.874283", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def eval_model(model, data_loader):\n", " model.eval() # Set model to eval mode\n", " true_preds, num_preds = 0.0, 0.0\n", "\n", " with torch.no_grad(): # Deactivate gradients for the following code\n", " for data_inputs, data_labels in data_loader:\n", "\n", " # Determine prediction of model on dev set\n", " data_inputs, data_labels = data_inputs.to(device), data_labels.to(device)\n", " preds = model(data_inputs)\n", " preds = preds.squeeze(dim=1)\n", " preds = torch.sigmoid(preds) # Sigmoid to map predictions between 0 and 1\n", " pred_labels = (preds >= 0.5).long() # Binarize predictions to 0 and 1\n", "\n", " # Keep records of predictions for the accuracy metric (true_preds=TP+TN, num_preds=TP+TN+FP+FN)\n", " true_preds += (pred_labels == data_labels).sum()\n", " num_preds += data_labels.shape[0]\n", "\n", " acc = true_preds / num_preds\n", " print(f\"Accuracy of the model: {100.0*acc:4.2f}%\")"]}, {"cell_type": "code", "execution_count": 56, "id": "71db7937", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:17.540450Z", "iopub.status.busy": "2021-12-04T15:54:17.539985Z", "iopub.status.idle": "2021-12-04T15:54:17.546678Z", "shell.execute_reply": "2021-12-04T15:54:17.547057Z"}, "papermill": {"duration": 0.228671, "end_time": "2021-12-04T15:54:17.547187", "exception": false, "start_time": "2021-12-04T15:54:17.318516", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Accuracy of the model: 100.00%\n"]}], "source": ["eval_model(model, test_data_loader)"]}, {"cell_type": "markdown", "id": "0b763086", "metadata": {"papermill": {"duration": 0.216167, "end_time": "2021-12-04T15:54:17.978220", "exception": false, "start_time": "2021-12-04T15:54:17.762053", "status": "completed"}, "tags": []}, "source": ["If we trained our model correctly, we should see a score close to 100% accuracy.\n", "However, this is only possible because of our simple task, and\n", "unfortunately, we usually don't get such high scores on test sets of\n", "more complex tasks."]}, {"cell_type": "markdown", "id": "5fc4b4e1", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.215766, "end_time": "2021-12-04T15:54:18.415334", "exception": false, "start_time": "2021-12-04T15:54:18.199568", "status": "completed"}, "tags": []}, "source": ["#### Visualizing classification boundaries\n", "\n", "To visualize what our model has learned, we can perform a prediction for every data point in a range of $[-0.5, 1.5]$, and visualize the predicted class as in the sample figure at the beginning of this section.\n", "This shows where the model has created decision boundaries, and which points would be classified as $0$, and which as $1$.\n", "We therefore get a background image out of blue (class 0) and orange (class 1).\n", "The spots where the model is uncertain we will see a blurry overlap.\n", "The specific code is less relevant compared to the output figure which\n", "should hopefully show us a clear separation of classes:"]}, {"cell_type": "code", "execution_count": 57, "id": "9b2cdd8a", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:18.862084Z", "iopub.status.busy": "2021-12-04T15:54:18.861126Z", "iopub.status.idle": "2021-12-04T15:54:19.252452Z", "shell.execute_reply": "2021-12-04T15:54:19.252841Z"}, "papermill": {"duration": 0.618628, "end_time": "2021-12-04T15:54:19.253007", "exception": false, "start_time": "2021-12-04T15:54:18.634379", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:54:18.983966\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["@torch.no_grad() # Decorator, same effect as \"with torch.no_grad(): ...\" over the whole function.\n", "def visualize_classification(model, data, label):\n", " if isinstance(data, torch.Tensor):\n", " data = data.cpu().numpy()\n", " if isinstance(label, torch.Tensor):\n", " label = label.cpu().numpy()\n", " data_0 = data[label == 0]\n", " data_1 = data[label == 1]\n", "\n", " plt.figure(figsize=(4, 4))\n", " plt.scatter(data_0[:, 0], data_0[:, 1], edgecolor=\"#333\", label=\"Class 0\")\n", " plt.scatter(data_1[:, 0], data_1[:, 1], edgecolor=\"#333\", label=\"Class 1\")\n", " plt.title(\"Dataset samples\")\n", " plt.ylabel(r\"$x_2$\")\n", " plt.xlabel(r\"$x_1$\")\n", " plt.legend()\n", "\n", " # Let's make use of a lot of operations we have learned above\n", " model.to(device)\n", " c0 = torch.Tensor(to_rgba(\"C0\")).to(device)\n", " c1 = torch.Tensor(to_rgba(\"C1\")).to(device)\n", " x1 = torch.arange(-0.5, 1.5, step=0.01, device=device)\n", " x2 = torch.arange(-0.5, 1.5, step=0.01, device=device)\n", " xx1, xx2 = torch.meshgrid(x1, x2) # Meshgrid function as in numpy\n", " model_inputs = torch.stack([xx1, xx2], dim=-1)\n", " preds = model(model_inputs)\n", " preds = torch.sigmoid(preds)\n", " # Specifying \"None\" in a dimension creates a new one\n", " output_image = (1 - preds) * c0[None, None] + preds * c1[None, None]\n", " output_image = (\n", " output_image.cpu().numpy()\n", " ) # Convert to numpy array. This only works for tensors on CPU, hence first push to CPU\n", " plt.imshow(output_image, origin=\"lower\", extent=(-0.5, 1.5, -0.5, 1.5))\n", " plt.grid(False)\n", "\n", "\n", "visualize_classification(model, dataset.data, dataset.label)\n", "plt.show()"]}, {"cell_type": "markdown", "id": "34a5111d", "metadata": {"papermill": {"duration": 0.21845, "end_time": "2021-12-04T15:54:19.694395", "exception": false, "start_time": "2021-12-04T15:54:19.475945", "status": "completed"}, "tags": []}, "source": ["The decision boundaries might not look exactly as in the figure in the preamble of this section which can be caused by running it on CPU or a different GPU architecture.\n", "Nevertheless, the result on the accuracy metric should be the approximately the same."]}, {"cell_type": "markdown", "id": "a501a3ba", "metadata": {"papermill": {"duration": 0.219567, "end_time": "2021-12-04T15:54:20.134648", "exception": false, "start_time": "2021-12-04T15:54:19.915081", "status": "completed"}, "tags": []}, "source": ["## Additional features we didn't get to discuss yet\n", "\n", "Finally, you are all set to start with your own PyTorch project!\n", "In summary, we have looked at how we can build neural networks in PyTorch, and train and test them on data.\n", "However, there is still much more to PyTorch we haven't discussed yet.\n", "In the comming series of Jupyter notebooks, we will discover more and more functionalities of PyTorch, so that you also get familiar to PyTorch concepts beyond the basics.\n", "If you are already interested in learning more of PyTorch, we recommend the official [tutorial website](https://pytorch.org/tutorials/) that contains many tutorials on various topics.\n", "Especially logging with Tensorboard ([tutorial\n", "here](https://pytorch.org/tutorials/intermediate/tensorboard_tutorial.html))\n", "is a good practice that we will explore from Tutorial 5 on."]}, {"cell_type": "markdown", "id": "96f1e6ba", "metadata": {"papermill": {"duration": 0.227432, "end_time": "2021-12-04T15:54:20.580697", "exception": false, "start_time": "2021-12-04T15:54:20.353265", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "[![Pytorch Lightning](){height=\"60px\" width=\"240px\"}](https://pytorchlightning.ai)"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: Tutorial 1: Introduction to PyTorch\n", " :card_description: This tutorial will give a short introduction to PyTorch basics, and get you setup for writing your own neural networks. This notebook is part of a lecture series on Deep...\n", " :tags: GPU/TPU,UvA-DL-Course\n", " :image: _static/images/course_UvA-DL/01-introduction-to-pytorch.jpg"]}], "metadata": {"jupytext": {"cell_metadata_filter": "colab,colab_type,id,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 60.734817, "end_time": "2021-12-04T15:54:21.407766", "environment_variables": {}, "exception": null, "input_path": "course_UvA-DL/01-introduction-to-pytorch/Introduction_to_PyTorch.ipynb", "output_path": ".notebooks/course_UvA-DL/01-introduction-to-pytorch.ipynb", "parameters": {}, "start_time": "2021-12-04T15:53:20.672949", "version": "2.3.3"}, "widgets": {"application/vnd.jupyter.widget-state+json": {"state": {"1258f7118a0c424184d1474fa7c7c996": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2a2ddc2695ca450cbb62218c40c78f0d", "placeholder": "\u200b", "style": "IPY_MODEL_c9b7c58a69a648deb8285855bed4a010", "value": "100%"}}, "2a2ddc2695ca450cbb62218c40c78f0d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3ae1c6ddf0434903b17b358d083da8db": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4d30509a31df4d158d2bb33eb9986e6a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "61c30cfd473447a38bffb83685bd5f10": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_cd512299253f4dca9324b2260bf7d58c", "placeholder": "\u200b", "style": "IPY_MODEL_eaacc50a6b044949945e0b3f82453cca", "value": " 100/100 [00:01<00:00, 84.02it/s]"}}, "8222db0c1ce847c18b82712853539f5e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_1258f7118a0c424184d1474fa7c7c996", "IPY_MODEL_fa1ac1649a95469d9415b8ad881b0c26", "IPY_MODEL_61c30cfd473447a38bffb83685bd5f10"], "layout": "IPY_MODEL_3ae1c6ddf0434903b17b358d083da8db"}}, "9c98efcaa23c420fa86f3b36f45e2f83": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c9b7c58a69a648deb8285855bed4a010": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "cd512299253f4dca9324b2260bf7d58c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "eaacc50a6b044949945e0b3f82453cca": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "fa1ac1649a95469d9415b8ad881b0c26": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_9c98efcaa23c420fa86f3b36f45e2f83", "max": 100.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_4d30509a31df4d158d2bb33eb9986e6a", "value": 100.0}}}, "version_major": 2, "version_minor": 0}}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/course_UvA-DL/02-activation-functions.ipynb b/source/notebooks/course_UvA-DL/02-activation-functions.ipynb deleted file mode 100644 index f71b969..0000000 --- a/source/notebooks/course_UvA-DL/02-activation-functions.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "ed3501af", "metadata": {"papermill": {"duration": 0.023462, "end_time": "2021-09-16T12:33:15.496875", "exception": false, "start_time": "2021-09-16T12:33:15.473413", "status": "completed"}, "tags": []}, "source": ["\n", "# Tutorial 2: Activation Functions\n", "\n", "* **Author:** Phillip Lippe\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-09-16T14:32:18.973374\n", "\n", "In this tutorial, we will take a closer look at (popular) activation functions and investigate their effect on optimization properties in neural networks.\n", "Activation functions are a crucial part of deep learning models as they add the non-linearity to neural networks.\n", "There is a great variety of activation functions in the literature, and some are more beneficial than others.\n", "The goal of this tutorial is to show the importance of choosing a good activation function (and how to do so), and what problems might occur if we don't.\n", "This notebook is part of a lecture series on Deep Learning at the University of Amsterdam.\n", "The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io.\n", "\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/course_UvA-DL/02-activation-functions.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "66b84901", "metadata": {"papermill": {"duration": 0.021804, "end_time": "2021-09-16T12:33:15.540678", "exception": false, "start_time": "2021-09-16T12:33:15.518874", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "4d7c8160", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-09-16T12:33:15.587749Z", "iopub.status.busy": "2021-09-16T12:33:15.587280Z", "iopub.status.idle": "2021-09-16T12:33:15.589355Z", "shell.execute_reply": "2021-09-16T12:33:15.589747Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 0.027383, "end_time": "2021-09-16T12:33:15.589924", "exception": false, "start_time": "2021-09-16T12:33:15.562541", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# ! pip install --quiet \"torchmetrics>=0.3\" \"torch>=1.6, <1.9\" \"pytorch-lightning>=1.3\" \"torchvision\" \"seaborn\" \"matplotlib\""]}, {"cell_type": "markdown", "id": "94e4c637", "metadata": {"papermill": {"duration": 0.021895, "end_time": "2021-09-16T12:33:15.635408", "exception": false, "start_time": "2021-09-16T12:33:15.613513", "status": "completed"}, "tags": []}, "source": ["
\n", "Before we start, we import our standard libraries and set up basic functions:"]}, {"cell_type": "code", "execution_count": 2, "id": "afda8dd1", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:33:15.687272Z", "iopub.status.busy": "2021-09-16T12:33:15.686802Z", "iopub.status.idle": "2021-09-16T12:33:16.799385Z", "shell.execute_reply": "2021-09-16T12:33:16.799794Z"}, "papermill": {"duration": 1.142099, "end_time": "2021-09-16T12:33:16.799933", "exception": false, "start_time": "2021-09-16T12:33:15.657834", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/tmp/ipykernel_749/3776275675.py:24: DeprecationWarning: `set_matplotlib_formats` is deprecated since IPython 7.23, directly use `matplotlib_inline.backend_inline.set_matplotlib_formats()`\n", " set_matplotlib_formats(\"svg\", \"pdf\") # For export\n"]}], "source": ["import json\n", "import math\n", "import os\n", "import urllib.request\n", "import warnings\n", "from urllib.error import HTTPError\n", "\n", "import matplotlib.pyplot as plt\n", "import numpy as np\n", "import seaborn as sns\n", "import torch\n", "import torch.nn as nn\n", "import torch.nn.functional as F\n", "import torch.optim as optim\n", "import torch.utils.data as data\n", "import torchvision\n", "\n", "# %matplotlib inline\n", "from IPython.display import set_matplotlib_formats\n", "from torchvision import transforms\n", "from torchvision.datasets import FashionMNIST\n", "from tqdm.notebook import tqdm\n", "\n", "set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "sns.set()"]}, {"cell_type": "markdown", "id": "2587fcef", "metadata": {"papermill": {"duration": 0.022118, "end_time": "2021-09-16T12:33:16.844975", "exception": false, "start_time": "2021-09-16T12:33:16.822857", "status": "completed"}, "tags": []}, "source": ["We will define a function to set a seed on all libraries we might interact with in this tutorial (here numpy and torch).\n", "This allows us to make our training reproducible.\n", "However, note that in contrast to the CPU, the same seed on different GPU architectures can give different results.\n", "All models here have been trained on an NVIDIA GTX1080Ti.\n", "\n", "Additionally, the following cell defines two paths: `DATASET_PATH` and `CHECKPOINT_PATH`.\n", "The dataset path is the directory where we will download datasets used in the notebooks.\n", "It is recommended to store all datasets from PyTorch in one joined directory to prevent duplicate downloads.\n", "The checkpoint path is the directory where we will store trained model weights and additional files.\n", "The needed files will be automatically downloaded.\n", "In case you are on Google Colab, it is recommended to change the\n", "directories to start from the current directory (i.e. remove `../` for\n", "both dataset and checkpoint path)."]}, {"cell_type": "code", "execution_count": 3, "id": "5ad210ad", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:33:16.894843Z", "iopub.status.busy": "2021-09-16T12:33:16.894366Z", "iopub.status.idle": "2021-09-16T12:33:16.964040Z", "shell.execute_reply": "2021-09-16T12:33:16.963624Z"}, "papermill": {"duration": 0.096979, "end_time": "2021-09-16T12:33:16.964150", "exception": false, "start_time": "2021-09-16T12:33:16.867171", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Using device cuda:0\n"]}], "source": ["# Path to the folder where the datasets are/should be downloaded (e.g. MNIST)\n", "DATASET_PATH = os.environ.get(\"PATH_DATASETS\", \"data/\")\n", "# Path to the folder where the pretrained models are saved\n", "CHECKPOINT_PATH = os.environ.get(\"PATH_CHECKPOINT\", \"saved_models/Activation_Functions/\")\n", "\n", "\n", "# Function for setting the seed\n", "def set_seed(seed):\n", " np.random.seed(seed)\n", " torch.manual_seed(seed)\n", " if torch.cuda.is_available(): # GPU operation have separate seed\n", " torch.cuda.manual_seed(seed)\n", " torch.cuda.manual_seed_all(seed)\n", "\n", "\n", "set_seed(42)\n", "\n", "# Additionally, some operations on a GPU are implemented stochastic for efficiency\n", "# We want to ensure that all operations are deterministic on GPU (if used) for reproducibility\n", "torch.backends.cudnn.determinstic = True\n", "torch.backends.cudnn.benchmark = False\n", "\n", "# Fetching the device that will be used throughout this notebook\n", "device = torch.device(\"cpu\") if not torch.cuda.is_available() else torch.device(\"cuda:0\")\n", "print(\"Using device\", device)"]}, {"cell_type": "markdown", "id": "5aa7e547", "metadata": {"papermill": {"duration": 0.022623, "end_time": "2021-09-16T12:33:17.010058", "exception": false, "start_time": "2021-09-16T12:33:16.987435", "status": "completed"}, "tags": []}, "source": ["The following cell downloads all pretrained models we will use in this notebook.\n", "The files are stored on a separate [repository](https://github.com/phlippe/saved_models) to reduce the size of the notebook repository, especially for building the documentation on ReadTheDocs.\n", "In case the download below fails, you can download the models from a [Google Drive folder](https://drive.google.com/drive/folders/1sFpZUpDJVjiYEvIqISqfkFizfsTnPf4s?usp=sharing).\n", "Please let me (Phillip) know if an error occurs so it can be fixed for all students."]}, {"cell_type": "code", "execution_count": 4, "id": "58e26273", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:33:17.060096Z", "iopub.status.busy": "2021-09-16T12:33:17.059620Z", "iopub.status.idle": "2021-09-16T12:33:18.470969Z", "shell.execute_reply": "2021-09-16T12:33:18.470514Z"}, "papermill": {"duration": 1.438459, "end_time": "2021-09-16T12:33:18.471082", "exception": false, "start_time": "2021-09-16T12:33:17.032623", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial3/FashionMNIST_elu.config...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial3/FashionMNIST_elu.tar...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial3/FashionMNIST_leakyrelu.config...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial3/FashionMNIST_leakyrelu.tar...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial3/FashionMNIST_relu.config...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial3/FashionMNIST_relu.tar...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial3/FashionMNIST_sigmoid.config...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial3/FashionMNIST_sigmoid.tar...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial3/FashionMNIST_swish.config...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial3/FashionMNIST_swish.tar...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial3/FashionMNIST_tanh.config...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial3/FashionMNIST_tanh.tar...\n"]}], "source": ["# Github URL where saved models are stored for this tutorial\n", "base_url = \"https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial3/\"\n", "# Files to download\n", "pretrained_files = [\n", " \"FashionMNIST_elu.config\",\n", " \"FashionMNIST_elu.tar\",\n", " \"FashionMNIST_leakyrelu.config\",\n", " \"FashionMNIST_leakyrelu.tar\",\n", " \"FashionMNIST_relu.config\",\n", " \"FashionMNIST_relu.tar\",\n", " \"FashionMNIST_sigmoid.config\",\n", " \"FashionMNIST_sigmoid.tar\",\n", " \"FashionMNIST_swish.config\",\n", " \"FashionMNIST_swish.tar\",\n", " \"FashionMNIST_tanh.config\",\n", " \"FashionMNIST_tanh.tar\",\n", "]\n", "# Create checkpoint path if it doesn't exist yet\n", "os.makedirs(CHECKPOINT_PATH, exist_ok=True)\n", "\n", "# For each file, check whether it already exists. If not, try downloading it.\n", "for file_name in pretrained_files:\n", " file_path = os.path.join(CHECKPOINT_PATH, file_name)\n", " if not os.path.isfile(file_path):\n", " file_url = base_url + file_name\n", " print(f\"Downloading {file_url}...\")\n", " try:\n", " urllib.request.urlretrieve(file_url, file_path)\n", " except HTTPError as e:\n", " print(\n", " \"Something went wrong. Please try to download the file from the GDrive folder, or contact the author with the full output including the following error:\\n\",\n", " e,\n", " )"]}, {"cell_type": "markdown", "id": "acbb3e50", "metadata": {"papermill": {"duration": 0.023807, "end_time": "2021-09-16T12:33:18.519257", "exception": false, "start_time": "2021-09-16T12:33:18.495450", "status": "completed"}, "tags": []}, "source": ["## Common activation functions"]}, {"cell_type": "markdown", "id": "aa4d6503", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.023651, "end_time": "2021-09-16T12:33:18.566824", "exception": false, "start_time": "2021-09-16T12:33:18.543173", "status": "completed"}, "tags": []}, "source": ["As a first step, we will implement some common activation functions by ourselves.\n", "Of course, most of them can also be found in the `torch.nn` package (see the [documentation](https://pytorch.org/docs/stable/nn.html#non-linear-activations-weighted-sum-nonlinearity) for an overview).\n", "However, we'll write our own functions here for a better understanding and insights.\n", "\n", "For an easier time of comparing various activation functions, we start\n", "with defining a base class from which all our future modules will\n", "inherit:"]}, {"cell_type": "code", "execution_count": 5, "id": "3dcfd06e", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:33:18.618629Z", "iopub.status.busy": "2021-09-16T12:33:18.618166Z", "iopub.status.idle": "2021-09-16T12:33:18.620230Z", "shell.execute_reply": "2021-09-16T12:33:18.619833Z"}, "papermill": {"duration": 0.029814, "end_time": "2021-09-16T12:33:18.620328", "exception": false, "start_time": "2021-09-16T12:33:18.590514", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class ActivationFunction(nn.Module):\n", " def __init__(self):\n", " super().__init__()\n", " self.name = self.__class__.__name__\n", " self.config = {\"name\": self.name}"]}, {"cell_type": "markdown", "id": "d528e8e9", "metadata": {"papermill": {"duration": 0.023943, "end_time": "2021-09-16T12:33:18.668417", "exception": false, "start_time": "2021-09-16T12:33:18.644474", "status": "completed"}, "tags": []}, "source": ["Every activation function will be an `nn.Module` so that we can integrate them nicely in a network.\n", "We will use the `config` dictionary to store adjustable parameters for some activation functions.\n", "\n", "Next, we implement two of the \"oldest\" activation functions that are still commonly used for various tasks: sigmoid and tanh.\n", "Both the sigmoid and tanh activation can be also found as PyTorch functions (`torch.sigmoid`, `torch.tanh`) or as modules (`nn.Sigmoid`, `nn.Tanh`).\n", "Here, we implement them by hand:"]}, {"cell_type": "code", "execution_count": 6, "id": "e86a8cd3", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:33:18.720307Z", "iopub.status.busy": "2021-09-16T12:33:18.719843Z", "iopub.status.idle": "2021-09-16T12:33:18.721916Z", "shell.execute_reply": "2021-09-16T12:33:18.721501Z"}, "papermill": {"duration": 0.029566, "end_time": "2021-09-16T12:33:18.722011", "exception": false, "start_time": "2021-09-16T12:33:18.692445", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class Sigmoid(ActivationFunction):\n", " def forward(self, x):\n", " return 1 / (1 + torch.exp(-x))\n", "\n", "\n", "class Tanh(ActivationFunction):\n", " def forward(self, x):\n", " x_exp, neg_x_exp = torch.exp(x), torch.exp(-x)\n", " return (x_exp - neg_x_exp) / (x_exp + neg_x_exp)"]}, {"cell_type": "markdown", "id": "b2beae98", "metadata": {"papermill": {"duration": 0.023891, "end_time": "2021-09-16T12:33:18.770175", "exception": false, "start_time": "2021-09-16T12:33:18.746284", "status": "completed"}, "tags": []}, "source": ["Another popular activation function that has allowed the training of deeper networks, is the Rectified Linear Unit (ReLU).\n", "Despite its simplicity of being a piecewise linear function, ReLU has one major benefit compared to sigmoid and tanh: a strong, stable gradient for a large range of values.\n", "Based on this idea, a lot of variations of ReLU have been proposed, of which we will implement the following three: LeakyReLU, ELU, and Swish.\n", "LeakyReLU replaces the zero settings in the negative part with a smaller slope to allow gradients to flow also in this part of the input.\n", "Similarly, ELU replaces the negative part with an exponential decay.\n", "The third, most recently proposed activation function is Swish, which is actually the result of a large experiment with the purpose of finding the \"optimal\" activation function.\n", "Compared to the other activation functions, Swish is both smooth and non-monotonic (i.e. contains a change of sign in the gradient).\n", "This has been shown to prevent dead neurons as in standard ReLU activation, especially for deep networks.\n", "If interested, a more detailed discussion of the benefits of Swish can be found in [this paper](https://arxiv.org/abs/1710.05941) [1].\n", "\n", "Let's implement the four activation functions below:"]}, {"cell_type": "code", "execution_count": 7, "id": "68254625", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:33:18.823746Z", "iopub.status.busy": "2021-09-16T12:33:18.823281Z", "iopub.status.idle": "2021-09-16T12:33:18.825314Z", "shell.execute_reply": "2021-09-16T12:33:18.824855Z"}, "papermill": {"duration": 0.030969, "end_time": "2021-09-16T12:33:18.825411", "exception": false, "start_time": "2021-09-16T12:33:18.794442", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class ReLU(ActivationFunction):\n", " def forward(self, x):\n", " return x * (x > 0).float()\n", "\n", "\n", "class LeakyReLU(ActivationFunction):\n", " def __init__(self, alpha=0.1):\n", " super().__init__()\n", " self.config[\"alpha\"] = alpha\n", "\n", " def forward(self, x):\n", " return torch.where(x > 0, x, self.config[\"alpha\"] * x)\n", "\n", "\n", "class ELU(ActivationFunction):\n", " def forward(self, x):\n", " return torch.where(x > 0, x, torch.exp(x) - 1)\n", "\n", "\n", "class Swish(ActivationFunction):\n", " def forward(self, x):\n", " return x * torch.sigmoid(x)"]}, {"cell_type": "markdown", "id": "587dfd90", "metadata": {"papermill": {"duration": 0.023958, "end_time": "2021-09-16T12:33:18.873222", "exception": false, "start_time": "2021-09-16T12:33:18.849264", "status": "completed"}, "tags": []}, "source": ["For later usage, we summarize all our activation functions in a dictionary mapping the name to the class object.\n", "In case you implement a new activation function by yourself, add it here to include it in future comparisons as well:"]}, {"cell_type": "code", "execution_count": 8, "id": "61e3706d", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:33:18.924380Z", "iopub.status.busy": "2021-09-16T12:33:18.923908Z", "iopub.status.idle": "2021-09-16T12:33:18.925974Z", "shell.execute_reply": "2021-09-16T12:33:18.925558Z"}, "papermill": {"duration": 0.02888, "end_time": "2021-09-16T12:33:18.926069", "exception": false, "start_time": "2021-09-16T12:33:18.897189", "status": "completed"}, "tags": []}, "outputs": [], "source": ["act_fn_by_name = {\"sigmoid\": Sigmoid, \"tanh\": Tanh, \"relu\": ReLU, \"leakyrelu\": LeakyReLU, \"elu\": ELU, \"swish\": Swish}"]}, {"cell_type": "markdown", "id": "21624a4a", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.024088, "end_time": "2021-09-16T12:33:18.974301", "exception": false, "start_time": "2021-09-16T12:33:18.950213", "status": "completed"}, "tags": []}, "source": ["### Visualizing activation functions\n", "\n", "To get an idea of what each activation function actually does, we will visualize them in the following.\n", "Next to the actual activation value, the gradient of the function is an important aspect as it is crucial for optimizing the neural network.\n", "PyTorch allows us to compute the gradients simply by calling the `backward` function:"]}, {"cell_type": "code", "execution_count": 9, "id": "f0c123df", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:33:19.026746Z", "iopub.status.busy": "2021-09-16T12:33:19.026268Z", "iopub.status.idle": "2021-09-16T12:33:19.027904Z", "shell.execute_reply": "2021-09-16T12:33:19.028280Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.029948, "end_time": "2021-09-16T12:33:19.028393", "exception": false, "start_time": "2021-09-16T12:33:18.998445", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def get_grads(act_fn, x):\n", " \"\"\"Computes the gradients of an activation function at specified positions.\n", "\n", " Args:\n", " act_fn: An object of the class \"ActivationFunction\" with an implemented forward pass.\n", " x: 1D input tensor.\n", " Returns:\n", " A tensor with the same size of x containing the gradients of act_fn at x.\n", " \"\"\"\n", " x = x.clone().requires_grad_() # Mark the input as tensor for which we want to store gradients\n", " out = act_fn(x)\n", " out.sum().backward() # Summing results in an equal gradient flow to each element in x\n", " return x.grad # Accessing the gradients of x by \"x.grad\""]}, {"cell_type": "markdown", "id": "76f9c1ee", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.024154, "end_time": "2021-09-16T12:33:19.077839", "exception": false, "start_time": "2021-09-16T12:33:19.053685", "status": "completed"}, "tags": []}, "source": ["Now we can visualize all our activation functions including their gradients:"]}, {"cell_type": "code", "execution_count": 10, "id": "a03e014f", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:33:19.132841Z", "iopub.status.busy": "2021-09-16T12:33:19.132367Z", "iopub.status.idle": "2021-09-16T12:33:20.711026Z", "shell.execute_reply": "2021-09-16T12:33:20.711412Z"}, "papermill": {"duration": 1.60939, "end_time": "2021-09-16T12:33:20.711553", "exception": false, "start_time": "2021-09-16T12:33:19.102163", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:33:19.790904\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["def vis_act_fn(act_fn, ax, x):\n", " # Run activation function\n", " y = act_fn(x)\n", " y_grads = get_grads(act_fn, x)\n", " # Push x, y and gradients back to cpu for plotting\n", " x, y, y_grads = x.cpu().numpy(), y.cpu().numpy(), y_grads.cpu().numpy()\n", " # Plotting\n", " ax.plot(x, y, linewidth=2, label=\"ActFn\")\n", " ax.plot(x, y_grads, linewidth=2, label=\"Gradient\")\n", " ax.set_title(act_fn.name)\n", " ax.legend()\n", " ax.set_ylim(-1.5, x.max())\n", "\n", "\n", "# Add activation functions if wanted\n", "act_fns = [act_fn() for act_fn in act_fn_by_name.values()]\n", "x = torch.linspace(-5, 5, 1000) # Range on which we want to visualize the activation functions\n", "# Plotting\n", "cols = 2\n", "rows = math.ceil(len(act_fns) / float(cols))\n", "fig, ax = plt.subplots(rows, cols, figsize=(cols * 4, rows * 4))\n", "for i, act_fn in enumerate(act_fns):\n", " vis_act_fn(act_fn, ax[divmod(i, cols)], x)\n", "fig.subplots_adjust(hspace=0.3)\n", "plt.show()"]}, {"cell_type": "markdown", "id": "350e27aa", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.027663, "end_time": "2021-09-16T12:33:20.771273", "exception": false, "start_time": "2021-09-16T12:33:20.743610", "status": "completed"}, "tags": []}, "source": ["## Analysing the effect of activation functions\n", "
"]}, {"cell_type": "markdown", "id": "683c2c7d", "metadata": {"papermill": {"duration": 0.027646, "end_time": "2021-09-16T12:33:20.826418", "exception": false, "start_time": "2021-09-16T12:33:20.798772", "status": "completed"}, "tags": []}, "source": ["After implementing and visualizing the activation functions, we are aiming to gain insights into their effect.\n", "We do this by using a simple neural network trained on\n", "[FashionMNIST](https://github.com/zalandoresearch/fashion-mnist) and\n", "examine various aspects of the model, including the performance and\n", "gradient flow."]}, {"cell_type": "markdown", "id": "84e11974", "metadata": {"papermill": {"duration": 0.027431, "end_time": "2021-09-16T12:33:20.881415", "exception": false, "start_time": "2021-09-16T12:33:20.853984", "status": "completed"}, "tags": []}, "source": ["### Setup"]}, {"cell_type": "markdown", "id": "cf662ea5", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.027344, "end_time": "2021-09-16T12:33:20.936216", "exception": false, "start_time": "2021-09-16T12:33:20.908872", "status": "completed"}, "tags": []}, "source": ["Firstly, let's set up a neural network.\n", "The chosen network views the images as 1D tensors and pushes them through a sequence of linear layers and a specified activation function.\n", "Feel free to experiment with other network architectures."]}, {"cell_type": "code", "execution_count": 11, "id": "517f9479", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:33:20.997665Z", "iopub.status.busy": "2021-09-16T12:33:20.997195Z", "iopub.status.idle": "2021-09-16T12:33:20.999429Z", "shell.execute_reply": "2021-09-16T12:33:20.998822Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.035645, "end_time": "2021-09-16T12:33:20.999530", "exception": false, "start_time": "2021-09-16T12:33:20.963885", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class BaseNetwork(nn.Module):\n", " def __init__(self, act_fn, input_size=784, num_classes=10, hidden_sizes=[512, 256, 256, 128]):\n", " \"\"\"\n", " Args:\n", " act_fn: Object of the activation function that should be used as non-linearity in the network.\n", " input_size: Size of the input images in pixels\n", " num_classes: Number of classes we want to predict\n", " hidden_sizes: A list of integers specifying the hidden layer sizes in the NN\n", " \"\"\"\n", " super().__init__()\n", "\n", " # Create the network based on the specified hidden sizes\n", " layers = []\n", " layer_sizes = [input_size] + hidden_sizes\n", " layer_size_last = layer_sizes[0]\n", " for layer_size in layer_sizes[1:]:\n", " layers += [nn.Linear(layer_size_last, layer_size), act_fn]\n", " layer_size_last = layer_size\n", " layers += [nn.Linear(layer_sizes[-1], num_classes)]\n", " # nn.Sequential summarizes a list of modules into a single module, applying them in sequence\n", " self.layers = nn.Sequential(*layers)\n", "\n", " # We store all hyperparameters in a dictionary for saving and loading of the model\n", " self.config = {\n", " \"act_fn\": act_fn.config,\n", " \"input_size\": input_size,\n", " \"num_classes\": num_classes,\n", " \"hidden_sizes\": hidden_sizes,\n", " }\n", "\n", " def forward(self, x):\n", " x = x.view(x.size(0), -1) # Reshape images to a flat vector\n", " out = self.layers(x)\n", " return out"]}, {"cell_type": "markdown", "id": "6f191c6f", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.027564, "end_time": "2021-09-16T12:33:21.054674", "exception": false, "start_time": "2021-09-16T12:33:21.027110", "status": "completed"}, "tags": []}, "source": ["We also add functions for loading and saving the model.\n", "The hyperparameters are stored in a configuration file (simple json file):"]}, {"cell_type": "code", "execution_count": 12, "id": "36782eee", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:33:21.117432Z", "iopub.status.busy": "2021-09-16T12:33:21.116957Z", "iopub.status.idle": "2021-09-16T12:33:21.119088Z", "shell.execute_reply": "2021-09-16T12:33:21.118695Z"}, "papermill": {"duration": 0.036557, "end_time": "2021-09-16T12:33:21.119184", "exception": false, "start_time": "2021-09-16T12:33:21.082627", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def _get_config_file(model_path, model_name):\n", " # Name of the file for storing hyperparameter details\n", " return os.path.join(model_path, model_name + \".config\")\n", "\n", "\n", "def _get_model_file(model_path, model_name):\n", " # Name of the file for storing network parameters\n", " return os.path.join(model_path, model_name + \".tar\")\n", "\n", "\n", "def load_model(model_path, model_name, net=None):\n", " \"\"\"Loads a saved model from disk.\n", "\n", " Args:\n", " model_path: Path of the checkpoint directory\n", " model_name: Name of the model (str)\n", " net: (Optional) If given, the state dict is loaded into this model. Otherwise, a new model is created.\n", " \"\"\"\n", " config_file, model_file = _get_config_file(model_path, model_name), _get_model_file(model_path, model_name)\n", " assert os.path.isfile(\n", " config_file\n", " ), f'Could not find the config file \"{config_file}\". Are you sure this is the correct path and you have your model config stored here?'\n", " assert os.path.isfile(\n", " model_file\n", " ), f'Could not find the model file \"{model_file}\". Are you sure this is the correct path and you have your model stored here?'\n", " with open(config_file) as f:\n", " config_dict = json.load(f)\n", " if net is None:\n", " act_fn_name = config_dict[\"act_fn\"].pop(\"name\").lower()\n", " act_fn = act_fn_by_name[act_fn_name](**config_dict.pop(\"act_fn\"))\n", " net = BaseNetwork(act_fn=act_fn, **config_dict)\n", " net.load_state_dict(torch.load(model_file, map_location=device))\n", " return net\n", "\n", "\n", "def save_model(model, model_path, model_name):\n", " \"\"\"Given a model, we save the state_dict and hyperparameters.\n", "\n", " Args:\n", " model: Network object to save parameters from\n", " model_path: Path of the checkpoint directory\n", " model_name: Name of the model (str)\n", " \"\"\"\n", " config_dict = model.config\n", " os.makedirs(model_path, exist_ok=True)\n", " config_file, model_file = _get_config_file(model_path, model_name), _get_model_file(model_path, model_name)\n", " with open(config_file, \"w\") as f:\n", " json.dump(config_dict, f)\n", " torch.save(model.state_dict(), model_file)"]}, {"cell_type": "markdown", "id": "b2ca0082", "metadata": {"papermill": {"duration": 0.027629, "end_time": "2021-09-16T12:33:21.174646", "exception": false, "start_time": "2021-09-16T12:33:21.147017", "status": "completed"}, "tags": []}, "source": ["We also set up the dataset we want to train it on, namely [FashionMNIST](https://github.com/zalandoresearch/fashion-mnist).\n", "FashionMNIST is a more complex version of MNIST and contains black-and-white images of clothes instead of digits.\n", "The 10 classes include trousers, coats, shoes, bags and more.\n", "To load this dataset, we will make use of yet another PyTorch package, namely `torchvision` ([documentation](https://pytorch.org/vision/stable/index.html)).\n", "The `torchvision` package consists of popular datasets, model architectures, and common image transformations for computer vision.\n", "We will use the package for many of the notebooks in this course to simplify our dataset handling.\n", "\n", "Let's load the dataset below, and visualize a few images to get an impression of the data."]}, {"cell_type": "code", "execution_count": 13, "id": "d28b09ac", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:33:21.234912Z", "iopub.status.busy": "2021-09-16T12:33:21.234444Z", "iopub.status.idle": "2021-09-16T12:33:25.742469Z", "shell.execute_reply": "2021-09-16T12:33:25.741983Z"}, "papermill": {"duration": 4.539991, "end_time": "2021-09-16T12:33:25.742582", "exception": false, "start_time": "2021-09-16T12:33:21.202591", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to /__w/2/s/.datasets/FashionMNIST/raw/train-images-idx3-ubyte.gz\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "783d0fee8e0b4746ad687e2606ab92b1", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0/26421880 [00:00 first make them a tensor, then normalize them in the range -1 to 1\n", "transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.5,), (0.5,))])\n", "\n", "# Loading the training dataset. We need to split it into a training and validation part\n", "train_dataset = FashionMNIST(root=DATASET_PATH, train=True, transform=transform, download=True)\n", "train_set, val_set = torch.utils.data.random_split(train_dataset, [50000, 10000])\n", "\n", "# Loading the test set\n", "test_set = FashionMNIST(root=DATASET_PATH, train=False, transform=transform, download=True)"]}, {"cell_type": "markdown", "id": "22d8c0df", "metadata": {"papermill": {"duration": 0.031277, "end_time": "2021-09-16T12:33:25.805768", "exception": false, "start_time": "2021-09-16T12:33:25.774491", "status": "completed"}, "tags": []}, "source": ["We define a set of data loaders that we can use for various purposes later.\n", "Note that for actually training a model, we will use different data loaders\n", "with a lower batch size."]}, {"cell_type": "code", "execution_count": 14, "id": "079a68d3", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:33:25.874180Z", "iopub.status.busy": "2021-09-16T12:33:25.873691Z", "iopub.status.idle": "2021-09-16T12:33:25.875574Z", "shell.execute_reply": "2021-09-16T12:33:25.875949Z"}, "papermill": {"duration": 0.036986, "end_time": "2021-09-16T12:33:25.876059", "exception": false, "start_time": "2021-09-16T12:33:25.839073", "status": "completed"}, "tags": []}, "outputs": [], "source": ["train_loader = data.DataLoader(train_set, batch_size=1024, shuffle=True, drop_last=False)\n", "val_loader = data.DataLoader(val_set, batch_size=1024, shuffle=False, drop_last=False)\n", "test_loader = data.DataLoader(test_set, batch_size=1024, shuffle=False, drop_last=False)"]}, {"cell_type": "code", "execution_count": 15, "id": "09ec856b", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:33:25.943298Z", "iopub.status.busy": "2021-09-16T12:33:25.942829Z", "iopub.status.idle": "2021-09-16T12:33:26.149461Z", "shell.execute_reply": "2021-09-16T12:33:26.148976Z"}, "papermill": {"duration": 0.241991, "end_time": "2021-09-16T12:33:26.149573", "exception": false, "start_time": "2021-09-16T12:33:25.907582", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:33:26.023661\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["exmp_imgs = [train_set[i][0] for i in range(16)]\n", "# Organize the images into a grid for nicer visualization\n", "img_grid = torchvision.utils.make_grid(torch.stack(exmp_imgs, dim=0), nrow=4, normalize=True, pad_value=0.5)\n", "img_grid = img_grid.permute(1, 2, 0)\n", "\n", "plt.figure(figsize=(8, 8))\n", "plt.title(\"FashionMNIST examples\")\n", "plt.imshow(img_grid)\n", "plt.axis(\"off\")\n", "plt.show()\n", "plt.close()"]}, {"cell_type": "markdown", "id": "23a0bd21", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.032861, "end_time": "2021-09-16T12:33:26.216246", "exception": false, "start_time": "2021-09-16T12:33:26.183385", "status": "completed"}, "tags": []}, "source": ["### Visualizing the gradient flow after initialization\n", "\n", "As mentioned previously, one important aspect of activation functions is how they propagate gradients through the network.\n", "Imagine we have a very deep neural network with more than 50 layers.\n", "The gradients for the input layer, i.e. the very first layer, have passed >50 times the activation function, but we still want them to be of a reasonable size.\n", "If the gradient through the activation function is (in expectation) considerably smaller than 1, our gradients will vanish until they reach the input layer.\n", "If the gradient through the activation function is larger than 1, the gradients exponentially increase and might explode.\n", "\n", "To get a feeling of how every activation function influences the\n", "gradients, we can look at a freshly initialized network and measure the\n", "gradients for each parameter for a batch of 256 images:"]}, {"cell_type": "code", "execution_count": 16, "id": "d0313697", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:33:26.290315Z", "iopub.status.busy": "2021-09-16T12:33:26.289838Z", "iopub.status.idle": "2021-09-16T12:33:26.291904Z", "shell.execute_reply": "2021-09-16T12:33:26.291439Z"}, "papermill": {"duration": 0.043006, "end_time": "2021-09-16T12:33:26.292005", "exception": false, "start_time": "2021-09-16T12:33:26.248999", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def visualize_gradients(net, color=\"C0\"):\n", " \"\"\"\n", " Args:\n", " net: Object of class BaseNetwork\n", " color: Color in which we want to visualize the histogram (for easier separation of activation functions)\n", " \"\"\"\n", " net.eval()\n", " small_loader = data.DataLoader(train_set, batch_size=256, shuffle=False)\n", " imgs, labels = next(iter(small_loader))\n", " imgs, labels = imgs.to(device), labels.to(device)\n", "\n", " # Pass one batch through the network, and calculate the gradients for the weights\n", " net.zero_grad()\n", " preds = net(imgs)\n", " loss = F.cross_entropy(preds, labels)\n", " loss.backward()\n", " # We limit our visualization to the weight parameters and exclude the bias to reduce the number of plots\n", " grads = {\n", " name: params.grad.data.view(-1).cpu().clone().numpy()\n", " for name, params in net.named_parameters()\n", " if \"weight\" in name\n", " }\n", " net.zero_grad()\n", "\n", " # Plotting\n", " columns = len(grads)\n", " fig, ax = plt.subplots(1, columns, figsize=(columns * 3.5, 2.5))\n", " fig_index = 0\n", " for key in grads:\n", " key_ax = ax[fig_index % columns]\n", " sns.histplot(data=grads[key], bins=30, ax=key_ax, color=color, kde=True)\n", " key_ax.set_title(str(key))\n", " key_ax.set_xlabel(\"Grad magnitude\")\n", " fig_index += 1\n", " fig.suptitle(\n", " f\"Gradient magnitude distribution for activation function {net.config['act_fn']['name']}\", fontsize=14, y=1.05\n", " )\n", " fig.subplots_adjust(wspace=0.45)\n", " plt.show()\n", " plt.close()"]}, {"cell_type": "code", "execution_count": 17, "id": "41a44b36", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:33:26.364210Z", "iopub.status.busy": "2021-09-16T12:33:26.363743Z", "iopub.status.idle": "2021-09-16T12:33:55.550270Z", "shell.execute_reply": "2021-09-16T12:33:55.550658Z"}, "papermill": {"duration": 29.22383, "end_time": "2021-09-16T12:33:55.550789", "exception": false, "start_time": "2021-09-16T12:33:26.326959", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:33:32.587230\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:33:37.105241\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:33:41.454585\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:33:45.830177\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:33:50.374176\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:33:54.684961\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["# Seaborn prints warnings if histogram has small values. We can ignore them for now\n", "warnings.filterwarnings(\"ignore\")\n", "# Create a plot for every activation function\n", "for i, act_fn_name in enumerate(act_fn_by_name):\n", " # Setting the seed ensures that we have the same weight initialization for each activation function\n", " set_seed(42)\n", " act_fn = act_fn_by_name[act_fn_name]()\n", " net_actfn = BaseNetwork(act_fn=act_fn).to(device)\n", " visualize_gradients(net_actfn, color=f\"C{i}\")"]}, {"cell_type": "markdown", "id": "f73b5f3f", "metadata": {"papermill": {"duration": 0.062002, "end_time": "2021-09-16T12:33:55.677984", "exception": false, "start_time": "2021-09-16T12:33:55.615982", "status": "completed"}, "tags": []}, "source": ["The sigmoid activation function shows a clearly undesirable behavior.\n", "While the gradients for the output layer are very large with up to 0.1, the input layer has the lowest gradient norm across all activation functions with only 1e-5.\n", "This is due to its small maximum gradient of 1/4, and finding a suitable learning rate across all layers is not possible in this setup.\n", "All the other activation functions show to have similar gradient norms across all layers.\n", "Interestingly, the ReLU activation has a spike around 0 which is caused by its zero-part on the left, and dead neurons (we will take a closer look at this later on).\n", "\n", "Note that additionally to the activation, the initialization of the weight parameters can be crucial.\n", "By default, PyTorch uses the [Kaiming](https://pytorch.org/docs/stable/nn.init.html#torch.nn.init.kaiming_uniform_) initialization for linear layers optimized for Tanh activations.\n", "In Tutorial 4, we will take a closer look at initialization, but assume\n", "for now that the Kaiming initialization works for all activation\n", "functions reasonably well."]}, {"cell_type": "markdown", "id": "b6081434", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.061601, "end_time": "2021-09-16T12:33:55.800993", "exception": false, "start_time": "2021-09-16T12:33:55.739392", "status": "completed"}, "tags": []}, "source": ["### Training a model\n", "\n", "Next, we want to train our model with different activation functions on FashionMNIST and compare the gained performance.\n", "All in all, our final goal is to achieve the best possible performance on a dataset of our choice.\n", "Therefore, we write a training loop in the next cell including a\n", "validation after every epoch and a final test on the best model:"]}, {"cell_type": "code", "execution_count": 18, "id": "827e3645", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:33:55.937494Z", "iopub.status.busy": "2021-09-16T12:33:55.936999Z", "iopub.status.idle": "2021-09-16T12:33:55.939074Z", "shell.execute_reply": "2021-09-16T12:33:55.938676Z"}, "papermill": {"duration": 0.07601, "end_time": "2021-09-16T12:33:55.939174", "exception": false, "start_time": "2021-09-16T12:33:55.863164", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def train_model(net, model_name, max_epochs=50, patience=7, batch_size=256, overwrite=False):\n", " \"\"\"Train a model on the training set of FashionMNIST.\n", "\n", " Args:\n", " net: Object of BaseNetwork\n", " model_name: (str) Name of the model, used for creating the checkpoint names\n", " max_epochs: Number of epochs we want to (maximally) train for\n", " patience: If the performance on the validation set has not improved for #patience epochs, we stop training early\n", " batch_size: Size of batches used in training\n", " overwrite: Determines how to handle the case when there already exists a checkpoint. If True, it will be overwritten. Otherwise, we skip training.\n", " \"\"\"\n", " file_exists = os.path.isfile(_get_model_file(CHECKPOINT_PATH, model_name))\n", " if file_exists and not overwrite:\n", " print(\"Model file already exists. Skipping training...\")\n", " else:\n", " if file_exists:\n", " print(\"Model file exists, but will be overwritten...\")\n", "\n", " # Defining optimizer, loss and data loader\n", " optimizer = optim.SGD(net.parameters(), lr=1e-2, momentum=0.9) # Default parameters, feel free to change\n", " loss_module = nn.CrossEntropyLoss()\n", " train_loader_local = data.DataLoader(\n", " train_set, batch_size=batch_size, shuffle=True, drop_last=True, pin_memory=True\n", " )\n", "\n", " val_scores = []\n", " best_val_epoch = -1\n", " for epoch in range(max_epochs):\n", " ############\n", " # Training #\n", " ############\n", " net.train()\n", " true_preds, count = 0.0, 0\n", " for imgs, labels in tqdm(train_loader_local, desc=f\"Epoch {epoch+1}\", leave=False):\n", " imgs, labels = imgs.to(device), labels.to(device) # To GPU\n", " optimizer.zero_grad() # Zero-grad can be placed anywhere before \"loss.backward()\"\n", " preds = net(imgs)\n", " loss = loss_module(preds, labels)\n", " loss.backward()\n", " optimizer.step()\n", " # Record statistics during training\n", " true_preds += (preds.argmax(dim=-1) == labels).sum()\n", " count += labels.shape[0]\n", " train_acc = true_preds / count\n", "\n", " ##############\n", " # Validation #\n", " ##############\n", " val_acc = test_model(net, val_loader)\n", " val_scores.append(val_acc)\n", " print(\n", " f\"[Epoch {epoch+1:2i}] Training accuracy: {train_acc*100.0:05.2f}%, Validation accuracy: {val_acc*100.0:05.2f}%\"\n", " )\n", "\n", " if len(val_scores) == 1 or val_acc > val_scores[best_val_epoch]:\n", " print(\"\\t (New best performance, saving model...)\")\n", " save_model(net, CHECKPOINT_PATH, model_name)\n", " best_val_epoch = epoch\n", " elif best_val_epoch <= epoch - patience:\n", " print(f\"Early stopping due to no improvement over the last {patience} epochs\")\n", " break\n", "\n", " # Plot a curve of the validation accuracy\n", " plt.plot([i for i in range(1, len(val_scores) + 1)], val_scores)\n", " plt.xlabel(\"Epochs\")\n", " plt.ylabel(\"Validation accuracy\")\n", " plt.title(f\"Validation performance of {model_name}\")\n", " plt.show()\n", " plt.close()\n", "\n", " load_model(CHECKPOINT_PATH, model_name, net=net)\n", " test_acc = test_model(net, test_loader)\n", " print((f\" Test accuracy: {test_acc*100.0:4.2f}% \").center(50, \"=\") + \"\\n\")\n", " return test_acc\n", "\n", "\n", "def test_model(net, data_loader):\n", " \"\"\"Test a model on a specified dataset.\n", "\n", " Args:\n", " net: Trained model of type BaseNetwork\n", " data_loader: DataLoader object of the dataset to test on (validation or test)\n", " \"\"\"\n", " net.eval()\n", " true_preds, count = 0.0, 0\n", " for imgs, labels in data_loader:\n", " imgs, labels = imgs.to(device), labels.to(device)\n", " with torch.no_grad():\n", " preds = net(imgs).argmax(dim=-1)\n", " true_preds += (preds == labels).sum().item()\n", " count += labels.shape[0]\n", " test_acc = true_preds / count\n", " return test_acc"]}, {"cell_type": "markdown", "id": "685326ae", "metadata": {"papermill": {"duration": 0.06232, "end_time": "2021-09-16T12:33:56.062996", "exception": false, "start_time": "2021-09-16T12:33:56.000676", "status": "completed"}, "tags": []}, "source": ["We train one model for each activation function.\n", "We recommend using the pretrained models to save time if you are running this notebook on CPU."]}, {"cell_type": "code", "execution_count": 19, "id": "1a2237a5", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:33:56.192395Z", "iopub.status.busy": "2021-09-16T12:33:56.191926Z", "iopub.status.idle": "2021-09-16T12:34:06.194481Z", "shell.execute_reply": "2021-09-16T12:34:06.193995Z"}, "papermill": {"duration": 10.068153, "end_time": "2021-09-16T12:34:06.194591", "exception": false, "start_time": "2021-09-16T12:33:56.126438", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Training BaseNetwork with sigmoid activation...\n", "Model file already exists. Skipping training...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["============= Test accuracy: 10.00% ==============\n", "\n", "Training BaseNetwork with tanh activation...\n", "Model file already exists. Skipping training...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["============= Test accuracy: 87.59% ==============\n", "\n", "Training BaseNetwork with relu activation...\n", "Model file already exists. Skipping training...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["============= Test accuracy: 88.62% ==============\n", "\n", "Training BaseNetwork with leakyrelu activation...\n", "Model file already exists. Skipping training...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["============= Test accuracy: 88.92% ==============\n", "\n", "Training BaseNetwork with elu activation...\n", "Model file already exists. Skipping training...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["============= Test accuracy: 87.27% ==============\n", "\n", "Training BaseNetwork with swish activation...\n", "Model file already exists. Skipping training...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["============= Test accuracy: 88.73% ==============\n", "\n"]}], "source": ["for act_fn_name in act_fn_by_name:\n", " print(f\"Training BaseNetwork with {act_fn_name} activation...\")\n", " set_seed(42)\n", " act_fn = act_fn_by_name[act_fn_name]()\n", " net_actfn = BaseNetwork(act_fn=act_fn).to(device)\n", " train_model(net_actfn, f\"FashionMNIST_{act_fn_name}\", overwrite=False)"]}, {"cell_type": "markdown", "id": "34dd5b86", "metadata": {"papermill": {"duration": 0.062788, "end_time": "2021-09-16T12:34:06.322278", "exception": false, "start_time": "2021-09-16T12:34:06.259490", "status": "completed"}, "tags": []}, "source": ["Not surprisingly, the model using the sigmoid activation function shows to fail and does not improve upon random performance (10 classes => 1/10 for random chance).\n", "\n", "All the other activation functions gain similar performance.\n", "To have a more accurate conclusion, we would have to train the models for multiple seeds and look at the averages.\n", "However, the \"optimal\" activation function also depends on many other factors (hidden sizes, number of layers, type of layers, task, dataset, optimizer, learning rate, etc.)\n", "so that a thorough grid search would not be useful in our case.\n", "In the literature, activation functions that have shown to work well\n", "with deep networks are all types of ReLU functions we experiment with\n", "here, with small gains for specific activation functions in specific\n", "networks."]}, {"cell_type": "markdown", "id": "5a74d87d", "metadata": {"papermill": {"duration": 0.063695, "end_time": "2021-09-16T12:34:06.449135", "exception": false, "start_time": "2021-09-16T12:34:06.385440", "status": "completed"}, "tags": []}, "source": ["### Visualizing the activation distribution"]}, {"cell_type": "markdown", "id": "68596e03", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.062527, "end_time": "2021-09-16T12:34:06.574529", "exception": false, "start_time": "2021-09-16T12:34:06.512002", "status": "completed"}, "tags": []}, "source": ["After we have trained the models, we can look at the actual activation values that find inside the model.\n", "For instance, how many neurons are set to zero in ReLU?\n", "Where do we find most values in Tanh?\n", "To answer these questions, we can write a simple function which takes a\n", "trained model, applies it to a batch of images, and plots the histogram\n", "of the activations inside the network:"]}, {"cell_type": "code", "execution_count": 20, "id": "24bf9b21", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:34:06.708975Z", "iopub.status.busy": "2021-09-16T12:34:06.708490Z", "iopub.status.idle": "2021-09-16T12:34:06.710629Z", "shell.execute_reply": "2021-09-16T12:34:06.710158Z"}, "papermill": {"duration": 0.073035, "end_time": "2021-09-16T12:34:06.710735", "exception": false, "start_time": "2021-09-16T12:34:06.637700", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def visualize_activations(net, color=\"C0\"):\n", " activations = {}\n", "\n", " net.eval()\n", " small_loader = data.DataLoader(train_set, batch_size=1024)\n", " imgs, labels = next(iter(small_loader))\n", " with torch.no_grad():\n", " layer_index = 0\n", " imgs = imgs.to(device)\n", " imgs = imgs.view(imgs.size(0), -1)\n", " # We need to manually loop through the layers to save all activations\n", " for layer_index, layer in enumerate(net.layers[:-1]):\n", " imgs = layer(imgs)\n", " activations[layer_index] = imgs.view(-1).cpu().numpy()\n", "\n", " # Plotting\n", " columns = 4\n", " rows = math.ceil(len(activations) / columns)\n", " fig, ax = plt.subplots(rows, columns, figsize=(columns * 2.7, rows * 2.5))\n", " fig_index = 0\n", " for key in activations:\n", " key_ax = ax[fig_index // columns][fig_index % columns]\n", " sns.histplot(data=activations[key], bins=50, ax=key_ax, color=color, kde=True, stat=\"density\")\n", " key_ax.set_title(f\"Layer {key} - {net.layers[key].__class__.__name__}\")\n", " fig_index += 1\n", " fig.suptitle(f\"Activation distribution for activation function {net.config['act_fn']['name']}\", fontsize=14)\n", " fig.subplots_adjust(hspace=0.4, wspace=0.4)\n", " plt.show()\n", " plt.close()"]}, {"cell_type": "code", "execution_count": 21, "id": "d8f346ab", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:34:06.842909Z", "iopub.status.busy": "2021-09-16T12:34:06.842437Z", "iopub.status.idle": "2021-09-16T12:35:27.581742Z", "shell.execute_reply": "2021-09-16T12:35:27.582143Z"}, "papermill": {"duration": 80.807, "end_time": "2021-09-16T12:35:27.582289", "exception": false, "start_time": "2021-09-16T12:34:06.775289", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:34:19.777697\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:34:33.923518\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:34:46.777369\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:34:59.806501\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:35:13.285964\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:35:25.997012\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["for i, act_fn_name in enumerate(act_fn_by_name):\n", " net_actfn = load_model(model_path=CHECKPOINT_PATH, model_name=f\"FashionMNIST_{act_fn_name}\").to(device)\n", " visualize_activations(net_actfn, color=f\"C{i}\")"]}, {"cell_type": "markdown", "id": "1a945558", "metadata": {"papermill": {"duration": 0.111895, "end_time": "2021-09-16T12:35:27.806164", "exception": false, "start_time": "2021-09-16T12:35:27.694269", "status": "completed"}, "tags": []}, "source": ["As the model with sigmoid activation was not able to train properly, the activations are also less informative and all gathered around 0.5 (the activation at input 0).\n", "\n", "The tanh shows a more diverse behavior.\n", "While for the input layer we experience a larger amount of neurons to be close to -1 and 1, where the gradients are close to zero, the activations in the two consecutive layers are closer to zero.\n", "This is probably because the input layers look for specific features in the input image, and the consecutive layers combine those together.\n", "The activations for the last layer are again more biased to the extreme points because the classification layer can be seen as a weighted average of those values (the gradients push the activations to those extremes).\n", "\n", "The ReLU has a strong peak at 0, as we initially expected.\n", "The effect of having no gradients for negative values is that the network does not have a Gaussian-like distribution after the linear layers, but a longer tail towards the positive values.\n", "The LeakyReLU shows a very similar behavior while ELU follows again a more Gaussian-like distribution.\n", "The Swish activation seems to lie in between, although it is worth noting that Swish uses significantly higher values than other activation functions (up to 20).\n", "\n", "As all activation functions show slightly different behavior although\n", "obtaining similar performance for our simple network, it becomes\n", "apparent that the selection of the \"optimal\" activation function really\n", "depends on many factors, and is not the same for all possible networks."]}, {"cell_type": "markdown", "id": "57bfc158", "metadata": {"papermill": {"duration": 0.110593, "end_time": "2021-09-16T12:35:28.026614", "exception": false, "start_time": "2021-09-16T12:35:27.916021", "status": "completed"}, "tags": []}, "source": ["### Finding dead neurons in ReLU networks"]}, {"cell_type": "markdown", "id": "3dbcab2c", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.114666, "end_time": "2021-09-16T12:35:28.251636", "exception": false, "start_time": "2021-09-16T12:35:28.136970", "status": "completed"}, "tags": []}, "source": ["One known drawback of the ReLU activation is the occurrence of \"dead neurons\", i.e. neurons with no gradient for any training input.\n", "The issue of dead neurons is that as no gradient is provided for the layer, we cannot train the parameters of this neuron in the previous layer to obtain output values besides zero.\n", "For dead neurons to happen, the output value of a specific neuron of the linear layer before the ReLU has to be negative for all input images.\n", "Considering the large number of neurons we have in a neural network, it is not unlikely for this to happen.\n", "\n", "To get a better understanding of how much of a problem this is, and when we need to be careful, we will measure how many dead neurons different networks have.\n", "For this, we implement a function which runs the network on the whole\n", "training set and records whether a neuron is exactly 0 for all data\n", "points or not:"]}, {"cell_type": "code", "execution_count": 22, "id": "edc02b80", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:35:28.479594Z", "iopub.status.busy": "2021-09-16T12:35:28.479110Z", "iopub.status.idle": "2021-09-16T12:35:28.481273Z", "shell.execute_reply": "2021-09-16T12:35:28.481901Z"}, "papermill": {"duration": 0.119951, "end_time": "2021-09-16T12:35:28.482036", "exception": false, "start_time": "2021-09-16T12:35:28.362085", "status": "completed"}, "tags": []}, "outputs": [], "source": ["@torch.no_grad()\n", "def measure_number_dead_neurons(net):\n", " \"\"\"Function to measure the number of dead neurons in a trained neural network.\n", "\n", " For each neuron, we create a boolean variable initially set to 1. If it has an activation unequals 0 at any time, we\n", " set this variable to 0. After running through the whole training set, only dead neurons will have a 1.\n", " \"\"\"\n", " neurons_dead = [\n", " torch.ones(layer.weight.shape[0], device=device, dtype=torch.bool)\n", " for layer in net.layers[:-1]\n", " if isinstance(layer, nn.Linear)\n", " ] # Same shapes as hidden size in BaseNetwork\n", "\n", " net.eval()\n", " for imgs, labels in tqdm(train_loader, leave=False): # Run through whole training set\n", " layer_index = 0\n", " imgs = imgs.to(device)\n", " imgs = imgs.view(imgs.size(0), -1)\n", " for layer in net.layers[:-1]:\n", " imgs = layer(imgs)\n", " if isinstance(layer, ActivationFunction):\n", " # Are all activations == 0 in the batch, and we did not record the opposite in the last batches?\n", " neurons_dead[layer_index] = torch.logical_and(neurons_dead[layer_index], (imgs == 0).all(dim=0))\n", " layer_index += 1\n", " number_neurons_dead = [t.sum().item() for t in neurons_dead]\n", " print(\"Number of dead neurons:\", number_neurons_dead)\n", " print(\n", " \"In percentage:\",\n", " \", \".join(\n", " [f\"{(100.0 * num_dead / tens.shape[0]):4.2f}%\" for tens, num_dead in zip(neurons_dead, number_neurons_dead)]\n", " ),\n", " )"]}, {"cell_type": "markdown", "id": "39be5f1b", "metadata": {"papermill": {"duration": 0.109828, "end_time": "2021-09-16T12:35:28.702763", "exception": false, "start_time": "2021-09-16T12:35:28.592935", "status": "completed"}, "tags": []}, "source": ["First, we can measure the number of dead neurons for an untrained network:"]}, {"cell_type": "code", "execution_count": 23, "id": "1f83d14a", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:35:28.929900Z", "iopub.status.busy": "2021-09-16T12:35:28.929410Z", "iopub.status.idle": "2021-09-16T12:35:37.256636Z", "shell.execute_reply": "2021-09-16T12:35:37.256221Z"}, "papermill": {"duration": 8.441781, "end_time": "2021-09-16T12:35:37.256748", "exception": false, "start_time": "2021-09-16T12:35:28.814967", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "4f3bb9c6b5c64d568faac8e14240eab4", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0/49 [00:00=0.3\" \"torchvision\" \"pytorch-lightning>=1.3\" \"torch>=1.6, <1.9\" \"matplotlib\""]}, {"cell_type": "markdown", "id": "6502723b", "metadata": {"papermill": {"duration": 0.116681, "end_time": "2021-12-04T15:54:35.117128", "exception": false, "start_time": "2021-12-04T15:54:35.000447", "status": "completed"}, "tags": []}, "source": ["
\n", "In the first half of the notebook, we will review different initialization techniques, and go step by step from the simplest initialization to methods that are nowadays used in very deep networks.\n", "In the second half, we focus on optimization comparing the optimizers SGD, SGD with Momentum, and Adam.\n", "\n", "Let's start with importing our standard libraries:"]}, {"cell_type": "code", "execution_count": 2, "id": "7b848761", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:35.354836Z", "iopub.status.busy": "2021-12-04T15:54:35.354335Z", "iopub.status.idle": "2021-12-04T15:54:37.277810Z", "shell.execute_reply": "2021-12-04T15:54:37.278195Z"}, "papermill": {"duration": 2.046832, "end_time": "2021-12-04T15:54:37.278357", "exception": false, "start_time": "2021-12-04T15:54:35.231525", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/tmp/ipykernel_875/1682095326.py:24: DeprecationWarning: `set_matplotlib_formats` is deprecated since IPython 7.23, directly use `matplotlib_inline.backend_inline.set_matplotlib_formats()`\n", " set_matplotlib_formats(\"svg\", \"pdf\") # For export\n"]}], "source": ["import copy\n", "import json\n", "import math\n", "import os\n", "import urllib.request\n", "from urllib.error import HTTPError\n", "\n", "import matplotlib.pyplot as plt\n", "import numpy as np\n", "import pytorch_lightning as pl\n", "import seaborn as sns\n", "import torch\n", "import torch.nn as nn\n", "import torch.nn.functional as F\n", "import torch.utils.data as data\n", "\n", "%matplotlib inline\n", "from IPython.display import set_matplotlib_formats\n", "from matplotlib import cm\n", "from torchvision import transforms\n", "from torchvision.datasets import FashionMNIST\n", "from tqdm.notebook import tqdm\n", "\n", "set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "sns.set()"]}, {"cell_type": "markdown", "id": "34ff3be8", "metadata": {"papermill": {"duration": 0.117573, "end_time": "2021-12-04T15:54:37.513508", "exception": false, "start_time": "2021-12-04T15:54:37.395935", "status": "completed"}, "tags": []}, "source": ["Instead of the `set_seed` function as in Tutorial 3, we can use PyTorch Lightning's build-in function `pl.seed_everything`.\n", "We will reuse the path variables `DATASET_PATH` and `CHECKPOINT_PATH` as in Tutorial 3.\n", "Adjust the paths if necessary."]}, {"cell_type": "code", "execution_count": 3, "id": "35b849b3", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:37.749217Z", "iopub.status.busy": "2021-12-04T15:54:37.748745Z", "iopub.status.idle": "2021-12-04T15:54:37.951118Z", "shell.execute_reply": "2021-12-04T15:54:37.951502Z"}, "papermill": {"duration": 0.323033, "end_time": "2021-12-04T15:54:37.951669", "exception": false, "start_time": "2021-12-04T15:54:37.628636", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Using device cuda:0\n"]}], "source": ["# Path to the folder where the datasets are/should be downloaded (e.g. MNIST)\n", "DATASET_PATH = os.environ.get(\"PATH_DATASETS\", \"data/\")\n", "# Path to the folder where the pretrained models are saved\n", "CHECKPOINT_PATH = os.environ.get(\"PATH_CHECKPOINT\", \"saved_models/InitOptim/\")\n", "\n", "# Seed everything\n", "pl.seed_everything(42)\n", "\n", "# Ensure that all operations are deterministic on GPU (if used) for reproducibility\n", "torch.backends.cudnn.determinstic = True\n", "torch.backends.cudnn.benchmark = False\n", "\n", "# Fetching the device that will be used throughout this notebook\n", "device = torch.device(\"cpu\") if not torch.cuda.is_available() else torch.device(\"cuda:0\")\n", "print(\"Using device\", device)"]}, {"cell_type": "markdown", "id": "94ce8a6e", "metadata": {"papermill": {"duration": 0.116608, "end_time": "2021-12-04T15:54:38.185784", "exception": false, "start_time": "2021-12-04T15:54:38.069176", "status": "completed"}, "tags": []}, "source": ["In the last part of the notebook, we will train models using three different optimizers.\n", "The pretrained models for those are downloaded below."]}, {"cell_type": "code", "execution_count": 4, "id": "8e55f09c", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:38.430163Z", "iopub.status.busy": "2021-12-04T15:54:38.429683Z", "iopub.status.idle": "2021-12-04T15:54:39.458838Z", "shell.execute_reply": "2021-12-04T15:54:39.458384Z"}, "papermill": {"duration": 1.155736, "end_time": "2021-12-04T15:54:39.458964", "exception": false, "start_time": "2021-12-04T15:54:38.303228", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial4/FashionMNIST_SGD.config...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial4/FashionMNIST_SGD_results.json...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial4/FashionMNIST_SGD.tar...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial4/FashionMNIST_SGDMom.config...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial4/FashionMNIST_SGDMom_results.json...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial4/FashionMNIST_SGDMom.tar...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial4/FashionMNIST_Adam.config...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial4/FashionMNIST_Adam_results.json...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial4/FashionMNIST_Adam.tar...\n"]}], "source": ["# Github URL where saved models are stored for this tutorial\n", "base_url = \"https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial4/\"\n", "# Files to download\n", "pretrained_files = [\n", " \"FashionMNIST_SGD.config\",\n", " \"FashionMNIST_SGD_results.json\",\n", " \"FashionMNIST_SGD.tar\",\n", " \"FashionMNIST_SGDMom.config\",\n", " \"FashionMNIST_SGDMom_results.json\",\n", " \"FashionMNIST_SGDMom.tar\",\n", " \"FashionMNIST_Adam.config\",\n", " \"FashionMNIST_Adam_results.json\",\n", " \"FashionMNIST_Adam.tar\",\n", "]\n", "# Create checkpoint path if it doesn't exist yet\n", "os.makedirs(CHECKPOINT_PATH, exist_ok=True)\n", "\n", "# For each file, check whether it already exists. If not, try downloading it.\n", "for file_name in pretrained_files:\n", " file_path = os.path.join(CHECKPOINT_PATH, file_name)\n", " if not os.path.isfile(file_path):\n", " file_url = base_url + file_name\n", " print(f\"Downloading {file_url}...\")\n", " try:\n", " urllib.request.urlretrieve(file_url, file_path)\n", " except HTTPError as e:\n", " print(\n", " \"Something went wrong. Please try to download the file from the GDrive folder, or contact the author with the full output including the following error:\\n\",\n", " e,\n", " )"]}, {"cell_type": "markdown", "id": "30caea5b", "metadata": {"papermill": {"duration": 0.120012, "end_time": "2021-12-04T15:54:39.700194", "exception": false, "start_time": "2021-12-04T15:54:39.580182", "status": "completed"}, "tags": []}, "source": ["## Preparation"]}, {"cell_type": "markdown", "id": "231720c6", "metadata": {"papermill": {"duration": 0.120402, "end_time": "2021-12-04T15:54:39.942112", "exception": false, "start_time": "2021-12-04T15:54:39.821710", "status": "completed"}, "tags": []}, "source": ["Throughout this notebook, we will use a deep fully connected network, similar to our previous tutorial.\n", "We will also again apply the network to FashionMNIST, so you can relate to the results of Tutorial 3.\n", "We start by loading the FashionMNIST dataset:"]}, {"cell_type": "code", "execution_count": 5, "id": "f973c6a6", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:40.192819Z", "iopub.status.busy": "2021-12-04T15:54:40.192347Z", "iopub.status.idle": "2021-12-04T15:54:45.087304Z", "shell.execute_reply": "2021-12-04T15:54:45.087688Z"}, "papermill": {"duration": 5.025264, "end_time": "2021-12-04T15:54:45.087853", "exception": false, "start_time": "2021-12-04T15:54:40.062589", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to /__w/1/s/.datasets/FashionMNIST/raw/train-images-idx3-ubyte.gz\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "0fdf1596470d464fa9a290533416cb26", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0/26421880 [00:00 first make them a tensor, then normalize them with mean 0 and std 1\n", "transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.2861,), (0.3530,))])\n", "\n", "# Loading the training dataset. We need to split it into a training and validation part\n", "train_dataset = FashionMNIST(root=DATASET_PATH, train=True, transform=transform, download=True)\n", "train_set, val_set = torch.utils.data.random_split(train_dataset, [50000, 10000])\n", "\n", "# Loading the test set\n", "test_set = FashionMNIST(root=DATASET_PATH, train=False, transform=transform, download=True)"]}, {"cell_type": "markdown", "id": "62d14135", "metadata": {"papermill": {"duration": 0.132716, "end_time": "2021-12-04T15:54:45.352571", "exception": false, "start_time": "2021-12-04T15:54:45.219855", "status": "completed"}, "tags": []}, "source": ["We define a set of data loaders that we can use for various purposes later.\n", "Note that for actually training a model, we will use different data loaders\n", "with a lower batch size."]}, {"cell_type": "code", "execution_count": 6, "id": "3d28e67a", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:45.623150Z", "iopub.status.busy": "2021-12-04T15:54:45.622650Z", "iopub.status.idle": "2021-12-04T15:54:45.624735Z", "shell.execute_reply": "2021-12-04T15:54:45.624337Z"}, "papermill": {"duration": 0.139138, "end_time": "2021-12-04T15:54:45.624842", "exception": false, "start_time": "2021-12-04T15:54:45.485704", "status": "completed"}, "tags": []}, "outputs": [], "source": ["train_loader = data.DataLoader(train_set, batch_size=1024, shuffle=True, drop_last=False)\n", "val_loader = data.DataLoader(val_set, batch_size=1024, shuffle=False, drop_last=False)\n", "test_loader = data.DataLoader(test_set, batch_size=1024, shuffle=False, drop_last=False)"]}, {"cell_type": "markdown", "id": "b7b214a6", "metadata": {"papermill": {"duration": 0.132224, "end_time": "2021-12-04T15:54:45.888887", "exception": false, "start_time": "2021-12-04T15:54:45.756663", "status": "completed"}, "tags": []}, "source": ["In comparison to the previous tutorial, we have changed the parameters of the normalization transformation `transforms.Normalize`.\n", "The normalization is now designed to give us an expected mean of 0 and a standard deviation of 1 across pixels.\n", "This will be particularly relevant for the discussion about initialization we will look at below, and hence we change it here.\n", "It should be noted that in most classification tasks, both normalization techniques (between -1 and 1 or mean 0 and stddev 1) have shown to work well.\n", "We can calculate the normalization parameters by determining the mean and standard deviation on the original images:"]}, {"cell_type": "code", "execution_count": 7, "id": "f3c58d88", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:46.162358Z", "iopub.status.busy": "2021-12-04T15:54:46.161597Z", "iopub.status.idle": "2021-12-04T15:54:46.309115Z", "shell.execute_reply": "2021-12-04T15:54:46.309503Z"}, "papermill": {"duration": 0.288556, "end_time": "2021-12-04T15:54:46.309671", "exception": false, "start_time": "2021-12-04T15:54:46.021115", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Mean 0.28604060411453247\n", "Std 0.3530242443084717\n"]}], "source": ["print(\"Mean\", (train_dataset.data.float() / 255.0).mean().item())\n", "print(\"Std\", (train_dataset.data.float() / 255.0).std().item())"]}, {"cell_type": "markdown", "id": "205aa3d4", "metadata": {"papermill": {"duration": 0.134209, "end_time": "2021-12-04T15:54:46.580091", "exception": false, "start_time": "2021-12-04T15:54:46.445882", "status": "completed"}, "tags": []}, "source": ["We can verify the transformation by looking at the statistics of a single batch:"]}, {"cell_type": "code", "execution_count": 8, "id": "eb1baf45", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:46.853983Z", "iopub.status.busy": "2021-12-04T15:54:46.853514Z", "iopub.status.idle": "2021-12-04T15:54:47.034146Z", "shell.execute_reply": "2021-12-04T15:54:47.034531Z"}, "papermill": {"duration": 0.319767, "end_time": "2021-12-04T15:54:47.034711", "exception": false, "start_time": "2021-12-04T15:54:46.714944", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Mean: 0.009\n", "Standard deviation: 1.012\n", "Maximum: 2.022\n", "Minimum: -0.810\n"]}], "source": ["imgs, _ = next(iter(train_loader))\n", "print(f\"Mean: {imgs.mean().item():5.3f}\")\n", "print(f\"Standard deviation: {imgs.std().item():5.3f}\")\n", "print(f\"Maximum: {imgs.max().item():5.3f}\")\n", "print(f\"Minimum: {imgs.min().item():5.3f}\")"]}, {"cell_type": "markdown", "id": "b800ca4a", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.134539, "end_time": "2021-12-04T15:54:47.304930", "exception": false, "start_time": "2021-12-04T15:54:47.170391", "status": "completed"}, "tags": []}, "source": ["Note that the maximum and minimum are not 1 and -1 anymore, but shifted towards the positive values.\n", "This is because FashionMNIST contains a lot of black pixels, similar to MNIST.\n", "\n", "Next, we create a linear neural network. We use the same setup as in the previous tutorial."]}, {"cell_type": "code", "execution_count": 9, "id": "eb8177c7", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:47.584349Z", "iopub.status.busy": "2021-12-04T15:54:47.583870Z", "iopub.status.idle": "2021-12-04T15:54:47.585900Z", "shell.execute_reply": "2021-12-04T15:54:47.585499Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.147005, "end_time": "2021-12-04T15:54:47.586011", "exception": false, "start_time": "2021-12-04T15:54:47.439006", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class BaseNetwork(nn.Module):\n", " def __init__(self, act_fn, input_size=784, num_classes=10, hidden_sizes=[512, 256, 256, 128]):\n", " \"\"\"\n", " Args:\n", " act_fn: Object of the activation function that should be used as non-linearity in the network.\n", " input_size: Size of the input images in pixels\n", " num_classes: Number of classes we want to predict\n", " hidden_sizes: A list of integers specifying the hidden layer sizes in the NN\n", " \"\"\"\n", " super().__init__()\n", "\n", " # Create the network based on the specified hidden sizes\n", " layers = []\n", " layer_sizes = [input_size] + hidden_sizes\n", " for layer_index in range(1, len(layer_sizes)):\n", " layers += [nn.Linear(layer_sizes[layer_index - 1], layer_sizes[layer_index]), act_fn]\n", " layers += [nn.Linear(layer_sizes[-1], num_classes)]\n", " # A module list registers a list of modules as submodules (e.g. for parameters)\n", " self.layers = nn.ModuleList(layers)\n", "\n", " self.config = {\n", " \"act_fn\": act_fn.__class__.__name__,\n", " \"input_size\": input_size,\n", " \"num_classes\": num_classes,\n", " \"hidden_sizes\": hidden_sizes,\n", " }\n", "\n", " def forward(self, x):\n", " x = x.view(x.size(0), -1)\n", " for layer in self.layers:\n", " x = layer(x)\n", " return x"]}, {"cell_type": "markdown", "id": "8635213a", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.133716, "end_time": "2021-12-04T15:54:47.853607", "exception": false, "start_time": "2021-12-04T15:54:47.719891", "status": "completed"}, "tags": []}, "source": ["For the activation functions, we make use of PyTorch's `torch.nn` library instead of implementing ourselves.\n", "However, we also define an `Identity` activation function.\n", "Although this activation function would significantly limit the\n", "network's modeling capabilities, we will use it in the first steps of\n", "our discussion about initialization (for simplicity)."]}, {"cell_type": "code", "execution_count": 10, "id": "9f352558", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:48.130790Z", "iopub.status.busy": "2021-12-04T15:54:48.130299Z", "iopub.status.idle": "2021-12-04T15:54:48.132296Z", "shell.execute_reply": "2021-12-04T15:54:48.131898Z"}, "papermill": {"duration": 0.144009, "end_time": "2021-12-04T15:54:48.132404", "exception": false, "start_time": "2021-12-04T15:54:47.988395", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class Identity(nn.Module):\n", " def forward(self, x):\n", " return x\n", "\n", "\n", "act_fn_by_name = {\"tanh\": nn.Tanh, \"relu\": nn.ReLU, \"identity\": Identity}"]}, {"cell_type": "markdown", "id": "8eeb9167", "metadata": {"papermill": {"duration": 0.133812, "end_time": "2021-12-04T15:54:48.399825", "exception": false, "start_time": "2021-12-04T15:54:48.266013", "status": "completed"}, "tags": []}, "source": ["Finally, we define a few plotting functions that we will use for our discussions.\n", "These functions help us to (1) visualize the weight/parameter distribution inside a network, (2) visualize the gradients that the parameters at different layers receive, and (3) the activations, i.e. the output of the linear layers.\n", "The detailed code is not important, but feel free to take a closer look if interested."]}, {"cell_type": "code", "execution_count": 11, "id": "16bbefb4", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:48.682589Z", "iopub.status.busy": "2021-12-04T15:54:48.682093Z", "iopub.status.idle": "2021-12-04T15:54:48.683729Z", "shell.execute_reply": "2021-12-04T15:54:48.684129Z"}, "papermill": {"duration": 0.151108, "end_time": "2021-12-04T15:54:48.684257", "exception": false, "start_time": "2021-12-04T15:54:48.533149", "status": "completed"}, "tags": []}, "outputs": [], "source": ["##############################################################\n", "\n", "\n", "def plot_dists(val_dict, color=\"C0\", xlabel=None, stat=\"count\", use_kde=True):\n", " columns = len(val_dict)\n", " fig, ax = plt.subplots(1, columns, figsize=(columns * 3, 2.5))\n", " fig_index = 0\n", " for key in sorted(val_dict.keys()):\n", " key_ax = ax[fig_index % columns]\n", " sns.histplot(\n", " val_dict[key],\n", " ax=key_ax,\n", " color=color,\n", " bins=50,\n", " stat=stat,\n", " kde=use_kde and ((val_dict[key].max() - val_dict[key].min()) > 1e-8),\n", " ) # Only plot kde if there is variance\n", " hidden_dim_str = (\n", " r\"(%i $\\to$ %i)\" % (val_dict[key].shape[1], val_dict[key].shape[0]) if len(val_dict[key].shape) > 1 else \"\"\n", " )\n", " key_ax.set_title(f\"{key} {hidden_dim_str}\")\n", " if xlabel is not None:\n", " key_ax.set_xlabel(xlabel)\n", " fig_index += 1\n", " fig.subplots_adjust(wspace=0.4)\n", " return fig\n", "\n", "\n", "##############################################################\n", "\n", "\n", "def visualize_weight_distribution(model, color=\"C0\"):\n", " weights = {}\n", " for name, param in model.named_parameters():\n", " if name.endswith(\".bias\"):\n", " continue\n", " key_name = f\"Layer {name.split('.')[1]}\"\n", " weights[key_name] = param.detach().view(-1).cpu().numpy()\n", "\n", " # Plotting\n", " fig = plot_dists(weights, color=color, xlabel=\"Weight vals\")\n", " fig.suptitle(\"Weight distribution\", fontsize=14, y=1.05)\n", " plt.show()\n", " plt.close()\n", "\n", "\n", "##############################################################\n", "\n", "\n", "def visualize_gradients(model, color=\"C0\", print_variance=False):\n", " \"\"\"\n", " Args:\n", " net: Object of class BaseNetwork\n", " color: Color in which we want to visualize the histogram (for easier separation of activation functions)\n", " \"\"\"\n", " model.eval()\n", " small_loader = data.DataLoader(train_set, batch_size=1024, shuffle=False)\n", " imgs, labels = next(iter(small_loader))\n", " imgs, labels = imgs.to(device), labels.to(device)\n", "\n", " # Pass one batch through the network, and calculate the gradients for the weights\n", " model.zero_grad()\n", " preds = model(imgs)\n", " loss = F.cross_entropy(preds, labels) # Same as nn.CrossEntropyLoss, but as a function instead of module\n", " loss.backward()\n", " # We limit our visualization to the weight parameters and exclude the bias to reduce the number of plots\n", " grads = {\n", " name: params.grad.view(-1).cpu().clone().numpy()\n", " for name, params in model.named_parameters()\n", " if \"weight\" in name\n", " }\n", " model.zero_grad()\n", "\n", " # Plotting\n", " fig = plot_dists(grads, color=color, xlabel=\"Grad magnitude\")\n", " fig.suptitle(\"Gradient distribution\", fontsize=14, y=1.05)\n", " plt.show()\n", " plt.close()\n", "\n", " if print_variance:\n", " for key in sorted(grads.keys()):\n", " print(f\"{key} - Variance: {np.var(grads[key])}\")\n", "\n", "\n", "##############################################################\n", "\n", "\n", "def visualize_activations(model, color=\"C0\", print_variance=False):\n", " model.eval()\n", " small_loader = data.DataLoader(train_set, batch_size=1024, shuffle=False)\n", " imgs, labels = next(iter(small_loader))\n", " imgs, labels = imgs.to(device), labels.to(device)\n", "\n", " # Pass one batch through the network, and calculate the gradients for the weights\n", " feats = imgs.view(imgs.shape[0], -1)\n", " activations = {}\n", " with torch.no_grad():\n", " for layer_index, layer in enumerate(model.layers):\n", " feats = layer(feats)\n", " if isinstance(layer, nn.Linear):\n", " activations[f\"Layer {layer_index}\"] = feats.view(-1).detach().cpu().numpy()\n", "\n", " # Plotting\n", " fig = plot_dists(activations, color=color, stat=\"density\", xlabel=\"Activation vals\")\n", " fig.suptitle(\"Activation distribution\", fontsize=14, y=1.05)\n", " plt.show()\n", " plt.close()\n", "\n", " if print_variance:\n", " for key in sorted(activations.keys()):\n", " print(f\"{key} - Variance: {np.var(activations[key])}\")\n", "\n", "\n", "##############################################################"]}, {"cell_type": "markdown", "id": "307d0193", "metadata": {"papermill": {"duration": 0.134573, "end_time": "2021-12-04T15:54:48.953411", "exception": false, "start_time": "2021-12-04T15:54:48.818838", "status": "completed"}, "tags": []}, "source": ["## Initialization\n", "\n", "Before starting our discussion about initialization, it should be noted that there exist many very good blog posts about the topic of neural network initialization (for example [deeplearning.ai](https://www.deeplearning.ai/ai-notes/initialization/), or a more [math-focused blog post](https://pouannes.github.io/blog/initialization)).\n", "In case something remains unclear after this tutorial, we recommend skimming through these blog posts as well.\n", "\n", "When initializing a neural network, there are a few properties we would like to have.\n", "First, the variance of the input should be propagated through the model to the last layer, so that we have a similar standard deviation for the output neurons.\n", "If the variance would vanish the deeper we go in our model, it becomes much harder to optimize the model as the input to the next layer is basically a single constant value.\n", "Similarly, if the variance increases, it is likely to explode (i.e. head to infinity) the deeper we design our model.\n", "The second property we look out for in initialization techniques is a gradient distribution with equal variance across layers.\n", "If the first layer receives much smaller gradients than the last layer, we will have difficulties in choosing an appropriate learning rate.\n", "\n", "As a starting point for finding a good method, we will analyze different initialization based on our linear neural network with no activation function (i.e. an identity).\n", "We do this because initializations depend on the specific activation\n", "function used in the network, and we can adjust the initialization\n", "schemes later on for our specific choice."]}, {"cell_type": "code", "execution_count": 12, "id": "cc7ba656", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:49.227365Z", "iopub.status.busy": "2021-12-04T15:54:49.226898Z", "iopub.status.idle": "2021-12-04T15:54:53.850761Z", "shell.execute_reply": "2021-12-04T15:54:53.850280Z"}, "papermill": {"duration": 4.762201, "end_time": "2021-12-04T15:54:53.850902", "exception": false, "start_time": "2021-12-04T15:54:49.088701", "status": "completed"}, "tags": []}, "outputs": [], "source": ["model = BaseNetwork(act_fn=Identity()).to(device)"]}, {"cell_type": "markdown", "id": "7f1e34a7", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.136138, "end_time": "2021-12-04T15:54:54.121872", "exception": false, "start_time": "2021-12-04T15:54:53.985734", "status": "completed"}, "tags": []}, "source": ["### Constant initialization\n", "\n", "The first initialization we can consider is to initialize all weights with the same constant value.\n", "Intuitively, setting all weights to zero is not a good idea as the propagated gradient will be zero.\n", "However, what happens if we set all weights to a value slightly larger or smaller than 0?\n", "To find out, we can implement a function for setting all parameters below and visualize the gradients."]}, {"cell_type": "code", "execution_count": 13, "id": "e3710c8c", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:54:54.396221Z", "iopub.status.busy": "2021-12-04T15:54:54.395746Z", "iopub.status.idle": "2021-12-04T15:55:04.530115Z", "shell.execute_reply": "2021-12-04T15:55:04.530499Z"}, "papermill": {"duration": 10.27465, "end_time": "2021-12-04T15:55:04.530680", "exception": false, "start_time": "2021-12-04T15:54:54.256030", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:54:55.723291\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:55:03.610810\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Layer 0 - Variance: 2.0582761764526367\n", "Layer 2 - Variance: 13.489120483398438\n", "Layer 4 - Variance: 22.100574493408203\n", "Layer 6 - Variance: 36.20957946777344\n", "Layer 8 - Variance: 14.831440925598145\n"]}], "source": ["def const_init(model, fill=0.0):\n", " for name, param in model.named_parameters():\n", " param.data.fill_(fill)\n", "\n", "\n", "const_init(model, fill=0.005)\n", "visualize_gradients(model)\n", "visualize_activations(model, print_variance=True)"]}, {"cell_type": "markdown", "id": "8da1230d", "metadata": {"papermill": {"duration": 0.152167, "end_time": "2021-12-04T15:55:04.833884", "exception": false, "start_time": "2021-12-04T15:55:04.681717", "status": "completed"}, "tags": []}, "source": ["As we can see, only the first and the last layer have diverse gradient distributions while the other three layers have the same gradient for all weights (note that this value is unequal 0, but often very close to it).\n", "Having the same gradient for parameters that have been initialized with the same values means that we will always have the same value for those parameters.\n", "This would make our layer useless and reduce our effective number of parameters to 1.\n", "Thus, we cannot use a constant initialization to train our networks."]}, {"cell_type": "markdown", "id": "65128840", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.151605, "end_time": "2021-12-04T15:55:05.137267", "exception": false, "start_time": "2021-12-04T15:55:04.985662", "status": "completed"}, "tags": []}, "source": ["### Constant variance\n", "\n", "From the experiment above, we have seen that a constant value is not working.\n", "So instead, how about we initialize the parameters by randomly sampling from a distribution like a Gaussian?\n", "The most intuitive way would be to choose one variance that is used for all layers in the network.\n", "Let's implement it below, and visualize the activation distribution across layers."]}, {"cell_type": "code", "execution_count": 14, "id": "d6173456", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:55:05.442031Z", "iopub.status.busy": "2021-12-04T15:55:05.441560Z", "iopub.status.idle": "2021-12-04T15:55:13.063195Z", "shell.execute_reply": "2021-12-04T15:55:13.065428Z"}, "papermill": {"duration": 7.778761, "end_time": "2021-12-04T15:55:13.065600", "exception": false, "start_time": "2021-12-04T15:55:05.286839", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "JVBERi0xLjQKJazcIKu6CjEgMCBvYmoKPDwgL1BhZ2VzIDIgMCBSIC9UeXBlIC9DYXRhbG9nID4+CmVuZG9iago4IDAgb2JqCjw8IC9FeHRHU3RhdGUgNCAwIFIgL0ZvbnQgMyAwIFIgL1BhdHRlcm4gNSAwIFIKL1Byb2NTZXQgWyAvUERGIC9UZXh0IC9JbWFnZUIgL0ltYWdlQyAvSW1hZ2VJIF0gL1NoYWRpbmcgNiAwIFIKL1hPYmplY3QgNyAwIFIgPj4KZW5kb2JqCjExIDAgb2JqCjw8IC9Bbm5vdHMgMTAgMCBSIC9Db250ZW50cyA5IDAgUgovR3JvdXAgPDwgL0NTIC9EZXZpY2VSR0IgL1MgL1RyYW5zcGFyZW5jeSAvVHlwZSAvR3JvdXAgPj4KL01lZGlhQm94IFsgMCAwIDg5NC4wMjUgMjE2LjY2NTYyNSBdIC9QYXJlbnQgMiAwIFIgL1Jlc291cmNlcyA4IDAgUgovVHlwZSAvUGFnZSA+PgplbmRvYmoKOSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDEyIDAgUiA+PgpzdHJlYW0KeJzVfU2zJLmR3P39ijruHpjE98eRNEpjtqYLd2nSQaYDxZ2VhjY9a+SQXNt/L/dAVmYkKuqxX/frboFjpM1zVqEyPANAAAh4+NsfX375K3/7Pz/f8D83d/sj/vsf+Pfv+PeLw18fXlpPmwsZ//7j8e/Bl62UXPCvP+Jjlz//78vLv724rftaUnW5tdv8R+rO9+Jqu/2ZP/rdwweOP16mT7+8pL41/EwKWx8/+OEFn95Kir4FBf+oYV/b1u743sIFk2f+0+2hcR/K1vz+D9qJeeu3P39/+x+3n26//FUYxP0T/vtH/FeIe/nlb77/2w9/+P6fv/v17Q8/v9S0xZR7b5cnPtHLU7z8y8tvb3+6N+w2n/FS7m3Ln9/t6MufXjyY+4XD/1XKFmIpIbSU0y3kzTs294cPL7/+3e2X/9XfvL/97t9e+oa3VHtpla/yd//68j9v/+D/8fa/br/7p5f/8jsY7zbn2ahT//aHD2zhF7/5/o+//+9//Zff//TzLz788NNff7795t9vv335rTzt+3PmfYZFLbR6fc0n/A6see+3ytZKj+0V2txBljvJ+mKW57L56HItV8tP+D0sz2Er0pqL+P8+wnKvLdeeB59qrdaWXPe3vlXdRri28at/vGGQ6KG6Fvmf2z/84S8//O33f/nh33+6/e33P/785cn9+JHj03gNQdqPbast91hf9aXtK3jT3mLDC04+18ngE/5MgxvG6OLhB3jC9qrN+avZ7EPdoq85pKvRCv9Mq32I6JO1xVKrL691nq/4qj16ZOox1dnsE/9cs0sGgbC7JFfjq2bn66jBRn7B5jAMRLpNw7gT/XXgmQaN33z/088//OU/P5O/OOwMvbnYA1weUUUa8UWImAy3co8wkgQkWyicZ1LKO9mXL9/0l1+mL7+85LxlREklXgaaXLfW4XXtMs5cUfSfGIheWrijiFB+/f+/8YaZH14KWnB41/Fi/IS2hABvpuSOLmG8ZSaMD1t2BQ93Nf6C1t56eKDkjq5hvGEmjE94voA442r8Ba3VxfZIyY6uYbxhJoyvm/cttunNX9COGbg9UHJH1zDeMBPGY8IJyWPCuRh/onFD8w2zxoUSha5hvGEmlndYWoTec78Yr1CY2ZOTIORKyR1dwnjLTFnbuphrur55hUYsRL1zfabkQNcw3jATxiO2QecN05s/0Yi3jdbjTMmBrmG8YSaMb4g3a/TTmz/RiJVRjVjFTpQc6BrGG2Z+eOEqKEfXr29eoWlLDQskf6VEoUsYb5kJ49F78Y12ffMKzdwoCD5cKVHoGsYbZsJ4xOsllTK9+RMtW84hyLiuWlDoGsYbZsJ4xOvVpZyvxp8oXL2UHK6MnOAaphtGfnjpWCTXEq4+f4DZbzH7JMPa+X2NLmG6YSQsDxi1ggvXl36imVuKDivXCyEKXMN0w0rYnjhdYcC+mH4HsYKrIeXSLnxodA3TH42E5RXxacx9eusHWtrWY4nD9oMQBa5humElbO9b7D1el3IHiPnct15CuPCh0TVMfzTyw4t3iNFd9uX62hXcOaE3n4KmRINLGG/aSfMRpXvXZ+vvqHdl88Xl0K6kXPBFCHi0lPYjUPelxjIRcMCyEe59b/VKjIYXIcAwlQwgWgkhBz8xcMA++Y2/USZiFLwIAYalPHdFXw4tuskFThhN88wr9DoRo/E1KLBsJQWI26Occl4pOGC88i1GDHhtokbji1Bg2DpO33NEd5694IB9DRj8kx/9QFGj8UUoMGwlBYjjEcaV2QsO2FfHcMeXmZkTXoQAw1IQEHgu6FOafOCEfQmbi6X6mRiNr0GBZSspQFSfa4iTD5wwujqG/Tx6gWJGwYsQYFhKAhDal+h8nQg4YB/DlkNtbeJFwYsQYFhKAhDhl9bclG12wtLzQ3bFT8RofBEKDFtJAcL8mnKbfeCAe9sqRvxUrsxoeBECDEtBQPRbQRN18oETbnjm3H3uV140vAYBlqUkIG69FX7/SsABV/q6r61cedHwIgQYlpKAgjbgyrMHHHBh9g3WgvXKi4YXIcCwlAS0Lfdaw+wBB5z7lnMdu16qEQ0vQoBhKQhICOpczH7ygBPOeXOhYM6beFHwGgRYlpIAhPiuh94mAg44+y3F6urMi4IXIcCwlARgMPPZtTgRcMJ46SU256+8aHgRAgxLSQAC/OBamT3ghAteemtjb0g1ouBFCDAsZWI24vtQSp48QMEZ8a9rMy0nuob5lp00H9F9DGnaF9dwwitPfUyCqhEFL0KAYSkJSHKJIMzv/4Tj1hDtyAG/bkTBixBgWEoCENun5NzsAScc8ap52eWBlwNehADDUhKA2D712mcPOGEM+xXjfnvg5YAXIcCwFAQUxPYZEd01/UHDcfOuhf5Ayx1dw3zLTpqPyL4gvE2T+SccNx79+/rAygEvQoBhKQlAZF8qRvOJgBOGpT5hDfjIyx1ehADDUhKAaK6GHmcPuMD3fOapkaXSnE1Lec/EcTKrfvKAK1yTbxYvO/ypBFzvxmz59h8vTy260vHP392ud2jmixf4ZGNWI76VQZofCbqlSNheE2KZlqK4d/SwkyfdtfJ2LKY5yWoMqUu2S23cAfRN4h7PWY+vvIUt4CGTZzQYi8e8MBLEIsZHrjXz1hAkywDREC9xH10i54L35+JIqKpMocQz1I2PK+dsrW0u0sVujLcir9gQ7Rt8DYvPwHTjktNIzcFyJLZyw7wcc8h1T1tBaO5gT8ZvwVO9fBbTVSoVT44hvOSKhdxI80guJzx5IQtY4XNfp5cNi51UIy8IlpSD7Pl2RL8NMWC41bIBi2nkC7jkPD4AOmKCc8g04RyetgW01uXsaN9IdAFBQwmJx+sYR7CG8uPjcIkeYOqNW23ZuVLH50EL0Aiv4VuqMbq0H8+5BDrSjRMSluZJ3hOvhAZX8E59gWHe73vYHs9QsuNBDpw3+ZBj2fEO2/EM9HV8ERPafvQFh6mF9449rGqljp9NcuPJZTkSoyOkvuN8p6mNozKH19v2A6RQfJUjNA8L4bbjMQveIQ2Q363R+7TDvff9tldr2fW2H8JgvsHAK08fW61lfBxeGdERaG3cUkUrMkV5fBldD92F0QqmqH0PL2Dqguviy565i6WUJu0EMhsypnQYtOEFx7HeDxzoeoQpQlQPuQXB0f8bvnzr0koch8Z4bzWB18LMEZfQd+8bqqnF2POtgcmI7hf27bTm8ELqDcTgfQ/P59CQYWAvN95Sg5+n8emKUKtwVCloO7bW+74jkyJmYHQU2lnccJoESumy8ZajhOtuLN7Qcbrr3L7AuBZ9HAENenQIGDQ8F/UV/bLdtwDwIIXduKITxSBdXs6AmAyV2bvRFfCmJCryGwY3xy1GdHQMzmksF/D7vaWRI42Rog93zLwGXTiIMIjGwBbvoRUG28Ct+sibnUH6ON8tumIoI+Bw+2NPYzM+1Z7D1wuDgYPtBjLH/PF379ha1+3Ronn19sPTS/v4xpvu7z7+6qttOxj1sTchMcC2DFfgP+iaGJv3lp7fY/xvv//P7/+Mv/RFxl134S1CCUOdYRZMeNBauAomBF55fcxejRjzMe6WKbFHwReOVCuPwgn0juMD/OdT5+8Xy6dCCuPM4LrwUPA7XIoPIW+lcOTF6F7fpqKAgCO/g5DCF2QQY2pzko13YfCE34NBNJEl5Q+j2scJKmzu4Wr0lyMBwyTvV2V3Pc9W8DuQEPmUia25hgjpo0gI+Ym8AgIuzDQpYMwGGe+sr/AFve1NA84nOpt3I6V+PP3HaS58EwoQtzgE6blfKTjhd6Kg0lcQrHm4wGtyBOGbsMCo0pWEQOlKg8LfiQdG0wh+GcfnHF4hIn0bIjIvu3JNNBFx4u9FBJZ6WGW3hEAgvKbLUZ7oNGCJofn4DL2GT2SWmxsfu5r/+5sbr+6MIEyK1PPAiv16yovP4muuTtk+E9ywiI4CXxq5w8fmxhpEGBaTCCymE7pqm4i4wCcRJj+LEWFYzLgTcUuGAdcd/wk+iTD5WYsIy+IRgMfcXJ48QsFYcgYXZRGpG1HwYkQYFpOIhLVDbGn2iBPmsJD5bzM/B7wYEYbFJAIRaOklzB5xwnIpJIfyyM8dXowIw2ISgXVizdxWvBJxwnGL3KJ7oOeOLkaDYS9oyH7DitBPGUIajlgz5ujqAzsHvBYRlsUkIiIoLX3KFNIwIsEYmpyG6UYUvBgRhsUkomyyQukTESecsIhFmFke+DngxYgwLCYRjZu7OaeJiBPO3M9NzU/8KHgxIgyLQUThJlTiJvaFCAVX/G4schCmG1HwWkRYFpMIToLOT4ICGu5brrHKeZ5uRMGLEWFYTCKwdvDcYZ+IOGAejGQMiu3Kj4YXI8KwmERg7TB2U69EHDAPrgJ+JE38KHgxIgyLQQSPV0NNU46RguEE3P0accTZiIbXIsKymERg7RBjmLKNFExFrYjfjVd+NLwYEYbFJAJrh9hdnni4ow0NoZ0RTp1NaHgxGh7tJQuFGQhw8YmGA+4IpEuokthxtqHRxWgwDCYPWDlkV6Y9ugNlIkguPUiCg2rjgi9GxKPF4KF55gmluVucMLM1QvJJ8nQUQRpeiwjLZDKBkb+EKSXtROU6TuJqc+JH44sR8WgxeaAMSe119ogDZk526rylfSVIw4sRYZhMJrByEJnBKxF3lMLWrqV9a0rxo/HFiHi0eBz61yoHyhciTphJaIEphBNBGl6LCMtkMhHxZnOcrvIrmGl3rWK92WeGFL4YFYbNpCJvsXvvp95xwsxb9lhbpIkhBS9GhGExiaj4JD87EXHArMVRe2Ae65UgjS9GhWHzh5fomJ8TSpsSxE6YAkfoED6kiSKNL0WFaTOpYFpuS9VPVBwwNQ4a5kuJJDVFGl+MCsNmUoFFhE8hz15xwMyiziUiuJwo0vhiVBg2kwrmWzmXZq84YHSJhHZkQ0o1ouHFiDAsJhFYRzC9e/aJA25pCwwiypUfDS9GhGExiKCLR18mSQAFV8ycGVNFv/Kj4bWIsCwmEdx4q8ztvxJxwCXxrk0UEQTViIYXI8KwmETIXZg5QV3BucEJ0rjxoRrR8GJEGBaTCKwjUuOV7ysRB8zd+zQ00jQ9J7oYDYa9oCHwdkmqefIHBVMeJY9KTboRBa9FhGUxicCQVxxz7a9EnHDdfBPRpCs/Cl6MCMNiEsHbf4iLZo844by10PoYKlUjCl6MCMNiEsGbUsG72SNOOG0wLdSZHwUvRoRhMYnovBjcJkkBDVNNSi4YXPlR8GJEGBbzakbYAgvsXdOHNEwVCbz5+MDPAa9FhGUxiUiPReV+vMDcv89BRLWu/BzwYkQYFpOIYtXR07BKqbzys2ampWnxuLVk1NTTMEtptVHe88rPAS9GhGExiEjeqq83wbWOq9NTI3d4LSIsi0lEtGrtTXD1Va7Az/zs8GJEGBaTiGLV3ZvgkwiTn8WIMCwmEc2qwTfBJxEmP59LhL4d9SL6HLePpOVRn2O6XVNLdX1Pv/ewKKYxzPc8cq0rawnuAjQhhyAaD8ytLTXuUQK1EPKAWQ259yxqHM6FKmU7mG7oUsF/KLwRUsEoKnDf8IiFtRLACuUH7jl5PUWRCmkba4CMnfESNu+CG6u4lvDvcU9cwzcYpfCZME+P5CW8hlzxS5Tf6DGnEvacJu6Q5ET9jRSoxCAwT+cS2GL1TLDq/J73Ezwrm7P8Sug9jQOsis9QXcLzsmAtJY+nrnErTRYSjfv2Lcgik9kiLVVqjrS6de5OjSSSRhlH55PIOpRau8gZh5aZvF1ZnB1cdqafxf0kFW+GYiAUP6rZl5H0zutkVY5LKEsBxyuykiGODzWeshUEdJ67QYL3LUZPpRCevvlaU4873j0WRLtIhoiu7Kd1MLvBFhHVAB7GKZ7HAgq+V6+69MRLanmcc8LNQxwfRywVaqe0CLU8MvXrdpwaKWmIu0e8kVr3o7HYCqIOMauDHHfH0V9oCysChOj7uAzS4XdoBeMwJdIpFT7Y74UH8SXVcRIPL91PWeCQ8GRwSznB7FobNHd4JJpnLgcm+4pHuJ9EgEJHaRGExwmds8qiwVGdP/Pit2dAABeW6dFlFiWrfSg1++6lRld0Ur/KM4Eqb8lRyF12JxzeW6UYCnwloA2RreBuHgaTgA6EF5gDaxzue1uuJfQ/ZuUl9NLxJB5fxavBgha9BzPzkGKJnj8ESiKTGSO8TErhckMEFPDqEEVEfayioAI2qTLuRo5s3f09BvhJz456gzyFaVX8HUtGvEfusrFPt1aHjgn4pdoN/iPaHD0N+RRe6GYVAynVV7Mboo1ca4CsxoGQGRMxlRFesCPjB2QthnfmxIkihkSMEaHJp312acTpGMQc3vh+7lZjEFd5GJ/jeBAbfoM2x5N72c+UHdCyeWX7w1ONCHzjzXe/7V9/9TfeotXB4TTtkxaHlI8X6wjfRKwDz7r1x0xgDG9bfaw/ouALSaoVW6zj/IC7/tRnX3VO6F01Phig4HdQWUiOlyBKxrqGSQhvFOtw7yHW8QUZ5OxNnbFrNKfg92Awc05HaxhYMQt8oljHlyMh+4qgBCPkdWtMwe9AAqYGTERsLfJCyceR8EysA2MzBrLha++r1PEFXe1No80nKqIwgex8+k9T6vgqFCAuQ1jQQ7lScMLvRAEVuSjb1dD1+iss5G/CQqcynQuiT6FYOOFPZ8FrFrioQAiFX0aU/goL/ts4A9X0KBkX+pUHhb8TEVxGYRmEdWFHjPoaE9/GIZjNFXLiHdQrEyf+XkxELNmx+KN2ZK+vadh8I58oPHJD5B0mJk78vZigTjBWgin1ml5V88lPxFuwMtKEfIZ4yydS+1V3wBKWokaVmkThyccqNRNc49hMmRq5w6cy7RJEGBaTiLwZ1WqewiZtixFhmEYiqlW1ZoJbq7InMDVyhxcjwrCYRHSreo2Gqc+NFUKc+FHwYkQYFo+VqVHFRsPcuKKs4SM/d3gtIiyLSUSyqtlomKfJMcu14is/B7wYEYbFJKJYVW00HCl7XaSm65WfA16MCMNiEtGt6jYajlvD+Ngf6Lmji9Fg2AsaKEL9WOVGw3CBGOoDOwpeiwjLYhIRrWo3GqaqdR5Zq7oRBS9GhGExiShW1RsNly3lNI6udCMKXowIw2IS0azqNxpuW09uHI7pRhS8GBGGxSAiOasKjoIzV/nVtys9Cl2LBste0sA/HqrhKJj7ziU7EavR7Ch4MSIMi0lEtqriKLhkefMjvD4b0fBiRBgWk4hqVcdRMCupYJqM8cqPhhcjwrCYRHSrSo6CW95cLcVP/Gh4MSIMi0EExjzmd7jJI064V9aHSSOsPBvR8FpEWBaTCEosuNAmjzhh71jNxlfJsFGtXPDFqDBsJhW8PI2PzT5xwFJGvfoY60SRxhejwrCZVGD94Px06/pEqVASY2qiHK8J0vhiRDxaDB4Klg+O+XlXIk6Y9UTlBki9EqThtYiwTCYTWD/4OKkLnyhL/HhXo2RIaX40vhgRjxaTh8KtR3x/IuKAmVrXCiWmr/yc6GI0GAaTB/T0MJMwsEtOo2ZG44uRMFs7cmFKxEcmEk6YSZke0WOIF3IUuBYJlsHkAX/EMh9vHaiUq8PvSrqhZkfjixHxaDF5yEwijXn2hwNmcm0J3s38nOhiNBgGkweEyKn5KYo6UM9lNmsw1okdjS9GxKPF5AGLhhz7JEihYCZVh9CrJC9oghS8GBGGyWCiYdGQe/XXVC4Fs4JhY1XTNjGk8bWosGwmFVg0lJz65BQnjLmBeqlS7lIzpODFiDAsJhGFS6bQZp84YKkwilhatLU1QRpfjArDZlLRN1erK7NPHLBnEaTSfK4TRRpfjArDZpbp9Bva5O3xCxUnzKswvkapqaoa0fBaRFgWkwi5DzXfVVBwQ7sUfbvSo9DFaDDsJQ0sqpyY33Cl4YBZwxiT5USOQhejwbCXNGDt4FyYVCkUXBIWWVXSg1UbCl2MBsPeDy/Z4ZMu8xaWpkHBFCzKLZYrOQpdigbTXtKAP7yvtU40HHDmdbouaWKanBNdjAbDXtKQOebnMnvDAWeHFXfILk3sKHgxIgyLSQTPJGJMsz+ccNtcodb4hR6FLkaDYS9pYLXtzgToKw0nXJgrTmHpKzsKXowIw2LeTwqPRSR/vMC871u9REu6EQWvRYRlMYngpeWHspka5nWpFmWlrRtR8GJEGBaTiGKVzdSwyBB4kVDWjSh4MSIMi0lEt8pmajhuoaZx//vKzwEvRoRhMYgI3iqbqWFmFvPK+UzPHV2LBste0hCtopkapihqC3LIPbFzhxcjwrCYROCRHotmTnDzrqSJHwV/LhHvKdMy36PxLXbJJnaY9ntw482W4O/p5Q4ejtfJjt6i27OqCyPFMoSscsVH6p5ci2ghJsm5DRQEqXuqaY6lyjzKliWgYN5ly8l1CT9c6tXJ6oRqDF6q3yTKoERXwp6c6DEDF6ks13gqMOC6xeh4BMef9kPUnBl8GJu4sEFI2woaG4l9nde20F+Z2If/t4V7nlvDr7h2yxlmYcYfOT4eL0dqn2OZFLsfihOJGhGguVHTxRWsH/yeGYV2Oh6qgkfe3fZ7npCvDX5wq3LKWeJoo1FmwPlbg+UVjytPnT1cIDIh2TtP4Zgs4jcps9ymZ9ETinQXmj7wjCY7iy56eGPFj46j9gbackvcPOaxYh5aJgnPG5Jvfdxf8zmHYSdw8BmoNkLpj+PVyx9U0ZAbdN5VLwuDRBHg3AM1wyl7g3hR9Dx4nNlqKWlosSSHbwy8bnjUzrN/SsCApOFDBVF2zOB74KGnssMF77kOxZgMVtJ+PBYzL5ZTtQR/jVRNfsL7yLaLBO1elFJ4hlTglTVICQQXwp6GUPOWSxkyOKzLB2NG63CYEkXuJiPECb6kfb/dpSBqN/AYJnyNn22OOmWiakPdD3Q30YZODcNgcaJew06E11/DvludwTxlaij/AkcZ7kGF7VxEdgZvMLUY2vi8bFTwQ95TlxzDzPjdxtT9UgsFYBCGpX1Bj9cMJ2c2Gl2ojKUsd33Qc/FeqSeEOL7dd4gAJubwwVNb4KBNuLKoaQui/4LXHkUbhXsFeFwePWUq+fjc96UzKKO0DH0wptHtMry2wH/D0AWG443wEQtMOqcTVZjqETwUgePGch3sX2gOY9aYShwWHZVXmLgMC+jTLu6rkoSxYJeYRbzhRyNNFKmjjBbAkh9hC1eylUI47JghDbFJBrKFYkdSx5S9dP80vCL5lEWhqmIsSOPT6LIcU4sU/nXNyfXqjIGSuV3jao1n8l95nBAQEon3P4HfoAvzRAXgmYgIWjYFAj48lSPBN96sNGD/+qu/8RZdGA6y/U16MOmb6MGg+8BzH9KLK6XjH4v4KPhCjmrF1oM5PsB/0idFDc+EPDpGR46I191lBb+HkAdG3dIrpmmMe2+WgwnvoQfz5RgsdFWEIJPwpYLfgUEMH9RgY3knrDo/Vg/m4Rr+F2ShY+JxPU6Jowp+DxYqvZKtBcQfH8nCfAX/bM0x6EB0EUTe6n1FYb5gj33TkPOJHbbkceFhPP2nicJ8FQoYVTuESvVKwQl/MgWIohUFFGGM8KWOgONNaihfhQWRekSAV/qVBoW/Ew/eiaIlIkVEcf5NGiBfh4lUpQB59xMTJ/5eTDAmlJg+U7LzORPRPdEAwQJME/IZGiCfSO3X3V5pzarJgxDSqsmjYS5H+pB20I0o+NheWYIIy2ISEayaPBqGw2EQkn2PKz8HvBgRhsUkIls1eTSMNWdzTjK+dCMKXowIw2ISgTHrsSaPgrlu7qlM9Ch0MRoMe0lDt2ryKJiCxi65sQxX7Ch4MSIMixFMu2DV5FEwJalLlNo7mp4TXYoG017SkKyKPArOiQmhcjVVk3Oii9Fg2EsailWPR8Fl6HzLrqpqRMOLEWFYTCKaVY9HwQgagGU5i1CNaHgxIgyLQYT3Vj0eBXuW+/Sp5Hgl6IKvRYVlM6mIVkUeBXP/POBvf2VIw4sRYVhMIrJVkUfBXo6wXZ0JuuCLUWHYTCqaVZNHwT7yLLM1uYqoKdL4YlQYNoMKnvU+VuVRsGdFP4ROsnOgKdL4WlRYNpOKYNXlUbCP/OHS20yRxhejwrCZVGSrMo+CfWZ1jixno5ohBS9GhGExiahWZR4F+8zyKHmchl4IUvhiVBg2k4rOY++e+0TFAcsBOH7W9YkijS9GhWEzqOA9s5hrmrzihH1gBZ8eZNtZU6TxtaiwbCYVWE0kT5XtKxUHzHkCUUSVjJQLRQpfjArDZlJRmFMU/ewVB+xT3grsLjNFGl+MCsNmUoEFRWa5rYmKAx61mFyTezeaIo0vRoVhM09/mc7RWpu84oQvig8XiiwliCWosGweB+EIDRgxXqk4YKZWee5UxYkijS9GhWEzqWBdnKn60o8a9pL8mJykU2mKNL4YFYbNpIKBUglz/7ijPkcmeTnJLNQEaXwxIh4tBg/crEeQFCaXOGHmKSYWQk0TQQpeiwjLZDIRttrqdOv9RJmX6X3Itcz8KHwxIh4tJg+sRsfqlBMRB0wFrdBDK2UiSMGLEWGYTCYqpsI+6TqfKOuRIMIeKbaaH40vRsSjxeQBKwmXfZk94oA9KyUy0zdeCdLwYkQYJoMJptx7N3eNAx05GXmk9V/4UfhaRBgWk4fEXOc6aSAo2Efu3qYsWe+KIA0vRoRhMpnAIiKEPMkgKNgH3ifwToqfaoY0vhgVhs2kovFgL7rZKQ5Y7hjAfCmOdaFI4YtRYdgMKioWEY956wr2vm49lSpCzpoija9FhWUzqYjce2p18ooT7jwh73K/RLWh0MVoMOwlDVhCpFzK7BEHzPqdOed2JUehi9Fg2EsasH5gFevZGw6YRcBr9WML82xEw4sRYVgMIigHlGuIkz+cMBaarPgsF7xVIxpeiwjLYhIR5JLlJImgYC61XIkjnUbxo+DFiDAsJhG8m9raJImgYMbVLcaxAFX8KHgxIgyLSQRLfqfcZo844MJBMRa5yKYa0fBiRBgWk4j+WLXwRw2zyD1GRxE3V41oeDEiDIvHLR6j4KCG64ZJ0o8zQNWIgtciwrKYRKTNKMio4b41apuHiR8FL0aEYTGJKFadRgXnsEUsvuWmt2pEw4sRYVhMIppVp1HBGAx6jeOYR9FzoovRYNjLmzbeqtKo4AzTW9vPeBQ7Cl6KCNNiEhGtKo0a5tV+l+Sev25EwZ9LxHuqhUw3bkJPLjEpH4M8k8p5rMP6kin6cS3FU14yJ5ELKbypKZfgKULaPDUYUkLY2KrocOYetxR798IK5oxe5YJ95938lnmmWrdU49CX4J3kGAtv0lPUA62l4zpEzzxGpoxfyKBE4Marb8z6rmjQ368MhEjVBBH6SCKBOGBmMjVRM2CdaLklVpyjOorM8xTqj7mNtFkwyhpQmTDWBMmNT1Mji3IZhFOJ8cg/r67zM5myBbG5kZxMMZXGjAhqi6R7DAG4gYcRY/nWS5IZ1VF2quKxi4hQFCkZURw4c8V7LNr6VvF7+2M3qVeOEL2LSsNQWygOszLmIgSsnY9dgugnFO9YFpKqL2QB3WG07Tk+tSZFbiLWPmX/TRZDhzNQsAI/D9LB0G3kjVaPCa+JRAlFG0Ys4LNU1MO60QdGRcGPs38PRmMKo0AMBWZq2mFx9zgUTVwp49jLgzu4Eq+jw/NzQsAZd7xyNdIFxxusw1iPASbiGUZPgUcMDbviO7qhoz4N8YjOMMwKjuJNhRtDYbymwQ5wWI4vyHZhYx3VkeYEG1OLFWZFj/eXnHguc+IoD8b02diYFDZqx2Gc2XLJNY2sj5AoviJ4wo9lSuAwXSqAkHbHKzvVXkXFtRDumWYRkRVTuTMLvKbqw46DEc+9POD97qqBnhiomSPyJfCzMh6nbi755qqk7lG+R6Q3iFOdhxvmnT7c3WiG6Z8uMVE8gX30hDw+3jfw4WsXazuWQGNtFB0+VBs33slO9a6MNCC/oYtTZ4dsohOV4TzA8U02KuOa64O0GLj3Qv0deVk5tuZ3vEVMGVVeVkD3GrNKxGgCNtk6XjPoq3mHe4/8DJXCe6m1j49n+HUoVLBIzLmodbzbiEfojkI9cA+W79k3Q2KlSAmlfCif02ouo7/BdHLDM9mS0D7V0Ha88DSuigQNX8+OYxByzQ31HLhycHe4tgor5ePoMWF8PDle3CiU96YKT8UQHHe8JwwYXcokRGoNyGNyOEavEen4CsvhVPdkgpaCiAhxsKUS0Thbx9gSMAlVkZTnwdE4M6BUk+MjC4wO1++5ChmO06I0g3HN7yf36GYYGkWZvtLAIEN8oVgTaxeMo3uMqaPMKA+yU0WHIMv4JZg72Ew8oCgiXiT3t1wePQs43oyXtBAqQblRSYkHwYG9qY7PJ7jFHa89tQHHiGlhwJ6JNjkXeZyIl5jHWVrkIbJoIPGbHG2FtUz1GLqA0MBB0w8c4xdGjDyEftCz/RipRzwTxaV4uWJ4Mod+eHgaeMPL6vejzAqfonqRyKaVnXveNMZfVC8SQRq43f3EL7Xs/DjRQriwn31isqBmDV2f0y563ti2Ag6YOlNepGpSHL4G/w0B/57keTz62xgv6EjN1yjnRCC7jLtDBRZi2vdF1IsQtw1JHp4goHVelvCS94lHvp84MAm2jMRHDDt7M4030rIbWeRMgtt33zGMxNjS2H3HnynvMCIDzynIs+wDhd1vY4+aJTlr3qegFuTGZ6mJulDoB7cKh8IYO7ivYx7B60d36zXnMSrUQjUKrEU4p+Jf0niWis4cGJJwXoYThDGi1Y5JhNobjBAw8pd9nxh9Fv133DjDbJ7rvkeG/odZTDYLXdsHXcA9cHLgIqjj7Q7PaxiAHUdXCV9Ac7zvv7nKYYtwDvcxrqF3R/Y/eZBS45gXGnsuPYxRhuMUkXYYcybvOgFGuB2lGjq3bHLmrXii6MpjzmyFIp9S9ZSzLQyLO1wpt1QkrvG77hp3O1oNbb9th4BvTAnUnY8MdLnCgT/7cIfxGJRhR+/KmOLHmIQAxTP4TLJAlmh2h2vpcu8ProEJzMd9OR2p6kYUX4vlWGSHUb0XA2u5B0ddKrdmqkhRLyy1dKzAMG8VWaAi/B1qTGUoYvcu+7t4ij1m4m0gRM1R3g3iNT+iEURKCdFok3fDcgMyVmAWpYo0c1Iy69Zgedd2GF0JI6ioXyHyFU9j6F8ronCxPdQwBpDqZPpmFraMJKk9rB4SnsiF5/AbpKWeaIk80yNCy6bMyIenykYUo3qrXon966/+xlukpRi7JbbCf94kMVW+icRU5eD+eG+lNeZ2XMm7Yxd61PdtcanzA/76I5+ty8GWMemUKU9Ywe8gClRl/YlwsLEszpvFpd5BW+rLEdjYQCxuUlVS8DsQiOELIw1aw8ozfayqknsiqoTgeqMn41mpDfe+okpf1lM/spN9upfm89E/TVHpq9gvYVRjgHraf2KfbD8CR2U/8/3RFbmOwAT4nIL8bThAB0AsJFHASYICP5kFLkzPh6fKa8+eezT178hKfSMemEmJtUC88HCC78UD79dGrFOxtnlVVMp/K3/AWoRBo7vwcILvxQMX+JQFRtznXxsZwjz+HppSNURNx2doSn0isV93Ex6EGWXDKqWAH8uGKZi7iwgExxaIauWCH9vwa1Bh2AwqONI+lg1TsEjyxrFboxrR8FpEWBaTiGCVDXsKm7QtRoRhGolIVuGwp7DJz2JEGKaRiGqVDnsKm/wsRoRhGonoVvGwp7DJz2JEGKaBiOat8mHPYJuftYiwTCMRySog9hQ2+VmMCMM0ElGsAmJPYZOfxYgwTCMRzSoh9hQ2+VmMCMM0EMEMh8cSYs9gm5+1iLBMIxFxM0qIPYVNfhYjwjCNRGSrhNhT2ORnMSIM00hEs0qIPYVNfhYjwjDtw0tzzioh9gR+ws9SRJimkYhgFRF7Cpv8LEaEYRqJYGbIQxGxp7DJz2JEGKaRCGbsZJ7oXi1+Apv8LEaEYRqJ6Ky35Pv86p/AJj+LEWGYBiK831orfcqYfQbb/KxFhGUaiUhMcqyTUM5T2ORnMSIM00hEkVoNOU0WP4FNfhYjwjCNRGD14BLzT64WP4FNfhYjwjCNB95YPXjnJ7mgZ7DNz1pEWKaRCOa4TnXaftRwLSwyN0pVqkY0vBgRhsUkAquH4EufPeKAPaPJ4rLkRKlWLvhiVBg2kwrmLFZmsl2pOOEkqf+SJqkbUfBiRBgWg4jomEgayuQTJ8wE8OhHmVTViIbXIsKymERg/RC7m7LDTjRK8V7RcNZNKHgxGh7tJQtYPKTU4kzDE9jibDEaDMvIA9YO2U2b0s9Qk5zFaHi0jCxg4ZBLeugUT2CLncVoMCwDD8mzDrWfJgsbtclZiwbDMrKQeCOj1+m1P4MtdhajwbCMPBS5YFkme23UJGcxGh4tIwttq4+56BrmtbTY5OqDakOhi9FgGAweqOPfcpxEcRTMmgc5uirXElQrF3wtKiybSQWCoe55ufZKxQnzwlZqI6hWjSh4MSIMi0kEazfzsxMRB8w7YSn4seI8G9HwYkQYFpMIrBec3BK/EnHAXEZkRA5SRelCkMIXo8KwGVTg0aNrqU4+ccIXFXNNkaluvgQVls2kAssGn0KevOKEe6YITJXr8KoRDS9GhGExiUi83kg5zSsRB+xD5K0VL3fBVSsXfDEqDJtJRX2sdPujhjFKpt6SKESoRjS8GBGGxSSiW7V9n8ImbYsRYZgGIqq3avs+g21+1iLCMo1EJKu271PY5GcxIgzTSASio8favk9hk5/FiDBMIxHNqu6r4bjV0nqd+VHwYkQYFvNakbeq+ypYrkkZBF3wz6XiPbWj1MUaqVbhmlwkq4UiEo5VLOQmcBySHYR76Hy3gDERhqGRRZUU17G0oprFXaBIbqo0KjgQzp7353e4lMqL/Gw6uVjHvZa+BazZeZFfpGFGVTLe8kggN4gSAq8Gi/wG7zz4lNxQj3Iwzg0YcUoLvG4voiMUABKY8iVOzp+pBMPLrwKXzfcudU9gbohDpUKy53PzDBmyKH7k0UiDEaUNgSzfKUFx21PMa85M+4iU8uhDaaA5jIuIorvs2fvORyVMtY0QmC2DVWhLOY4c1Lwl9JQ9m6g5J+odTDurPbYzNVVkbpqDESXGMFay0YnSBdMummMCp8h9UeRTYhfv8E20J2cK2UlBDsJBtI+CLIfxQlMaML5aa3JiJN5GEIUOHuCnWFwf2mg+UieQcN5yT7WKCljx6Ah9P+WulOvI1E3oIXi5f9eo2+0DVShyYMptF6kGfGcr2eF3WJjPUXJLjn6CaEj1TE2QQPmT+yEh3h7eDu+n4m2kcUIS0hZa6jxFZZ1Yl0VcgzBitwB3pb/gpYa6n68lmMPLfRt8P4vaA29suxA6XjZguGcQXQzChXgRuPYaRtOVIhQF7lolE6zsjVQMeY4SUYDhO6HcD/oiPB3U4/l8jb6OB0GX65332Nkp0DNi2M97Soa3Sn1oPH6SjsON/+ojD4gHf0ObsEVW3vHs3pldNbgU9+1xF10aPu9d7aXsMJ/Pi/JnotCWWEkprNb96ArdU2p9h/FUlAACXGJt9b7pHFOlAhAlMPiBsMM9VAoAJSqSoC/Lcyepx8mOi590Nbt037F1TQRd8Ui5+H3DyoPNHNidGiU8hixcS7Q4NnQn0f5xow5yo+/idbbMwByeFoY7wEnRffEoHDQ6mPT3XUF4HRWBikj8DKEg7pFhEKLED14O5WSkY7fMVMdMxZ4mYneiy8PdE8pEcffEJYytiAHHHgPvHjnQf/PocT62JGorTQToMBO0IZETQw19xytGXW7YoRdh3BjKII1Sxa4mVmdEN8o11kE5cN7+91VwjFqx7et26tgWQeUD49N9Yy0m6vgAD3iWwQBwjOlDxyfzXQzJKC56A+XGKOTD7SEMp2HHef+bWnLUjMOgLGWXW/HUcQpyQRpPX+6eWyhh5Dqo4tAFV3Bj/dREh657OnQsMcS6B9EY8SnZw9/3mBPk05WTSBBxHnpX7HucGXjxVgQAKe89HBRw7V6keRIlScZtyMY9jOp2aZ7O23Flh3vqNYq7gMteR9uU7+mi2BOp+VnjPaDDCI1RIFO6B/1tTOoi6iOCPeh4Pg4VqoZJI7fEo2pwzDJxze8hgOeMGAhTTjTd4cpyDlnm0ZxSHXDn8S6leUg82Qs7DNfiTUfC/J78JIW+mWcnczS6TBg/eUYjDC8yBqZX4Dco0TwRYHgmXoKWH7UZPtgCKFSteZO8g/2jz1t/i/oM3JDRQh//vEV9pt2eSG6gE6OTiB6WVC+/NJUsxY2Kobn6xIhEKW786w8//+XPP/zvv/KPy2Xwl/8Hi5HogQplbmRzdHJlYW0KZW5kb2JqCjEyIDAgb2JqCjEyMjMyCmVuZG9iagoxMCAwIG9iagpbIF0KZW5kb2JqCjE3IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggOTEgPj4Kc3RyZWFtCnicNYy7DcAwCER7prgR+DiA94miFPb+bYgtF9w96YnzbGBknYcjtOMWsqZwU0xSTqh3DGqlNx076CXN/TTJei4a9A9x9RW2mwOSUSSRh0SXy5Vn5V98PgxvHGIKZW5kc3RyZWFtCmVuZG9iagoxOCAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDE2NCA+PgpzdHJlYW0KeJw9kMERQyEIRO9WsSWAgEA9yWRy+L//a0CTXGQdYPepO4GQUYczw2fiyYPTsTRwbxWMawivI/QITQKTwMTBmngMCwGnYZFjLt9VllWnla6ajZ7XvWNB1WmXNQ1t2oHyrY8/wjXeo/Aa7B5CB7EodG5lWguZWDxrnDvMo8znfk7bdz0YrabUrDdy2dc9OsvUUF5a+4TOaLT9J9cvuzFeH4UUOQgKZW5kc3RyZWFtCmVuZG9iagoxOSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDYxID4+CnN0cmVhbQp4nDM1NVcwULC0ABKmpkYK5kaWCimGXEA+iJXLZWhpDmblgFkWxkAGSBmcYQCkwZpzYHpyuDK40gDLFRDMCmVuZHN0cmVhbQplbmRvYmoKMjAgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAzMDcgPj4Kc3RyZWFtCnicPZJLbgMxDEP3PoUuEMD62Z7zpCi6mN5/2ycl6Yoc2RZFapa6TFlTHpA0k4R/6fBwsZ3yO2zPZmbgWqKXieWU59AVYu6ifNnMRl1ZJ8XqhGY6t+hRORcHNk2qn6sspd0ueA7XJp5b9hE/vNCgHtQ1Lgk3dFejZSk0Y6r7f9J7/Iwy4GpMXWxSq3sfPF5EVejoB0eJImOXF+fjQQnpSsJoWoiVd0UDQe7ytMp7Ce7b3mrIsgepmM47KWaw63RSLm4XhyEeyPKo8OWj2GtCz/iwKyX0SNiGM3In7mjG5tTI4pD+3o0ES4+uaCHz4K9u1i5gvFM6RWJkTnKsaYtVTvdQFNO5w70MEPVsRUMpc5HV6l/DzgtrlmwWeEr6BR6j3SZLDlbZ26hO76082dD3H1rXdB8KZW5kc3RyZWFtCmVuZG9iagoyMSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDI0NCA+PgpzdHJlYW0KeJxFkU1yBSEIhPeeoi/wquRXPc+kUllM7r8NzbwkK1qF5gPTAhNH8BJD7ImVEx8yfC/oMny3MjvwOtmZcE+4blzDZcMzYVvgOyrLO15Dd7ZSP52hqu8aOd4uUjV0ZWSfeqGaC8yQiK4RWXQrl3VA05TuUuEabFuCFPVKrCedoDToEcrwd5RrfHUTT6+x5FTNIVrNrRMairBseEHUySQRtQ2LJ5ZzIVH5qhurOi5gkyXi9IDcoJVmfHpSSREwg3ysyWjMAjbQk7tnF8aaSx5Fjlc0mLA7STXwgPfitr73NnGP8xf4hXff/ysOfdcCPn8AS/5dBgplbmRzdHJlYW0KZW5kb2JqCjIyIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMjMyID4+CnN0cmVhbQp4nDVRSW7EMAy7+xX8wADW7rwnxaCH9v/XUsoUCEAltrglYmMjAi8x+DmI3PiSNaMmfmdyV/wsT4VHwq3gSRSBl+FedoLLG8ZlPw4zH7yXVs6kxpMMyEU2PTwRMtglEDowuwZ12Gbaib4h4bMjUs1GltPXEvTSKgTKU7bf6YISbav6c/usC2372hNOdnvqSeUTiOeWrMBl4xWTxVgGPVG5SzF9kOpsoSehvCifg2w+aohElyhn4InBwSjQDuy57WfiVSFoXd2nbWOoRkrH078NTU2SCPlECWe2NO4W/n/Pvb7X+w9OIVQRCmVuZHN0cmVhbQplbmRvYmoKMjMgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAyMzEgPj4Kc3RyZWFtCnicNU85kgQhDMt5hT4wVRjbQL+np7Y22Pl/upKZTpDwIcnTEx2ZeJkjI7Bmx9taZCBm4FNMxb/2tA8TqvfgHiKUiwthhpFw1qzjbp6OF/92lc9YB+82+IpZXhDYwkzWVxZnLtsFY2mcxDnJboxdE7GNda2nU1hHMKEMhHS2w5Qgc1Sk9MmOMuboOJEnnovv9tssdjl+DusLNo0hFef4KnqCNoOi7HnvAhpyQf9d3fgeRbvoJSAbCRbWUWLunOWEX712dB61KBJzQppBLhMhzekqphCaUKyzo6BSUXCpPqforJ9/5V9cLQplbmRzdHJlYW0KZW5kb2JqCjI0IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMjQ5ID4+CnN0cmVhbQp4nD1QO45EIQzrOYUv8CTyI3AeRqstZu/frgOaKVBMfrYzJNARgUcMMZSv4yWtoK6Bv4tC8W7i64PCIKtDUiDOeg+IdOymNpETOh2cMz9hN2OOwEUxBpzpdKY9ByY5+8IKhHMbZexWSCeJqiKO6jOOKZ4qe594FiztyDZbJ5I95CDhUlKJyaWflMo/bcqUCjpm0QQsErngZBNNOMu7SVKMGZQy6h6mdiJ9rDzIozroZE3OrCOZ2dNP25n4HHC3X9pkTpXHdB7M+Jy0zoM5Fbr344k2B02N2ujs9xNpKi9Sux1anX51EpXdGOcYEpdnfxnfZP/5B/6HWiIKZW5kc3RyZWFtCmVuZG9iagoyNSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDM5NSA+PgpzdHJlYW0KeJw9UktuxUAI2+cUXKDS8JvPeVJV3bz7b2tDUqkqvIkxxjB9ypC55UtdEnGFybderls8pnwuW1qZeYi7i40lPrbcl+4htl10LrE4HUfyCzKdKkSozarRofhCloUHkE7woQvCfTn+4y+AwdewDbjhPTJBsCTmKULGblEZmhJBEWHnkRWopFCfWcLfUe7r9zIFam+MpQtjHPQJtAVCbUjEAupAAETslFStkI5nJBO/Fd1nYhxg59GyAa4ZVESWe+zHiKnOqIy8RMQ+T036KJZMLVbGblMZX/yUjNR8dAUqqTTylPLQVbPQC1iJeRL2OfxI+OfWbCGGOm7W8onlHzPFMhLOYEs5YKGX40fg21l1Ea4dubjOdIEfldZwTLTrfsj1T/5021rNdbxyCKJA5U1B8LsOrkaxxMQyPp2NKXqiLLAamrxGM8FhEBHW98PIAxr9crwQNKdrIrRYIpu1YkSNimxzPb0E1kzvxTnWwxPCbO+d1qGyMzMqIYLauoZq60B2s77zcLafPzPoom0KZW5kc3RyZWFtCmVuZG9iagoyNiAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDI0OSA+PgpzdHJlYW0KeJxNUUmKAzAMu+cV+kAhXpO8p0OZQ+f/18oOhTkECa+Sk5aYWAsPMYQfLD34kSFzN/0bfqLZu1l6ksnZ/5jnIlNR+FKoLmJCXYgbz6ER8D2haxJZsb3xOSyjmXO+Bx+FuAQzoQFjfUkyuajmlSETTgx1HA5apMK4a2LD4lrRPI3cbvtGZmUmhA2PZELcGICIIOsCshgslDY2EzJZzgPtDckNWmDXqRtRi4IrlNYJdKJWxKrM4LPm1nY3Qy3y4Kh98fpoVpdghdFL9Vh4X4U+mKmZdu6SQnrhTTsizB4KpDI7LSu1e8TqboH6P8tS8P3J9/gdrw/N/FycCmVuZHN0cmVhbQplbmRvYmoKMjcgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCA5NCA+PgpzdHJlYW0KeJxFjcERwCAIBP9UQQkKCtpPJpOH9v+NEDJ8YOcO7oQFC7Z5Rh8FlSZeFVgHSmPcUI9AveFyLcncBQ9wJ3/a0FScltN3aZFJVSncpBJ5/w5nJpCoedFjnfcLY/sjPAplbmRzdHJlYW0KZW5kb2JqCjI4IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggNzIgPj4Kc3RyZWFtCnicMzK3UDBQsDQBEoYWJgrmZgYKKYZcQL6piblCLhdIDMTKAbMMgLQlnIKIZ4CYIG0QxSAWRLGZiRlEHZwBkcvgSgMAJdsWyQplbmRzdHJlYW0KZW5kb2JqCjI5IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggNDcgPj4Kc3RyZWFtCnicMzK3UDBQsDQBEoYWJgrmZgYKKYZclhBWLhdMLAfMAtGWcAoinsGVBgC5Zw0nCmVuZHN0cmVhbQplbmRvYmoKMzAgMCBvYmoKPDwgL0JCb3ggWyAtMTAyMSAtNDYzIDE3OTQgMTIzMyBdIC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMzkKL1N1YnR5cGUgL0Zvcm0gL1R5cGUgL1hPYmplY3QgPj4Kc3RyZWFtCnic4zI0MFMwNjVVyOUyNzYCs3LALCNzIyALJItgQWQzuNIAFfMKfAplbmRzdHJlYW0KZW5kb2JqCjMxIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMTYzID4+CnN0cmVhbQp4nEWQOxIDIQxDe06hI/gjAz7PZjIpNvdvY9hsUsDTWCCDuxOC1NqCieiCh7Yl3QXvrQRnY/zpNm41EuQEdYBWpONolFJ9ucVplXTxaDZzKwutEx1mDnqUoxmgEDoV3u2i5HKm7s75Q3D1X/W/Yt05m4mBycodCM3qU9z5NjuiurrJ/qTH3KzXfivsVWFpWUvLCbedu2ZACdxTOdqrPT8fCjr2CmVuZHN0cmVhbQplbmRvYmoKMzIgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAyMTggPj4Kc3RyZWFtCnicPVC5jQQxDMtdhRpYwHrtqWcWi0um//RI+fYi0RZFUio1mZIpL3WUJVlT3jp8lsQOeYblbmQ2JSpFL5OwJffQCvF9ieYU993VlrNDNJdoOX4LMyqqGx3TSzaacCoTuqDcwzP6DW10A1aHHrFbINCkYNe2IHLHDxgMwZkTiyIMSk0G/65yj59eixs+w/FDFJGSDuY1/1j98nMNr1OPJ5Fub77iXpypDgMRHJKavCNdWLEuEhFpNUFNz8BaLYC7t17+G7QjugxA9onEcZpSjqG/a3Clzy/lJ1PYCmVuZHN0cmVhbQplbmRvYmoKMzMgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCA4MyA+PgpzdHJlYW0KeJxFjLsNwDAIRHumYAR+JvY+UZTC3r8NECVuuCfdPVwdCZkpbjPDQwaeDCyGXXGB9JYwC1xHUI6d7KNh1b7qBI31plLz7w+Unuys4obrAQJCGmYKZW5kc3RyZWFtCmVuZG9iagozNCAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDUxID4+CnN0cmVhbQp4nDM2tFAwUDA0MAeSRoZAlpGJQoohF0gAxMzlggnmgFkGQBqiOAeuJocrgysNAOG0DZgKZW5kc3RyZWFtCmVuZG9iagozNSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDE2MCA+PgpzdHJlYW0KeJxFkDkSAzEIBHO9gidIXIL3rMu1wfr/qQfWR6LpAjQcuhZNynoUaD7psUahutBr6CxKkkTBFpIdUKdjiDsoSExIY5JIth6DI5pYs12YmVQqs1LhtGnFwr/ZWtXIRI1wjfyJ6QZU/E/qXJTwTYOvkjH6GFS8O4OMSfheRdxaMe3+RDCxGfYJb0UmBYSJsanZvs9ghsz3Ctc4x/MNTII36wplbmRzdHJlYW0KZW5kb2JqCjM2IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMzM0ID4+CnN0cmVhbQp4nC1SS3LFIAzbcwpdoDP4B+Q86XS6eL3/tpKTRUYOYPQx5YaJSnxZILej1sS3jcxAheGvq8yFz0jbyDqIy5CLuJIthXtELOQxxDzEgu+r8R4e+azMybMHxi/Zdw8r9tSEZSHjxRnaYRXHYRXkWLB1Iap7eFOkw6kk2OOL/z7Fcy0ELXxG0IBf5J+vjuD5khZp95ht0656sEw7qqSwHGxPc14mX1pnuToezwfJ9q7YEVK7AhSFuTPOc+Eo01ZGtBZ2NkhqXGxvjv1YStCFblxGiiOQn6kiPKCkycwmCuKPnB5yKgNh6pqudHIbVXGnnsw1m4u3M0lm675IsZnCeV04s/4MU2a1eSfPcqLUqQjvsWdL0NA5rp69lllodJsTvKSEz8ZOT06+VzPrITkVCaliWlfBaRSZYgnbEl9TUVOaehn++/Lu8Tt+/gEsc3xzCmVuZHN0cmVhbQplbmRvYmoKMzcgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAzMjAgPj4Kc3RyZWFtCnicNVJLbgUxCNvPKbhApfBPzvOqqou++29rE70VTDBg4ykvWdJLvtQl26XD5Fsf9yWxQt6P7ZrMUsX3FrMUzy2vR88Rty0KBFETPViZLxUi1M/06DqocEqfgVcItxQbvINJAINq+AcepTMgUOdAxrtiMlIDgiTYc2lxCIlyJol/pLye3yetpKH0PVmZy9+TS6XQHU1O6AHFysVJoF1J+aCZmEpEkpfrfbFC9IbAkjw+RzHJgOw2iW2iBSbnHqUlzMQUOrDHArxmmtVV6GDCHocpjFcLs6gebPJbE5WkHa3jGdkw3sswU2Kh4bAF1OZiZYLu5eM1r8KI7VGTXcNw7pbNdwjRaP4bFsrgYxWSgEensRINaTjAiMCeXjjFXvMTOQ7AiGOdmiwMY2gmp3qOicDQnrOlYcbHHlr18w9U6XyHCmVuZHN0cmVhbQplbmRvYmoKMzggMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAxOCA+PgpzdHJlYW0KeJwzNrRQMIDDFEOuNAAd5gNSCmVuZHN0cmVhbQplbmRvYmoKMzkgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAxMzMgPj4Kc3RyZWFtCnicRY9LDgQhCET3nKKOwMcf53Ey6YVz/+2AnW4TYz2FVIG5gqE9LmsDnRUfIRm28beplo5FWT5UelJWD8ngh6zGyyHcoCzwgkkqhiFQi5gakS1lbreA2zYNsrKVU6WOsIujMI/2tGwVHl+iWyJ1kj+DxCov3OO6Hcil1rveoou+f6QBMQkKZW5kc3RyZWFtCmVuZG9iago0MCAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDM0MCA+PgpzdHJlYW0KeJw1UjluBDEM6/0KfSCAbtvv2SBIkfy/DanZFANxdFKUO1pUdsuHhVS17HT5tJXaEjfkd2WFxAnJqxLtUoZIqLxWIdXvmTKvtzVnBMhSpcLkpORxyYI/w6WnC8f5trGv5cgdjx5YFSOhRMAyxcToGpbO7rBmW36WacCPeIScK9Ytx1gFUhvdOO2K96F5LbIGiL2ZlooKHVaJFn5B8aBHjX32GFRYINHtHElwjIlQkYB2gdpIDDl7LHZRH/QzKDET6NobRdxBgSWSmDnFunT03/jQsaD+2Iw3vzoq6VtaWWPSPhvtlMYsMul6WPR089bHgws076L859UMEjRljZLGB63aOYaimVFWeLdDkw3NMcch8w6ewxkJSvo8FL+PJRMdlMjfDg2hf18eo4ycNt4C5qI/bRUHDuKzw165gRVKF2uS9wGpTOiB6f+v8bW+19cfHe2AxgplbmRzdHJlYW0KZW5kb2JqCjQxIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMjUxID4+CnN0cmVhbQp4nC1RSXIDQQi7zyv0hGan32OXK4fk/9cIygcGDYtAdFrioIyfICxXvOWRq2jD3zMxgt8Fh34r121Y5EBUIEljUDWhdvF69B7YcZgJzJPWsAxmrA/8jCnc6MXhMRlnt9dl1BDsXa89mUHJrFzEJRMXTNVhI2cOP5kyLrRzPTcg50ZYl2GQblYaMxKONIVIIYWqm6TOBEESjK5GjTZyFPulL490hlWNqDHscy1tX89NOGvQ7Fis8uSUHl1xLicXL6wc9PU2AxdRaazyQEjA/W4P9XOyk994S+fOFtPje83J8sJUYMWb125ANtXi37yI4/uMr+fn+fwDX2BbiAplbmRzdHJlYW0KZW5kb2JqCjQyIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMTc0ID4+CnN0cmVhbQp4nE2QSQ5DIQxD95zCF6iEM8DnPL+qumjvv61DB3WB/OQgcDw80HEkLnRk6IyOK5sc48CzIGPi0Tj/ybg+xDFB3aItWJd2x9nMEnPCMjECtkbJ2TyiwA/HXAgSZJcfvsAgIl2P+VbzWZP0z7c73Y+6tGZfPaLAiewIxbABV4D9useBS8L5XtPklyolYxOH8oHqIlI2O6EQtVTscqqKs92bK3AV9PzRQ+7tBbUjPN8KZW5kc3RyZWFtCmVuZG9iago0MyAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDc1ID4+CnN0cmVhbQp4nDO1NFIwUDA2ABKmZkYKpibmCimGXEA+iJXLZWhkCmblcBlZmilYWAAZJmbmUCGYhhwuY1NzoAFARcamYBqqP4crgysNAJWQEu8KZW5kc3RyZWFtCmVuZG9iago0NCAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDE0MSA+PgpzdHJlYW0KeJw9j8EOwzAIQ+/5Cv9ApNgpoXxPp2qH7v+vI0u7C3oCY4yF0NAbqprDhmCb48XSJVRr+BTFQCU3yJlgDqWk0h1HkXpiOBhcHrQbjuKx6PoRu5JmfdDGQrolaIB7rFNp3KZxE8QdNQXqKeqco7wQuZ+pZ9g0kt00s5JzuA2/e89T1/+nq7zL+QW9dy7+CmVuZHN0cmVhbQplbmRvYmoKNDUgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAyMTUgPj4Kc3RyZWFtCnicNVE5DgMhDOz3Ff5AJIwveE+iKM3+v82M0VYewVyGtJQhmfJSk6gh5VM+epkunLrc18xqNOeWtC1zgLi2vC+tksCJZoiDwWmYuAGaPAFD19GoUUMXHtDUpVMosNwEPoq3bg/dY7WBl7Yh54kgYigZLEHNqUUTFm3PJ6Q1v16LG96X7d3IU6XGlhiBBgFWOBzX6NfwlT1PJtF0FTLUqzXLGAkTRSI8+Y6m1RPrWjTSMhLUxhGsagO8O/0wTgAAE3HLAmSfSpSz5MRvsfSzBlf6/gGfR1SWCmVuZHN0cmVhbQplbmRvYmoKMTUgMCBvYmoKPDwgL0Jhc2VGb250IC9EZWphVnVTYW5zIC9DaGFyUHJvY3MgMTYgMCBSCi9FbmNvZGluZyA8PAovRGlmZmVyZW5jZXMgWyAzMiAvc3BhY2UgNDYgL3BlcmlvZCA0OCAvemVybyAvb25lIC90d28gL3RocmVlIC9mb3VyIC9maXZlIC9zaXggNTYKL2VpZ2h0IDY1IC9BIDY4IC9EIDc2IC9MIDk3IC9hIC9iIC9jIC9kIC9lIDEwNSAvaSAxMDggL2wgMTEwIC9uIC9vIDExNCAvcgovcyAvdCAvdSAvdiAxMjEgL3kgXQovVHlwZSAvRW5jb2RpbmcgPj4KL0ZpcnN0Q2hhciAwIC9Gb250QkJveCBbIC0xMDIxIC00NjMgMTc5NCAxMjMzIF0gL0ZvbnREZXNjcmlwdG9yIDE0IDAgUgovRm9udE1hdHJpeCBbIDAuMDAxIDAgMCAwLjAwMSAwIDAgXSAvTGFzdENoYXIgMjU1IC9OYW1lIC9EZWphVnVTYW5zCi9TdWJ0eXBlIC9UeXBlMyAvVHlwZSAvRm9udCAvV2lkdGhzIDEzIDAgUiA+PgplbmRvYmoKMTQgMCBvYmoKPDwgL0FzY2VudCA5MjkgL0NhcEhlaWdodCAwIC9EZXNjZW50IC0yMzYgL0ZsYWdzIDMyCi9Gb250QkJveCBbIC0xMDIxIC00NjMgMTc5NCAxMjMzIF0gL0ZvbnROYW1lIC9EZWphVnVTYW5zIC9JdGFsaWNBbmdsZSAwCi9NYXhXaWR0aCAxMzQyIC9TdGVtViAwIC9UeXBlIC9Gb250RGVzY3JpcHRvciAvWEhlaWdodCAwID4+CmVuZG9iagoxMyAwIG9iagpbIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwCjYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgMzE4IDQwMSA0NjAgODM4IDYzNgo5NTAgNzgwIDI3NSAzOTAgMzkwIDUwMCA4MzggMzE4IDM2MSAzMTggMzM3IDYzNiA2MzYgNjM2IDYzNiA2MzYgNjM2IDYzNiA2MzYKNjM2IDYzNiAzMzcgMzM3IDgzOCA4MzggODM4IDUzMSAxMDAwIDY4NCA2ODYgNjk4IDc3MCA2MzIgNTc1IDc3NSA3NTIgMjk1CjI5NSA2NTYgNTU3IDg2MyA3NDggNzg3IDYwMyA3ODcgNjk1IDYzNSA2MTEgNzMyIDY4NCA5ODkgNjg1IDYxMSA2ODUgMzkwIDMzNwozOTAgODM4IDUwMCA1MDAgNjEzIDYzNSA1NTAgNjM1IDYxNSAzNTIgNjM1IDYzNCAyNzggMjc4IDU3OSAyNzggOTc0IDYzNCA2MTIKNjM1IDYzNSA0MTEgNTIxIDM5MiA2MzQgNTkyIDgxOCA1OTIgNTkyIDUyNSA2MzYgMzM3IDYzNiA4MzggNjAwIDYzNiA2MDAgMzE4CjM1MiA1MTggMTAwMCA1MDAgNTAwIDUwMCAxMzQyIDYzNSA0MDAgMTA3MCA2MDAgNjg1IDYwMCA2MDAgMzE4IDMxOCA1MTggNTE4CjU5MCA1MDAgMTAwMCA1MDAgMTAwMCA1MjEgNDAwIDEwMjMgNjAwIDUyNSA2MTEgMzE4IDQwMSA2MzYgNjM2IDYzNiA2MzYgMzM3CjUwMCA1MDAgMTAwMCA0NzEgNjEyIDgzOCAzNjEgMTAwMCA1MDAgNTAwIDgzOCA0MDEgNDAxIDUwMCA2MzYgNjM2IDMxOCA1MDAKNDAxIDQ3MSA2MTIgOTY5IDk2OSA5NjkgNTMxIDY4NCA2ODQgNjg0IDY4NCA2ODQgNjg0IDk3NCA2OTggNjMyIDYzMiA2MzIgNjMyCjI5NSAyOTUgMjk1IDI5NSA3NzUgNzQ4IDc4NyA3ODcgNzg3IDc4NyA3ODcgODM4IDc4NyA3MzIgNzMyIDczMiA3MzIgNjExIDYwNQo2MzAgNjEzIDYxMyA2MTMgNjEzIDYxMyA2MTMgOTgyIDU1MCA2MTUgNjE1IDYxNSA2MTUgMjc4IDI3OCAyNzggMjc4IDYxMiA2MzQKNjEyIDYxMiA2MTIgNjEyIDYxMiA4MzggNjEyIDYzNCA2MzQgNjM0IDYzNCA1OTIgNjM1IDU5MiBdCmVuZG9iagoxNiAwIG9iago8PCAvQSAxNyAwIFIgL0QgMTggMCBSIC9MIDE5IDAgUiAvYSAyMCAwIFIgL2IgMjEgMCBSIC9jIDIyIDAgUiAvZCAyMyAwIFIKL2UgMjQgMCBSIC9laWdodCAyNSAwIFIgL2ZpdmUgMjYgMCBSIC9mb3VyIDI3IDAgUiAvaSAyOCAwIFIgL2wgMjkgMCBSCi9uIDMxIDAgUiAvbyAzMiAwIFIgL29uZSAzMyAwIFIgL3BlcmlvZCAzNCAwIFIgL3IgMzUgMCBSIC9zIDM2IDAgUgovc2l4IDM3IDAgUiAvc3BhY2UgMzggMCBSIC90IDM5IDAgUiAvdGhyZWUgNDAgMCBSIC90d28gNDEgMCBSIC91IDQyIDAgUgovdiA0MyAwIFIgL3kgNDQgMCBSIC96ZXJvIDQ1IDAgUiA+PgplbmRvYmoKMyAwIG9iago8PCAvRjEgMTUgMCBSID4+CmVuZG9iago0IDAgb2JqCjw8IC9BMSA8PCAvQ0EgMCAvVHlwZSAvRXh0R1N0YXRlIC9jYSAxID4+Ci9BMiA8PCAvQ0EgMSAvVHlwZSAvRXh0R1N0YXRlIC9jYSAxID4+Ci9BMyA8PCAvQ0EgMSAvVHlwZSAvRXh0R1N0YXRlIC9jYSAwLjUgPj4gPj4KZW5kb2JqCjUgMCBvYmoKPDwgPj4KZW5kb2JqCjYgMCBvYmoKPDwgPj4KZW5kb2JqCjcgMCBvYmoKPDwgL0YxLURlamFWdVNhbnMtbWludXMgMzAgMCBSID4+CmVuZG9iagoyIDAgb2JqCjw8IC9Db3VudCAxIC9LaWRzIFsgMTEgMCBSIF0gL1R5cGUgL1BhZ2VzID4+CmVuZG9iago0NiAwIG9iago8PCAvQ3JlYXRpb25EYXRlIChEOjIwMjExMjA0MTY1NTEyKzAyJzAwJykKL0NyZWF0b3IgKE1hdHBsb3RsaWIgdjMuNC4zLCBodHRwczovL21hdHBsb3RsaWIub3JnKQovUHJvZHVjZXIgKE1hdHBsb3RsaWIgcGRmIGJhY2tlbmQgdjMuNC4zKSA+PgplbmRvYmoKeHJlZgowIDQ3CjAwMDAwMDAwMDAgNjU1MzUgZiAKMDAwMDAwMDAxNiAwMDAwMCBuIAowMDAwMDIyMzcwIDAwMDAwIG4gCjAwMDAwMjIxMDcgMDAwMDAgbiAKMDAwMDAyMjEzOSAwMDAwMCBuIAowMDAwMDIyMjc5IDAwMDAwIG4gCjAwMDAwMjIzMDAgMDAwMDAgbiAKMDAwMDAyMjMyMSAwMDAwMCBuIAowMDAwMDAwMDY1IDAwMDAwIG4gCjAwMDAwMDAzOTkgMDAwMDAgbiAKMDAwMDAxMjcyOCAwMDAwMCBuIAowMDAwMDAwMjA4IDAwMDAwIG4gCjAwMDAwMTI3MDYgMDAwMDAgbiAKMDAwMDAyMDcyMCAwMDAwMCBuIAowMDAwMDIwNTIwIDAwMDAwIG4gCjAwMDAwMjAwNjcgMDAwMDAgbiAKMDAwMDAyMTc3MyAwMDAwMCBuIAowMDAwMDEyNzQ4IDAwMDAwIG4gCjAwMDAwMTI5MTEgMDAwMDAgbiAKMDAwMDAxMzE0OCAwMDAwMCBuIAowMDAwMDEzMjgxIDAwMDAwIG4gCjAwMDAwMTM2NjEgMDAwMDAgbiAKMDAwMDAxMzk3OCAwMDAwMCBuIAowMDAwMDE0MjgzIDAwMDAwIG4gCjAwMDAwMTQ1ODcgMDAwMDAgbiAKMDAwMDAxNDkwOSAwMDAwMCBuIAowMDAwMDE1Mzc3IDAwMDAwIG4gCjAwMDAwMTU2OTkgMDAwMDAgbiAKMDAwMDAxNTg2NSAwMDAwMCBuIAowMDAwMDE2MDA5IDAwMDAwIG4gCjAwMDAwMTYxMjggMDAwMDAgbiAKMDAwMDAxNjMwMCAwMDAwMCBuIAowMDAwMDE2NTM2IDAwMDAwIG4gCjAwMDAwMTY4MjcgMDAwMDAgbiAKMDAwMDAxNjk4MiAwMDAwMCBuIAowMDAwMDE3MTA1IDAwMDAwIG4gCjAwMDAwMTczMzggMDAwMDAgbiAKMDAwMDAxNzc0NSAwMDAwMCBuIAowMDAwMDE4MTM4IDAwMDAwIG4gCjAwMDAwMTgyMjggMDAwMDAgbiAKMDAwMDAxODQzNCAwMDAwMCBuIAowMDAwMDE4ODQ3IDAwMDAwIG4gCjAwMDAwMTkxNzEgMDAwMDAgbiAKMDAwMDAxOTQxOCAwMDAwMCBuIAowMDAwMDE5NTY1IDAwMDAwIG4gCjAwMDAwMTk3NzkgMDAwMDAgbiAKMDAwMDAyMjQzMCAwMDAwMCBuIAp0cmFpbGVyCjw8IC9JbmZvIDQ2IDAgUiAvUm9vdCAxIDAgUiAvU2l6ZSA0NyA+PgpzdGFydHhyZWYKMjI1ODcKJSVFT0YK\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:55:12.112890\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Layer 0 - Variance: 0.0768686905503273\n", "Layer 2 - Variance: 0.00374085595831275\n", "Layer 4 - Variance: 0.00021300435764715075\n", "Layer 6 - Variance: 0.000116668117698282\n", "Layer 8 - Variance: 8.082647400442511e-05\n"]}], "source": ["def var_init(model, std=0.01):\n", " for name, param in model.named_parameters():\n", " param.data.normal_(mean=0.0, std=std)\n", "\n", "\n", "var_init(model, std=0.01)\n", "visualize_activations(model, print_variance=True)"]}, {"cell_type": "markdown", "id": "7c95cf24", "metadata": {"papermill": {"duration": 0.163132, "end_time": "2021-12-04T15:55:13.391937", "exception": false, "start_time": "2021-12-04T15:55:13.228805", "status": "completed"}, "tags": []}, "source": ["The variance of the activation becomes smaller and smaller across layers, and almost vanishes in the last layer.\n", "Alternatively, we could use a higher standard deviation:"]}, {"cell_type": "code", "execution_count": 15, "id": "c6819982", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:55:13.709227Z", "iopub.status.busy": "2021-12-04T15:55:13.708760Z", "iopub.status.idle": "2021-12-04T15:55:21.442388Z", "shell.execute_reply": "2021-12-04T15:55:21.442802Z"}, "papermill": {"duration": 7.894595, "end_time": "2021-12-04T15:55:21.442993", "exception": false, "start_time": "2021-12-04T15:55:13.548398", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:55:20.476417\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Layer 0 - Variance: 8.08608341217041\n", "Layer 2 - Variance: 41.400367736816406\n", "Layer 4 - Variance: 104.29255676269531\n", "Layer 6 - Variance: 270.63995361328125\n", "Layer 8 - Variance: 288.26495361328125\n"]}], "source": ["var_init(model, std=0.1)\n", "visualize_activations(model, print_variance=True)"]}, {"cell_type": "markdown", "id": "4e4a9097", "metadata": {"papermill": {"duration": 0.165816, "end_time": "2021-12-04T15:55:21.775202", "exception": false, "start_time": "2021-12-04T15:55:21.609386", "status": "completed"}, "tags": []}, "source": ["With a higher standard deviation, the activations are likely to explode.\n", "You can play around with the specific standard deviation values, but it will be hard to find one that gives us a good activation distribution across layers and is very specific to our model.\n", "If we would change the hidden sizes or number of layers, you would have\n", "to search all over again, which is neither efficient nor recommended."]}, {"cell_type": "markdown", "id": "b785fdfc", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.165929, "end_time": "2021-12-04T15:55:22.105283", "exception": false, "start_time": "2021-12-04T15:55:21.939354", "status": "completed"}, "tags": []}, "source": ["### How to find appropriate initialization values\n", "\n", "From our experiments above, we have seen that we need to sample the weights from a distribution, but are not sure which one exactly.\n", "As a next step, we will try to find the optimal initialization from the perspective of the activation distribution.\n", "For this, we state two requirements:\n", "\n", "1. The mean of the activations should be zero\n", "2. The variance of the activations should stay the same across every layer\n", "\n", "Suppose we want to design an initialization for the following layer: $y=Wx+b$ with $y\\in\\mathbb{R}^{d_y}$, $x\\in\\mathbb{R}^{d_x}$.\n", "Our goal is that the variance of each element of $y$ is the same as the input, i.e. $\\text{Var}(y_i)=\\text{Var}(x_i)=\\sigma_x^{2}$, and that the mean is zero.\n", "We assume $x$ to also have a mean of zero, because, in deep neural networks, $y$ would be the input of another layer.\n", "This requires the bias and weight to have an expectation of 0.\n", "Actually, as $b$ is a single element per output neuron and is constant across different inputs, we set it to 0 overall.\n", "\n", "Next, we need to calculate the variance with which we need to initialize the weight parameters.\n", "Along the calculation, we will need to following variance rule: given two independent variables, the variance of their product is $\\text{Var}(X\\cdot Y) = \\mathbb{E}(Y)^2\\text{Var}(X) + \\mathbb{E}(X)^2\\text{Var}(Y) + \\text{Var}(X)\\text{Var}(Y) = \\mathbb{E}(Y^2)\\mathbb{E}(X^2)-\\mathbb{E}(Y)^2\\mathbb{E}(X)^2$ ($X$ and $Y$ are not refering to $x$ and $y$, but any random variable).\n", "\n", "The needed variance of the weights, $\\text{Var}(w_{ij})$, is calculated as follows:\n", "\n", "$$\n", "\\begin{split}\n", " y_i & = \\sum_{j} w_{ij}x_{j}\\hspace{10mm}\\text{Calculation of a single output neuron without bias}\\\\\n", " \\text{Var}(y_i) = \\sigma_x^{2} & = \\text{Var}\\left(\\sum_{j} w_{ij}x_{j}\\right)\\\\\n", " & = \\sum_{j} \\text{Var}(w_{ij}x_{j}) \\hspace{10mm}\\text{Inputs and weights are independent of each other}\\\\\n", " & = \\sum_{j} \\text{Var}(w_{ij})\\cdot\\text{Var}(x_{j}) \\hspace{10mm}\\text{Variance rule (see above) with expectations being zero}\\\\\n", " & = d_x \\cdot \\text{Var}(w_{ij})\\cdot\\text{Var}(x_{j}) \\hspace{10mm}\\text{Variance equal for all $d_x$ elements}\\\\\n", " & = \\sigma_x^{2} \\cdot d_x \\cdot \\text{Var}(w_{ij})\\\\\n", " \\Rightarrow \\text{Var}(w_{ij}) = \\sigma_{W}^2 & = \\frac{1}{d_x}\\\\\n", "\\end{split}\n", "$$\n", "\n", "Thus, we should initialize the weight distribution with a variance of the inverse of the input dimension $d_x$.\n", "Let's implement it below and check whether this holds:"]}, {"cell_type": "code", "execution_count": 16, "id": "85fe111a", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:55:22.441463Z", "iopub.status.busy": "2021-12-04T15:55:22.440990Z", "iopub.status.idle": "2021-12-04T15:55:35.037471Z", "shell.execute_reply": "2021-12-04T15:55:35.037861Z"}, "papermill": {"duration": 12.767059, "end_time": "2021-12-04T15:55:35.038029", "exception": false, "start_time": "2021-12-04T15:55:22.270970", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:55:26.361643\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:55:34.092028\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Layer 0 - Variance: 1.0374585390090942\n", "Layer 2 - Variance: 1.0698715448379517\n", "Layer 4 - Variance: 1.1412183046340942\n", "Layer 6 - Variance: 1.0962424278259277\n", "Layer 8 - Variance: 1.0699418783187866\n"]}], "source": ["def equal_var_init(model):\n", " for name, param in model.named_parameters():\n", " if name.endswith(\".bias\"):\n", " param.data.fill_(0)\n", " else:\n", " param.data.normal_(std=1.0 / math.sqrt(param.shape[1]))\n", "\n", "\n", "equal_var_init(model)\n", "visualize_weight_distribution(model)\n", "visualize_activations(model, print_variance=True)"]}, {"cell_type": "markdown", "id": "ca9c629c", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.183436, "end_time": "2021-12-04T15:55:35.408994", "exception": false, "start_time": "2021-12-04T15:55:35.225558", "status": "completed"}, "tags": []}, "source": ["As we expected, the variance stays indeed constant across layers.\n", "Note that our initialization does not restrict us to a normal distribution, but allows any other distribution with a mean of 0 and variance of $1/d_x$.\n", "You often see that a uniform distribution is used for initialization.\n", "A small benefit of using a uniform instead of a normal distribution is that we can exclude the chance of initializing very large or small weights.\n", "\n", "Besides the variance of the activations, another variance we would like to stabilize is the one of the gradients.\n", "This ensures a stable optimization for deep networks.\n", "It turns out that we can do the same calculation as above starting from $\\Delta x=W\\Delta y$, and come to the conclusion that we should initialize our layers with $1/d_y$ where $d_y$ is the number of output neurons.\n", "You can do the calculation as a practice, or check a thorough explanation in [this blog post](https://pouannes.github.io/blog/initialization).\n", "As a compromise between both constraints, [Glorot and Bengio (2010)](http://proceedings.mlr.press/v9/glorot10a/glorot10a.pdf?hc_location=ufi) proposed to use the harmonic mean of both values.\n", "This leads us to the well-known Xavier initialization:\n", "\n", "$$W\\sim \\mathcal{N}\\left(0,\\frac{2}{d_x+d_y}\\right)$$\n", "\n", "If we use a uniform distribution, we would initialize the weights with:\n", "\n", "$$W\\sim U\\left[-\\frac{\\sqrt{6}}{\\sqrt{d_x+d_y}}, \\frac{\\sqrt{6}}{\\sqrt{d_x+d_y}}\\right]$$\n", "\n", "Let's shortly implement it and validate its effectiveness:"]}, {"cell_type": "code", "execution_count": 17, "id": "886f5024", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:55:35.773825Z", "iopub.status.busy": "2021-12-04T15:55:35.773355Z", "iopub.status.idle": "2021-12-04T15:55:48.170979Z", "shell.execute_reply": "2021-12-04T15:55:48.170552Z"}, "papermill": {"duration": 12.581276, "end_time": "2021-12-04T15:55:48.171111", "exception": false, "start_time": "2021-12-04T15:55:35.589835", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:55:39.652330\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["layers.0.weight - Variance: 0.000457785528851673\n", "layers.2.weight - Variance: 0.0006751694600097835\n", "layers.4.weight - Variance: 0.0008508111932314932\n", "layers.6.weight - Variance: 0.001484374050050974\n", "layers.8.weight - Variance: 0.011529149487614632\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:55:47.230788\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Layer 0 - Variance: 1.1692266464233398\n", "Layer 2 - Variance: 1.520001769065857\n", "Layer 4 - Variance: 1.585775375366211\n", "Layer 6 - Variance: 1.9146416187286377\n", "Layer 8 - Variance: 3.2868599891662598\n"]}], "source": ["def xavier_init(model):\n", " for name, param in model.named_parameters():\n", " if name.endswith(\".bias\"):\n", " param.data.fill_(0)\n", " else:\n", " bound = math.sqrt(6) / math.sqrt(param.shape[0] + param.shape[1])\n", " param.data.uniform_(-bound, bound)\n", "\n", "\n", "xavier_init(model)\n", "visualize_gradients(model, print_variance=True)\n", "visualize_activations(model, print_variance=True)"]}, {"cell_type": "markdown", "id": "920b63e6", "metadata": {"papermill": {"duration": 0.203664, "end_time": "2021-12-04T15:55:48.573926", "exception": false, "start_time": "2021-12-04T15:55:48.370262", "status": "completed"}, "tags": []}, "source": ["We see that the Xavier initialization balances the variance of gradients and activations.\n", "Note that the significantly higher variance for the output layer is due to the large difference of input and output dimension ($128$ vs $10$).\n", "However, we currently assumed the activation function to be linear.\n", "So what happens if we add a non-linearity?\n", "In a tanh-based network, a common assumption is that for small values during the initial steps in training, the $\\tanh$ works as a linear function such that we don't have to adjust our calculation.\n", "We can check if that is the case for us as well:"]}, {"cell_type": "code", "execution_count": 18, "id": "dff6e720", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:55:48.968877Z", "iopub.status.busy": "2021-12-04T15:55:48.968403Z", "iopub.status.idle": "2021-12-04T15:56:01.734151Z", "shell.execute_reply": "2021-12-04T15:56:01.733706Z"}, "papermill": {"duration": 12.965651, "end_time": "2021-12-04T15:56:01.734278", "exception": false, "start_time": "2021-12-04T15:55:48.768627", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:55:53.100667\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["layers.0.weight - Variance: 2.4351327738258988e-05\n", "layers.2.weight - Variance: 3.7693978811148554e-05\n", "layers.4.weight - Variance: 5.152593075763434e-05\n", "layers.6.weight - Variance: 6.856555410195142e-05\n", "layers.8.weight - Variance: 0.0004877124447375536\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:56:00.772458\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Layer 0 - Variance: 1.2570290565490723\n", "Layer 2 - Variance: 0.5786585807800293\n", "Layer 4 - Variance: 0.2740468978881836\n", "Layer 6 - Variance: 0.2201044261455536\n", "Layer 8 - Variance: 0.3423171937465668\n"]}], "source": ["model = BaseNetwork(act_fn=nn.Tanh()).to(device)\n", "xavier_init(model)\n", "visualize_gradients(model, print_variance=True)\n", "visualize_activations(model, print_variance=True)"]}, {"cell_type": "markdown", "id": "3609de04", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.215252, "end_time": "2021-12-04T15:56:02.163103", "exception": false, "start_time": "2021-12-04T15:56:01.947851", "status": "completed"}, "tags": []}, "source": ["Although the variance decreases over depth, it is apparent that the activation distribution becomes more focused on the low values.\n", "Therefore, our variance will stabilize around 0.25 if we would go even deeper.\n", "Hence, we can conclude that the Xavier initialization works well for Tanh networks.\n", "But what about ReLU networks?\n", "Here, we cannot take the previous assumption of the non-linearity becoming linear for small values.\n", "The ReLU activation function sets (in expectation) half of the inputs to 0 so that also the expectation of the input is not zero.\n", "However, as long as the expectation of $W$ is zero and $b=0$, the expectation of the output is zero.\n", "The part where the calculation of the ReLU initialization differs from the identity is when determining $\\text{Var}(w_{ij}x_{j})$:\n", "\n", "$$\\text{Var}(w_{ij}x_{j})=\\underbrace{\\mathbb{E}[w_{ij}^2]}_{=\\text{Var}(w_{ij})}\\mathbb{E}[x_{j}^2]-\\underbrace{\\mathbb{E}[w_{ij}]^2}_{=0}\\mathbb{E}[x_{j}]^2=\\text{Var}(w_{ij})\\mathbb{E}[x_{j}^2]$$\n", "\n", "If we assume now that $x$ is the output of a ReLU activation (from a previous layer, $x=max(0,\\tilde{y})$), we can calculate the expectation as follows:\n", "\n", "\n", "$$\n", "\\begin{split}\n", " \\mathbb{E}[x^2] & =\\mathbb{E}[\\max(0,\\tilde{y})^2]\\\\\n", " & =\\frac{1}{2}\\mathbb{E}[{\\tilde{y}}^2]\\hspace{2cm}\\tilde{y}\\text{ is zero-centered and symmetric}\\\\\n", " & =\\frac{1}{2}\\text{Var}(\\tilde{y})\n", "\\end{split}$$\n", "\n", "Thus, we see that we have an additional factor of 1/2 in the equation, so that our desired weight variance becomes $2/d_x$.\n", "This gives us the Kaiming initialization (see [He, K. et al.\n", "(2015)](https://arxiv.org/pdf/1502.01852.pdf)).\n", "Note that the Kaiming initialization does not use the harmonic mean between input and output size.\n", "In their paper (Section 2.2, Backward Propagation, last paragraph), they argue that using $d_x$ or $d_y$ both lead to stable gradients throughout the network, and only depend on the overall input and output size of the network.\n", "Hence, we can use here only the input $d_x$:"]}, {"cell_type": "code", "execution_count": 19, "id": "d4b7f43f", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:02.594108Z", "iopub.status.busy": "2021-12-04T15:56:02.593625Z", "iopub.status.idle": "2021-12-04T15:56:15.072435Z", "shell.execute_reply": "2021-12-04T15:56:15.071951Z"}, "papermill": {"duration": 12.695197, "end_time": "2021-12-04T15:56:15.072560", "exception": false, "start_time": "2021-12-04T15:56:02.377363", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:56:06.552473\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["layers.0.weight - Variance: 4.737732888315804e-05\n", "layers.2.weight - Variance: 5.9308793424861506e-05\n", "layers.4.weight - Variance: 7.343693141592667e-05\n", "layers.6.weight - Variance: 0.00016474377480335534\n", "layers.8.weight - Variance: 0.0029673215467482805\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:56:14.115116\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Layer 0 - Variance: 1.037200689315796\n", "Layer 2 - Variance: 1.0582876205444336\n", "Layer 4 - Variance: 1.0638010501861572\n", "Layer 6 - Variance: 1.3167966604232788\n", "Layer 8 - Variance: 0.6909096837043762\n"]}], "source": ["def kaiming_init(model):\n", " for name, param in model.named_parameters():\n", " if name.endswith(\".bias\"):\n", " param.data.fill_(0)\n", " elif name.startswith(\"layers.0\"): # The first layer does not have ReLU applied on its input\n", " param.data.normal_(0, 1 / math.sqrt(param.shape[1]))\n", " else:\n", " param.data.normal_(0, math.sqrt(2) / math.sqrt(param.shape[1]))\n", "\n", "\n", "model = BaseNetwork(act_fn=nn.ReLU()).to(device)\n", "kaiming_init(model)\n", "visualize_gradients(model, print_variance=True)\n", "visualize_activations(model, print_variance=True)"]}, {"cell_type": "markdown", "id": "6af2f0ac", "metadata": {"papermill": {"duration": 0.227785, "end_time": "2021-12-04T15:56:15.529106", "exception": false, "start_time": "2021-12-04T15:56:15.301321", "status": "completed"}, "tags": []}, "source": ["The variance stays stable across layers.\n", "We can conclude that the Kaiming initialization indeed works well for ReLU-based networks.\n", "Note that for Leaky-ReLU etc., we have to slightly adjust the factor of $2$ in the variance as half of the values are not set to zero anymore.\n", "PyTorch provides a function to calculate this factor for many activation\n", "function, see `torch.nn.init.calculate_gain`\n", "([link](https://pytorch.org/docs/stable/nn.init.html#torch.nn.init.calculate_gain))."]}, {"cell_type": "markdown", "id": "0d736eff", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.22843, "end_time": "2021-12-04T15:56:15.988215", "exception": false, "start_time": "2021-12-04T15:56:15.759785", "status": "completed"}, "tags": []}, "source": ["## Optimization\n", "\n", "
\n", "\n", "Besides initialization, selecting a suitable optimization algorithm can be an important choice for deep neural networks.\n", "Before taking a closer look at them, we should define code for training the models.\n", "Most of the following code is copied from the previous tutorial, and only slightly altered to fit our needs."]}, {"cell_type": "code", "execution_count": 20, "id": "b9bfe5e2", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:16.464612Z", "iopub.status.busy": "2021-12-04T15:56:16.453313Z", "iopub.status.idle": "2021-12-04T15:56:16.468178Z", "shell.execute_reply": "2021-12-04T15:56:16.467704Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.251694, "end_time": "2021-12-04T15:56:16.468294", "exception": false, "start_time": "2021-12-04T15:56:16.216600", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def _get_config_file(model_path, model_name):\n", " return os.path.join(model_path, model_name + \".config\")\n", "\n", "\n", "def _get_model_file(model_path, model_name):\n", " return os.path.join(model_path, model_name + \".tar\")\n", "\n", "\n", "def _get_result_file(model_path, model_name):\n", " return os.path.join(model_path, model_name + \"_results.json\")\n", "\n", "\n", "def load_model(model_path, model_name, net=None):\n", " config_file = _get_config_file(model_path, model_name)\n", " model_file = _get_model_file(model_path, model_name)\n", " assert os.path.isfile(\n", " config_file\n", " ), f'Could not find the config file \"{config_file}\". Are you sure this is the correct path and you have your model config stored here?'\n", " assert os.path.isfile(\n", " model_file\n", " ), f'Could not find the model file \"{model_file}\". Are you sure this is the correct path and you have your model stored here?'\n", " with open(config_file) as f:\n", " config_dict = json.load(f)\n", " if net is None:\n", " act_fn_name = config_dict[\"act_fn\"].pop(\"name\").lower()\n", " assert (\n", " act_fn_name in act_fn_by_name\n", " ), f'Unknown activation function \"{act_fn_name}\". Please add it to the \"act_fn_by_name\" dict.'\n", " act_fn = act_fn_by_name[act_fn_name]()\n", " net = BaseNetwork(act_fn=act_fn, **config_dict)\n", " net.load_state_dict(torch.load(model_file))\n", " return net\n", "\n", "\n", "def save_model(model, model_path, model_name):\n", " config_dict = model.config\n", " os.makedirs(model_path, exist_ok=True)\n", " config_file = _get_config_file(model_path, model_name)\n", " model_file = _get_model_file(model_path, model_name)\n", " with open(config_file, \"w\") as f:\n", " json.dump(config_dict, f)\n", " torch.save(model.state_dict(), model_file)\n", "\n", "\n", "def train_model(net, model_name, optim_func, max_epochs=50, batch_size=256, overwrite=False):\n", " \"\"\"Train a model on the training set of FashionMNIST.\n", "\n", " Args:\n", " net: Object of BaseNetwork\n", " model_name: (str) Name of the model, used for creating the checkpoint names\n", " max_epochs: Number of epochs we want to (maximally) train for\n", " patience: If the performance on the validation set has not improved for #patience epochs, we stop training early\n", " batch_size: Size of batches used in training\n", " overwrite: Determines how to handle the case when there already exists a checkpoint. If True, it will be overwritten. Otherwise, we skip training.\n", " \"\"\"\n", " file_exists = os.path.isfile(_get_model_file(CHECKPOINT_PATH, model_name))\n", " if file_exists and not overwrite:\n", " print(f'Model file of \"{model_name}\" already exists. Skipping training...')\n", " with open(_get_result_file(CHECKPOINT_PATH, model_name)) as f:\n", " results = json.load(f)\n", " else:\n", " if file_exists:\n", " print(\"Model file exists, but will be overwritten...\")\n", "\n", " # Defining optimizer, loss and data loader\n", " optimizer = optim_func(net.parameters())\n", " loss_module = nn.CrossEntropyLoss()\n", " train_loader_local = data.DataLoader(\n", " train_set, batch_size=batch_size, shuffle=True, drop_last=True, pin_memory=True\n", " )\n", "\n", " results = None\n", " val_scores = []\n", " train_losses, train_scores = [], []\n", " best_val_epoch = -1\n", " for epoch in range(max_epochs):\n", " train_acc, val_acc, epoch_losses = epoch_iteration(\n", " net, loss_module, optimizer, train_loader_local, val_loader, epoch\n", " )\n", " train_scores.append(train_acc)\n", " val_scores.append(val_acc)\n", " train_losses += epoch_losses\n", "\n", " if len(val_scores) == 1 or val_acc > val_scores[best_val_epoch]:\n", " print(\"\\t (New best performance, saving model...)\")\n", " save_model(net, CHECKPOINT_PATH, model_name)\n", " best_val_epoch = epoch\n", "\n", " if results is None:\n", " load_model(CHECKPOINT_PATH, model_name, net=net)\n", " test_acc = test_model(net, test_loader)\n", " results = {\n", " \"test_acc\": test_acc,\n", " \"val_scores\": val_scores,\n", " \"train_losses\": train_losses,\n", " \"train_scores\": train_scores,\n", " }\n", " with open(_get_result_file(CHECKPOINT_PATH, model_name), \"w\") as f:\n", " json.dump(results, f)\n", "\n", " # Plot a curve of the validation accuracy\n", " sns.set()\n", " plt.plot([i for i in range(1, len(results[\"train_scores\"]) + 1)], results[\"train_scores\"], label=\"Train\")\n", " plt.plot([i for i in range(1, len(results[\"val_scores\"]) + 1)], results[\"val_scores\"], label=\"Val\")\n", " plt.xlabel(\"Epochs\")\n", " plt.ylabel(\"Validation accuracy\")\n", " plt.ylim(min(results[\"val_scores\"]), max(results[\"train_scores\"]) * 1.01)\n", " plt.title(f\"Validation performance of {model_name}\")\n", " plt.legend()\n", " plt.show()\n", " plt.close()\n", "\n", " print((f\" Test accuracy: {results['test_acc']*100.0:4.2f}% \").center(50, \"=\") + \"\\n\")\n", " return results\n", "\n", "\n", "def epoch_iteration(net, loss_module, optimizer, train_loader_local, val_loader, epoch):\n", " ############\n", " # Training #\n", " ############\n", " net.train()\n", " true_preds, count = 0.0, 0\n", " epoch_losses = []\n", " t = tqdm(train_loader_local, leave=False)\n", " for imgs, labels in t:\n", " imgs, labels = imgs.to(device), labels.to(device)\n", " optimizer.zero_grad()\n", " preds = net(imgs)\n", " loss = loss_module(preds, labels)\n", " loss.backward()\n", " optimizer.step()\n", " # Record statistics during training\n", " true_preds += (preds.argmax(dim=-1) == labels).sum().item()\n", " count += labels.shape[0]\n", " t.set_description(f\"Epoch {epoch+1}: loss={loss.item():4.2f}\")\n", " epoch_losses.append(loss.item())\n", " train_acc = true_preds / count\n", "\n", " ##############\n", " # Validation #\n", " ##############\n", " val_acc = test_model(net, val_loader)\n", " print(\n", " f\"[Epoch {epoch+1:2i}] Training accuracy: {train_acc*100.0:05.2f}%, Validation accuracy: {val_acc*100.0:05.2f}%\"\n", " )\n", " return train_acc, val_acc, epoch_losses\n", "\n", "\n", "def test_model(net, data_loader):\n", " \"\"\"Test a model on a specified dataset.\n", "\n", " Args:\n", " net: Trained model of type BaseNetwork\n", " data_loader: DataLoader object of the dataset to test on (validation or test)\n", " \"\"\"\n", " net.eval()\n", " true_preds, count = 0.0, 0\n", " for imgs, labels in data_loader:\n", " imgs, labels = imgs.to(device), labels.to(device)\n", " with torch.no_grad():\n", " preds = net(imgs).argmax(dim=-1)\n", " true_preds += (preds == labels).sum().item()\n", " count += labels.shape[0]\n", " test_acc = true_preds / count\n", " return test_acc"]}, {"cell_type": "markdown", "id": "ebc0236d", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.226171, "end_time": "2021-12-04T15:56:16.921208", "exception": false, "start_time": "2021-12-04T15:56:16.695037", "status": "completed"}, "tags": []}, "source": ["First, we need to understand what an optimizer actually does.\n", "The optimizer is responsible to update the network's parameters given the gradients.\n", "Hence, we effectively implement a function $w^{t} = f(w^{t-1}, g^{t}, ...)$ with $w$ being the parameters, and $g^{t} = \\nabla_{w^{(t-1)}} \\mathcal{L}^{(t)}$ the gradients at time step $t$.\n", "A common, additional parameter to this function is the learning rate, here denoted by $\\eta$.\n", "Usually, the learning rate can be seen as the \"step size\" of the update.\n", "A higher learning rate means that we change the weights more in the direction of the gradients, a smaller means we take shorter steps.\n", "\n", "As most optimizers only differ in the implementation of $f$, we can define a template for an optimizer in PyTorch below.\n", "We take as input the parameters of a model and a learning rate.\n", "The function `zero_grad` sets the gradients of all parameters to zero, which we have to do before calling `loss.backward()`.\n", "Finally, the `step()` function tells the optimizer to update all weights based on their gradients.\n", "The template is setup below:"]}, {"cell_type": "code", "execution_count": 21, "id": "8115a144", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:17.381962Z", "iopub.status.busy": "2021-12-04T15:56:17.381485Z", "iopub.status.idle": "2021-12-04T15:56:17.383062Z", "shell.execute_reply": "2021-12-04T15:56:17.383442Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.234647, "end_time": "2021-12-04T15:56:17.383573", "exception": false, "start_time": "2021-12-04T15:56:17.148926", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class OptimizerTemplate:\n", " def __init__(self, params, lr):\n", " self.params = list(params)\n", " self.lr = lr\n", "\n", " def zero_grad(self):\n", " # Set gradients of all parameters to zero\n", " for p in self.params:\n", " if p.grad is not None:\n", " p.grad.detach_() # For second-order optimizers important\n", " p.grad.zero_()\n", "\n", " @torch.no_grad()\n", " def step(self):\n", " # Apply update step to all parameters\n", " for p in self.params:\n", " if p.grad is None: # We skip parameters without any gradients\n", " continue\n", " self.update_param(p)\n", "\n", " def update_param(self, p):\n", " # To be implemented in optimizer-specific classes\n", " raise NotImplementedError"]}, {"cell_type": "markdown", "id": "11fc5bd8", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.225818, "end_time": "2021-12-04T15:56:17.836069", "exception": false, "start_time": "2021-12-04T15:56:17.610251", "status": "completed"}, "tags": []}, "source": ["The first optimizer we are going to implement is the standard Stochastic Gradient Descent (SGD).\n", "SGD updates the parameters using the following equation:\n", "\n", "$$\n", "\\begin{split}\n", " w^{(t)} & = w^{(t-1)} - \\eta \\cdot g^{(t)}\n", "\\end{split}\n", "$$\n", "\n", "As simple as the equation is also our implementation of SGD:"]}, {"cell_type": "code", "execution_count": 22, "id": "7c5f4955", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:18.300285Z", "iopub.status.busy": "2021-12-04T15:56:18.299810Z", "iopub.status.idle": "2021-12-04T15:56:18.301728Z", "shell.execute_reply": "2021-12-04T15:56:18.301262Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.237501, "end_time": "2021-12-04T15:56:18.301837", "exception": false, "start_time": "2021-12-04T15:56:18.064336", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class SGD(OptimizerTemplate):\n", " def __init__(self, params, lr):\n", " super().__init__(params, lr)\n", "\n", " def update_param(self, p):\n", " p_update = -self.lr * p.grad\n", " p.add_(p_update) # In-place update => saves memory and does not create computation graph"]}, {"cell_type": "markdown", "id": "0f34b439", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.226849, "end_time": "2021-12-04T15:56:18.754221", "exception": false, "start_time": "2021-12-04T15:56:18.527372", "status": "completed"}, "tags": []}, "source": ["In the lecture, we also have discussed the concept of momentum which replaces the gradient in the update by an exponential average of all past gradients including the current one:\n", "\n", "$$\n", "\\begin{split}\n", " m^{(t)} & = \\beta_1 m^{(t-1)} + (1 - \\beta_1)\\cdot g^{(t)}\\\\\n", " w^{(t)} & = w^{(t-1)} - \\eta \\cdot m^{(t)}\\\\\n", "\\end{split}\n", "$$\n", "\n", "Let's also implement it below:"]}, {"cell_type": "code", "execution_count": 23, "id": "48028221", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:19.214485Z", "iopub.status.busy": "2021-12-04T15:56:19.214011Z", "iopub.status.idle": "2021-12-04T15:56:19.215560Z", "shell.execute_reply": "2021-12-04T15:56:19.215939Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.23626, "end_time": "2021-12-04T15:56:19.216068", "exception": false, "start_time": "2021-12-04T15:56:18.979808", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class SGDMomentum(OptimizerTemplate):\n", " def __init__(self, params, lr, momentum=0.0):\n", " super().__init__(params, lr)\n", " self.momentum = momentum # Corresponds to beta_1 in the equation above\n", " self.param_momentum = {p: torch.zeros_like(p.data) for p in self.params} # Dict to store m_t\n", "\n", " def update_param(self, p):\n", " self.param_momentum[p] = (1 - self.momentum) * p.grad + self.momentum * self.param_momentum[p]\n", " p_update = -self.lr * self.param_momentum[p]\n", " p.add_(p_update)"]}, {"cell_type": "markdown", "id": "f9f83484", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.2256, "end_time": "2021-12-04T15:56:19.667175", "exception": false, "start_time": "2021-12-04T15:56:19.441575", "status": "completed"}, "tags": []}, "source": ["Finally, we arrive at Adam.\n", "Adam combines the idea of momentum with an adaptive learning rate, which is based on an exponential average of the squared gradients, i.e. the gradients norm.\n", "Furthermore, we add a bias correction for the momentum and adaptive learning rate for the first iterations:\n", "\n", "$$\n", "\\begin{split}\n", " m^{(t)} & = \\beta_1 m^{(t-1)} + (1 - \\beta_1)\\cdot g^{(t)}\\\\\n", " v^{(t)} & = \\beta_2 v^{(t-1)} + (1 - \\beta_2)\\cdot \\left(g^{(t)}\\right)^2\\\\\n", " \\hat{m}^{(t)} & = \\frac{m^{(t)}}{1-\\beta^{t}_1}, \\hat{v}^{(t)} = \\frac{v^{(t)}}{1-\\beta^{t}_2}\\\\\n", " w^{(t)} & = w^{(t-1)} - \\frac{\\eta}{\\sqrt{v^{(t)}} + \\epsilon}\\circ \\hat{m}^{(t)}\\\\\n", "\\end{split}\n", "$$\n", "\n", "Epsilon is a small constant used to improve numerical stability for very small gradient norms.\n", "Remember that the adaptive learning rate does not replace the learning\n", "rate hyperparameter $\\eta$, but rather acts as an extra factor and\n", "ensures that the gradients of various parameters have a similar norm."]}, {"cell_type": "code", "execution_count": 24, "id": "3f028169", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:20.130949Z", "iopub.status.busy": "2021-12-04T15:56:20.130446Z", "iopub.status.idle": "2021-12-04T15:56:20.132399Z", "shell.execute_reply": "2021-12-04T15:56:20.131929Z"}, "papermill": {"duration": 0.238498, "end_time": "2021-12-04T15:56:20.132510", "exception": false, "start_time": "2021-12-04T15:56:19.894012", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class Adam(OptimizerTemplate):\n", " def __init__(self, params, lr, beta1=0.9, beta2=0.999, eps=1e-8):\n", " super().__init__(params, lr)\n", " self.beta1 = beta1\n", " self.beta2 = beta2\n", " self.eps = eps\n", " self.param_step = {p: 0 for p in self.params} # Remembers \"t\" for each parameter for bias correction\n", " self.param_momentum = {p: torch.zeros_like(p.data) for p in self.params}\n", " self.param_2nd_momentum = {p: torch.zeros_like(p.data) for p in self.params}\n", "\n", " def update_param(self, p):\n", " self.param_step[p] += 1\n", "\n", " self.param_momentum[p] = (1 - self.beta1) * p.grad + self.beta1 * self.param_momentum[p]\n", " self.param_2nd_momentum[p] = (1 - self.beta2) * (p.grad) ** 2 + self.beta2 * self.param_2nd_momentum[p]\n", "\n", " bias_correction_1 = 1 - self.beta1 ** self.param_step[p]\n", " bias_correction_2 = 1 - self.beta2 ** self.param_step[p]\n", "\n", " p_2nd_mom = self.param_2nd_momentum[p] / bias_correction_2\n", " p_mom = self.param_momentum[p] / bias_correction_1\n", " p_lr = self.lr / (torch.sqrt(p_2nd_mom) + self.eps)\n", " p_update = -p_lr * p_mom\n", "\n", " p.add_(p_update)"]}, {"cell_type": "markdown", "id": "b6db76a2", "metadata": {"papermill": {"duration": 0.227049, "end_time": "2021-12-04T15:56:20.587369", "exception": false, "start_time": "2021-12-04T15:56:20.360320", "status": "completed"}, "tags": []}, "source": ["### Comparing optimizers on model training\n", "\n", "After we have implemented three optimizers (SGD, SGD with momentum, and Adam), we can start to analyze and compare them.\n", "First, we test them on how well they can optimize a neural network on the FashionMNIST dataset.\n", "We use again our linear network, this time with a ReLU activation and the kaiming initialization, which we have found before to work well for ReLU-based networks.\n", "Note that the model is over-parameterized for this task, and we can achieve similar performance with a much smaller network (for example `100,100,100`).\n", "However, our main interest is in how well the optimizer can train *deep*\n", "neural networks, hence the over-parameterization."]}, {"cell_type": "code", "execution_count": 25, "id": "99328e5e", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:21.045265Z", "iopub.status.busy": "2021-12-04T15:56:21.044794Z", "iopub.status.idle": "2021-12-04T15:56:21.057645Z", "shell.execute_reply": "2021-12-04T15:56:21.058024Z"}, "papermill": {"duration": 0.24428, "end_time": "2021-12-04T15:56:21.058155", "exception": false, "start_time": "2021-12-04T15:56:20.813875", "status": "completed"}, "tags": []}, "outputs": [], "source": ["base_model = BaseNetwork(act_fn=nn.ReLU(), hidden_sizes=[512, 256, 256, 128])\n", "kaiming_init(base_model)"]}, {"cell_type": "markdown", "id": "1636493f", "metadata": {"papermill": {"duration": 0.226015, "end_time": "2021-12-04T15:56:21.512106", "exception": false, "start_time": "2021-12-04T15:56:21.286091", "status": "completed"}, "tags": []}, "source": ["For a fair comparison, we train the exact same model with the same seed with the three optimizers below.\n", "Feel free to change the hyperparameters if you want (however, you have to train your own model then)."]}, {"cell_type": "code", "execution_count": 26, "id": "83cf00ee", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:21.971222Z", "iopub.status.busy": "2021-12-04T15:56:21.970734Z", "iopub.status.idle": "2021-12-04T15:56:22.354403Z", "shell.execute_reply": "2021-12-04T15:56:22.353972Z"}, "papermill": {"duration": 0.615668, "end_time": "2021-12-04T15:56:22.354532", "exception": false, "start_time": "2021-12-04T15:56:21.738864", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Model file of \"FashionMNIST_SGD\" already exists. Skipping training...\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:56:22.120363\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["============= Test accuracy: 89.09% ==============\n", "\n"]}], "source": ["SGD_model = copy.deepcopy(base_model).to(device)\n", "SGD_results = train_model(\n", " SGD_model, \"FashionMNIST_SGD\", lambda params: SGD(params, lr=1e-1), max_epochs=40, batch_size=256\n", ")"]}, {"cell_type": "code", "execution_count": 27, "id": "8e4625d5", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:22.825235Z", "iopub.status.busy": "2021-12-04T15:56:22.824735Z", "iopub.status.idle": "2021-12-04T15:56:23.187783Z", "shell.execute_reply": "2021-12-04T15:56:23.187344Z"}, "papermill": {"duration": 0.600767, "end_time": "2021-12-04T15:56:23.187909", "exception": false, "start_time": "2021-12-04T15:56:22.587142", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Model file of \"FashionMNIST_SGDMom\" already exists. Skipping training...\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:56:22.966259\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["============= Test accuracy: 88.83% ==============\n", "\n"]}], "source": ["SGDMom_model = copy.deepcopy(base_model).to(device)\n", "SGDMom_results = train_model(\n", " SGDMom_model,\n", " \"FashionMNIST_SGDMom\",\n", " lambda params: SGDMomentum(params, lr=1e-1, momentum=0.9),\n", " max_epochs=40,\n", " batch_size=256,\n", ")"]}, {"cell_type": "code", "execution_count": 28, "id": "2d326436", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:23.673283Z", "iopub.status.busy": "2021-12-04T15:56:23.672814Z", "iopub.status.idle": "2021-12-04T15:56:24.028499Z", "shell.execute_reply": "2021-12-04T15:56:24.028068Z"}, "papermill": {"duration": 0.601587, "end_time": "2021-12-04T15:56:24.028625", "exception": false, "start_time": "2021-12-04T15:56:23.427038", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Model file of \"FashionMNIST_Adam\" already exists. Skipping training...\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:56:23.812352\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["============= Test accuracy: 89.46% ==============\n", "\n"]}], "source": ["Adam_model = copy.deepcopy(base_model).to(device)\n", "Adam_results = train_model(\n", " Adam_model, \"FashionMNIST_Adam\", lambda params: Adam(params, lr=1e-3), max_epochs=40, batch_size=256\n", ")"]}, {"cell_type": "markdown", "id": "d48d9738", "metadata": {"papermill": {"duration": 0.242293, "end_time": "2021-12-04T15:56:24.518095", "exception": false, "start_time": "2021-12-04T15:56:24.275802", "status": "completed"}, "tags": []}, "source": ["The result is that all optimizers perform similarly well with the given model.\n", "The differences are too small to find any significant conclusion.\n", "However, keep in mind that this can also be attributed to the initialization we chose.\n", "When changing the initialization to worse (e.g. constant initialization), Adam usually shows to be more robust because of its adaptive learning rate.\n", "To show the specific benefits of the optimizers, we will continue to\n", "look at some possible loss surfaces in which momentum and adaptive\n", "learning rate are crucial."]}, {"cell_type": "markdown", "id": "650284a9", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.243267, "end_time": "2021-12-04T15:56:25.002092", "exception": false, "start_time": "2021-12-04T15:56:24.758825", "status": "completed"}, "tags": []}, "source": ["### Pathological curvatures\n", "\n", "A pathological curvature is a type of surface that is similar to ravines and is particularly tricky for plain SGD optimization.\n", "In words, pathological curvatures typically have a steep gradient in one direction with an optimum at the center, while in a second direction we have a slower gradient towards a (global) optimum.\n", "Let's first create an example surface of this and visualize it:"]}, {"cell_type": "code", "execution_count": 29, "id": "b739a90c", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:25.513474Z", "iopub.status.busy": "2021-12-04T15:56:25.513001Z", "iopub.status.idle": "2021-12-04T15:56:25.514972Z", "shell.execute_reply": "2021-12-04T15:56:25.514568Z"}, "papermill": {"duration": 0.271487, "end_time": "2021-12-04T15:56:25.515085", "exception": false, "start_time": "2021-12-04T15:56:25.243598", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def pathological_curve_loss(w1, w2):\n", " # Example of a pathological curvature. There are many more possible, feel free to experiment here!\n", " x1_loss = torch.tanh(w1) ** 2 + 0.01 * torch.abs(w1)\n", " x2_loss = torch.sigmoid(w2)\n", " return x1_loss + x2_loss"]}, {"cell_type": "code", "execution_count": 30, "id": "31ad8756", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:26.015141Z", "iopub.status.busy": "2021-12-04T15:56:26.014659Z", "iopub.status.idle": "2021-12-04T15:56:27.270117Z", "shell.execute_reply": "2021-12-04T15:56:27.270502Z"}, "papermill": {"duration": 1.508289, "end_time": "2021-12-04T15:56:27.270685", "exception": false, "start_time": "2021-12-04T15:56:25.762396", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/tmp/ipykernel_875/1102210584.py:5: MatplotlibDeprecationWarning: Calling gca() with keyword arguments was deprecated in Matplotlib 3.4. Starting two minor releases later, gca() will take no keyword arguments. The gca() function should only be used to get the current axes, or if no axes exist, create new axes with default keyword arguments. To create a new axes with non-default arguments, use plt.axes() or plt.subplot().\n", " ax = fig.gca(projection=\"3d\") if plot_3d else fig.gca()\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:56:26.317299\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["def plot_curve(\n", " curve_fn, x_range=(-5, 5), y_range=(-5, 5), plot_3d=False, cmap=cm.viridis, title=\"Pathological curvature\"\n", "):\n", " fig = plt.figure()\n", " ax = fig.gca(projection=\"3d\") if plot_3d else fig.gca()\n", "\n", " x = torch.arange(x_range[0], x_range[1], (x_range[1] - x_range[0]) / 100.0)\n", " y = torch.arange(y_range[0], y_range[1], (y_range[1] - y_range[0]) / 100.0)\n", " x, y = torch.meshgrid([x, y])\n", " z = curve_fn(x, y)\n", " x, y, z = x.numpy(), y.numpy(), z.numpy()\n", "\n", " if plot_3d:\n", " ax.plot_surface(x, y, z, cmap=cmap, linewidth=1, color=\"#000\", antialiased=False)\n", " ax.set_zlabel(\"loss\")\n", " else:\n", " ax.imshow(z.T[::-1], cmap=cmap, extent=(x_range[0], x_range[1], y_range[0], y_range[1]))\n", " plt.title(title)\n", " ax.set_xlabel(r\"$w_1$\")\n", " ax.set_ylabel(r\"$w_2$\")\n", " plt.tight_layout()\n", " return ax\n", "\n", "\n", "sns.reset_orig()\n", "_ = plot_curve(pathological_curve_loss, plot_3d=True)\n", "plt.show()"]}, {"cell_type": "markdown", "id": "3a07e352", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.279049, "end_time": "2021-12-04T15:56:27.829838", "exception": false, "start_time": "2021-12-04T15:56:27.550789", "status": "completed"}, "tags": []}, "source": ["In terms of optimization, you can image that $w_1$ and $w_2$ are weight parameters, and the curvature represents the loss surface over the space of $w_1$ and $w_2$.\n", "Note that in typical networks, we have many, many more parameters than two, and such curvatures can occur in multi-dimensional spaces as well.\n", "\n", "Ideally, our optimization algorithm would find the center of the ravine and focuses on optimizing the parameters towards the direction of $w_2$.\n", "However, if we encounter a point along the ridges, the gradient is much greater in $w_1$ than $w_2$, and we might end up jumping from one side to the other.\n", "Due to the large gradients, we would have to reduce our learning rate slowing down learning significantly.\n", "\n", "To test our algorithms, we can implement a simple function to train two parameters on such a surface:"]}, {"cell_type": "code", "execution_count": 31, "id": "5d2f28de", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:28.389879Z", "iopub.status.busy": "2021-12-04T15:56:28.389383Z", "iopub.status.idle": "2021-12-04T15:56:28.391395Z", "shell.execute_reply": "2021-12-04T15:56:28.390988Z"}, "papermill": {"duration": 0.285299, "end_time": "2021-12-04T15:56:28.391509", "exception": false, "start_time": "2021-12-04T15:56:28.106210", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def train_curve(optimizer_func, curve_func=pathological_curve_loss, num_updates=100, init=[5, 5]):\n", " \"\"\"\n", " Args:\n", " optimizer_func: Constructor of the optimizer to use. Should only take a parameter list\n", " curve_func: Loss function (e.g. pathological curvature)\n", " num_updates: Number of updates/steps to take when optimizing\n", " init: Initial values of parameters. Must be a list/tuple with two elements representing w_1 and w_2\n", " Returns:\n", " Numpy array of shape [num_updates, 3] with [t,:2] being the parameter values at step t, and [t,2] the loss at t.\n", " \"\"\"\n", " weights = nn.Parameter(torch.FloatTensor(init), requires_grad=True)\n", " optim = optimizer_func([weights])\n", "\n", " list_points = []\n", " for _ in range(num_updates):\n", " loss = curve_func(weights[0], weights[1])\n", " list_points.append(torch.cat([weights.data.detach(), loss.unsqueeze(dim=0).detach()], dim=0))\n", " optim.zero_grad()\n", " loss.backward()\n", " optim.step()\n", " points = torch.stack(list_points, dim=0).numpy()\n", " return points"]}, {"cell_type": "markdown", "id": "34d620d2", "metadata": {"papermill": {"duration": 0.277293, "end_time": "2021-12-04T15:56:28.945849", "exception": false, "start_time": "2021-12-04T15:56:28.668556", "status": "completed"}, "tags": []}, "source": ["Next, let's apply the different optimizers on our curvature.\n", "Note that we set a much higher learning rate for the optimization algorithms as you would in a standard neural network.\n", "This is because we only have 2 parameters instead of tens of thousands or even millions."]}, {"cell_type": "code", "execution_count": 32, "id": "41d2cd89", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:29.513423Z", "iopub.status.busy": "2021-12-04T15:56:29.512941Z", "iopub.status.idle": "2021-12-04T15:56:29.600337Z", "shell.execute_reply": "2021-12-04T15:56:29.599941Z"}, "papermill": {"duration": 0.369932, "end_time": "2021-12-04T15:56:29.600456", "exception": false, "start_time": "2021-12-04T15:56:29.230524", "status": "completed"}, "tags": []}, "outputs": [], "source": ["SGD_points = train_curve(lambda params: SGD(params, lr=10))\n", "SGDMom_points = train_curve(lambda params: SGDMomentum(params, lr=10, momentum=0.9))\n", "Adam_points = train_curve(lambda params: Adam(params, lr=1))"]}, {"cell_type": "markdown", "id": "f8145cab", "metadata": {"papermill": {"duration": 0.28425, "end_time": "2021-12-04T15:56:30.165657", "exception": false, "start_time": "2021-12-04T15:56:29.881407", "status": "completed"}, "tags": []}, "source": ["To understand best how the different algorithms worked, we visualize the update step as a line plot through the loss surface.\n", "We will stick with a 2D representation for readability."]}, {"cell_type": "code", "execution_count": 33, "id": "54af4578", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:30.745262Z", "iopub.status.busy": "2021-12-04T15:56:30.744720Z", "iopub.status.idle": "2021-12-04T15:56:31.275773Z", "shell.execute_reply": "2021-12-04T15:56:31.276161Z"}, "papermill": {"duration": 0.832259, "end_time": "2021-12-04T15:56:31.276328", "exception": false, "start_time": "2021-12-04T15:56:30.444069", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:56:30.860693\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["all_points = np.concatenate([SGD_points, SGDMom_points, Adam_points], axis=0)\n", "ax = plot_curve(\n", " pathological_curve_loss,\n", " x_range=(-np.absolute(all_points[:, 0]).max(), np.absolute(all_points[:, 0]).max()),\n", " y_range=(all_points[:, 1].min(), all_points[:, 1].max()),\n", " plot_3d=False,\n", ")\n", "ax.plot(SGD_points[:, 0], SGD_points[:, 1], color=\"red\", marker=\"o\", zorder=1, label=\"SGD\")\n", "ax.plot(SGDMom_points[:, 0], SGDMom_points[:, 1], color=\"blue\", marker=\"o\", zorder=2, label=\"SGDMom\")\n", "ax.plot(Adam_points[:, 0], Adam_points[:, 1], color=\"grey\", marker=\"o\", zorder=3, label=\"Adam\")\n", "plt.legend()\n", "plt.show()"]}, {"cell_type": "markdown", "id": "0e880578", "metadata": {"papermill": {"duration": 0.281894, "end_time": "2021-12-04T15:56:31.843290", "exception": false, "start_time": "2021-12-04T15:56:31.561396", "status": "completed"}, "tags": []}, "source": ["We can clearly see that SGD is not able to find the center of the optimization curve and has a problem converging due to the steep gradients in $w_1$.\n", "In contrast, Adam and SGD with momentum nicely converge as the changing direction of $w_1$ is canceling itself out.\n", "On such surfaces, it is crucial to use momentum."]}, {"cell_type": "markdown", "id": "23673b0c", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.283817, "end_time": "2021-12-04T15:56:32.414094", "exception": false, "start_time": "2021-12-04T15:56:32.130277", "status": "completed"}, "tags": []}, "source": ["### Steep optima\n", "\n", "A second type of challenging loss surfaces are steep optima.\n", "In those, we have a larger part of the surface having very small gradients while around the optimum, we have very large gradients.\n", "For instance, take the following loss surfaces:"]}, {"cell_type": "code", "execution_count": 34, "id": "93f0e0e9", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:33.000196Z", "iopub.status.busy": "2021-12-04T15:56:32.994290Z", "iopub.status.idle": "2021-12-04T15:56:34.120588Z", "shell.execute_reply": "2021-12-04T15:56:34.120986Z"}, "papermill": {"duration": 1.424954, "end_time": "2021-12-04T15:56:34.121153", "exception": false, "start_time": "2021-12-04T15:56:32.696199", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/tmp/ipykernel_875/1102210584.py:5: MatplotlibDeprecationWarning: Calling gca() with keyword arguments was deprecated in Matplotlib 3.4. Starting two minor releases later, gca() will take no keyword arguments. The gca() function should only be used to get the current axes, or if no axes exist, create new axes with default keyword arguments. To create a new axes with non-default arguments, use plt.axes() or plt.subplot().\n", " ax = fig.gca(projection=\"3d\") if plot_3d else fig.gca()\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:56:33.220652\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["def bivar_gaussian(w1, w2, x_mean=0.0, y_mean=0.0, x_sig=1.0, y_sig=1.0):\n", " norm = 1 / (2 * np.pi * x_sig * y_sig)\n", " x_exp = (-1 * (w1 - x_mean) ** 2) / (2 * x_sig ** 2)\n", " y_exp = (-1 * (w2 - y_mean) ** 2) / (2 * y_sig ** 2)\n", " return norm * torch.exp(x_exp + y_exp)\n", "\n", "\n", "def comb_func(w1, w2):\n", " z = -bivar_gaussian(w1, w2, x_mean=1.0, y_mean=-0.5, x_sig=0.2, y_sig=0.2)\n", " z -= bivar_gaussian(w1, w2, x_mean=-1.0, y_mean=0.5, x_sig=0.2, y_sig=0.2)\n", " z -= bivar_gaussian(w1, w2, x_mean=-0.5, y_mean=-0.8, x_sig=0.2, y_sig=0.2)\n", " return z\n", "\n", "\n", "_ = plot_curve(comb_func, x_range=(-2, 2), y_range=(-2, 2), plot_3d=True, title=\"Steep optima\")"]}, {"cell_type": "markdown", "id": "7ef1175a", "metadata": {"papermill": {"duration": 0.332877, "end_time": "2021-12-04T15:56:34.786176", "exception": false, "start_time": "2021-12-04T15:56:34.453299", "status": "completed"}, "tags": []}, "source": ["Most of the loss surface has very little to no gradients.\n", "However, close to the optima, we have very steep gradients.\n", "To reach the minimum when starting in a region with lower gradients, we expect an adaptive learning rate to be crucial.\n", "To verify this hypothesis, we can run our three optimizers on the surface:"]}, {"cell_type": "code", "execution_count": 35, "id": "4f8818bb", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:35.429165Z", "iopub.status.busy": "2021-12-04T15:56:35.428679Z", "iopub.status.idle": "2021-12-04T15:56:36.013195Z", "shell.execute_reply": "2021-12-04T15:56:36.013583Z"}, "papermill": {"duration": 0.911295, "end_time": "2021-12-04T15:56:36.013752", "exception": false, "start_time": "2021-12-04T15:56:35.102457", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:56:35.780390\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["SGD_points = train_curve(lambda params: SGD(params, lr=0.5), comb_func, init=[0, 0])\n", "SGDMom_points = train_curve(lambda params: SGDMomentum(params, lr=1, momentum=0.9), comb_func, init=[0, 0])\n", "Adam_points = train_curve(lambda params: Adam(params, lr=0.2), comb_func, init=[0, 0])\n", "\n", "all_points = np.concatenate([SGD_points, SGDMom_points, Adam_points], axis=0)\n", "ax = plot_curve(comb_func, x_range=(-2, 2), y_range=(-2, 2), plot_3d=False, title=\"Steep optima\")\n", "ax.plot(SGD_points[:, 0], SGD_points[:, 1], color=\"red\", marker=\"o\", zorder=3, label=\"SGD\", alpha=0.7)\n", "ax.plot(SGDMom_points[:, 0], SGDMom_points[:, 1], color=\"blue\", marker=\"o\", zorder=2, label=\"SGDMom\", alpha=0.7)\n", "ax.plot(Adam_points[:, 0], Adam_points[:, 1], color=\"grey\", marker=\"o\", zorder=1, label=\"Adam\", alpha=0.7)\n", "ax.set_xlim(-2, 2)\n", "ax.set_ylim(-2, 2)\n", "plt.legend()\n", "plt.show()"]}, {"cell_type": "markdown", "id": "494d99c5", "metadata": {"papermill": {"duration": 0.323237, "end_time": "2021-12-04T15:56:36.662651", "exception": false, "start_time": "2021-12-04T15:56:36.339414", "status": "completed"}, "tags": []}, "source": ["SGD first takes very small steps until it touches the border of the optimum.\n", "First reaching a point around $(-0.75,-0.5)$, the gradient direction has changed and pushes the parameters to $(0.8,0.5)$ from which SGD cannot recover anymore (only with many, many steps).\n", "A similar problem has SGD with momentum, only that it continues the direction of the touch of the optimum.\n", "The gradients from this time step are so much larger than any other point that the momentum $m_t$ is overpowered by it.\n", "Finally, Adam is able to converge in the optimum showing the importance of adaptive learning rates."]}, {"cell_type": "markdown", "id": "753e94b5", "metadata": {"papermill": {"duration": 0.327421, "end_time": "2021-12-04T15:56:37.310853", "exception": false, "start_time": "2021-12-04T15:56:36.983432", "status": "completed"}, "tags": []}, "source": ["### What optimizer to take\n", "\n", "After seeing the results on optimization, what is our conclusion?\n", "Should we always use Adam and never look at SGD anymore?\n", "The short answer: no.\n", "There are many papers saying that in certain situations, SGD (with momentum) generalizes better where Adam often tends to overfit [5,6].\n", "This is related to the idea of finding wider optima.\n", "For instance, see the illustration of different optima below (credit: [Keskar et al., 2017](https://arxiv.org/pdf/1609.04836.pdf)):\n", "\n", "
\n", "\n", "The black line represents the training loss surface, while the dotted red line is the test loss.\n", "Finding sharp, narrow minima can be helpful for finding the minimal training loss.\n", "However, this doesn't mean that it also minimizes the test loss as especially flat minima have shown to generalize better.\n", "You can imagine that the test dataset has a slightly shifted loss surface due to the different examples than in the training set.\n", "A small change can have a significant influence for sharp minima, while flat minima are generally more robust to this change.\n", "\n", "In the next tutorial, we will see that some network types can still be better optimized with SGD and learning rate scheduling than Adam.\n", "Nevertheless, Adam is the most commonly used optimizer in Deep Learning\n", "as it usually performs better than other optimizers, especially for deep\n", "networks."]}, {"cell_type": "markdown", "id": "7c5857ba", "metadata": {"papermill": {"duration": 0.328086, "end_time": "2021-12-04T15:56:37.960730", "exception": false, "start_time": "2021-12-04T15:56:37.632644", "status": "completed"}, "tags": []}, "source": ["## Conclusion\n", "\n", "In this tutorial, we have looked at initialization and optimization techniques for neural networks.\n", "We have seen that a good initialization has to balance the preservation of the gradient variance as well as the activation variance.\n", "This can be achieved with the Xavier initialization for tanh-based networks, and the Kaiming initialization for ReLU-based networks.\n", "In optimization, concepts like momentum and adaptive learning rate can help with challenging loss surfaces but don't guarantee an increase in performance for neural networks.\n", "\n", "\n", "## References\n", "\n", "[1] Glorot, Xavier, and Yoshua Bengio.\n", "\"Understanding the difficulty of training deep feedforward neural networks.\"\n", "Proceedings of the thirteenth international conference on artificial intelligence and statistics.\n", "2010.\n", "[link](http://proceedings.mlr.press/v9/glorot10a/glorot10a.pdf)\n", "\n", "[2] He, Kaiming, et al.\n", "\"Delving deep into rectifiers: Surpassing human-level performance on imagenet classification.\"\n", "Proceedings of the IEEE international conference on computer vision.\n", "2015.\n", "[link](https://www.cv-foundation.org/openaccess/content_iccv_2015/html/He_Delving_Deep_into_ICCV_2015_paper.html)\n", "\n", "[3] Kingma, Diederik P. & Ba, Jimmy.\n", "\"Adam: A Method for Stochastic Optimization.\"\n", "Proceedings of the third international conference for learning representations (ICLR).\n", "2015.\n", "[link](https://arxiv.org/abs/1412.6980)\n", "\n", "[4] Keskar, Nitish Shirish, et al.\n", "\"On large-batch training for deep learning: Generalization gap and sharp minima.\"\n", "Proceedings of the fifth international conference for learning representations (ICLR).\n", "2017.\n", "[link](https://arxiv.org/abs/1609.04836)\n", "\n", "[5] Wilson, Ashia C., et al.\n", "\"The Marginal Value of Adaptive Gradient Methods in Machine Learning.\"\n", "Advances in neural information processing systems.\n", "2017.\n", "[link](https://papers.nips.cc/paper/7003-the-marginal-value-of-adaptive-gradient-methods-in-machine-learning.pdf)\n", "\n", "[6] Ruder, Sebastian.\n", "\"An overview of gradient descent optimization algorithms.\"\n", "arXiv preprint.\n", "2017.\n", "[link](https://arxiv.org/abs/1609.04747)"]}, {"cell_type": "markdown", "id": "717a390c", "metadata": {"papermill": {"duration": 0.321185, "end_time": "2021-12-04T15:56:38.605839", "exception": false, "start_time": "2021-12-04T15:56:38.284654", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "[![Pytorch Lightning](){height=\"60px\" width=\"240px\"}](https://pytorchlightning.ai)"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: Tutorial 3: Initialization and Optimization\n", " :card_description: In this tutorial, we will review techniques for optimization and initialization of neural networks. When increasing the depth of neural networks, there are various challenges...\n", " :tags: Image,Initialization,Optimizers,GPU/TPU,UvA-DL-Course\n", " :image: _static/images/course_UvA-DL/03-initialization-and-optimization.jpg"]}], "metadata": {"jupytext": {"cell_metadata_filter": "colab,colab_type,id,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 129.529808, "end_time": "2021-12-04T15:56:39.938276", "environment_variables": {}, "exception": null, "input_path": "course_UvA-DL/03-initialization-and-optimization/Initialization_and_Optimization.ipynb", "output_path": ".notebooks/course_UvA-DL/03-initialization-and-optimization.ipynb", "parameters": {}, "start_time": "2021-12-04T15:54:30.408468", "version": "2.3.3"}, "widgets": {"application/vnd.jupyter.widget-state+json": {"state": {"016d946a5dab4a79a18764f5c0041ba5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "026aebbc34a44feb8b457365361afafd": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_22e8949053614c0192e311e8ff9aef02", "max": 26421880.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_093f9a4bfafa4740b5f88601d54044ac", "value": 26421880.0}}, "08483ba1c3a04915abdbad783c25de3c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "093f9a4bfafa4740b5f88601d54044ac": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "0d49022c934a4041bdedb88894434ccb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "0fdf1596470d464fa9a290533416cb26": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_354ac47ccada4df9998175a3f34d76c9", "IPY_MODEL_026aebbc34a44feb8b457365361afafd", "IPY_MODEL_27b5f2c48c6a4bad9b67ba6eae81cbfb"], "layout": "IPY_MODEL_7c2dc452217b4a448d843765a9de3589"}}, "165b31c1d551419c9c3e957a59b4dbe8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_016d946a5dab4a79a18764f5c0041ba5", "placeholder": "\u200b", "style": "IPY_MODEL_f08b86836fdc45349d6e4f05cb5a13b9", "value": " 4422656/? [00:00<00:00, 5533630.76it/s]"}}, "17db2890ca0d456d8cf158dc64abf9d5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "19d14e54732d4a498f8b2802a85f5149": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "221bb2a4278543d480edebc7722b71fc": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "22e8949053614c0192e311e8ff9aef02": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "27b5f2c48c6a4bad9b67ba6eae81cbfb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a4e1072e043c4055a83cd5a886ed7ee2", "placeholder": "\u200b", "style": "IPY_MODEL_f07427933ca0436591fbab57cc611476", "value": " 26422272/? [00:01<00:00, 28038507.13it/s]"}}, "2c36103f487546b8b37b85e3aefafdd5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "354ac47ccada4df9998175a3f34d76c9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_221bb2a4278543d480edebc7722b71fc", "placeholder": "\u200b", "style": "IPY_MODEL_fc2fa21a06584df18e1935b0d4c97740", "value": ""}}, "3d1754bbcdcf43fab677cb91b0efa22e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "44bb90b0e4f54124ba64039651776ce9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_cf04ff1d2808421493a90ea67b0c6c65", "max": 5148.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_3d1754bbcdcf43fab677cb91b0efa22e", "value": 5148.0}}, "4c894e4c1ae9405faec2c75640591ff0": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4ef9603d92f346419ff8be3c2984b0e6": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "5552c3e370d84c4abe093fd198faf878": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "56a2c8c742d5459e92de2eb14a2908ed": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_7c769972b877422bb50730dcab448940", "IPY_MODEL_5d9e259f88794c08b0124f67612517ba", "IPY_MODEL_165b31c1d551419c9c3e957a59b4dbe8"], "layout": "IPY_MODEL_17db2890ca0d456d8cf158dc64abf9d5"}}, "5d9e259f88794c08b0124f67612517ba": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4c894e4c1ae9405faec2c75640591ff0", "max": 4422102.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_7a0e21be27384807ab12f5a8bfac4978", "value": 4422102.0}}, "65057ed2e8c044468d5be827e3a2e007": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4ef9603d92f346419ff8be3c2984b0e6", "max": 29515.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_d0fa3935d2454032aa3820b5314c22e5", "value": 29515.0}}, "68ab1848fe7942fd914800ef133729fd": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_e6202326d4104925b4cb7cfba26f1f56", "IPY_MODEL_65057ed2e8c044468d5be827e3a2e007", "IPY_MODEL_98a9c5a0f7f1451e8a11f46e53321208"], "layout": "IPY_MODEL_a06f5823643545f49353d80444b7313f"}}, "7136c44874c14f3a9db1e1bea7d49b11": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b16b51a3dfd9446aa90ad8458f381041", "placeholder": "\u200b", "style": "IPY_MODEL_5552c3e370d84c4abe093fd198faf878", "value": ""}}, "7198121599234cd586ed1a5516fd079d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "7a0e21be27384807ab12f5a8bfac4978": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "7c2dc452217b4a448d843765a9de3589": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "7c769972b877422bb50730dcab448940": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c9bee2a106034b52b0f23a884a670400", "placeholder": "\u200b", "style": "IPY_MODEL_0d49022c934a4041bdedb88894434ccb", "value": ""}}, "94ba0c8691ce48feb9c6331ba8e9396b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "98a9c5a0f7f1451e8a11f46e53321208": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2c36103f487546b8b37b85e3aefafdd5", "placeholder": "\u200b", "style": "IPY_MODEL_a0566c7ab89149f4b7490c6da055358f", "value": " 29696/? [00:00<00:00, 318811.85it/s]"}}, "a0566c7ab89149f4b7490c6da055358f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "a06f5823643545f49353d80444b7313f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "a4e1072e043c4055a83cd5a886ed7ee2": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b16b51a3dfd9446aa90ad8458f381041": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b34dadf61f28405fbaf0146f3b1a4611": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_7136c44874c14f3a9db1e1bea7d49b11", "IPY_MODEL_44bb90b0e4f54124ba64039651776ce9", "IPY_MODEL_d568fb874f04460aafc60684ebbc0770"], "layout": "IPY_MODEL_7198121599234cd586ed1a5516fd079d"}}, "c9bee2a106034b52b0f23a884a670400": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "cf04ff1d2808421493a90ea67b0c6c65": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d0fa3935d2454032aa3820b5314c22e5": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "d568fb874f04460aafc60684ebbc0770": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ec31a74304f344579b5f66384dd658be", "placeholder": "\u200b", "style": "IPY_MODEL_19d14e54732d4a498f8b2802a85f5149", "value": " 6144/? [00:00<00:00, 355068.46it/s]"}}, "e6202326d4104925b4cb7cfba26f1f56": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_08483ba1c3a04915abdbad783c25de3c", "placeholder": "\u200b", "style": "IPY_MODEL_94ba0c8691ce48feb9c6331ba8e9396b", "value": ""}}, "ec31a74304f344579b5f66384dd658be": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "f07427933ca0436591fbab57cc611476": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "f08b86836fdc45349d6e4f05cb5a13b9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "fc2fa21a06584df18e1935b0d4c97740": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}}, "version_major": 2, "version_minor": 0}}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/course_UvA-DL/04-inception-resnet-densenet.ipynb b/source/notebooks/course_UvA-DL/04-inception-resnet-densenet.ipynb deleted file mode 100644 index 8ede350..0000000 --- a/source/notebooks/course_UvA-DL/04-inception-resnet-densenet.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "ab9a7af5", "metadata": {"papermill": {"duration": 0.123414, "end_time": "2021-12-04T15:56:50.350891", "exception": false, "start_time": "2021-12-04T15:56:50.227477", "status": "completed"}, "tags": []}, "source": ["\n", "# Tutorial 4: Inception, ResNet and DenseNet\n", "\n", "* **Author:** Phillip Lippe\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-12-04T16:52:48.435460\n", "\n", "In this tutorial, we will implement and discuss variants of modern CNN architectures.\n", "There have been many different architectures been proposed over the past few years.\n", "Some of the most impactful ones, and still relevant today, are the following: [GoogleNet](https://arxiv.org/abs/1409.4842)/Inception architecture (winner of ILSVRC 2014), [ResNet](https://arxiv.org/abs/1512.03385) (winner of ILSVRC 2015), and [DenseNet](https://arxiv.org/abs/1608.06993) (best paper award CVPR 2017).\n", "All of them were state-of-the-art models when being proposed, and the core ideas of these networks are the foundations for most current state-of-the-art architectures.\n", "Thus, it is important to understand these architectures in detail and learn how to implement them.\n", "This notebook is part of a lecture series on Deep Learning at the University of Amsterdam.\n", "The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io.\n", "\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/course_UvA-DL/04-inception-resnet-densenet.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "047ed0ea", "metadata": {"papermill": {"duration": 0.122263, "end_time": "2021-12-04T15:56:50.594054", "exception": false, "start_time": "2021-12-04T15:56:50.471791", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "487ba510", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-12-04T15:56:50.845118Z", "iopub.status.busy": "2021-12-04T15:56:50.844642Z", "iopub.status.idle": "2021-12-04T15:56:53.309346Z", "shell.execute_reply": "2021-12-04T15:56:53.309758Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 2.594206, "end_time": "2021-12-04T15:56:53.310042", "exception": false, "start_time": "2021-12-04T15:56:50.715836", "status": "completed"}, "tags": []}, "outputs": [], "source": ["! pip install --quiet \"pytorch-lightning>=1.3\" \"torchvision\" \"matplotlib\" \"torch>=1.6, <1.9\" \"tabulate\" \"seaborn\" \"torchmetrics>=0.3\""]}, {"cell_type": "markdown", "id": "3d41adef", "metadata": {"papermill": {"duration": 0.122031, "end_time": "2021-12-04T15:56:53.555792", "exception": false, "start_time": "2021-12-04T15:56:53.433761", "status": "completed"}, "tags": []}, "source": ["
\n", "Let's start with importing our standard libraries here."]}, {"cell_type": "code", "execution_count": 2, "id": "b6e98e07", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:53.808117Z", "iopub.status.busy": "2021-12-04T15:56:53.807640Z", "iopub.status.idle": "2021-12-04T15:56:55.699547Z", "shell.execute_reply": "2021-12-04T15:56:55.699937Z"}, "papermill": {"duration": 2.02344, "end_time": "2021-12-04T15:56:55.700099", "exception": false, "start_time": "2021-12-04T15:56:53.676659", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/tmp/ipykernel_1009/1100401100.py:25: DeprecationWarning: `set_matplotlib_formats` is deprecated since IPython 7.23, directly use `matplotlib_inline.backend_inline.set_matplotlib_formats()`\n", " set_matplotlib_formats(\"svg\", \"pdf\") # For export\n"]}], "source": ["import os\n", "import urllib.request\n", "from types import SimpleNamespace\n", "from urllib.error import HTTPError\n", "\n", "import matplotlib\n", "import matplotlib.pyplot as plt\n", "import numpy as np\n", "import pytorch_lightning as pl\n", "import seaborn as sns\n", "import tabulate\n", "import torch\n", "import torch.nn as nn\n", "import torch.optim as optim\n", "import torch.utils.data as data\n", "import torchvision\n", "\n", "%matplotlib inline\n", "from IPython.display import HTML, display, set_matplotlib_formats\n", "from PIL import Image\n", "from pytorch_lightning.callbacks import LearningRateMonitor, ModelCheckpoint\n", "from torchvision import transforms\n", "from torchvision.datasets import CIFAR10\n", "\n", "set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "matplotlib.rcParams[\"lines.linewidth\"] = 2.0\n", "sns.reset_orig()\n", "\n", "# PyTorch\n", "# Torchvision"]}, {"cell_type": "markdown", "id": "ca1ba35c", "metadata": {"papermill": {"duration": 0.122671, "end_time": "2021-12-04T15:56:55.949046", "exception": false, "start_time": "2021-12-04T15:56:55.826375", "status": "completed"}, "tags": []}, "source": ["We will use the same `set_seed` function as in the previous tutorials, as well as the path variables `DATASET_PATH` and `CHECKPOINT_PATH`.\n", "Adjust the paths if necessary."]}, {"cell_type": "code", "execution_count": 3, "id": "8c2ed3ca", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:56.198762Z", "iopub.status.busy": "2021-12-04T15:56:56.198264Z", "iopub.status.idle": "2021-12-04T15:56:56.395384Z", "shell.execute_reply": "2021-12-04T15:56:56.394919Z"}, "papermill": {"duration": 0.324279, "end_time": "2021-12-04T15:56:56.395518", "exception": false, "start_time": "2021-12-04T15:56:56.071239", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}], "source": ["# Path to the folder where the datasets are/should be downloaded (e.g. CIFAR10)\n", "DATASET_PATH = os.environ.get(\"PATH_DATASETS\", \"data/\")\n", "# Path to the folder where the pretrained models are saved\n", "CHECKPOINT_PATH = os.environ.get(\"PATH_CHECKPOINT\", \"saved_models/ConvNets\")\n", "\n", "\n", "# Function for setting the seed\n", "pl.seed_everything(42)\n", "\n", "# Ensure that all operations are deterministic on GPU (if used) for reproducibility\n", "torch.backends.cudnn.determinstic = True\n", "torch.backends.cudnn.benchmark = False\n", "\n", "device = torch.device(\"cuda:0\") if torch.cuda.is_available() else torch.device(\"cpu\")"]}, {"cell_type": "markdown", "id": "335391a2", "metadata": {"papermill": {"duration": 0.122428, "end_time": "2021-12-04T15:56:56.642177", "exception": false, "start_time": "2021-12-04T15:56:56.519749", "status": "completed"}, "tags": []}, "source": ["We also have pretrained models and Tensorboards (more on this later) for this tutorial, and download them below."]}, {"cell_type": "code", "execution_count": 4, "id": "218d11ab", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:56.895357Z", "iopub.status.busy": "2021-12-04T15:56:56.893762Z", "iopub.status.idle": "2021-12-04T15:56:57.854104Z", "shell.execute_reply": "2021-12-04T15:56:57.853693Z"}, "papermill": {"duration": 1.089563, "end_time": "2021-12-04T15:56:57.854235", "exception": false, "start_time": "2021-12-04T15:56:56.764672", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial5/GoogleNet.ckpt...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial5/ResNet.ckpt...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial5/ResNetPreAct.ckpt...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial5/DenseNet.ckpt...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial5/tensorboards/GoogleNet/events.out.tfevents.googlenet...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial5/tensorboards/ResNet/events.out.tfevents.resnet...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial5/tensorboards/ResNetPreAct/events.out.tfevents.resnetpreact...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial5/tensorboards/DenseNet/events.out.tfevents.densenet...\n"]}], "source": ["# Github URL where saved models are stored for this tutorial\n", "base_url = \"https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial5/\"\n", "# Files to download\n", "pretrained_files = [\n", " \"GoogleNet.ckpt\",\n", " \"ResNet.ckpt\",\n", " \"ResNetPreAct.ckpt\",\n", " \"DenseNet.ckpt\",\n", " \"tensorboards/GoogleNet/events.out.tfevents.googlenet\",\n", " \"tensorboards/ResNet/events.out.tfevents.resnet\",\n", " \"tensorboards/ResNetPreAct/events.out.tfevents.resnetpreact\",\n", " \"tensorboards/DenseNet/events.out.tfevents.densenet\",\n", "]\n", "# Create checkpoint path if it doesn't exist yet\n", "os.makedirs(CHECKPOINT_PATH, exist_ok=True)\n", "\n", "# For each file, check whether it already exists. If not, try downloading it.\n", "for file_name in pretrained_files:\n", " file_path = os.path.join(CHECKPOINT_PATH, file_name)\n", " if \"/\" in file_name:\n", " os.makedirs(file_path.rsplit(\"/\", 1)[0], exist_ok=True)\n", " if not os.path.isfile(file_path):\n", " file_url = base_url + file_name\n", " print(f\"Downloading {file_url}...\")\n", " try:\n", " urllib.request.urlretrieve(file_url, file_path)\n", " except HTTPError as e:\n", " print(\n", " \"Something went wrong. Please try to download the file from the GDrive folder, or contact the author with the full output including the following error:\\n\",\n", " e,\n", " )"]}, {"cell_type": "markdown", "id": "8e425fea", "metadata": {"papermill": {"duration": 0.128244, "end_time": "2021-12-04T15:56:58.108919", "exception": false, "start_time": "2021-12-04T15:56:57.980675", "status": "completed"}, "tags": []}, "source": ["Throughout this tutorial, we will train and evaluate the models on the CIFAR10 dataset.\n", "This allows you to compare the results obtained here with the model you have implemented in the first assignment.\n", "As we have learned from the previous tutorial about initialization, it is important to have the data preprocessed with a zero mean.\n", "Therefore, as a first step, we will calculate the mean and standard deviation of the CIFAR dataset:"]}, {"cell_type": "code", "execution_count": 5, "id": "f33e6af1", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:56:58.376340Z", "iopub.status.busy": "2021-12-04T15:56:58.375859Z", "iopub.status.idle": "2021-12-04T15:57:01.995135Z", "shell.execute_reply": "2021-12-04T15:57:01.995523Z"}, "papermill": {"duration": 3.752594, "end_time": "2021-12-04T15:57:01.995688", "exception": false, "start_time": "2021-12-04T15:56:58.243094", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Data mean [0.49139968 0.48215841 0.44653091]\n", "Data std [0.24703223 0.24348513 0.26158784]\n"]}], "source": ["train_dataset = CIFAR10(root=DATASET_PATH, train=True, download=True)\n", "DATA_MEANS = (train_dataset.data / 255.0).mean(axis=(0, 1, 2))\n", "DATA_STD = (train_dataset.data / 255.0).std(axis=(0, 1, 2))\n", "print(\"Data mean\", DATA_MEANS)\n", "print(\"Data std\", DATA_STD)"]}, {"cell_type": "markdown", "id": "b37fa62e", "metadata": {"papermill": {"duration": 0.128325, "end_time": "2021-12-04T15:57:02.252178", "exception": false, "start_time": "2021-12-04T15:57:02.123853", "status": "completed"}, "tags": []}, "source": ["We will use this information to define a `transforms.Normalize` module which will normalize our data accordingly.\n", "Additionally, we will use data augmentation during training.\n", "This reduces the risk of overfitting and helps CNNs to generalize better.\n", "Specifically, we will apply two random augmentations.\n", "\n", "First, we will flip each image horizontally by a chance of 50% (`transforms.RandomHorizontalFlip`).\n", "The object class usually does not change when flipping an image, and we don't expect any image information to be dependent on the horizontal orientation.\n", "This would be however different if we would try to detect digits or letters in an image, as those have a certain orientation.\n", "\n", "The second augmentation we use is called `transforms.RandomResizedCrop`.\n", "This transformation scales the image in a small range, while eventually changing the aspect ratio, and crops it afterward in the previous size.\n", "Therefore, the actual pixel values change while the content or overall semantics of the image stays the same.\n", "\n", "We will randomly split the training dataset into a training and a validation set.\n", "The validation set will be used for determining early stopping.\n", "After finishing the training, we test the models on the CIFAR test set."]}, {"cell_type": "code", "execution_count": 6, "id": "5e411a23", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:02.522094Z", "iopub.status.busy": "2021-12-04T15:57:02.521619Z", "iopub.status.idle": "2021-12-04T15:57:05.007752Z", "shell.execute_reply": "2021-12-04T15:57:05.007283Z"}, "papermill": {"duration": 2.621367, "end_time": "2021-12-04T15:57:05.007890", "exception": false, "start_time": "2021-12-04T15:57:02.386523", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}, {"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}, {"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}], "source": ["test_transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize(DATA_MEANS, DATA_STD)])\n", "# For training, we add some augmentation. Networks are too powerful and would overfit.\n", "train_transform = transforms.Compose(\n", " [\n", " transforms.RandomHorizontalFlip(),\n", " transforms.RandomResizedCrop((32, 32), scale=(0.8, 1.0), ratio=(0.9, 1.1)),\n", " transforms.ToTensor(),\n", " transforms.Normalize(DATA_MEANS, DATA_STD),\n", " ]\n", ")\n", "# Loading the training dataset. We need to split it into a training and validation part\n", "# We need to do a little trick because the validation set should not use the augmentation.\n", "train_dataset = CIFAR10(root=DATASET_PATH, train=True, transform=train_transform, download=True)\n", "val_dataset = CIFAR10(root=DATASET_PATH, train=True, transform=test_transform, download=True)\n", "pl.seed_everything(42)\n", "train_set, _ = torch.utils.data.random_split(train_dataset, [45000, 5000])\n", "pl.seed_everything(42)\n", "_, val_set = torch.utils.data.random_split(val_dataset, [45000, 5000])\n", "\n", "# Loading the test set\n", "test_set = CIFAR10(root=DATASET_PATH, train=False, transform=test_transform, download=True)\n", "\n", "# We define a set of data loaders that we can use for various purposes later.\n", "train_loader = data.DataLoader(train_set, batch_size=128, shuffle=True, drop_last=True, pin_memory=True, num_workers=4)\n", "val_loader = data.DataLoader(val_set, batch_size=128, shuffle=False, drop_last=False, num_workers=4)\n", "test_loader = data.DataLoader(test_set, batch_size=128, shuffle=False, drop_last=False, num_workers=4)"]}, {"cell_type": "markdown", "id": "939e3864", "metadata": {"papermill": {"duration": 0.132752, "end_time": "2021-12-04T15:57:05.272691", "exception": false, "start_time": "2021-12-04T15:57:05.139939", "status": "completed"}, "tags": []}, "source": ["To verify that our normalization works, we can print out the mean and standard deviation of the single batch.\n", "The mean should be close to 0 and the standard deviation close to 1 for each channel:"]}, {"cell_type": "code", "execution_count": 7, "id": "1cecadf2", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:05.545013Z", "iopub.status.busy": "2021-12-04T15:57:05.544534Z", "iopub.status.idle": "2021-12-04T15:57:09.246817Z", "shell.execute_reply": "2021-12-04T15:57:09.247213Z"}, "papermill": {"duration": 3.840259, "end_time": "2021-12-04T15:57:09.247384", "exception": false, "start_time": "2021-12-04T15:57:05.407125", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Batch mean tensor([-0.0088, -0.0180, -0.0446])\n", "Batch std tensor([0.9446, 0.9240, 0.9487])\n"]}], "source": ["imgs, _ = next(iter(train_loader))\n", "print(\"Batch mean\", imgs.mean(dim=[0, 2, 3]))\n", "print(\"Batch std\", imgs.std(dim=[0, 2, 3]))"]}, {"cell_type": "markdown", "id": "4523d138", "metadata": {"papermill": {"duration": 0.134355, "end_time": "2021-12-04T15:57:09.514896", "exception": false, "start_time": "2021-12-04T15:57:09.380541", "status": "completed"}, "tags": []}, "source": ["Finally, let's visualize a few images from the training set, and how they look like after random data augmentation:"]}, {"cell_type": "code", "execution_count": 8, "id": "380c3c39", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:09.787847Z", "iopub.status.busy": "2021-12-04T15:57:09.787368Z", "iopub.status.idle": "2021-12-04T15:57:09.932044Z", "shell.execute_reply": "2021-12-04T15:57:09.932440Z"}, "papermill": {"duration": 0.284584, "end_time": "2021-12-04T15:57:09.932602", "exception": false, "start_time": "2021-12-04T15:57:09.648018", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:57:09.848870\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["NUM_IMAGES = 4\n", "images = [train_dataset[idx][0] for idx in range(NUM_IMAGES)]\n", "orig_images = [Image.fromarray(train_dataset.data[idx]) for idx in range(NUM_IMAGES)]\n", "orig_images = [test_transform(img) for img in orig_images]\n", "\n", "img_grid = torchvision.utils.make_grid(torch.stack(images + orig_images, dim=0), nrow=4, normalize=True, pad_value=0.5)\n", "img_grid = img_grid.permute(1, 2, 0)\n", "\n", "plt.figure(figsize=(8, 8))\n", "plt.title(\"Augmentation examples on CIFAR10\")\n", "plt.imshow(img_grid)\n", "plt.axis(\"off\")\n", "plt.show()\n", "plt.close()"]}, {"cell_type": "markdown", "id": "1cf109b4", "metadata": {"papermill": {"duration": 0.136475, "end_time": "2021-12-04T15:57:10.205519", "exception": false, "start_time": "2021-12-04T15:57:10.069044", "status": "completed"}, "tags": []}, "source": ["## PyTorch Lightning\n", "\n", "In this notebook and in many following ones, we will make use of the library [PyTorch Lightning](https://www.pytorchlightning.ai/).\n", "PyTorch Lightning is a framework that simplifies your code needed to train, evaluate, and test a model in PyTorch.\n", "It also handles logging into [TensorBoard](https://pytorch.org/tutorials/intermediate/tensorboard_tutorial.html), a visualization toolkit for ML experiments, and saving model checkpoints automatically with minimal code overhead from our side.\n", "This is extremely helpful for us as we want to focus on implementing different model architectures and spend little time on other code overhead.\n", "Note that at the time of writing/teaching, the framework has been released in version 1.3.\n", "Future versions might have a slightly changed interface and thus might not work perfectly with the code (we will try to keep it up-to-date as much as possible).\n", "\n", "Now, we will take the first step in PyTorch Lightning, and continue to explore the framework in our other tutorials.\n", "PyTorch Lightning comes with a lot of useful functions, such as one for setting the seed as we have seen before:"]}, {"cell_type": "code", "execution_count": 9, "id": "9f8167cf", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:10.483015Z", "iopub.status.busy": "2021-12-04T15:57:10.482484Z", "iopub.status.idle": "2021-12-04T15:57:10.486516Z", "shell.execute_reply": "2021-12-04T15:57:10.486045Z"}, "papermill": {"duration": 0.143057, "end_time": "2021-12-04T15:57:10.486644", "exception": false, "start_time": "2021-12-04T15:57:10.343587", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}, {"data": {"text/plain": ["42"]}, "execution_count": 9, "metadata": {}, "output_type": "execute_result"}], "source": ["# Setting the seed\n", "pl.seed_everything(42)"]}, {"cell_type": "markdown", "id": "b8164877", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.137277, "end_time": "2021-12-04T15:57:10.761911", "exception": false, "start_time": "2021-12-04T15:57:10.624634", "status": "completed"}, "tags": []}, "source": ["Thus, in the future, we don't have to define our own `set_seed` function anymore.\n", "\n", "In PyTorch Lightning, we define `pl.LightningModule`'s (inheriting from `torch.nn.Module`) that organize our code into 5 main sections:\n", "\n", "1. Initialization (`__init__`), where we create all necessary parameters/models\n", "2. Optimizers (`configure_optimizers`) where we create the optimizers, learning rate scheduler, etc.\n", "3.\n", "Training loop (`training_step`) where we only have to define the loss calculation for a single batch (the loop of optimizer.zero_grad(), loss.backward() and optimizer.step(), as well as any logging/saving operation, is done in the background)\n", "4.\n", "Validation loop (`validation_step`) where similarly to the training, we only have to define what should happen per step\n", "5. Test loop (`test_step`) which is the same as validation, only on a test set.\n", "\n", "Therefore, we don't abstract the PyTorch code, but rather organize it and define some default operations that are commonly used.\n", "If you need to change something else in your training/validation/test loop, there are many possible functions you can overwrite (see the [docs](https://pytorch-lightning.readthedocs.io/en/stable/common/lightning_module.html) for details).\n", "\n", "Now we can look at an example of how a Lightning Module for training a CNN looks like:"]}, {"cell_type": "code", "execution_count": 10, "id": "6fac8494", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:11.047878Z", "iopub.status.busy": "2021-12-04T15:57:11.039872Z", "iopub.status.idle": "2021-12-04T15:57:11.049883Z", "shell.execute_reply": "2021-12-04T15:57:11.049481Z"}, "papermill": {"duration": 0.14967, "end_time": "2021-12-04T15:57:11.049991", "exception": false, "start_time": "2021-12-04T15:57:10.900321", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class CIFARModule(pl.LightningModule):\n", " def __init__(self, model_name, model_hparams, optimizer_name, optimizer_hparams):\n", " \"\"\"\n", " Inputs:\n", " model_name - Name of the model/CNN to run. Used for creating the model (see function below)\n", " model_hparams - Hyperparameters for the model, as dictionary.\n", " optimizer_name - Name of the optimizer to use. Currently supported: Adam, SGD\n", " optimizer_hparams - Hyperparameters for the optimizer, as dictionary. This includes learning rate, weight decay, etc.\n", " \"\"\"\n", " super().__init__()\n", " # Exports the hyperparameters to a YAML file, and create \"self.hparams\" namespace\n", " self.save_hyperparameters()\n", " # Create model\n", " self.model = create_model(model_name, model_hparams)\n", " # Create loss module\n", " self.loss_module = nn.CrossEntropyLoss()\n", " # Example input for visualizing the graph in Tensorboard\n", " self.example_input_array = torch.zeros((1, 3, 32, 32), dtype=torch.float32)\n", "\n", " def forward(self, imgs):\n", " # Forward function that is run when visualizing the graph\n", " return self.model(imgs)\n", "\n", " def configure_optimizers(self):\n", " # We will support Adam or SGD as optimizers.\n", " if self.hparams.optimizer_name == \"Adam\":\n", " # AdamW is Adam with a correct implementation of weight decay (see here\n", " # for details: https://arxiv.org/pdf/1711.05101.pdf)\n", " optimizer = optim.AdamW(self.parameters(), **self.hparams.optimizer_hparams)\n", " elif self.hparams.optimizer_name == \"SGD\":\n", " optimizer = optim.SGD(self.parameters(), **self.hparams.optimizer_hparams)\n", " else:\n", " assert False, f'Unknown optimizer: \"{self.hparams.optimizer_name}\"'\n", "\n", " # We will reduce the learning rate by 0.1 after 100 and 150 epochs\n", " scheduler = optim.lr_scheduler.MultiStepLR(optimizer, milestones=[100, 150], gamma=0.1)\n", " return [optimizer], [scheduler]\n", "\n", " def training_step(self, batch, batch_idx):\n", " # \"batch\" is the output of the training data loader.\n", " imgs, labels = batch\n", " preds = self.model(imgs)\n", " loss = self.loss_module(preds, labels)\n", " acc = (preds.argmax(dim=-1) == labels).float().mean()\n", "\n", " # Logs the accuracy per epoch to tensorboard (weighted average over batches)\n", " self.log(\"train_acc\", acc, on_step=False, on_epoch=True)\n", " self.log(\"train_loss\", loss)\n", " return loss # Return tensor to call \".backward\" on\n", "\n", " def validation_step(self, batch, batch_idx):\n", " imgs, labels = batch\n", " preds = self.model(imgs).argmax(dim=-1)\n", " acc = (labels == preds).float().mean()\n", " # By default logs it per epoch (weighted average over batches)\n", " self.log(\"val_acc\", acc)\n", "\n", " def test_step(self, batch, batch_idx):\n", " imgs, labels = batch\n", " preds = self.model(imgs).argmax(dim=-1)\n", " acc = (labels == preds).float().mean()\n", " # By default logs it per epoch (weighted average over batches), and returns it afterwards\n", " self.log(\"test_acc\", acc)"]}, {"cell_type": "markdown", "id": "41d60bc2", "metadata": {"papermill": {"duration": 0.137514, "end_time": "2021-12-04T15:57:11.325129", "exception": false, "start_time": "2021-12-04T15:57:11.187615", "status": "completed"}, "tags": []}, "source": ["We see that the code is organized and clear, which helps if someone else tries to understand your code.\n", "\n", "Another important part of PyTorch Lightning is the concept of callbacks.\n", "Callbacks are self-contained functions that contain the non-essential logic of your Lightning Module.\n", "They are usually called after finishing a training epoch, but can also influence other parts of your training loop.\n", "For instance, we will use the following two pre-defined callbacks: `LearningRateMonitor` and `ModelCheckpoint`.\n", "The learning rate monitor adds the current learning rate to our TensorBoard, which helps to verify that our learning rate scheduler works correctly.\n", "The model checkpoint callback allows you to customize the saving routine of your checkpoints.\n", "For instance, how many checkpoints to keep, when to save, which metric to look out for, etc.\n", "We import them below:"]}, {"cell_type": "code", "execution_count": 11, "id": "e1f870e3", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:11.605285Z", "iopub.status.busy": "2021-12-04T15:57:11.604819Z", "iopub.status.idle": "2021-12-04T15:57:11.606792Z", "shell.execute_reply": "2021-12-04T15:57:11.606380Z"}, "papermill": {"duration": 0.143447, "end_time": "2021-12-04T15:57:11.606903", "exception": false, "start_time": "2021-12-04T15:57:11.463456", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# Callbacks"]}, {"cell_type": "markdown", "id": "b3894841", "metadata": {"papermill": {"duration": 0.137143, "end_time": "2021-12-04T15:57:11.881319", "exception": false, "start_time": "2021-12-04T15:57:11.744176", "status": "completed"}, "tags": []}, "source": ["To allow running multiple different models with the same Lightning module, we define a function below that maps a model name to the model class.\n", "At this stage, the dictionary `model_dict` is empty, but we will fill it throughout the notebook with our new models."]}, {"cell_type": "code", "execution_count": 12, "id": "df79310c", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:12.170411Z", "iopub.status.busy": "2021-12-04T15:57:12.169937Z", "iopub.status.idle": "2021-12-04T15:57:12.171891Z", "shell.execute_reply": "2021-12-04T15:57:12.171423Z"}, "papermill": {"duration": 0.151484, "end_time": "2021-12-04T15:57:12.172000", "exception": false, "start_time": "2021-12-04T15:57:12.020516", "status": "completed"}, "tags": []}, "outputs": [], "source": ["model_dict = {}\n", "\n", "\n", "def create_model(model_name, model_hparams):\n", " if model_name in model_dict:\n", " return model_dict[model_name](**model_hparams)\n", " else:\n", " assert False, f'Unknown model name \"{model_name}\". Available models are: {str(model_dict.keys())}'"]}, {"cell_type": "markdown", "id": "c4ffa0dc", "metadata": {"papermill": {"duration": 0.140094, "end_time": "2021-12-04T15:57:12.450270", "exception": false, "start_time": "2021-12-04T15:57:12.310176", "status": "completed"}, "tags": []}, "source": ["Similarly, to use the activation function as another hyperparameter in\n", "our model, we define a \"name to function\" dict below:"]}, {"cell_type": "code", "execution_count": 13, "id": "75f7c5d8", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:12.729899Z", "iopub.status.busy": "2021-12-04T15:57:12.729422Z", "iopub.status.idle": "2021-12-04T15:57:12.731428Z", "shell.execute_reply": "2021-12-04T15:57:12.730960Z"}, "papermill": {"duration": 0.142657, "end_time": "2021-12-04T15:57:12.731536", "exception": false, "start_time": "2021-12-04T15:57:12.588879", "status": "completed"}, "tags": []}, "outputs": [], "source": ["act_fn_by_name = {\"tanh\": nn.Tanh, \"relu\": nn.ReLU, \"leakyrelu\": nn.LeakyReLU, \"gelu\": nn.GELU}"]}, {"cell_type": "markdown", "id": "9e4e507a", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.137281, "end_time": "2021-12-04T15:57:13.005846", "exception": false, "start_time": "2021-12-04T15:57:12.868565", "status": "completed"}, "tags": []}, "source": ["If we pass the classes or objects directly as an argument to the Lightning module, we couldn't take advantage of PyTorch Lightning's automatically hyperparameter saving and loading.\n", "\n", "Besides the Lightning module, the second most important module in PyTorch Lightning is the `Trainer`.\n", "The trainer is responsible to execute the training steps defined in the Lightning module and completes the framework.\n", "Similar to the Lightning module, you can override any key part that you don't want to be automated, but the default settings are often the best practice to do.\n", "For a full overview, see the [documentation](https://pytorch-lightning.readthedocs.io/en/stable/common/trainer.html).\n", "The most important functions we use below are:\n", "\n", "* `trainer.fit`: Takes as input a lightning module, a training dataset, and an (optional) validation dataset.\n", "This function trains the given module on the training dataset with occasional validation (default once per epoch, can be changed)\n", "* `trainer.test`: Takes as input a model and a dataset on which we want to test.\n", "It returns the test metric on the dataset.\n", "\n", "For training and testing, we don't have to worry about things like setting the model to eval mode (`model.eval()`) as this is all done automatically.\n", "See below how we define a training function for our models:"]}, {"cell_type": "code", "execution_count": 14, "id": "70fa7f16", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:13.293251Z", "iopub.status.busy": "2021-12-04T15:57:13.292766Z", "iopub.status.idle": "2021-12-04T15:57:13.294781Z", "shell.execute_reply": "2021-12-04T15:57:13.294298Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.149211, "end_time": "2021-12-04T15:57:13.294889", "exception": false, "start_time": "2021-12-04T15:57:13.145678", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def train_model(model_name, save_name=None, **kwargs):\n", " \"\"\"\n", " Inputs:\n", " model_name - Name of the model you want to run. Is used to look up the class in \"model_dict\"\n", " save_name (optional) - If specified, this name will be used for creating the checkpoint and logging directory.\n", " \"\"\"\n", " if save_name is None:\n", " save_name = model_name\n", "\n", " # Create a PyTorch Lightning trainer with the generation callback\n", " trainer = pl.Trainer(\n", " default_root_dir=os.path.join(CHECKPOINT_PATH, save_name), # Where to save models\n", " # We run on a single GPU (if possible)\n", " gpus=1 if str(device) == \"cuda:0\" else 0,\n", " # How many epochs to train for if no patience is set\n", " max_epochs=180,\n", " callbacks=[\n", " ModelCheckpoint(\n", " save_weights_only=True, mode=\"max\", monitor=\"val_acc\"\n", " ), # Save the best checkpoint based on the maximum val_acc recorded. Saves only weights and not optimizer\n", " LearningRateMonitor(\"epoch\"),\n", " ], # Log learning rate every epoch\n", " progress_bar_refresh_rate=1,\n", " ) # In case your notebook crashes due to the progress bar, consider increasing the refresh rate\n", " trainer.logger._log_graph = True # If True, we plot the computation graph in tensorboard\n", " trainer.logger._default_hp_metric = None # Optional logging argument that we don't need\n", "\n", " # Check whether pretrained model exists. If yes, load it and skip training\n", " pretrained_filename = os.path.join(CHECKPOINT_PATH, save_name + \".ckpt\")\n", " if os.path.isfile(pretrained_filename):\n", " print(f\"Found pretrained model at {pretrained_filename}, loading...\")\n", " # Automatically loads the model with the saved hyperparameters\n", " model = CIFARModule.load_from_checkpoint(pretrained_filename)\n", " else:\n", " pl.seed_everything(42) # To be reproducable\n", " model = CIFARModule(model_name=model_name, **kwargs)\n", " trainer.fit(model, train_loader, val_loader)\n", " model = CIFARModule.load_from_checkpoint(\n", " trainer.checkpoint_callback.best_model_path\n", " ) # Load best checkpoint after training\n", "\n", " # Test best model on validation and test set\n", " val_result = trainer.test(model, test_dataloaders=val_loader, verbose=False)\n", " test_result = trainer.test(model, test_dataloaders=test_loader, verbose=False)\n", " result = {\"test\": test_result[0][\"test_acc\"], \"val\": val_result[0][\"test_acc\"]}\n", "\n", " return model, result"]}, {"cell_type": "markdown", "id": "3091fdb8", "metadata": {"papermill": {"duration": 0.139091, "end_time": "2021-12-04T15:57:13.571355", "exception": false, "start_time": "2021-12-04T15:57:13.432264", "status": "completed"}, "tags": []}, "source": ["Finally, we can focus on the Convolutional Neural Networks we want to\n", "implement today: GoogleNet, ResNet, and DenseNet."]}, {"cell_type": "markdown", "id": "13b5e914", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.137839, "end_time": "2021-12-04T15:57:13.846237", "exception": false, "start_time": "2021-12-04T15:57:13.708398", "status": "completed"}, "tags": []}, "source": ["## Inception\n", "\n", "
\n", "\n", "The [GoogleNet](https://arxiv.org/abs/1409.4842), proposed in 2014, won the ImageNet Challenge because of its usage of the Inception modules.\n", "In general, we will mainly focus on the concept of Inception in this tutorial instead of the specifics of the GoogleNet, as based on Inception, there have been many follow-up works ([Inception-v2](https://arxiv.org/abs/1512.00567), [Inception-v3](https://arxiv.org/abs/1512.00567), [Inception-v4](https://arxiv.org/abs/1602.07261), [Inception-ResNet](https://arxiv.org/abs/1602.07261),...).\n", "The follow-up works mainly focus on increasing efficiency and enabling very deep Inception networks.\n", "However, for a fundamental understanding, it is sufficient to look at the original Inception block.\n", "\n", "An Inception block applies four convolution blocks separately on the same feature map: a 1x1, 3x3, and 5x5 convolution, and a max pool operation.\n", "This allows the network to look at the same data with different receptive fields.\n", "Of course, learning only 5x5 convolution would be theoretically more powerful.\n", "However, this is not only more computation and memory heavy but also tends to overfit much easier.\n", "The overall inception block looks like below (figure credit - [Szegedy et al. ](https://arxiv.org/abs/1409.4842)):\n", "\n", "
\n", "\n", "The additional 1x1 convolutions before the 3x3 and 5x5 convolutions are used for dimensionality reduction.\n", "This is especially crucial as the feature maps of all branches are merged afterward, and we don't want any explosion of feature size.\n", "As 5x5 convolutions are 25 times more expensive than 1x1 convolutions, we can save a lot of computation and parameters by reducing the dimensionality before the large convolutions.\n", "\n", "We can now try to implement the Inception Block ourselves:"]}, {"cell_type": "code", "execution_count": 15, "id": "4fa882ae", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:14.130278Z", "iopub.status.busy": "2021-12-04T15:57:14.129749Z", "iopub.status.idle": "2021-12-04T15:57:14.132368Z", "shell.execute_reply": "2021-12-04T15:57:14.131969Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.148391, "end_time": "2021-12-04T15:57:14.132478", "exception": false, "start_time": "2021-12-04T15:57:13.984087", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class InceptionBlock(nn.Module):\n", " def __init__(self, c_in, c_red: dict, c_out: dict, act_fn):\n", " \"\"\"\n", " Inputs:\n", " c_in - Number of input feature maps from the previous layers\n", " c_red - Dictionary with keys \"3x3\" and \"5x5\" specifying the output of the dimensionality reducing 1x1 convolutions\n", " c_out - Dictionary with keys \"1x1\", \"3x3\", \"5x5\", and \"max\"\n", " act_fn - Activation class constructor (e.g. nn.ReLU)\n", " \"\"\"\n", " super().__init__()\n", "\n", " # 1x1 convolution branch\n", " self.conv_1x1 = nn.Sequential(\n", " nn.Conv2d(c_in, c_out[\"1x1\"], kernel_size=1), nn.BatchNorm2d(c_out[\"1x1\"]), act_fn()\n", " )\n", "\n", " # 3x3 convolution branch\n", " self.conv_3x3 = nn.Sequential(\n", " nn.Conv2d(c_in, c_red[\"3x3\"], kernel_size=1),\n", " nn.BatchNorm2d(c_red[\"3x3\"]),\n", " act_fn(),\n", " nn.Conv2d(c_red[\"3x3\"], c_out[\"3x3\"], kernel_size=3, padding=1),\n", " nn.BatchNorm2d(c_out[\"3x3\"]),\n", " act_fn(),\n", " )\n", "\n", " # 5x5 convolution branch\n", " self.conv_5x5 = nn.Sequential(\n", " nn.Conv2d(c_in, c_red[\"5x5\"], kernel_size=1),\n", " nn.BatchNorm2d(c_red[\"5x5\"]),\n", " act_fn(),\n", " nn.Conv2d(c_red[\"5x5\"], c_out[\"5x5\"], kernel_size=5, padding=2),\n", " nn.BatchNorm2d(c_out[\"5x5\"]),\n", " act_fn(),\n", " )\n", "\n", " # Max-pool branch\n", " self.max_pool = nn.Sequential(\n", " nn.MaxPool2d(kernel_size=3, padding=1, stride=1),\n", " nn.Conv2d(c_in, c_out[\"max\"], kernel_size=1),\n", " nn.BatchNorm2d(c_out[\"max\"]),\n", " act_fn(),\n", " )\n", "\n", " def forward(self, x):\n", " x_1x1 = self.conv_1x1(x)\n", " x_3x3 = self.conv_3x3(x)\n", " x_5x5 = self.conv_5x5(x)\n", " x_max = self.max_pool(x)\n", " x_out = torch.cat([x_1x1, x_3x3, x_5x5, x_max], dim=1)\n", " return x_out"]}, {"cell_type": "markdown", "id": "bffa7c2d", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.137965, "end_time": "2021-12-04T15:57:14.408272", "exception": false, "start_time": "2021-12-04T15:57:14.270307", "status": "completed"}, "tags": []}, "source": ["The GoogleNet architecture consists of stacking multiple Inception blocks with occasional max pooling to reduce the height and width of the feature maps.\n", "The original GoogleNet was designed for image sizes of ImageNet (224x224 pixels) and had almost 7 million parameters.\n", "As we train on CIFAR10 with image sizes of 32x32, we don't require such a heavy architecture, and instead, apply a reduced version.\n", "The number of channels for dimensionality reduction and output per filter (1x1, 3x3, 5x5, and max pooling) need to be manually specified and can be changed if interested.\n", "The general intuition is to have the most filters for the 3x3\n", "convolutions, as they are powerful enough to take the context into\n", "account while requiring almost a third of the parameters of the 5x5\n", "convolution."]}, {"cell_type": "code", "execution_count": 16, "id": "85cd0c39", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:14.698719Z", "iopub.status.busy": "2021-12-04T15:57:14.693514Z", "iopub.status.idle": "2021-12-04T15:57:14.700699Z", "shell.execute_reply": "2021-12-04T15:57:14.700227Z"}, "papermill": {"duration": 0.152836, "end_time": "2021-12-04T15:57:14.700807", "exception": false, "start_time": "2021-12-04T15:57:14.547971", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class GoogleNet(nn.Module):\n", " def __init__(self, num_classes=10, act_fn_name=\"relu\", **kwargs):\n", " super().__init__()\n", " self.hparams = SimpleNamespace(\n", " num_classes=num_classes, act_fn_name=act_fn_name, act_fn=act_fn_by_name[act_fn_name]\n", " )\n", " self._create_network()\n", " self._init_params()\n", "\n", " def _create_network(self):\n", " # A first convolution on the original image to scale up the channel size\n", " self.input_net = nn.Sequential(\n", " nn.Conv2d(3, 64, kernel_size=3, padding=1), nn.BatchNorm2d(64), self.hparams.act_fn()\n", " )\n", " # Stacking inception blocks\n", " self.inception_blocks = nn.Sequential(\n", " InceptionBlock(\n", " 64,\n", " c_red={\"3x3\": 32, \"5x5\": 16},\n", " c_out={\"1x1\": 16, \"3x3\": 32, \"5x5\": 8, \"max\": 8},\n", " act_fn=self.hparams.act_fn,\n", " ),\n", " InceptionBlock(\n", " 64,\n", " c_red={\"3x3\": 32, \"5x5\": 16},\n", " c_out={\"1x1\": 24, \"3x3\": 48, \"5x5\": 12, \"max\": 12},\n", " act_fn=self.hparams.act_fn,\n", " ),\n", " nn.MaxPool2d(3, stride=2, padding=1), # 32x32 => 16x16\n", " InceptionBlock(\n", " 96,\n", " c_red={\"3x3\": 32, \"5x5\": 16},\n", " c_out={\"1x1\": 24, \"3x3\": 48, \"5x5\": 12, \"max\": 12},\n", " act_fn=self.hparams.act_fn,\n", " ),\n", " InceptionBlock(\n", " 96,\n", " c_red={\"3x3\": 32, \"5x5\": 16},\n", " c_out={\"1x1\": 16, \"3x3\": 48, \"5x5\": 16, \"max\": 16},\n", " act_fn=self.hparams.act_fn,\n", " ),\n", " InceptionBlock(\n", " 96,\n", " c_red={\"3x3\": 32, \"5x5\": 16},\n", " c_out={\"1x1\": 16, \"3x3\": 48, \"5x5\": 16, \"max\": 16},\n", " act_fn=self.hparams.act_fn,\n", " ),\n", " InceptionBlock(\n", " 96,\n", " c_red={\"3x3\": 32, \"5x5\": 16},\n", " c_out={\"1x1\": 32, \"3x3\": 48, \"5x5\": 24, \"max\": 24},\n", " act_fn=self.hparams.act_fn,\n", " ),\n", " nn.MaxPool2d(3, stride=2, padding=1), # 16x16 => 8x8\n", " InceptionBlock(\n", " 128,\n", " c_red={\"3x3\": 48, \"5x5\": 16},\n", " c_out={\"1x1\": 32, \"3x3\": 64, \"5x5\": 16, \"max\": 16},\n", " act_fn=self.hparams.act_fn,\n", " ),\n", " InceptionBlock(\n", " 128,\n", " c_red={\"3x3\": 48, \"5x5\": 16},\n", " c_out={\"1x1\": 32, \"3x3\": 64, \"5x5\": 16, \"max\": 16},\n", " act_fn=self.hparams.act_fn,\n", " ),\n", " )\n", " # Mapping to classification output\n", " self.output_net = nn.Sequential(\n", " nn.AdaptiveAvgPool2d((1, 1)), nn.Flatten(), nn.Linear(128, self.hparams.num_classes)\n", " )\n", "\n", " def _init_params(self):\n", " # Based on our discussion in Tutorial 4, we should initialize the\n", " # convolutions according to the activation function\n", " for m in self.modules():\n", " if isinstance(m, nn.Conv2d):\n", " nn.init.kaiming_normal_(m.weight, nonlinearity=self.hparams.act_fn_name)\n", " elif isinstance(m, nn.BatchNorm2d):\n", " nn.init.constant_(m.weight, 1)\n", " nn.init.constant_(m.bias, 0)\n", "\n", " def forward(self, x):\n", " x = self.input_net(x)\n", " x = self.inception_blocks(x)\n", " x = self.output_net(x)\n", " return x"]}, {"cell_type": "markdown", "id": "5a8f15ba", "metadata": {"papermill": {"duration": 0.138296, "end_time": "2021-12-04T15:57:14.978565", "exception": false, "start_time": "2021-12-04T15:57:14.840269", "status": "completed"}, "tags": []}, "source": ["Now, we can integrate our model to the model dictionary we defined above:"]}, {"cell_type": "code", "execution_count": 17, "id": "0d93d35b", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:15.257555Z", "iopub.status.busy": "2021-12-04T15:57:15.257085Z", "iopub.status.idle": "2021-12-04T15:57:15.259035Z", "shell.execute_reply": "2021-12-04T15:57:15.258543Z"}, "papermill": {"duration": 0.143062, "end_time": "2021-12-04T15:57:15.259141", "exception": false, "start_time": "2021-12-04T15:57:15.116079", "status": "completed"}, "tags": []}, "outputs": [], "source": ["model_dict[\"GoogleNet\"] = GoogleNet"]}, {"cell_type": "markdown", "id": "d57cb4bb", "metadata": {"papermill": {"duration": 0.138614, "end_time": "2021-12-04T15:57:15.536507", "exception": false, "start_time": "2021-12-04T15:57:15.397893", "status": "completed"}, "tags": []}, "source": ["The training of the model is handled by PyTorch Lightning, and we just have to define the command to start.\n", "Note that we train for almost 200 epochs, which takes about an hour on Lisa's default GPUs (GTX1080Ti).\n", "We would recommend using the saved models and train your own model if you are interested."]}, {"cell_type": "code", "execution_count": 18, "id": "0a7d2c3d", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:15.822049Z", "iopub.status.busy": "2021-12-04T15:57:15.821573Z", "iopub.status.idle": "2021-12-04T15:57:20.480077Z", "shell.execute_reply": "2021-12-04T15:57:20.480477Z"}, "papermill": {"duration": 4.805519, "end_time": "2021-12-04T15:57:20.480642", "exception": false, "start_time": "2021-12-04T15:57:15.675123", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/connectors/callback_connector.py:90: LightningDeprecationWarning: Setting `Trainer(progress_bar_refresh_rate=1)` is deprecated in v1.5 and will be removed in v1.7. Please pass `pytorch_lightning.callbacks.progress.TQDMProgressBar` with `refresh_rate` directly to the Trainer's `callbacks` argument instead. Or, to disable the progress bar pass `enable_progress_bar = False` to the Trainer.\n", " rank_zero_deprecation(\n", "GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/trainer.py:901: LightningDeprecationWarning: `trainer.test(test_dataloaders)` is deprecated in v1.4 and will be removed in v1.6. Use `trainer.test(dataloaders)` instead.\n", " rank_zero_deprecation(\n", "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torch/_jit_internal.py:603: LightningDeprecationWarning: The `LightningModule.loaded_optimizer_states_dict` property is deprecated in v1.4 and will be removed in v1.6.\n", " if hasattr(mod, name):\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model at saved_models/ConvNets/GoogleNet.ckpt, loading...\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "d4a54ef3af5d4bcaafad8c61c3360423", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "88b1b202de814778ae51007742b5610c", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}], "source": ["googlenet_model, googlenet_results = train_model(\n", " model_name=\"GoogleNet\",\n", " model_hparams={\"num_classes\": 10, \"act_fn_name\": \"relu\"},\n", " optimizer_name=\"Adam\",\n", " optimizer_hparams={\"lr\": 1e-3, \"weight_decay\": 1e-4},\n", ")"]}, {"cell_type": "markdown", "id": "580ed6ce", "metadata": {"papermill": {"duration": 0.145507, "end_time": "2021-12-04T15:57:20.772152", "exception": false, "start_time": "2021-12-04T15:57:20.626645", "status": "completed"}, "tags": []}, "source": ["We will compare the results later in the notebooks, but we can already print them here for a first glance:"]}, {"cell_type": "code", "execution_count": 19, "id": "00f40b04", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:21.066499Z", "iopub.status.busy": "2021-12-04T15:57:21.066033Z", "iopub.status.idle": "2021-12-04T15:57:21.068511Z", "shell.execute_reply": "2021-12-04T15:57:21.068131Z"}, "papermill": {"duration": 0.151434, "end_time": "2021-12-04T15:57:21.068618", "exception": false, "start_time": "2021-12-04T15:57:20.917184", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["GoogleNet Results {'test': 0.8970000147819519, 'val': 0.9039999842643738}\n"]}], "source": ["print(\"GoogleNet Results\", googlenet_results)"]}, {"cell_type": "markdown", "id": "c1e798a1", "metadata": {"papermill": {"duration": 0.15013, "end_time": "2021-12-04T15:57:21.364739", "exception": false, "start_time": "2021-12-04T15:57:21.214609", "status": "completed"}, "tags": []}, "source": ["### Tensorboard log\n", "\n", "A nice extra of PyTorch Lightning is the automatic logging into TensorBoard.\n", "To give you a better intuition of what TensorBoard can be used, we can look at the board that PyTorch Lightning has been generated when training the GoogleNet.\n", "TensorBoard provides an inline functionality for Jupyter notebooks, and we use it here:"]}, {"cell_type": "code", "execution_count": 20, "id": "636c7e8a", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:21.662240Z", "iopub.status.busy": "2021-12-04T15:57:21.661769Z", "iopub.status.idle": "2021-12-04T15:57:21.665743Z", "shell.execute_reply": "2021-12-04T15:57:21.665337Z"}, "papermill": {"duration": 0.154976, "end_time": "2021-12-04T15:57:21.665854", "exception": false, "start_time": "2021-12-04T15:57:21.510878", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# Import tensorboard\n", "%load_ext tensorboard"]}, {"cell_type": "code", "execution_count": 21, "id": "172e6d41", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:21.964674Z", "iopub.status.busy": "2021-12-04T15:57:21.964207Z", "iopub.status.idle": "2021-12-04T15:57:23.517538Z", "shell.execute_reply": "2021-12-04T15:57:23.517924Z"}, "papermill": {"duration": 1.704031, "end_time": "2021-12-04T15:57:23.518088", "exception": false, "start_time": "2021-12-04T15:57:21.814057", "status": "completed"}, "tags": []}, "outputs": [{"data": {"text/html": ["\n", " \n", " \n", " "], "text/plain": [""]}, "metadata": {}, "output_type": "display_data"}], "source": ["# Opens tensorboard in notebook. Adjust the path to your CHECKPOINT_PATH!\n", "%tensorboard --logdir ../saved_models/tutorial5/tensorboards/GoogleNet/"]}, {"cell_type": "markdown", "id": "12cc6a1a", "metadata": {"papermill": {"duration": 0.152112, "end_time": "2021-12-04T15:57:23.821918", "exception": false, "start_time": "2021-12-04T15:57:23.669806", "status": "completed"}, "tags": []}, "source": ["
\n", "\n", "TensorBoard is organized in multiple tabs.\n", "The main tab is the scalar tab where we can log the development of single numbers.\n", "For example, we have plotted the training loss, accuracy, learning rate, etc.\n", "If we look at the training or validation accuracy, we can really see the impact of using a learning rate scheduler.\n", "Reducing the learning rate gives our model a nice increase in training performance.\n", "Similarly, when looking at the training loss, we see a sudden decrease at this point.\n", "However, the high numbers on the training set compared to validation indicate that our model was overfitting which is inevitable for such large networks.\n", "\n", "Another interesting tab in TensorBoard is the graph tab.\n", "It shows us the network architecture organized by building blocks from the input to the output.\n", "It basically shows the operations taken in the forward step of `CIFARModule`.\n", "Double-click on a module to open it.\n", "Feel free to explore the architecture from a different perspective.\n", "The graph visualization can often help you to validate that your model\n", "is actually doing what it is supposed to do, and you don't miss any\n", "layers in the computation graph."]}, {"cell_type": "markdown", "id": "9836e715", "metadata": {"papermill": {"duration": 0.149221, "end_time": "2021-12-04T15:57:24.120321", "exception": false, "start_time": "2021-12-04T15:57:23.971100", "status": "completed"}, "tags": []}, "source": ["## ResNet\n", "\n", "The [ResNet](https://arxiv.org/abs/1512.03385) paper is one of the [most cited AI papers](https://www.natureindex.com/news-blog/google-scholar-reveals-most-influential-papers-research-citations-twenty-twenty), and has been the foundation for neural networks with more than 1,000 layers.\n", "Despite its simplicity, the idea of residual connections is highly effective as it supports stable gradient propagation through the network.\n", "Instead of modeling $x_{l+1}=F(x_{l})$, we model $x_{l+1}=x_{l}+F(x_{l})$ where $F$ is a non-linear mapping (usually a sequence of NN modules likes convolutions, activation functions, and normalizations).\n", "If we do backpropagation on such residual connections, we obtain:\n", "\n", "$$\\frac{\\partial x_{l+1}}{\\partial x_{l}} = \\mathbf{I} + \\frac{\\partial F(x_{l})}{\\partial x_{l}}$$\n", "\n", "The bias towards the identity matrix guarantees a stable gradient propagation being less effected by $F$ itself.\n", "There have been many variants of ResNet proposed, which mostly concern the function $F$, or operations applied on the sum.\n", "In this tutorial, we look at two of them: the original ResNet block, and the [Pre-Activation ResNet block](https://arxiv.org/abs/1603.05027).\n", "We visually compare the blocks below (figure credit - [He et al. ](https://arxiv.org/abs/1603.05027)):\n", "\n", "
\n", "\n", "The original ResNet block applies a non-linear activation function, usually ReLU, after the skip connection.\n", "In contrast, the pre-activation ResNet block applies the non-linearity at the beginning of $F$.\n", "Both have their advantages and disadvantages.\n", "For very deep network, however, the pre-activation ResNet has shown to perform better as the gradient flow is guaranteed to have the identity matrix as calculated above, and is not harmed by any non-linear activation applied to it.\n", "For comparison, in this notebook, we implement both ResNet types as shallow networks.\n", "\n", "Let's start with the original ResNet block.\n", "The visualization above already shows what layers are included in $F$.\n", "One special case we have to handle is when we want to reduce the image dimensions in terms of width and height.\n", "The basic ResNet block requires $F(x_{l})$ to be of the same shape as $x_{l}$.\n", "Thus, we need to change the dimensionality of $x_{l}$ as well before adding to $F(x_{l})$.\n", "The original implementation used an identity mapping with stride 2 and padded additional feature dimensions with 0.\n", "However, the more common implementation is to use a 1x1 convolution with stride 2 as it allows us to change the feature dimensionality while being efficient in parameter and computation cost.\n", "The code for the ResNet block is relatively simple, and shown below:"]}, {"cell_type": "code", "execution_count": 22, "id": "9a388e6a", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:24.427355Z", "iopub.status.busy": "2021-12-04T15:57:24.426861Z", "iopub.status.idle": "2021-12-04T15:57:24.428757Z", "shell.execute_reply": "2021-12-04T15:57:24.428366Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.16061, "end_time": "2021-12-04T15:57:24.428877", "exception": false, "start_time": "2021-12-04T15:57:24.268267", "status": "completed"}, "tags": []}, "outputs": [], "source": ["\n", "\n", "class ResNetBlock(nn.Module):\n", " def __init__(self, c_in, act_fn, subsample=False, c_out=-1):\n", " \"\"\"\n", " Inputs:\n", " c_in - Number of input features\n", " act_fn - Activation class constructor (e.g. nn.ReLU)\n", " subsample - If True, we want to apply a stride inside the block and reduce the output shape by 2 in height and width\n", " c_out - Number of output features. Note that this is only relevant if subsample is True, as otherwise, c_out = c_in\n", " \"\"\"\n", " super().__init__()\n", " if not subsample:\n", " c_out = c_in\n", "\n", " # Network representing F\n", " self.net = nn.Sequential(\n", " nn.Conv2d(\n", " c_in, c_out, kernel_size=3, padding=1, stride=1 if not subsample else 2, bias=False\n", " ), # No bias needed as the Batch Norm handles it\n", " nn.BatchNorm2d(c_out),\n", " act_fn(),\n", " nn.Conv2d(c_out, c_out, kernel_size=3, padding=1, bias=False),\n", " nn.BatchNorm2d(c_out),\n", " )\n", "\n", " # 1x1 convolution with stride 2 means we take the upper left value, and transform it to new output size\n", " self.downsample = nn.Conv2d(c_in, c_out, kernel_size=1, stride=2) if subsample else None\n", " self.act_fn = act_fn()\n", "\n", " def forward(self, x):\n", " z = self.net(x)\n", " if self.downsample is not None:\n", " x = self.downsample(x)\n", " out = z + x\n", " out = self.act_fn(out)\n", " return out"]}, {"cell_type": "markdown", "id": "5935648f", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.153709, "end_time": "2021-12-04T15:57:24.734386", "exception": false, "start_time": "2021-12-04T15:57:24.580677", "status": "completed"}, "tags": []}, "source": ["The second block we implement is the pre-activation ResNet block.\n", "For this, we have to change the order of layer in `self.net`, and do not apply an activation function on the output.\n", "Additionally, the downsampling operation has to apply a non-linearity as well as the input, $x_l$, has not been processed by a non-linearity yet.\n", "Hence, the block looks as follows:"]}, {"cell_type": "code", "execution_count": 23, "id": "d3772982", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:25.038147Z", "iopub.status.busy": "2021-12-04T15:57:25.037663Z", "iopub.status.idle": "2021-12-04T15:57:25.039227Z", "shell.execute_reply": "2021-12-04T15:57:25.039608Z"}, "papermill": {"duration": 0.15651, "end_time": "2021-12-04T15:57:25.039740", "exception": false, "start_time": "2021-12-04T15:57:24.883230", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class PreActResNetBlock(nn.Module):\n", " def __init__(self, c_in, act_fn, subsample=False, c_out=-1):\n", " \"\"\"\n", " Inputs:\n", " c_in - Number of input features\n", " act_fn - Activation class constructor (e.g. nn.ReLU)\n", " subsample - If True, we want to apply a stride inside the block and reduce the output shape by 2 in height and width\n", " c_out - Number of output features. Note that this is only relevant if subsample is True, as otherwise, c_out = c_in\n", " \"\"\"\n", " super().__init__()\n", " if not subsample:\n", " c_out = c_in\n", "\n", " # Network representing F\n", " self.net = nn.Sequential(\n", " nn.BatchNorm2d(c_in),\n", " act_fn(),\n", " nn.Conv2d(c_in, c_out, kernel_size=3, padding=1, stride=1 if not subsample else 2, bias=False),\n", " nn.BatchNorm2d(c_out),\n", " act_fn(),\n", " nn.Conv2d(c_out, c_out, kernel_size=3, padding=1, bias=False),\n", " )\n", "\n", " # 1x1 convolution needs to apply non-linearity as well as not done on skip connection\n", " self.downsample = (\n", " nn.Sequential(nn.BatchNorm2d(c_in), act_fn(), nn.Conv2d(c_in, c_out, kernel_size=1, stride=2, bias=False))\n", " if subsample\n", " else None\n", " )\n", "\n", " def forward(self, x):\n", " z = self.net(x)\n", " if self.downsample is not None:\n", " x = self.downsample(x)\n", " out = z + x\n", " return out"]}, {"cell_type": "markdown", "id": "ca3b8840", "metadata": {"papermill": {"duration": 0.154836, "end_time": "2021-12-04T15:57:25.343780", "exception": false, "start_time": "2021-12-04T15:57:25.188944", "status": "completed"}, "tags": []}, "source": ["Similarly to the model selection, we define a dictionary to create a mapping from string to block class.\n", "We will use the string name as hyperparameter value in our model to choose between the ResNet blocks.\n", "Feel free to implement any other ResNet block type and add it here as well."]}, {"cell_type": "code", "execution_count": 24, "id": "c456c8ca", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:25.653668Z", "iopub.status.busy": "2021-12-04T15:57:25.653194Z", "iopub.status.idle": "2021-12-04T15:57:25.654948Z", "shell.execute_reply": "2021-12-04T15:57:25.654524Z"}, "papermill": {"duration": 0.157547, "end_time": "2021-12-04T15:57:25.655397", "exception": false, "start_time": "2021-12-04T15:57:25.497850", "status": "completed"}, "tags": []}, "outputs": [], "source": ["resnet_blocks_by_name = {\"ResNetBlock\": ResNetBlock, \"PreActResNetBlock\": PreActResNetBlock}"]}, {"cell_type": "markdown", "id": "c37cfa5a", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.149278, "end_time": "2021-12-04T15:57:25.960549", "exception": false, "start_time": "2021-12-04T15:57:25.811271", "status": "completed"}, "tags": []}, "source": ["The overall ResNet architecture consists of stacking multiple ResNet blocks, of which some are downsampling the input.\n", "When talking about ResNet blocks in the whole network, we usually group them by the same output shape.\n", "Hence, if we say the ResNet has `[3,3,3]` blocks, it means that we have 3 times a group of 3 ResNet blocks, where a subsampling is taking place in the fourth and seventh block.\n", "The ResNet with `[3,3,3]` blocks on CIFAR10 is visualized below.\n", "\n", "
\n", "\n", "The three groups operate on the resolutions $32\\times32$, $16\\times16$ and $8\\times8$ respectively.\n", "The blocks in orange denote ResNet blocks with downsampling.\n", "The same notation is used by many other implementations such as in the [torchvision library](https://pytorch.org/vision/0.11/models.html#torchvision.models.resnet18) from PyTorch.\n", "Thus, our code looks as follows:"]}, {"cell_type": "code", "execution_count": 25, "id": "8c994805", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:26.274254Z", "iopub.status.busy": "2021-12-04T15:57:26.273764Z", "iopub.status.idle": "2021-12-04T15:57:26.275799Z", "shell.execute_reply": "2021-12-04T15:57:26.275419Z"}, "papermill": {"duration": 0.162052, "end_time": "2021-12-04T15:57:26.275911", "exception": false, "start_time": "2021-12-04T15:57:26.113859", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class ResNet(nn.Module):\n", " def __init__(\n", " self,\n", " num_classes=10,\n", " num_blocks=[3, 3, 3],\n", " c_hidden=[16, 32, 64],\n", " act_fn_name=\"relu\",\n", " block_name=\"ResNetBlock\",\n", " **kwargs,\n", " ):\n", " \"\"\"\n", " Inputs:\n", " num_classes - Number of classification outputs (10 for CIFAR10)\n", " num_blocks - List with the number of ResNet blocks to use. The first block of each group uses downsampling, except the first.\n", " c_hidden - List with the hidden dimensionalities in the different blocks. Usually multiplied by 2 the deeper we go.\n", " act_fn_name - Name of the activation function to use, looked up in \"act_fn_by_name\"\n", " block_name - Name of the ResNet block, looked up in \"resnet_blocks_by_name\"\n", " \"\"\"\n", " super().__init__()\n", " assert block_name in resnet_blocks_by_name\n", " self.hparams = SimpleNamespace(\n", " num_classes=num_classes,\n", " c_hidden=c_hidden,\n", " num_blocks=num_blocks,\n", " act_fn_name=act_fn_name,\n", " act_fn=act_fn_by_name[act_fn_name],\n", " block_class=resnet_blocks_by_name[block_name],\n", " )\n", " self._create_network()\n", " self._init_params()\n", "\n", " def _create_network(self):\n", " c_hidden = self.hparams.c_hidden\n", "\n", " # A first convolution on the original image to scale up the channel size\n", " if self.hparams.block_class == PreActResNetBlock: # => Don't apply non-linearity on output\n", " self.input_net = nn.Sequential(nn.Conv2d(3, c_hidden[0], kernel_size=3, padding=1, bias=False))\n", " else:\n", " self.input_net = nn.Sequential(\n", " nn.Conv2d(3, c_hidden[0], kernel_size=3, padding=1, bias=False),\n", " nn.BatchNorm2d(c_hidden[0]),\n", " self.hparams.act_fn(),\n", " )\n", "\n", " # Creating the ResNet blocks\n", " blocks = []\n", " for block_idx, block_count in enumerate(self.hparams.num_blocks):\n", " for bc in range(block_count):\n", " # Subsample the first block of each group, except the very first one.\n", " subsample = bc == 0 and block_idx > 0\n", " blocks.append(\n", " self.hparams.block_class(\n", " c_in=c_hidden[block_idx if not subsample else (block_idx - 1)],\n", " act_fn=self.hparams.act_fn,\n", " subsample=subsample,\n", " c_out=c_hidden[block_idx],\n", " )\n", " )\n", " self.blocks = nn.Sequential(*blocks)\n", "\n", " # Mapping to classification output\n", " self.output_net = nn.Sequential(\n", " nn.AdaptiveAvgPool2d((1, 1)), nn.Flatten(), nn.Linear(c_hidden[-1], self.hparams.num_classes)\n", " )\n", "\n", " def _init_params(self):\n", " # Based on our discussion in Tutorial 4, we should initialize the convolutions according to the activation function\n", " # Fan-out focuses on the gradient distribution, and is commonly used in ResNets\n", " for m in self.modules():\n", " if isinstance(m, nn.Conv2d):\n", " nn.init.kaiming_normal_(m.weight, mode=\"fan_out\", nonlinearity=self.hparams.act_fn_name)\n", " elif isinstance(m, nn.BatchNorm2d):\n", " nn.init.constant_(m.weight, 1)\n", " nn.init.constant_(m.bias, 0)\n", "\n", " def forward(self, x):\n", " x = self.input_net(x)\n", " x = self.blocks(x)\n", " x = self.output_net(x)\n", " return x"]}, {"cell_type": "markdown", "id": "37b8bdf0", "metadata": {"papermill": {"duration": 0.149083, "end_time": "2021-12-04T15:57:26.573227", "exception": false, "start_time": "2021-12-04T15:57:26.424144", "status": "completed"}, "tags": []}, "source": ["We also need to add the new ResNet class to our model dictionary:"]}, {"cell_type": "code", "execution_count": 26, "id": "468df0ab", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:26.873446Z", "iopub.status.busy": "2021-12-04T15:57:26.872978Z", "iopub.status.idle": "2021-12-04T15:57:26.874996Z", "shell.execute_reply": "2021-12-04T15:57:26.874511Z"}, "papermill": {"duration": 0.153475, "end_time": "2021-12-04T15:57:26.875104", "exception": false, "start_time": "2021-12-04T15:57:26.721629", "status": "completed"}, "tags": []}, "outputs": [], "source": ["model_dict[\"ResNet\"] = ResNet"]}, {"cell_type": "markdown", "id": "b23a2b2b", "metadata": {"papermill": {"duration": 0.151943, "end_time": "2021-12-04T15:57:27.179422", "exception": false, "start_time": "2021-12-04T15:57:27.027479", "status": "completed"}, "tags": []}, "source": ["Finally, we can train our ResNet models.\n", "One difference to the GoogleNet training is that we explicitly use SGD with Momentum as optimizer instead of Adam.\n", "Adam often leads to a slightly worse accuracy on plain, shallow ResNets.\n", "It is not 100% clear why Adam performs worse in this context, but one possible explanation is related to ResNet's loss surface.\n", "ResNet has been shown to produce smoother loss surfaces than networks without skip connection (see [Li et al., 2018](https://arxiv.org/pdf/1712.09913.pdf) for details).\n", "A possible visualization of the loss surface with/out skip connections is below (figure credit - [Li et al. ](https://arxiv.org/pdf/1712.09913.pdf)):\n", "\n", "
\n", "\n", "The $x$ and $y$ axis shows a projection of the parameter space, and the $z$ axis shows the loss values achieved by different parameter values.\n", "On smooth surfaces like the one on the right, we might not require an adaptive learning rate as Adam provides.\n", "Instead, Adam can get stuck in local optima while SGD finds the wider minima that tend to generalize better.\n", "However, to answer this question in detail, we would need an extra tutorial because it is not easy to answer.\n", "For now, we conclude: for ResNet architectures, consider the optimizer to be an important hyperparameter, and try training with both Adam and SGD.\n", "Let's train the model below with SGD:"]}, {"cell_type": "code", "execution_count": 27, "id": "73edd595", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:27.485930Z", "iopub.status.busy": "2021-12-04T15:57:27.485459Z", "iopub.status.idle": "2021-12-04T15:57:29.804705Z", "shell.execute_reply": "2021-12-04T15:57:29.804239Z"}, "papermill": {"duration": 2.475739, "end_time": "2021-12-04T15:57:29.804902", "exception": false, "start_time": "2021-12-04T15:57:27.329163", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/connectors/callback_connector.py:90: LightningDeprecationWarning: Setting `Trainer(progress_bar_refresh_rate=1)` is deprecated in v1.5 and will be removed in v1.7. Please pass `pytorch_lightning.callbacks.progress.TQDMProgressBar` with `refresh_rate` directly to the Trainer's `callbacks` argument instead. Or, to disable the progress bar pass `enable_progress_bar = False` to the Trainer.\n", " rank_zero_deprecation(\n", "GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/trainer.py:901: LightningDeprecationWarning: `trainer.test(test_dataloaders)` is deprecated in v1.4 and will be removed in v1.6. Use `trainer.test(dataloaders)` instead.\n", " rank_zero_deprecation(\n", "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model at saved_models/ConvNets/ResNet.ckpt, loading...\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "b92f8c8a741b439084618bba61742bb0", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "6000f7a133b44b9b96fd7c1bf554a644", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}], "source": ["resnet_model, resnet_results = train_model(\n", " model_name=\"ResNet\",\n", " model_hparams={\"num_classes\": 10, \"c_hidden\": [16, 32, 64], \"num_blocks\": [3, 3, 3], \"act_fn_name\": \"relu\"},\n", " optimizer_name=\"SGD\",\n", " optimizer_hparams={\"lr\": 0.1, \"momentum\": 0.9, \"weight_decay\": 1e-4},\n", ")"]}, {"cell_type": "markdown", "id": "48da8881", "metadata": {"papermill": {"duration": 0.159561, "end_time": "2021-12-04T15:57:30.121598", "exception": false, "start_time": "2021-12-04T15:57:29.962037", "status": "completed"}, "tags": []}, "source": ["Let's also train the pre-activation ResNet as comparison:"]}, {"cell_type": "code", "execution_count": 28, "id": "2a7deb12", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:30.440774Z", "iopub.status.busy": "2021-12-04T15:57:30.440297Z", "iopub.status.idle": "2021-12-04T15:57:32.785696Z", "shell.execute_reply": "2021-12-04T15:57:32.786096Z"}, "papermill": {"duration": 2.508623, "end_time": "2021-12-04T15:57:32.786264", "exception": false, "start_time": "2021-12-04T15:57:30.277641", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model at saved_models/ConvNets/ResNetPreAct.ckpt, loading...\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "e84f1647ff4244d5992786cbc17d3e1b", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "4542daedea6845f9b0e7df869e150283", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}], "source": ["resnetpreact_model, resnetpreact_results = train_model(\n", " model_name=\"ResNet\",\n", " model_hparams={\n", " \"num_classes\": 10,\n", " \"c_hidden\": [16, 32, 64],\n", " \"num_blocks\": [3, 3, 3],\n", " \"act_fn_name\": \"relu\",\n", " \"block_name\": \"PreActResNetBlock\",\n", " },\n", " optimizer_name=\"SGD\",\n", " optimizer_hparams={\"lr\": 0.1, \"momentum\": 0.9, \"weight_decay\": 1e-4},\n", " save_name=\"ResNetPreAct\",\n", ")"]}, {"cell_type": "markdown", "id": "9753f382", "metadata": {"papermill": {"duration": 0.166613, "end_time": "2021-12-04T15:57:33.120458", "exception": false, "start_time": "2021-12-04T15:57:32.953845", "status": "completed"}, "tags": []}, "source": ["### Tensorboard log\n", "\n", "Similarly to our GoogleNet model, we also have a TensorBoard log for the ResNet model. We can open it below."]}, {"cell_type": "code", "execution_count": 29, "id": "0880db27", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:33.458069Z", "iopub.status.busy": "2021-12-04T15:57:33.457596Z", "iopub.status.idle": "2021-12-04T15:57:35.014300Z", "shell.execute_reply": "2021-12-04T15:57:35.014709Z"}, "papermill": {"duration": 1.728728, "end_time": "2021-12-04T15:57:35.014873", "exception": false, "start_time": "2021-12-04T15:57:33.286145", "status": "completed"}, "tags": []}, "outputs": [{"data": {"text/html": ["\n", " \n", " \n", " "], "text/plain": [""]}, "metadata": {}, "output_type": "display_data"}], "source": ["# Opens tensorboard in notebook. Adjust the path to your CHECKPOINT_PATH! Feel free to change \"ResNet\" to \"ResNetPreAct\"\n", "%tensorboard --logdir ../saved_models/tutorial5/tensorboards/ResNet/"]}, {"cell_type": "markdown", "id": "99d58ffe", "metadata": {"papermill": {"duration": 0.167371, "end_time": "2021-12-04T15:57:35.347711", "exception": false, "start_time": "2021-12-04T15:57:35.180340", "status": "completed"}, "tags": []}, "source": ["
\n", "\n", "Feel free to explore the TensorBoard yourself, including the computation graph.\n", "In general, we can see that with SGD, the ResNet has a higher training loss than the GoogleNet in the first stage of the training.\n", "After reducing the learning rate however, the model achieves even higher validation accuracies.\n", "We compare the precise scores at the end of the notebook."]}, {"cell_type": "markdown", "id": "d632a3fd", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.165036, "end_time": "2021-12-04T15:57:35.677544", "exception": false, "start_time": "2021-12-04T15:57:35.512508", "status": "completed"}, "tags": []}, "source": ["## DenseNet\n", "\n", "
\n", "\n", "[DenseNet](https://arxiv.org/abs/1608.06993) is another architecture for enabling very deep neural networks and takes a slightly different perspective on residual connections.\n", "Instead of modeling the difference between layers, DenseNet considers residual connections as a possible way to reuse features across layers, removing any necessity to learn redundant feature maps.\n", "If we go deeper into the network, the model learns abstract features to recognize patterns.\n", "However, some complex patterns consist of a combination of abstract features (e.g. hand, face, etc.\n", "), and low-level features (e.g. edges, basic color, etc.).\n", "To find these low-level features in the deep layers, standard CNNs have to learn copy such feature maps, which wastes a lot of parameter complexity.\n", "DenseNet provides an efficient way of reusing features by having each convolution depends on all previous input features, but add only a small amount of filters to it.\n", "See the figure below for an illustration (figure credit - [Hu et al. ](https://arxiv.org/abs/1608.06993)):\n", "\n", "
\n", "\n", "The last layer, called the transition layer, is responsible for reducing the dimensionality of the feature maps in height, width, and channel size.\n", "Although those technically break the identity backpropagation, there are only a few in a network so that it doesn't affect the gradient flow much.\n", "\n", "We split the implementation of the layers in DenseNet into three parts: a `DenseLayer`, and a `DenseBlock`, and a `TransitionLayer`.\n", "The module `DenseLayer` implements a single layer inside a dense block.\n", "It applies a 1x1 convolution for dimensionality reduction with a subsequential 3x3 convolution.\n", "The output channels are concatenated to the originals and returned.\n", "Note that we apply the Batch Normalization as the first layer of each block.\n", "This allows slightly different activations for the same features to different layers, depending on what is needed.\n", "Overall, we can implement it as follows:"]}, {"cell_type": "code", "execution_count": 30, "id": "a46957dd", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:36.017059Z", "iopub.status.busy": "2021-12-04T15:57:36.016566Z", "iopub.status.idle": "2021-12-04T15:57:36.018483Z", "shell.execute_reply": "2021-12-04T15:57:36.018007Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.173649, "end_time": "2021-12-04T15:57:36.018596", "exception": false, "start_time": "2021-12-04T15:57:35.844947", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class DenseLayer(nn.Module):\n", " def __init__(self, c_in, bn_size, growth_rate, act_fn):\n", " \"\"\"\n", " Inputs:\n", " c_in - Number of input channels\n", " bn_size - Bottleneck size (factor of growth rate) for the output of the 1x1 convolution. Typically between 2 and 4.\n", " growth_rate - Number of output channels of the 3x3 convolution\n", " act_fn - Activation class constructor (e.g. nn.ReLU)\n", " \"\"\"\n", " super().__init__()\n", " self.net = nn.Sequential(\n", " nn.BatchNorm2d(c_in),\n", " act_fn(),\n", " nn.Conv2d(c_in, bn_size * growth_rate, kernel_size=1, bias=False),\n", " nn.BatchNorm2d(bn_size * growth_rate),\n", " act_fn(),\n", " nn.Conv2d(bn_size * growth_rate, growth_rate, kernel_size=3, padding=1, bias=False),\n", " )\n", "\n", " def forward(self, x):\n", " out = self.net(x)\n", " out = torch.cat([out, x], dim=1)\n", " return out"]}, {"cell_type": "markdown", "id": "22c3bb8d", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.166194, "end_time": "2021-12-04T15:57:36.351919", "exception": false, "start_time": "2021-12-04T15:57:36.185725", "status": "completed"}, "tags": []}, "source": ["The module `DenseBlock` summarizes multiple dense layers applied in sequence.\n", "Each dense layer takes as input the original input concatenated with all previous layers' feature maps:"]}, {"cell_type": "code", "execution_count": 31, "id": "e2b77d5c", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:36.689854Z", "iopub.status.busy": "2021-12-04T15:57:36.689367Z", "iopub.status.idle": "2021-12-04T15:57:36.691378Z", "shell.execute_reply": "2021-12-04T15:57:36.690906Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.173592, "end_time": "2021-12-04T15:57:36.691485", "exception": false, "start_time": "2021-12-04T15:57:36.517893", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class DenseBlock(nn.Module):\n", " def __init__(self, c_in, num_layers, bn_size, growth_rate, act_fn):\n", " \"\"\"\n", " Inputs:\n", " c_in - Number of input channels\n", " num_layers - Number of dense layers to apply in the block\n", " bn_size - Bottleneck size to use in the dense layers\n", " growth_rate - Growth rate to use in the dense layers\n", " act_fn - Activation function to use in the dense layers\n", " \"\"\"\n", " super().__init__()\n", " layers = []\n", " for layer_idx in range(num_layers):\n", " # Input channels are original plus the feature maps from previous layers\n", " layer_c_in = c_in + layer_idx * growth_rate\n", " layers.append(DenseLayer(c_in=layer_c_in, bn_size=bn_size, growth_rate=growth_rate, act_fn=act_fn))\n", " self.block = nn.Sequential(*layers)\n", "\n", " def forward(self, x):\n", " out = self.block(x)\n", " return out"]}, {"cell_type": "markdown", "id": "41bcb65f", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.168003, "end_time": "2021-12-04T15:57:37.026310", "exception": false, "start_time": "2021-12-04T15:57:36.858307", "status": "completed"}, "tags": []}, "source": ["Finally, the `TransitionLayer` takes as input the final output of a dense block and reduces its channel dimensionality using a 1x1 convolution.\n", "To reduce the height and width dimension, we take a slightly different approach than in ResNet and apply an average pooling with kernel size 2 and stride 2.\n", "This is because we don't have an additional connection to the output that would consider the full 2x2 patch instead of a single value.\n", "Besides, it is more parameter efficient than using a 3x3 convolution with stride 2.\n", "Thus, the layer is implemented as follows:"]}, {"cell_type": "code", "execution_count": 32, "id": "2ea6e9bd", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:37.371597Z", "iopub.status.busy": "2021-12-04T15:57:37.371122Z", "iopub.status.idle": "2021-12-04T15:57:37.373121Z", "shell.execute_reply": "2021-12-04T15:57:37.372717Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.178559, "end_time": "2021-12-04T15:57:37.373229", "exception": false, "start_time": "2021-12-04T15:57:37.194670", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class TransitionLayer(nn.Module):\n", " def __init__(self, c_in, c_out, act_fn):\n", " super().__init__()\n", " self.transition = nn.Sequential(\n", " nn.BatchNorm2d(c_in),\n", " act_fn(),\n", " nn.Conv2d(c_in, c_out, kernel_size=1, bias=False),\n", " nn.AvgPool2d(kernel_size=2, stride=2), # Average the output for each 2x2 pixel group\n", " )\n", "\n", " def forward(self, x):\n", " return self.transition(x)"]}, {"cell_type": "markdown", "id": "2a5d631f", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.167305, "end_time": "2021-12-04T15:57:37.707771", "exception": false, "start_time": "2021-12-04T15:57:37.540466", "status": "completed"}, "tags": []}, "source": ["Now we can put everything together and create our DenseNet.\n", "To specify the number of layers, we use a similar notation as in ResNets and pass on a list of ints representing the number of layers per block.\n", "After each dense block except the last one, we apply a transition layer to reduce the dimensionality by 2."]}, {"cell_type": "code", "execution_count": 33, "id": "e61967ce", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:38.057964Z", "iopub.status.busy": "2021-12-04T15:57:38.049763Z", "iopub.status.idle": "2021-12-04T15:57:38.059615Z", "shell.execute_reply": "2021-12-04T15:57:38.060000Z"}, "papermill": {"duration": 0.187694, "end_time": "2021-12-04T15:57:38.060130", "exception": false, "start_time": "2021-12-04T15:57:37.872436", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class DenseNet(nn.Module):\n", " def __init__(\n", " self, num_classes=10, num_layers=[6, 6, 6, 6], bn_size=2, growth_rate=16, act_fn_name=\"relu\", **kwargs\n", " ):\n", " super().__init__()\n", " self.hparams = SimpleNamespace(\n", " num_classes=num_classes,\n", " num_layers=num_layers,\n", " bn_size=bn_size,\n", " growth_rate=growth_rate,\n", " act_fn_name=act_fn_name,\n", " act_fn=act_fn_by_name[act_fn_name],\n", " )\n", " self._create_network()\n", " self._init_params()\n", "\n", " def _create_network(self):\n", " c_hidden = self.hparams.growth_rate * self.hparams.bn_size # The start number of hidden channels\n", "\n", " # A first convolution on the original image to scale up the channel size\n", " self.input_net = nn.Sequential(\n", " # No batch norm or activation function as done inside the Dense layers\n", " nn.Conv2d(3, c_hidden, kernel_size=3, padding=1)\n", " )\n", "\n", " # Creating the dense blocks, eventually including transition layers\n", " blocks = []\n", " for block_idx, num_layers in enumerate(self.hparams.num_layers):\n", " blocks.append(\n", " DenseBlock(\n", " c_in=c_hidden,\n", " num_layers=num_layers,\n", " bn_size=self.hparams.bn_size,\n", " growth_rate=self.hparams.growth_rate,\n", " act_fn=self.hparams.act_fn,\n", " )\n", " )\n", " c_hidden = c_hidden + num_layers * self.hparams.growth_rate # Overall output of the dense block\n", " if block_idx < len(self.hparams.num_layers) - 1: # Don't apply transition layer on last block\n", " blocks.append(TransitionLayer(c_in=c_hidden, c_out=c_hidden // 2, act_fn=self.hparams.act_fn))\n", " c_hidden = c_hidden // 2\n", "\n", " self.blocks = nn.Sequential(*blocks)\n", "\n", " # Mapping to classification output\n", " self.output_net = nn.Sequential(\n", " nn.BatchNorm2d(c_hidden), # The features have not passed a non-linearity until here.\n", " self.hparams.act_fn(),\n", " nn.AdaptiveAvgPool2d((1, 1)),\n", " nn.Flatten(),\n", " nn.Linear(c_hidden, self.hparams.num_classes),\n", " )\n", "\n", " def _init_params(self):\n", " # Based on our discussion in Tutorial 4, we should initialize the\n", " # convolutions according to the activation function\n", " for m in self.modules():\n", " if isinstance(m, nn.Conv2d):\n", " nn.init.kaiming_normal_(m.weight, nonlinearity=self.hparams.act_fn_name)\n", " elif isinstance(m, nn.BatchNorm2d):\n", " nn.init.constant_(m.weight, 1)\n", " nn.init.constant_(m.bias, 0)\n", "\n", " def forward(self, x):\n", " x = self.input_net(x)\n", " x = self.blocks(x)\n", " x = self.output_net(x)\n", " return x"]}, {"cell_type": "markdown", "id": "8a17a3e1", "metadata": {"papermill": {"duration": 0.169685, "end_time": "2021-12-04T15:57:38.400764", "exception": false, "start_time": "2021-12-04T15:57:38.231079", "status": "completed"}, "tags": []}, "source": ["Let's also add the DenseNet to our model dictionary:"]}, {"cell_type": "code", "execution_count": 34, "id": "42fb9154", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:38.737268Z", "iopub.status.busy": "2021-12-04T15:57:38.736793Z", "iopub.status.idle": "2021-12-04T15:57:38.738365Z", "shell.execute_reply": "2021-12-04T15:57:38.738764Z"}, "papermill": {"duration": 0.172954, "end_time": "2021-12-04T15:57:38.738890", "exception": false, "start_time": "2021-12-04T15:57:38.565936", "status": "completed"}, "tags": []}, "outputs": [], "source": ["model_dict[\"DenseNet\"] = DenseNet"]}, {"cell_type": "markdown", "id": "4be858c3", "metadata": {"papermill": {"duration": 0.168419, "end_time": "2021-12-04T15:57:39.078283", "exception": false, "start_time": "2021-12-04T15:57:38.909864", "status": "completed"}, "tags": []}, "source": ["Lastly, we train our network.\n", "In contrast to ResNet, DenseNet does not show any issues with Adam, and hence we train it with this optimizer.\n", "The other hyperparameters are chosen to result in a network with a similar parameter size as the ResNet and GoogleNet.\n", "Commonly, when designing very deep networks, DenseNet is more parameter\n", "efficient than ResNet while achieving a similar or even better\n", "performance."]}, {"cell_type": "code", "execution_count": 35, "id": "e36f4881", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:39.415290Z", "iopub.status.busy": "2021-12-04T15:57:39.414811Z", "iopub.status.idle": "2021-12-04T15:57:44.113020Z", "shell.execute_reply": "2021-12-04T15:57:44.113406Z"}, "papermill": {"duration": 4.869343, "end_time": "2021-12-04T15:57:44.113572", "exception": false, "start_time": "2021-12-04T15:57:39.244229", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/connectors/callback_connector.py:90: LightningDeprecationWarning: Setting `Trainer(progress_bar_refresh_rate=1)` is deprecated in v1.5 and will be removed in v1.7. Please pass `pytorch_lightning.callbacks.progress.TQDMProgressBar` with `refresh_rate` directly to the Trainer's `callbacks` argument instead. Or, to disable the progress bar pass `enable_progress_bar = False` to the Trainer.\n", " rank_zero_deprecation(\n", "GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/trainer.py:901: LightningDeprecationWarning: `trainer.test(test_dataloaders)` is deprecated in v1.4 and will be removed in v1.6. Use `trainer.test(dataloaders)` instead.\n", " rank_zero_deprecation(\n", "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model at saved_models/ConvNets/DenseNet.ckpt, loading...\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "c37fd9f09225462dbf011a96be37c084", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "cf02514bd53f4511a0b664fc86c842b7", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}], "source": ["densenet_model, densenet_results = train_model(\n", " model_name=\"DenseNet\",\n", " model_hparams={\n", " \"num_classes\": 10,\n", " \"num_layers\": [6, 6, 6, 6],\n", " \"bn_size\": 2,\n", " \"growth_rate\": 16,\n", " \"act_fn_name\": \"relu\",\n", " },\n", " optimizer_name=\"Adam\",\n", " optimizer_hparams={\"lr\": 1e-3, \"weight_decay\": 1e-4},\n", ")"]}, {"cell_type": "markdown", "id": "6a712390", "metadata": {"papermill": {"duration": 0.170458, "end_time": "2021-12-04T15:57:44.457192", "exception": false, "start_time": "2021-12-04T15:57:44.286734", "status": "completed"}, "tags": []}, "source": ["### Tensorboard log\n", "\n", "Finally, we also have another TensorBoard for the DenseNet training. We take a look at it below:"]}, {"cell_type": "code", "execution_count": 36, "id": "1b728973", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:44.807975Z", "iopub.status.busy": "2021-12-04T15:57:44.807514Z", "iopub.status.idle": "2021-12-04T15:57:46.369275Z", "shell.execute_reply": "2021-12-04T15:57:46.368869Z"}, "papermill": {"duration": 1.742356, "end_time": "2021-12-04T15:57:46.369408", "exception": false, "start_time": "2021-12-04T15:57:44.627052", "status": "completed"}, "tags": []}, "outputs": [{"data": {"text/html": ["\n", " \n", " \n", " "], "text/plain": [""]}, "metadata": {}, "output_type": "display_data"}], "source": ["# Opens tensorboard in notebook. Adjust the path to your CHECKPOINT_PATH! Feel free to change \"ResNet\" to \"ResNetPreAct\"\n", "%tensorboard --logdir ../saved_models/tutorial5/tensorboards/DenseNet/"]}, {"cell_type": "markdown", "id": "e39ad034", "metadata": {"papermill": {"duration": 0.172568, "end_time": "2021-12-04T15:57:46.718239", "exception": false, "start_time": "2021-12-04T15:57:46.545671", "status": "completed"}, "tags": []}, "source": ["
\n", "\n", "The overall course of the validation accuracy and training loss resemble the training of GoogleNet, which is also related to training the network with Adam.\n", "Feel free to explore the training metrics yourself."]}, {"cell_type": "markdown", "id": "6bad2177", "metadata": {"papermill": {"duration": 0.171587, "end_time": "2021-12-04T15:57:47.073199", "exception": false, "start_time": "2021-12-04T15:57:46.901612", "status": "completed"}, "tags": []}, "source": ["## Conclusion and Comparison\n", "\n", "After discussing each model separately, and training all of them, we can finally compare them.\n", "First, let's organize the results of all models in a table:"]}, {"cell_type": "code", "execution_count": 37, "id": "8e60b85a", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:47.427909Z", "iopub.status.busy": "2021-12-04T15:57:47.427445Z", "iopub.status.idle": "2021-12-04T15:57:47.430369Z", "shell.execute_reply": "2021-12-04T15:57:47.429973Z"}, "papermill": {"duration": 0.183449, "end_time": "2021-12-04T15:57:47.430477", "exception": false, "start_time": "2021-12-04T15:57:47.247028", "status": "completed"}, "tags": []}, "outputs": [{"data": {"text/html": ["\n", "\n"], "text/plain": [""]}, "metadata": {}, "output_type": "display_data"}], "source": ["%%html\n", "\n", ""]}, {"cell_type": "code", "execution_count": 38, "id": "800aabe6", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:57:47.801905Z", "iopub.status.busy": "2021-12-04T15:57:47.801437Z", "iopub.status.idle": "2021-12-04T15:57:47.804116Z", "shell.execute_reply": "2021-12-04T15:57:47.803654Z"}, "papermill": {"duration": 0.198645, "end_time": "2021-12-04T15:57:47.804225", "exception": false, "start_time": "2021-12-04T15:57:47.605580", "status": "completed"}, "tags": []}, "outputs": [{"data": {"text/html": ["\n", "\n", "\n", "\n", "\n", "\n", "\n", "\n", "\n", "\n", "
Model Val Accuracy Test Accuracy Num Parameters
GoogleNet 90.40% 89.70% 260,650
ResNet 91.84% 91.06% 272,378
ResNetPreAct91.80% 91.07% 272,250
DenseNet 90.72% 90.23% 239,146
"], "text/plain": [""]}, "metadata": {}, "output_type": "display_data"}], "source": ["all_models = [\n", " (\"GoogleNet\", googlenet_results, googlenet_model),\n", " (\"ResNet\", resnet_results, resnet_model),\n", " (\"ResNetPreAct\", resnetpreact_results, resnetpreact_model),\n", " (\"DenseNet\", densenet_results, densenet_model),\n", "]\n", "table = [\n", " [\n", " model_name,\n", " f\"{100.0*model_results['val']:4.2f}%\",\n", " f\"{100.0*model_results['test']:4.2f}%\",\n", " f\"{sum(np.prod(p.shape) for p in model.parameters()):,}\",\n", " ]\n", " for model_name, model_results, model in all_models\n", "]\n", "display(\n", " HTML(\n", " tabulate.tabulate(table, tablefmt=\"html\", headers=[\"Model\", \"Val Accuracy\", \"Test Accuracy\", \"Num Parameters\"])\n", " )\n", ")"]}, {"cell_type": "markdown", "id": "73c70307", "metadata": {"papermill": {"duration": 0.17902, "end_time": "2021-12-04T15:57:48.160604", "exception": false, "start_time": "2021-12-04T15:57:47.981584", "status": "completed"}, "tags": []}, "source": ["First of all, we see that all models are performing reasonably well.\n", "Simple models as you have implemented them in the practical achieve considerably lower performance, which is beside the lower number of parameters also attributed to the architecture design choice.\n", "GoogleNet is the model to obtain the lowest performance on the validation and test set, although it is very close to DenseNet.\n", "A proper hyperparameter search over all the channel sizes in GoogleNet would likely improve the accuracy of the model to a similar level, but this is also expensive given a large number of hyperparameters.\n", "ResNet outperforms both DenseNet and GoogleNet by more than 1% on the validation set, while there is a minor difference between both versions, original and pre-activation.\n", "We can conclude that for shallow networks, the place of the activation function does not seem to be crucial, although papers have reported the contrary for very deep networks (e.g. [He et al. ](https://arxiv.org/abs/1603.05027)).\n", "\n", "In general, we can conclude that ResNet is a simple, but powerful architecture.\n", "If we would apply the models on more complex tasks with larger images and more layers inside the networks, we would likely see a bigger gap between GoogleNet and skip-connection architectures like ResNet and DenseNet.\n", "A comparison with deeper models on CIFAR10 can be for example found [here](https://github.com/kuangliu/pytorch-cifar).\n", "Interestingly, DenseNet outperforms the original ResNet on their setup but comes closely behind the Pre-Activation ResNet.\n", "The best model, a Dual Path Network ([Chen et.\n", "al](https://arxiv.org/abs/1707.01629)), is actually a combination of\n", "ResNet and DenseNet showing that both offer different advantages."]}, {"cell_type": "markdown", "id": "202e03f1", "metadata": {"papermill": {"duration": 0.175905, "end_time": "2021-12-04T15:57:48.512460", "exception": false, "start_time": "2021-12-04T15:57:48.336555", "status": "completed"}, "tags": []}, "source": ["### Which model should I choose for my task?\n", "\n", "We have reviewed four different models.\n", "So, which one should we choose if have given a new task?\n", "Usually, starting with a ResNet is a good idea given the superior performance of the CIFAR dataset and its simple implementation.\n", "Besides, for the parameter number we have chosen here, ResNet is the fastest as DenseNet and GoogleNet have many more layers that are applied in sequence in our primitive implementation.\n", "However, if you have a really difficult task, such as semantic\n", "segmentation on HD images, more complex variants of ResNet and DenseNet\n", "are recommended."]}, {"cell_type": "markdown", "id": "50fb705d", "metadata": {"papermill": {"duration": 0.175468, "end_time": "2021-12-04T15:57:48.863314", "exception": false, "start_time": "2021-12-04T15:57:48.687846", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "[![Pytorch Lightning](){height=\"60px\" width=\"240px\"}](https://pytorchlightning.ai)"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: Tutorial 4: Inception, ResNet and DenseNet\n", " :card_description: In this tutorial, we will implement and discuss variants of modern CNN architectures. There have been many different architectures been proposed over the past few years. Some...\n", " :tags: Image,GPU/TPU,UvA-DL-Course\n", " :image: _static/images/course_UvA-DL/04-inception-resnet-densenet.jpg"]}], "metadata": {"jupytext": {"cell_metadata_filter": "id,colab,colab_type,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 61.494311, "end_time": "2021-12-04T15:57:50.353007", "environment_variables": {}, "exception": null, "input_path": "course_UvA-DL/04-inception-resnet-densenet/Inception_ResNet_DenseNet.ipynb", "output_path": ".notebooks/course_UvA-DL/04-inception-resnet-densenet.ipynb", "parameters": {}, "start_time": "2021-12-04T15:56:48.858696", "version": "2.3.3"}, "widgets": {"application/vnd.jupyter.widget-state+json": {"state": {"004122da18ba429f94c52eb1fae5340c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_38d235ee850740368e877d28bb73f631", "placeholder": "\u200b", "style": "IPY_MODEL_022d04c15a7a40c1870c2a80cd397672", "value": "Testing: 100%"}}, "00a940952c5f49e98ca15e3623f74168": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "022d04c15a7a40c1870c2a80cd397672": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "04e7c8c74bca444e941f03d85f3cfb3f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e627c1b61a864374b8d87fead8d00fd1", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_b02d79366d6a49c7b9f5840d94533fae", "value": 1.0}}, "076947cb26da40f89c1c1972f76139a3": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "0da45269292640a09a53ff5a1a4d44ab": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "118ae85712494119a362f39f76d62852": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "14b309fa97bf436ebea932b9d1c99b7a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_6d72bfd4b6f94f61a3f626f29c690a39", "placeholder": "\u200b", "style": "IPY_MODEL_42a8b2e0205b4d1097c8b97d532f6ed9", "value": " 40/40 [00:00<00:00, 74.95it/s]"}}, "16bf296c023d48c0a08547e9c8332279": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "185245d8a5a14167bfdcddbd1262cd1a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_076947cb26da40f89c1c1972f76139a3", "placeholder": "\u200b", "style": "IPY_MODEL_8390973957a74be9969d427649734c45", "value": " 79/79 [00:01<00:00, 88.62it/s]"}}, "1963d06751de49fba491644790475b8d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_7d5327eea6524d07acda5225f552e010", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_6f8ec09e1ef24c11ae3bc5ae151a4568", "value": 1.0}}, "1c5ea7a5eb5d46f18b5b5d2da5d0e1cc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_00a940952c5f49e98ca15e3623f74168", "placeholder": "\u200b", "style": "IPY_MODEL_74efd30822274ed89911d1bf644ce3ca", "value": " 79/79 [00:00<00:00, 123.78it/s]"}}, "352ddbe0e937449b9c2cac2f6e201121": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "38d235ee850740368e877d28bb73f631": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3a6311c097a3455cb2d71f023e8d4d8f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "3b2ff86eb87949bcaa63b16a35aebaca": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_93686022ddb8443faf4f5451d731b796", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_3a6311c097a3455cb2d71f023e8d4d8f", "value": 1.0}}, "41a45b5de3914d8f942a3cef02cf377b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "4296ffe355d14d4bac17df7d1425a410": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "42a8b2e0205b4d1097c8b97d532f6ed9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "44586163a7ec4db7bd0c32aff969aefc": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "4542daedea6845f9b0e7df869e150283": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_c0250bb5c8c4472fafccb35b520586e4", "IPY_MODEL_c0d08635227c47b4ad6cad2c2a37f925", "IPY_MODEL_1c5ea7a5eb5d46f18b5b5d2da5d0e1cc"], "layout": "IPY_MODEL_a125c1f239c640b1ab4cbec01e92bbb6"}}, "473521a5bc274985a92e69de0abd4f4b": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4a3504d97bfa49f0ac3f87e109978777": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "4b76c0b6cd5e461e84eba9db81f50cbe": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "513cfb186fbd4c01bdacc7feea4bdb5c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "53f2e1fd00bc487297fc47bac77b0732": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a92128f9324349a7aefb31c2e503006c", "placeholder": "\u200b", "style": "IPY_MODEL_f974bb4fc58d40ccac4644c1c3e6666d", "value": "Testing: 100%"}}, "591231fc56eb4c06ad9194cff69c82c8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "5cafd0505815497a88ef0bd271cef82a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_473521a5bc274985a92e69de0abd4f4b", "placeholder": "\u200b", "style": "IPY_MODEL_fc013fd8d5e14e40a7d95a00ac2e2f90", "value": " 40/40 [00:00<00:00, 88.89it/s]"}}, "6000f7a133b44b9b96fd7c1bf554a644": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_004122da18ba429f94c52eb1fae5340c", "IPY_MODEL_6a5c7a9b7da04f2e82ef909e900754f0", "IPY_MODEL_e9a8f29f80c94231b08fadfd08e7467d"], "layout": "IPY_MODEL_dab6f379137447b0ace973fcdb0c4883"}}, "64a7eb6a4ab24ae098f0c43f6cd7af26": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "65496b20e7a24e40b31fa8f48e60a2d4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d7d3481e866640fbac41b5386ad2e9c3", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_41a45b5de3914d8f942a3cef02cf377b", "value": 1.0}}, "6a5c7a9b7da04f2e82ef909e900754f0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_513cfb186fbd4c01bdacc7feea4bdb5c", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_ed64940063374f128c2013deb6314870", "value": 1.0}}, "6ca97f4b62c14c7bbfeb1db85fc993a2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_77cca86506734df5b72869411d27da60", "placeholder": "\u200b", "style": "IPY_MODEL_b7279c1fe219460498493b83c026738e", "value": "Testing: 100%"}}, "6d72bfd4b6f94f61a3f626f29c690a39": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "6e026d193e4743a69f3692b485b5ac17": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_0da45269292640a09a53ff5a1a4d44ab", "placeholder": "\u200b", "style": "IPY_MODEL_591231fc56eb4c06ad9194cff69c82c8", "value": " 40/40 [00:00<00:00, 75.32it/s]"}}, "6f2f0240233b41469935805c777db4c2": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "6f8ec09e1ef24c11ae3bc5ae151a4568": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "74efd30822274ed89911d1bf644ce3ca": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "75655468633246a19e817d74aa226268": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "77cca86506734df5b72869411d27da60": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "7b7ad0926c604a54834aa8f89f2c0ebc": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "7d5327eea6524d07acda5225f552e010": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "7f0bfa83aa584625b4fb04a2f3e7ec2a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4b76c0b6cd5e461e84eba9db81f50cbe", "placeholder": "\u200b", "style": "IPY_MODEL_be040e2360db45b0a40f43d3787798b1", "value": "Testing: 100%"}}, "8390973957a74be9969d427649734c45": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "863d7a5eb148478c8c413b42460f9e98": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c53aaa5c2481470289ce280db63719e4", "placeholder": "\u200b", "style": "IPY_MODEL_4a3504d97bfa49f0ac3f87e109978777", "value": "Testing: 100%"}}, "88b1b202de814778ae51007742b5610c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_ad24953ed75e41d6bfcc8077104e37db", "IPY_MODEL_fb3273ec5ef647f4aeccf20834da1954", "IPY_MODEL_185245d8a5a14167bfdcddbd1262cd1a"], "layout": "IPY_MODEL_f55ab7d5e72a4c4a9ef5848f433e1b3d"}}, "8b06c3c950c14130b00f529e021afdac": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_fb6d4630bdf244f99cbf9e68a82bdc20", "placeholder": "\u200b", "style": "IPY_MODEL_16bf296c023d48c0a08547e9c8332279", "value": "Testing: 100%"}}, "8f66c046bbff4be7bd5a9214f0f14626": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "93686022ddb8443faf4f5451d731b796": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "9441a5cfb1b14598abb9a6c652e59289": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b697e02382f6498b8a29aba192f231db", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_352ddbe0e937449b9c2cac2f6e201121", "value": 1.0}}, "9704fd63690c487b9beb24e4d7e2209c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "9f659821a81047c2b875574e3a5e54f7": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "a125c1f239c640b1ab4cbec01e92bbb6": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "a92128f9324349a7aefb31c2e503006c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ad24953ed75e41d6bfcc8077104e37db": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_64a7eb6a4ab24ae098f0c43f6cd7af26", "placeholder": "\u200b", "style": "IPY_MODEL_e53518709a804cdab8e26116c179730b", "value": "Testing: 100%"}}, "b02d79366d6a49c7b9f5840d94533fae": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "b0d8426a216e46af8354fe3ad3d2249f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "b49f280f709c4cc1908bc5280cc5e728": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b697e02382f6498b8a29aba192f231db": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b7279c1fe219460498493b83c026738e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "b92f8c8a741b439084618bba61742bb0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_7f0bfa83aa584625b4fb04a2f3e7ec2a", "IPY_MODEL_65496b20e7a24e40b31fa8f48e60a2d4", "IPY_MODEL_5cafd0505815497a88ef0bd271cef82a"], "layout": "IPY_MODEL_6f2f0240233b41469935805c777db4c2"}}, "bbbcce7c1cd14711a307fac5253f8d00": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_75655468633246a19e817d74aa226268", "placeholder": "\u200b", "style": "IPY_MODEL_bfc08e0d2dc94323808770cf5150de04", "value": " 40/40 [00:00<00:00, 94.67it/s]"}}, "be040e2360db45b0a40f43d3787798b1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "bfc08e0d2dc94323808770cf5150de04": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "c0250bb5c8c4472fafccb35b520586e4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_9f659821a81047c2b875574e3a5e54f7", "placeholder": "\u200b", "style": "IPY_MODEL_9704fd63690c487b9beb24e4d7e2209c", "value": "Testing: 100%"}}, "c0d08635227c47b4ad6cad2c2a37f925": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_7b7ad0926c604a54834aa8f89f2c0ebc", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_c2080e16ca2f44b28902656b9c395539", "value": 1.0}}, "c2080e16ca2f44b28902656b9c395539": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "c37fd9f09225462dbf011a96be37c084": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_863d7a5eb148478c8c413b42460f9e98", "IPY_MODEL_3b2ff86eb87949bcaa63b16a35aebaca", "IPY_MODEL_14b309fa97bf436ebea932b9d1c99b7a"], "layout": "IPY_MODEL_44586163a7ec4db7bd0c32aff969aefc"}}, "c53aaa5c2481470289ce280db63719e4": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "cf02514bd53f4511a0b664fc86c842b7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_53f2e1fd00bc487297fc47bac77b0732", "IPY_MODEL_1963d06751de49fba491644790475b8d", "IPY_MODEL_da95394060554551a2465f7a2505d130"], "layout": "IPY_MODEL_ff9888303fc846d189e4ce73414c0a85"}}, "d4a54ef3af5d4bcaafad8c61c3360423": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_6ca97f4b62c14c7bbfeb1db85fc993a2", "IPY_MODEL_04e7c8c74bca444e941f03d85f3cfb3f", "IPY_MODEL_6e026d193e4743a69f3692b485b5ac17"], "layout": "IPY_MODEL_eb6d3d7ea0714bf181daacd91321c814"}}, "d7d3481e866640fbac41b5386ad2e9c3": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "da95394060554551a2465f7a2505d130": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b49f280f709c4cc1908bc5280cc5e728", "placeholder": "\u200b", "style": "IPY_MODEL_f1dc0af14e3a4e15b57164c87a249c7d", "value": " 79/79 [00:01<00:00, 91.28it/s]"}}, "dab6f379137447b0ace973fcdb0c4883": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "dfc83023ccbd496084ceb29ff0a8612c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "e53518709a804cdab8e26116c179730b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "e627c1b61a864374b8d87fead8d00fd1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "e84f1647ff4244d5992786cbc17d3e1b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_8b06c3c950c14130b00f529e021afdac", "IPY_MODEL_9441a5cfb1b14598abb9a6c652e59289", "IPY_MODEL_bbbcce7c1cd14711a307fac5253f8d00"], "layout": "IPY_MODEL_4296ffe355d14d4bac17df7d1425a410"}}, "e9a8f29f80c94231b08fadfd08e7467d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8f66c046bbff4be7bd5a9214f0f14626", "placeholder": "\u200b", "style": "IPY_MODEL_118ae85712494119a362f39f76d62852", "value": " 79/79 [00:00<00:00, 121.91it/s]"}}, "eb6d3d7ea0714bf181daacd91321c814": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "ed64940063374f128c2013deb6314870": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "f1dc0af14e3a4e15b57164c87a249c7d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "f55ab7d5e72a4c4a9ef5848f433e1b3d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "f974bb4fc58d40ccac4644c1c3e6666d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "fb3273ec5ef647f4aeccf20834da1954": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_dfc83023ccbd496084ceb29ff0a8612c", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_b0d8426a216e46af8354fe3ad3d2249f", "value": 1.0}}, "fb6d4630bdf244f99cbf9e68a82bdc20": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "fc013fd8d5e14e40a7d95a00ac2e2f90": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "ff9888303fc846d189e4ce73414c0a85": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}}, "version_major": 2, "version_minor": 0}}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/course_UvA-DL/05-transformers-and-MH-attention.ipynb b/source/notebooks/course_UvA-DL/05-transformers-and-MH-attention.ipynb deleted file mode 100644 index 1700ac0..0000000 --- a/source/notebooks/course_UvA-DL/05-transformers-and-MH-attention.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "829d77e5", "metadata": {"papermill": {"duration": 0.139908, "end_time": "2021-12-04T15:58:00.173929", "exception": false, "start_time": "2021-12-04T15:58:00.034021", "status": "completed"}, "tags": []}, "source": ["\n", "# Tutorial 5: Transformers and Multi-Head Attention\n", "\n", "* **Author:** Phillip Lippe\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-12-04T16:52:50.580472\n", "\n", "In this tutorial, we will discuss one of the most impactful architectures of the last 2 years: the Transformer model.\n", "Since the paper Attention Is All You Need by Vaswani et al. had been published in 2017,\n", "the Transformer architecture has continued to beat benchmarks in many domains, most importantly in Natural Language Processing.\n", "Transformers with an incredible amount of parameters can generate long, convincing essays, and opened up new application fields of AI.\n", "As the hype of the Transformer architecture seems not to come to an end in the next years,\n", "it is important to understand how it works, and have implemented it yourself, which we will do in this notebook.\n", "This notebook is part of a lecture series on Deep Learning at the University of Amsterdam.\n", "The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io.\n", "\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/course_UvA-DL/05-transformers-and-MH-attention.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "4bd97ecd", "metadata": {"papermill": {"duration": 0.139186, "end_time": "2021-12-04T15:58:00.454648", "exception": false, "start_time": "2021-12-04T15:58:00.315462", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "6df421c0", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-12-04T15:58:00.739046Z", "iopub.status.busy": "2021-12-04T15:58:00.738548Z", "iopub.status.idle": "2021-12-04T15:58:03.208213Z", "shell.execute_reply": "2021-12-04T15:58:03.207638Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 2.615354, "end_time": "2021-12-04T15:58:03.208358", "exception": false, "start_time": "2021-12-04T15:58:00.593004", "status": "completed"}, "tags": []}, "outputs": [], "source": ["! pip install --quiet \"torchmetrics>=0.3\" \"pytorch-lightning>=1.3\" \"torchvision\" \"torch>=1.6, <1.9\" \"matplotlib\" \"seaborn\""]}, {"cell_type": "markdown", "id": "a5126640", "metadata": {"papermill": {"duration": 0.138671, "end_time": "2021-12-04T15:58:03.486977", "exception": false, "start_time": "2021-12-04T15:58:03.348306", "status": "completed"}, "tags": []}, "source": ["
\n", "Despite the huge success of Transformers in NLP, we will _not_ include the NLP domain in our notebook here.\n", "There are many courses at the University of Amsterdam that focus on Natural Language Processing\n", "and take a closer look at the application of the Transformer architecture in NLP\n", "([NLP2](https://studiegids.uva.nl/xmlpages/page/2020-2021/zoek-vak/vak/79628),\n", "[Advanced Topics in Computational Semantics](https://studiegids.uva.nl/xmlpages/page/2020-2021/zoek-vak/vak/80162)).\n", "Furthermore, and most importantly, there is so much more to the Transformer architecture.\n", "NLP is the domain the Transformer architecture has been originally proposed for and had the greatest impact on,\n", "but it also accelerated research in other domains, recently even [Computer Vision](https://arxiv.org/abs/2010.11929).\n", "Thus, we focus here on what makes the Transformer and self-attention so powerful in general.\n", "In a second notebook, we will look at Vision Transformers, i.e. Transformers for image classification\n", "([link to notebook](https://uvadlc-notebooks.readthedocs.io/en/latest/tutorial_notebooks/tutorial15/Vision_Transformer.html)).\n", "\n", "Below, we import our standard libraries."]}, {"cell_type": "code", "execution_count": 2, "id": "31508898", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:03.772463Z", "iopub.status.busy": "2021-12-04T15:58:03.771979Z", "iopub.status.idle": "2021-12-04T15:58:05.871634Z", "shell.execute_reply": "2021-12-04T15:58:05.871226Z"}, "papermill": {"duration": 2.246581, "end_time": "2021-12-04T15:58:05.871763", "exception": false, "start_time": "2021-12-04T15:58:03.625182", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/tmp/ipykernel_1492/2689201066.py:34: DeprecationWarning: `set_matplotlib_formats` is deprecated since IPython 7.23, directly use `matplotlib_inline.backend_inline.set_matplotlib_formats()`\n", " set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "Global seed set to 42\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Device: cuda:0\n"]}], "source": ["# Standard libraries\n", "import math\n", "import os\n", "import urllib.request\n", "from functools import partial\n", "from urllib.error import HTTPError\n", "\n", "# Plotting\n", "import matplotlib\n", "import matplotlib.pyplot as plt\n", "import numpy as np\n", "\n", "# PyTorch Lightning\n", "import pytorch_lightning as pl\n", "import seaborn as sns\n", "\n", "# PyTorch\n", "import torch\n", "import torch.nn as nn\n", "import torch.nn.functional as F\n", "import torch.optim as optim\n", "import torch.utils.data as data\n", "\n", "# Torchvision\n", "import torchvision\n", "from IPython.display import set_matplotlib_formats\n", "from pytorch_lightning.callbacks import ModelCheckpoint\n", "from torchvision import transforms\n", "from torchvision.datasets import CIFAR100\n", "from tqdm.notebook import tqdm\n", "\n", "plt.set_cmap(\"cividis\")\n", "%matplotlib inline\n", "set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "matplotlib.rcParams[\"lines.linewidth\"] = 2.0\n", "sns.reset_orig()\n", "\n", "# Path to the folder where the datasets are/should be downloaded (e.g. CIFAR10)\n", "DATASET_PATH = os.environ.get(\"PATH_DATASETS\", \"data/\")\n", "# Path to the folder where the pretrained models are saved\n", "CHECKPOINT_PATH = os.environ.get(\"PATH_CHECKPOINT\", \"saved_models/Transformers/\")\n", "\n", "# Setting the seed\n", "pl.seed_everything(42)\n", "\n", "# Ensure that all operations are deterministic on GPU (if used) for reproducibility\n", "torch.backends.cudnn.determinstic = True\n", "torch.backends.cudnn.benchmark = False\n", "\n", "device = torch.device(\"cuda:0\") if torch.cuda.is_available() else torch.device(\"cpu\")\n", "print(\"Device:\", device)"]}, {"cell_type": "markdown", "id": "940525e1", "metadata": {"papermill": {"duration": 0.144686, "end_time": "2021-12-04T15:58:06.158145", "exception": false, "start_time": "2021-12-04T15:58:06.013459", "status": "completed"}, "tags": []}, "source": ["Two pre-trained models are downloaded below.\n", "Make sure to have adjusted your `CHECKPOINT_PATH` before running this code if not already done."]}, {"cell_type": "code", "execution_count": 3, "id": "a7a72c1a", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:06.442497Z", "iopub.status.busy": "2021-12-04T15:58:06.442012Z", "iopub.status.idle": "2021-12-04T15:58:06.793103Z", "shell.execute_reply": "2021-12-04T15:58:06.792670Z"}, "papermill": {"duration": 0.496404, "end_time": "2021-12-04T15:58:06.793239", "exception": false, "start_time": "2021-12-04T15:58:06.296835", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial6/ReverseTask.ckpt...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial6/SetAnomalyTask.ckpt...\n"]}], "source": ["# Github URL where saved models are stored for this tutorial\n", "base_url = \"https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial6/\"\n", "# Files to download\n", "pretrained_files = [\"ReverseTask.ckpt\", \"SetAnomalyTask.ckpt\"]\n", "\n", "# Create checkpoint path if it doesn't exist yet\n", "os.makedirs(CHECKPOINT_PATH, exist_ok=True)\n", "\n", "# For each file, check whether it already exists. If not, try downloading it.\n", "for file_name in pretrained_files:\n", " file_path = os.path.join(CHECKPOINT_PATH, file_name)\n", " if \"/\" in file_name:\n", " os.makedirs(file_path.rsplit(\"/\", 1)[0], exist_ok=True)\n", " if not os.path.isfile(file_path):\n", " file_url = base_url + file_name\n", " print(\"Downloading %s...\" % file_url)\n", " try:\n", " urllib.request.urlretrieve(file_url, file_path)\n", " except HTTPError as e:\n", " print(\n", " \"Something went wrong. Please try to download the file manually,\"\n", " \" or contact the author with the full output including the following error:\\n\",\n", " e,\n", " )"]}, {"cell_type": "markdown", "id": "1e17404e", "metadata": {"papermill": {"duration": 0.140163, "end_time": "2021-12-04T15:58:07.075728", "exception": false, "start_time": "2021-12-04T15:58:06.935565", "status": "completed"}, "tags": []}, "source": ["## The Transformer architecture\n", "\n", "In the first part of this notebook, we will implement the Transformer architecture by hand.\n", "As the architecture is so popular, there already exists a Pytorch module `nn.Transformer`\n", "([documentation](https://pytorch.org/docs/stable/generated/torch.nn.Transformer.html))\n", "and a [tutorial](https://pytorch.org/tutorials/beginner/transformer_tutorial.html)\n", "on how to use it for next token prediction.\n", "However, we will implement it here ourselves, to get through to the smallest details.\n", "\n", "There are of course many more tutorials out there about attention and Transformers.\n", "Below, we list a few that are worth exploring if you are interested in the topic\n", "and might want yet another perspective on the topic after this one:\n", "\n", "* [Transformer: A Novel Neural Network Architecture for Language Understanding\n", "(Jakob Uszkoreit, 2017)](https://ai.googleblog.com/2017/08/transformer-novel-neural-network.html) - The original Google blog post about the Transformer paper, focusing on the application in machine translation.\n", "* [The Illustrated Transformer (Jay Alammar, 2018)](http://jalammar.github.io/illustrated-transformer/) - A very popular and great blog post intuitively explaining the Transformer architecture with many nice visualizations.\n", "The focus is on NLP.\n", "* [Attention?\n", "Attention!\n", "(Lilian Weng, 2018)](https://lilianweng.github.io/lil-log/2018/06/24/attention-attention.html) - A nice blog post summarizing attention mechanisms in many domains including vision.\n", "* [Illustrated: Self-Attention (Raimi Karim, 2019)](https://towardsdatascience.com/illustrated-self-attention-2d627e33b20a) - A nice visualization of the steps of self-attention.\n", "Recommended going through if the explanation below is too abstract for you.\n", "* [The Transformer family (Lilian Weng, 2020)](https://lilianweng.github.io/lil-log/2020/04/07/the-transformer-family.html) - A very detailed blog post reviewing more variants of Transformers besides the original one."]}, {"cell_type": "markdown", "id": "c7a1d465", "metadata": {"papermill": {"duration": 0.14018, "end_time": "2021-12-04T15:58:07.355646", "exception": false, "start_time": "2021-12-04T15:58:07.215466", "status": "completed"}, "tags": []}, "source": ["### What is Attention?\n", "\n", "The attention mechanism describes a recent new group of layers in neural networks that has attracted\n", "a lot of interest in the past few years, especially in sequence tasks.\n", "There are a lot of different possible definitions of \"attention\" in the literature,\n", "but the one we will use here is the following: _the attention mechanism describes a weighted average\n", "of (sequence) elements with the weights dynamically computed based on an input query and elements' keys_.\n", "So what does this exactly mean?\n", "The goal is to take an average over the features of multiple elements.\n", "However, instead of weighting each element equally, we want to weight them depending on their actual values.\n", "In other words, we want to dynamically decide on which inputs we want to \"attend\" more than others.\n", "In particular, an attention mechanism has usually four parts we need to specify:\n", "\n", "* **Query**: The query is a feature vector that describes what we are looking for in the sequence, i.e. what would we maybe want to pay attention to.\n", "* **Keys**: For each input element, we have a key which is again a feature vector.\n", "This feature vector roughly describes what the element is \"offering\", or when it might be important.\n", "The keys should be designed such that we can identify the elements we want to pay attention to based on the query.\n", "* **Values**: For each input element, we also have a value vector.\n", "This feature vector is the one we want to average over.\n", "* **Score function**: To rate which elements we want to pay attention to, we need to specify a score function $f_{attn}$.\n", "The score function takes the query and a key as input, and output the score/attention weight of the query-key pair.\n", "It is usually implemented by simple similarity metrics like a dot product, or a small MLP.\n", "\n", "\n", "The weights of the average are calculated by a softmax over all score function outputs.\n", "Hence, we assign those value vectors a higher weight whose corresponding key is most similar to the query.\n", "If we try to describe it with pseudo-math, we can write:\n", "\n", "$$\n", "\\alpha_i = \\frac{\\exp\\left(f_{attn}\\left(\\text{key}_i, \\text{query}\\right)\\right)}{\\sum_j \\exp\\left(f_{attn}\\left(\\text{key}_j, \\text{query}\\right)\\right)}, \\hspace{5mm} \\text{out} = \\sum_i \\alpha_i \\cdot \\text{value}_i\n", "$$\n", "\n", "Visually, we can show the attention over a sequence of words as follows:\n", "\n", "
\n", "\n", "For every word, we have one key and one value vector.\n", "The query is compared to all keys with a score function (in this case the dot product) to determine the weights.\n", "The softmax is not visualized for simplicity.\n", "Finally, the value vectors of all words are averaged using the attention weights.\n", "\n", "Most attention mechanisms differ in terms of what queries they use, how the key and value vectors are defined,\n", "and what score function is used.\n", "The attention applied inside the Transformer architecture is called **self-attention**.\n", "In self-attention, each sequence element provides a key, value, and query.\n", "For each element, we perform an attention layer where based on its query,\n", "we check the similarity of the all sequence elements' keys, and returned a different,\n", "averaged value vector for each element.\n", "We will now go into a bit more detail by first looking at the specific implementation of the attention mechanism\n", "which is in the Transformer case the scaled dot product attention."]}, {"cell_type": "markdown", "id": "d9697f03", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.139603, "end_time": "2021-12-04T15:58:07.635701", "exception": false, "start_time": "2021-12-04T15:58:07.496098", "status": "completed"}, "tags": []}, "source": ["### Scaled Dot Product Attention\n", "\n", "The core concept behind self-attention is the scaled dot product attention.\n", "Our goal is to have an attention mechanism with which any element in a sequence can attend to any other while\n", "still being efficient to compute.\n", "The dot product attention takes as input a set of queries\n", "$Q\\in\\mathbb{R}^{T\\times d_k}$, keys $K\\in\\mathbb{R}^{T\\times d_k}$\n", "and values $V\\in\\mathbb{R}^{T\\times d_v}$ where $T$ is the sequence length,\n", "and $d_k$ and $d_v$ are the hidden dimensionality for queries/keys and values respectively.\n", "For simplicity, we neglect the batch dimension for now.\n", "The attention value from element $i$ to $j$ is based on its similarity of the query $Q_i$ and key $K_j$,\n", "using the dot product as the similarity metric.\n", "In math, we calculate the dot product attention as follows:\n", "\n", "$$\\text{Attention}(Q,K,V)=\\text{softmax}\\left(\\frac{QK^T}{\\sqrt{d_k}}\\right)V$$\n", "\n", "The matrix multiplication $QK^T$ performs the dot product for every possible pair of queries and keys,\n", "resulting in a matrix of the shape $T\\times T$.\n", "Each row represents the attention logits for a specific element $i$ to all other elements in the sequence.\n", "On these, we apply a softmax and multiply with the value vector to obtain a weighted mean\n", "(the weights being determined by the attention).\n", "Another perspective on this attention mechanism offers the computation graph which is visualized below\n", "(figure credit - [Vaswani et al., 2017](https://arxiv.org/abs/1706.03762)).\n", "\n", "
\n", "\n", "One aspect we haven't discussed yet is the scaling factor of $1/\\sqrt{d_k}$.\n", "This scaling factor is crucial to maintain an appropriate variance of attention values after initialization.\n", "Remember that we intialize our layers with the intention of having equal variance throughout the model, and hence,\n", "$Q$ and $K$ might also have a variance close to $1$.\n", "However, performing a dot product over two vectors with a variance $\\sigma$ results\n", "in a scalar having $d_k$-times higher variance:\n", "\n", "$$q_i \\sim \\mathcal{N}(0,\\sigma), k_i \\sim \\mathcal{N}(0,\\sigma) \\to \\text{Var}\\left(\\sum_{i=1}^{d_k} q_i\\cdot k_i\\right) = \\sigma\\cdot d_k$$\n", "\n", "\n", "If we do not scale down the variance back to $\\sigma$, the softmax over the logits will already saturate\n", "to $1$ for one random element and $0$ for all others.\n", "The gradients through the softmax will be close to zero so that we can't learn the parameters appropriately.\n", "\n", "The block `Mask (opt.\n", ")` in the diagram above represents the optional masking of specific entries in the attention matrix.\n", "This is for instance used if we stack multiple sequences with different lengths into a batch.\n", "To still benefit from parallelization in PyTorch, we pad the sentences to the same length and mask out the padding\n", "tokens during the calculation of the attention values.\n", "This is usually done by setting the respective attention logits to a very low value.\n", "\n", "After we have discussed the details of the scaled dot product attention block, we can write a function below\n", "which computes the output features given the triple of queries, keys, and values:"]}, {"cell_type": "code", "execution_count": 4, "id": "f65c1f5d", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:07.923041Z", "iopub.status.busy": "2021-12-04T15:58:07.922459Z", "iopub.status.idle": "2021-12-04T15:58:07.924745Z", "shell.execute_reply": "2021-12-04T15:58:07.925122Z"}, "papermill": {"duration": 0.148521, "end_time": "2021-12-04T15:58:07.925250", "exception": false, "start_time": "2021-12-04T15:58:07.776729", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def scaled_dot_product(q, k, v, mask=None):\n", " d_k = q.size()[-1]\n", " attn_logits = torch.matmul(q, k.transpose(-2, -1))\n", " attn_logits = attn_logits / math.sqrt(d_k)\n", " if mask is not None:\n", " attn_logits = attn_logits.masked_fill(mask == 0, -9e15)\n", " attention = F.softmax(attn_logits, dim=-1)\n", " values = torch.matmul(attention, v)\n", " return values, attention"]}, {"cell_type": "markdown", "id": "10dc2e7e", "metadata": {"papermill": {"duration": 0.139995, "end_time": "2021-12-04T15:58:08.204876", "exception": false, "start_time": "2021-12-04T15:58:08.064881", "status": "completed"}, "tags": []}, "source": ["Note that our code above supports any additional dimensionality in front of the sequence length\n", "so that we can also use it for batches.\n", "However, for a better understanding, let's generate a few random queries, keys, and value vectors,\n", "and calculate the attention outputs:"]}, {"cell_type": "code", "execution_count": 5, "id": "c417bca9", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:08.490138Z", "iopub.status.busy": "2021-12-04T15:58:08.489665Z", "iopub.status.idle": "2021-12-04T15:58:08.498288Z", "shell.execute_reply": "2021-12-04T15:58:08.497857Z"}, "papermill": {"duration": 0.15228, "end_time": "2021-12-04T15:58:08.498402", "exception": false, "start_time": "2021-12-04T15:58:08.346122", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Q\n", " tensor([[ 0.3367, 0.1288],\n", " [ 0.2345, 0.2303],\n", " [-1.1229, -0.1863]])\n", "K\n", " tensor([[ 2.2082, -0.6380],\n", " [ 0.4617, 0.2674],\n", " [ 0.5349, 0.8094]])\n", "V\n", " tensor([[ 1.1103, -1.6898],\n", " [-0.9890, 0.9580],\n", " [ 1.3221, 0.8172]])\n", "Values\n", " tensor([[ 0.5698, -0.1520],\n", " [ 0.5379, -0.0265],\n", " [ 0.2246, 0.5556]])\n", "Attention\n", " tensor([[0.4028, 0.2886, 0.3086],\n", " [0.3538, 0.3069, 0.3393],\n", " [0.1303, 0.4630, 0.4067]])\n"]}], "source": ["seq_len, d_k = 3, 2\n", "pl.seed_everything(42)\n", "q = torch.randn(seq_len, d_k)\n", "k = torch.randn(seq_len, d_k)\n", "v = torch.randn(seq_len, d_k)\n", "values, attention = scaled_dot_product(q, k, v)\n", "print(\"Q\\n\", q)\n", "print(\"K\\n\", k)\n", "print(\"V\\n\", v)\n", "print(\"Values\\n\", values)\n", "print(\"Attention\\n\", attention)"]}, {"cell_type": "markdown", "id": "a9d22885", "metadata": {"papermill": {"duration": 0.141388, "end_time": "2021-12-04T15:58:08.781187", "exception": false, "start_time": "2021-12-04T15:58:08.639799", "status": "completed"}, "tags": []}, "source": ["Before continuing, make sure you can follow the calculation of the specific values here, and also check it by hand.\n", "It is important to fully understand how the scaled dot product attention is calculated."]}, {"cell_type": "markdown", "id": "09bc5c7a", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.141201, "end_time": "2021-12-04T15:58:09.064542", "exception": false, "start_time": "2021-12-04T15:58:08.923341", "status": "completed"}, "tags": []}, "source": ["### Multi-Head Attention\n", "\n", "The scaled dot product attention allows a network to attend over a sequence.\n", "However, often there are multiple different aspects a sequence element wants to attend to,\n", "and a single weighted average is not a good option for it.\n", "This is why we extend the attention mechanisms to multiple heads,\n", "i.e. multiple different query-key-value triplets on the same features.\n", "Specifically, given a query, key, and value matrix, we transform those into $h$ sub-queries, sub-keys,\n", "and sub-values, which we pass through the scaled dot product attention independently.\n", "Afterward, we concatenate the heads and combine them with a final weight matrix.\n", "Mathematically, we can express this operation as:\n", "\n", "$$\n", "\\begin{split}\n", " \\text{Multihead}(Q,K,V) & = \\text{Concat}(\\text{head}_1,...,\\text{head}_h)W^{O}\\\\\n", " \\text{where } \\text{head}_i & = \\text{Attention}(QW_i^Q,KW_i^K, VW_i^V)\n", "\\end{split}\n", "$$\n", "\n", "We refer to this as Multi-Head Attention layer with the learnable parameters\n", "$W_{1...h}^{Q}\\in\\mathbb{R}^{D\\times d_k}$,\n", "$W_{1...h}^{K}\\in\\mathbb{R}^{D\\times d_k}$,\n", "$W_{1...h}^{V}\\in\\mathbb{R}^{D\\times d_v}$,\n", "and $W^{O}\\in\\mathbb{R}^{h\\cdot d_k\\times d_{out}}$ ($D$ being the input dimensionality).\n", "Expressed in a computational graph, we can visualize it as below\n", "(figure credit - [Vaswani et al., 2017](https://arxiv.org/abs/1706.03762)).\n", "\n", "
\n", "\n", "How are we applying a Multi-Head Attention layer in a neural network,\n", "where we don't have an arbitrary query, key, and value vector as input?\n", "Looking at the computation graph above, a simple but effective implementation is to set the current\n", "feature map in a NN, $X\\in\\mathbb{R}^{B\\times T\\times d_{\\text{model}}}$, as $Q$, $K$ and $V$\n", "($B$ being the batch size, $T$ the sequence length, $d_{\\text{model}}$ the hidden dimensionality of $X$).\n", "The consecutive weight matrices $W^{Q}$, $W^{K}$, and $W^{V}$ can transform $X$ to the corresponding\n", "feature vectors that represent the queries, keys, and values of the input.\n", "Using this approach, we can implement the Multi-Head Attention module below."]}, {"cell_type": "code", "execution_count": 6, "id": "9a857f4f", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:09.357800Z", "iopub.status.busy": "2021-12-04T15:58:09.357266Z", "iopub.status.idle": "2021-12-04T15:58:09.359052Z", "shell.execute_reply": "2021-12-04T15:58:09.358641Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.152505, "end_time": "2021-12-04T15:58:09.359159", "exception": false, "start_time": "2021-12-04T15:58:09.206654", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class MultiheadAttention(nn.Module):\n", " def __init__(self, input_dim, embed_dim, num_heads):\n", " super().__init__()\n", " assert embed_dim % num_heads == 0, \"Embedding dimension must be 0 modulo number of heads.\"\n", "\n", " self.embed_dim = embed_dim\n", " self.num_heads = num_heads\n", " self.head_dim = embed_dim // num_heads\n", "\n", " # Stack all weight matrices 1...h together for efficiency\n", " # Note that in many implementations you see \"bias=False\" which is optional\n", " self.qkv_proj = nn.Linear(input_dim, 3 * embed_dim)\n", " self.o_proj = nn.Linear(embed_dim, embed_dim)\n", "\n", " self._reset_parameters()\n", "\n", " def _reset_parameters(self):\n", " # Original Transformer initialization, see PyTorch documentation\n", " nn.init.xavier_uniform_(self.qkv_proj.weight)\n", " self.qkv_proj.bias.data.fill_(0)\n", " nn.init.xavier_uniform_(self.o_proj.weight)\n", " self.o_proj.bias.data.fill_(0)\n", "\n", " def forward(self, x, mask=None, return_attention=False):\n", " batch_size, seq_length, embed_dim = x.size()\n", " qkv = self.qkv_proj(x)\n", "\n", " # Separate Q, K, V from linear output\n", " qkv = qkv.reshape(batch_size, seq_length, self.num_heads, 3 * self.head_dim)\n", " qkv = qkv.permute(0, 2, 1, 3) # [Batch, Head, SeqLen, Dims]\n", " q, k, v = qkv.chunk(3, dim=-1)\n", "\n", " # Determine value outputs\n", " values, attention = scaled_dot_product(q, k, v, mask=mask)\n", " values = values.permute(0, 2, 1, 3) # [Batch, SeqLen, Head, Dims]\n", " values = values.reshape(batch_size, seq_length, embed_dim)\n", " o = self.o_proj(values)\n", "\n", " if return_attention:\n", " return o, attention\n", " else:\n", " return o"]}, {"cell_type": "markdown", "id": "b56973f7", "metadata": {"papermill": {"duration": 0.142069, "end_time": "2021-12-04T15:58:09.642785", "exception": false, "start_time": "2021-12-04T15:58:09.500716", "status": "completed"}, "tags": []}, "source": ["One crucial characteristic of the multi-head attention is that it is permutation-equivariant with respect to its inputs.\n", "This means that if we switch two input elements in the sequence, e.g. $X_1\\leftrightarrow X_2$\n", "(neglecting the batch dimension for now), the output is exactly the same besides the elements 1 and 2 switched.\n", "Hence, the multi-head attention is actually looking at the input not as a sequence, but as a set of elements.\n", "This property makes the multi-head attention block and the Transformer architecture so powerful and widely applicable!\n", "But what if the order of the input is actually important for solving the task, like language modeling?\n", "The answer is to encode the position in the input features, which we will take a closer look at later\n", "(topic _Positional encodings_ below).\n", "\n", "Before moving on to creating the Transformer architecture, we can compare the self-attention operation\n", "with our other common layer competitors for sequence data: convolutions and recurrent neural networks.\n", "Below you can find a table by [Vaswani et al.\n", "(2017)](https://arxiv.org/abs/1706.03762) on the complexity per layer, the number of sequential operations,\n", "and maximum path length.\n", "The complexity is measured by the upper bound of the number of operations to perform, while the maximum path\n", "length represents the maximum number of steps a forward or backward signal has to traverse to reach any other position.\n", "The lower this length, the better gradient signals can backpropagate for long-range dependencies.\n", "Let's take a look at the table below:\n", "\n", "\n", "
\n", "\n", "$n$ is the sequence length, $d$ is the representation dimension and $k$ is the kernel size of convolutions.\n", "In contrast to recurrent networks, the self-attention layer can parallelize all its operations making it much faster\n", "to execute for smaller sequence lengths.\n", "However, when the sequence length exceeds the hidden dimensionality, self-attention becomes more expensive than RNNs.\n", "One way of reducing the computational cost for long sequences is by restricting the self-attention to a neighborhood\n", "of inputs to attend over, denoted by $r$.\n", "Nevertheless, there has been recently a lot of work on more efficient Transformer architectures that still allow long\n", "dependencies, of which you can find an overview in the paper by [Tay et al.\n", "(2020)](https://arxiv.org/abs/2009.06732) if interested."]}, {"cell_type": "markdown", "id": "c9ea3bc6", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.142611, "end_time": "2021-12-04T15:58:09.927152", "exception": false, "start_time": "2021-12-04T15:58:09.784541", "status": "completed"}, "tags": []}, "source": ["### Transformer Encoder\n", "\n", "
\n", "\n", "Next, we will look at how to apply the multi-head attention blog inside the Transformer architecture.\n", "Originally, the Transformer model was designed for machine translation.\n", "Hence, it got an encoder-decoder structure where the encoder takes as input the sentence in the original language\n", "and generates an attention-based representation.\n", "On the other hand, the decoder attends over the encoded information and generates the translated sentence\n", "in an autoregressive manner, as in a standard RNN.\n", "While this structure is extremely useful for Sequence-to-Sequence tasks with the necessity of autoregressive decoding,\n", "we will focus here on the encoder part.\n", "Many advances in NLP have been made using pure encoder-based Transformer models (if interested, models include the\n", "[BERT](https://arxiv.org/abs/1810.04805)-family,\n", "the [Vision Transformer](https://arxiv.org/abs/2010.11929), and more),\n", "and in our tutorial, we will also mainly focus on the encoder part.\n", "If you have understood the encoder architecture, the decoder is a very small step to implement as well.\n", "The full Transformer architecture looks as follows\n", "(figure credit - [Vaswani et al., 2017](https://arxiv.org/abs/1706.03762)).\n", ":\n", "\n", "
\n", "\n", "The encoder consists of $N$ identical blocks that are applied in sequence.\n", "Taking as input $x$, it is first passed through a Multi-Head Attention block as we have implemented above.\n", "The output is added to the original input using a residual connection,\n", "and we apply a consecutive Layer Normalization on the sum.\n", "Overall, it calculates $\\text{LayerNorm}(x+\\text{Multihead}(x,x,x))$\n", "($x$ being $Q$, $K$ and $V$ input to the attention layer).\n", "The residual connection is crucial in the Transformer architecture for two reasons:\n", "\n", "1.\n", "Similar to ResNets, Transformers are designed to be very deep.\n", "Some models contain more than 24 blocks in the encoder.\n", "Hence, the residual connections are crucial for enabling a smooth gradient flow through the model.\n", "2.\n", "Without the residual connection, the information about the original sequence is lost.\n", "Remember that the Multi-Head Attention layer ignores the position of elements in a sequence,\n", "and can only learn it based on the input features.\n", "Removing the residual connections would mean that this information is lost after the first attention layer\n", "(after initialization), and with a randomly initialized query and key vector,\n", "the output vectors for position $i$ has no relation to its original input.\n", "All outputs of the attention are likely to represent similar/same information,\n", "and there is no chance for the model to distinguish which information came from which input element.\n", "An alternative option to residual connection would be to fix at least one head to focus on its original input,\n", "but this is very inefficient and does not have the benefit of the improved gradient flow.\n", "\n", "The Layer Normalization also plays an important role in the Transformer architecture as it enables faster\n", "training and provides small regularization.\n", "Additionally, it ensures that the features are in a similar magnitude among the elements in the sequence.\n", "We are not using Batch Normalization because it depends on the batch size which is often small with Transformers\n", "(they require a lot of GPU memory), and BatchNorm has shown to perform particularly bad in language\n", "as the features of words tend to have a much higher variance (there are many, very rare words\n", "which need to be considered for a good distribution estimate).\n", "\n", "Additionally to the Multi-Head Attention, a small fully connected feed-forward network is added to the model,\n", "which is applied to each position separately and identically.\n", "Specifically, the model uses a Linear$\\to$ReLU$\\to$Linear MLP.\n", "The full transformation including the residual connection can be expressed as:\n", "\n", "$$\n", "\\begin{split}\n", " \\text{FFN}(x) & = \\max(0, xW_1+b_1)W_2 + b_2\\\\\n", " x & = \\text{LayerNorm}(x + \\text{FFN}(x))\n", "\\end{split}\n", "$$\n", "\n", "This MLP adds extra complexity to the model and allows transformations on each sequence element separately.\n", "You can imagine as this allows the model to \"post-process\" the new information added\n", "by the previous Multi-Head Attention, and prepare it for the next attention block.\n", "Usually, the inner dimensionality of the MLP is 2-8$\\times$ larger than $d_{\\text{model}}$,\n", "i.e. the dimensionality of the original input $x$.\n", "The general advantage of a wider layer instead of a narrow, multi-layer MLP is the faster, parallelizable execution.\n", "\n", "Finally, after looking at all parts of the encoder architecture, we can start implementing it below.\n", "We first start by implementing a single encoder block.\n", "Additionally to the layers described above, we will add dropout layers in the MLP and on the output\n", "of the MLP and Multi-Head Attention for regularization."]}, {"cell_type": "code", "execution_count": 7, "id": "23103d12", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:10.224411Z", "iopub.status.busy": "2021-12-04T15:58:10.223932Z", "iopub.status.idle": "2021-12-04T15:58:10.225971Z", "shell.execute_reply": "2021-12-04T15:58:10.225565Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.157144, "end_time": "2021-12-04T15:58:10.226077", "exception": false, "start_time": "2021-12-04T15:58:10.068933", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class EncoderBlock(nn.Module):\n", " def __init__(self, input_dim, num_heads, dim_feedforward, dropout=0.0):\n", " \"\"\"\n", " Args:\n", " input_dim: Dimensionality of the input\n", " num_heads: Number of heads to use in the attention block\n", " dim_feedforward: Dimensionality of the hidden layer in the MLP\n", " dropout: Dropout probability to use in the dropout layers\n", " \"\"\"\n", " super().__init__()\n", "\n", " # Attention layer\n", " self.self_attn = MultiheadAttention(input_dim, input_dim, num_heads)\n", "\n", " # Two-layer MLP\n", " self.linear_net = nn.Sequential(\n", " nn.Linear(input_dim, dim_feedforward),\n", " nn.Dropout(dropout),\n", " nn.ReLU(inplace=True),\n", " nn.Linear(dim_feedforward, input_dim),\n", " )\n", "\n", " # Layers to apply in between the main layers\n", " self.norm1 = nn.LayerNorm(input_dim)\n", " self.norm2 = nn.LayerNorm(input_dim)\n", " self.dropout = nn.Dropout(dropout)\n", "\n", " def forward(self, x, mask=None):\n", " # Attention part\n", " attn_out = self.self_attn(x, mask=mask)\n", " x = x + self.dropout(attn_out)\n", " x = self.norm1(x)\n", "\n", " # MLP part\n", " linear_out = self.linear_net(x)\n", " x = x + self.dropout(linear_out)\n", " x = self.norm2(x)\n", "\n", " return x"]}, {"cell_type": "markdown", "id": "7820dae1", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.143711, "end_time": "2021-12-04T15:58:10.516987", "exception": false, "start_time": "2021-12-04T15:58:10.373276", "status": "completed"}, "tags": []}, "source": ["Based on this block, we can implement a module for the full Transformer encoder.\n", "Additionally to a forward function that iterates through the sequence of encoder blocks,\n", "we also provide a function called `get_attention_maps`.\n", "The idea of this function is to return the attention probabilities for all Multi-Head Attention blocks in the encoder.\n", "This helps us in understanding, and in a sense, explaining the model.\n", "However, the attention probabilities should be interpreted with a grain of salt as it does not necessarily\n", "reflect the true interpretation of the model (there is a series of papers about this,\n", "including [Attention is not Explanation](https://arxiv.org/abs/1902.10186)\n", "and [Attention is not not Explanation](https://arxiv.org/abs/1908.04626))."]}, {"cell_type": "code", "execution_count": 8, "id": "5619cdd3", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:10.816718Z", "iopub.status.busy": "2021-12-04T15:58:10.816231Z", "iopub.status.idle": "2021-12-04T15:58:10.818205Z", "shell.execute_reply": "2021-12-04T15:58:10.817797Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.158399, "end_time": "2021-12-04T15:58:10.818313", "exception": false, "start_time": "2021-12-04T15:58:10.659914", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class TransformerEncoder(nn.Module):\n", " def __init__(self, num_layers, **block_args):\n", " super().__init__()\n", " self.layers = nn.ModuleList([EncoderBlock(**block_args) for _ in range(num_layers)])\n", "\n", " def forward(self, x, mask=None):\n", " for layer in self.layers:\n", " x = layer(x, mask=mask)\n", " return x\n", "\n", " def get_attention_maps(self, x, mask=None):\n", " attention_maps = []\n", " for layer in self.layers:\n", " _, attn_map = layer.self_attn(x, mask=mask, return_attention=True)\n", " attention_maps.append(attn_map)\n", " x = layer(x)\n", " return attention_maps"]}, {"cell_type": "markdown", "id": "8a328d53", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.142344, "end_time": "2021-12-04T15:58:11.102765", "exception": false, "start_time": "2021-12-04T15:58:10.960421", "status": "completed"}, "tags": []}, "source": ["### Positional encoding\n", "\n", "We have discussed before that the Multi-Head Attention block is permutation-equivariant,\n", "and cannot distinguish whether an input comes before another one in the sequence or not.\n", "In tasks like language understanding, however, the position is important for interpreting the input words.\n", "The position information can therefore be added via the input features.\n", "We could learn a embedding for every possible position, but this would not generalize to a dynamical\n", "input sequence length.\n", "Hence, the better option is to use feature patterns that the network can identify from the features\n", "and potentially generalize to larger sequences.\n", "The specific pattern chosen by Vaswani et al.\n", "are sine and cosine functions of different frequencies, as follows:\n", "\n", "$$\n", "PE_{(pos,i)} = \\begin{cases}\n", " \\sin\\left(\\frac{pos}{10000^{i/d_{\\text{model}}}}\\right) & \\text{if}\\hspace{3mm} i \\text{ mod } 2=0\\\\\n", " \\cos\\left(\\frac{pos}{10000^{(i-1)/d_{\\text{model}}}}\\right) & \\text{otherwise}\\\\\n", "\\end{cases}\n", "$$\n", "\n", "$PE_{(pos,i)}$ represents the position encoding at position $pos$ in the sequence, and hidden dimensionality $i$.\n", "These values, concatenated for all hidden dimensions, are added to the original input features\n", "(in the Transformer visualization above, see \"Positional encoding\"), and constitute the position information.\n", "We distinguish between even ($i \\text{ mod } 2=0$) and uneven ($i \\text{ mod } 2=1$)\n", "hidden dimensionalities where we apply a sine/cosine respectively.\n", "The intuition behind this encoding is that you can represent $PE_{(pos+k,:)}$ as a linear function\n", "of $PE_{(pos,:)}$, which might allow the model to easily attend to relative positions.\n", "The wavelengths in different dimensions range from $2\\pi$ to $10000\\cdot 2\\pi$.\n", "\n", "The positional encoding is implemented below.\n", "The code is taken from the [PyTorch tutorial](https://pytorch.org/tutorials/beginner/transformer_tutorial.html#define-the-model)\n", "about Transformers on NLP and adjusted for our purposes."]}, {"cell_type": "code", "execution_count": 9, "id": "9a4179be", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:11.394604Z", "iopub.status.busy": "2021-12-04T15:58:11.394124Z", "iopub.status.idle": "2021-12-04T15:58:11.395735Z", "shell.execute_reply": "2021-12-04T15:58:11.396116Z"}, "papermill": {"duration": 0.151358, "end_time": "2021-12-04T15:58:11.396243", "exception": false, "start_time": "2021-12-04T15:58:11.244885", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class PositionalEncoding(nn.Module):\n", " def __init__(self, d_model, max_len=5000):\n", " \"\"\"\n", " Args\n", " d_model: Hidden dimensionality of the input.\n", " max_len: Maximum length of a sequence to expect.\n", " \"\"\"\n", " super().__init__()\n", "\n", " # Create matrix of [SeqLen, HiddenDim] representing the positional encoding for max_len inputs\n", " pe = torch.zeros(max_len, d_model)\n", " position = torch.arange(0, max_len, dtype=torch.float).unsqueeze(1)\n", " div_term = torch.exp(torch.arange(0, d_model, 2).float() * (-math.log(10000.0) / d_model))\n", " pe[:, 0::2] = torch.sin(position * div_term)\n", " pe[:, 1::2] = torch.cos(position * div_term)\n", " pe = pe.unsqueeze(0)\n", "\n", " # register_buffer => Tensor which is not a parameter, but should be part of the modules state.\n", " # Used for tensors that need to be on the same device as the module.\n", " # persistent=False tells PyTorch to not add the buffer to the state dict (e.g. when we save the model)\n", " self.register_buffer(\"pe\", pe, persistent=False)\n", "\n", " def forward(self, x):\n", " x = x + self.pe[:, : x.size(1)]\n", " return x"]}, {"cell_type": "markdown", "id": "ab85f000", "metadata": {"papermill": {"duration": 0.143264, "end_time": "2021-12-04T15:58:11.687431", "exception": false, "start_time": "2021-12-04T15:58:11.544167", "status": "completed"}, "tags": []}, "source": ["To understand the positional encoding, we can visualize it below.\n", "We will generate an image of the positional encoding over hidden dimensionality and position in a sequence.\n", "Each pixel, therefore, represents the change of the input feature we perform to encode the specific position.\n", "Let's do it below."]}, {"cell_type": "code", "execution_count": 10, "id": "f3c3e710", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:11.979041Z", "iopub.status.busy": "2021-12-04T15:58:11.978542Z", "iopub.status.idle": "2021-12-04T15:58:12.357315Z", "shell.execute_reply": "2021-12-04T15:58:12.357708Z"}, "papermill": {"duration": 0.527144, "end_time": "2021-12-04T15:58:12.357871", "exception": false, "start_time": "2021-12-04T15:58:11.830727", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:58:12.126505\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["encod_block = PositionalEncoding(d_model=48, max_len=96)\n", "pe = encod_block.pe.squeeze().T.cpu().numpy()\n", "\n", "fig, ax = plt.subplots(nrows=1, ncols=1, figsize=(8, 3))\n", "pos = ax.imshow(pe, cmap=\"RdGy\", extent=(1, pe.shape[1] + 1, pe.shape[0] + 1, 1))\n", "fig.colorbar(pos, ax=ax)\n", "ax.set_xlabel(\"Position in sequence\")\n", "ax.set_ylabel(\"Hidden dimension\")\n", "ax.set_title(\"Positional encoding over hidden dimensions\")\n", "ax.set_xticks([1] + [i * 10 for i in range(1, 1 + pe.shape[1] // 10)])\n", "ax.set_yticks([1] + [i * 10 for i in range(1, 1 + pe.shape[0] // 10)])\n", "plt.show()"]}, {"cell_type": "markdown", "id": "d5cc9a34", "metadata": {"papermill": {"duration": 0.154874, "end_time": "2021-12-04T15:58:12.659676", "exception": false, "start_time": "2021-12-04T15:58:12.504802", "status": "completed"}, "tags": []}, "source": ["You can clearly see the sine and cosine waves with different wavelengths that encode the position\n", "in the hidden dimensions.\n", "Specifically, we can look at the sine/cosine wave for each hidden dimension separately,\n", "to get a better intuition of the pattern.\n", "Below we visualize the positional encoding for the hidden dimensions $1$, $2$, $3$ and $4$."]}, {"cell_type": "code", "execution_count": 11, "id": "a476a12e", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:12.994247Z", "iopub.status.busy": "2021-12-04T15:58:12.979090Z", "iopub.status.idle": "2021-12-04T15:58:14.181132Z", "shell.execute_reply": "2021-12-04T15:58:14.181526Z"}, "papermill": {"duration": 1.37322, "end_time": "2021-12-04T15:58:14.181688", "exception": false, "start_time": "2021-12-04T15:58:12.808468", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:58:13.463512\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["sns.set_theme()\n", "fig, ax = plt.subplots(2, 2, figsize=(12, 4))\n", "ax = [a for a_list in ax for a in a_list]\n", "for i in range(len(ax)):\n", " ax[i].plot(np.arange(1, 17), pe[i, :16], color=\"C%i\" % i, marker=\"o\", markersize=6, markeredgecolor=\"black\")\n", " ax[i].set_title(\"Encoding in hidden dimension %i\" % (i + 1))\n", " ax[i].set_xlabel(\"Position in sequence\", fontsize=10)\n", " ax[i].set_ylabel(\"Positional encoding\", fontsize=10)\n", " ax[i].set_xticks(np.arange(1, 17))\n", " ax[i].tick_params(axis=\"both\", which=\"major\", labelsize=10)\n", " ax[i].tick_params(axis=\"both\", which=\"minor\", labelsize=8)\n", " ax[i].set_ylim(-1.2, 1.2)\n", "fig.subplots_adjust(hspace=0.8)\n", "sns.reset_orig()\n", "plt.show()"]}, {"cell_type": "markdown", "id": "323263e4", "metadata": {"papermill": {"duration": 0.162339, "end_time": "2021-12-04T15:58:14.500062", "exception": false, "start_time": "2021-12-04T15:58:14.337723", "status": "completed"}, "tags": []}, "source": ["As we can see, the patterns between the hidden dimension $1$ and $2$ only differ in the starting angle.\n", "The wavelength is $2\\pi$, hence the repetition after position $6$.\n", "The hidden dimensions $2$ and $3$ have about twice the wavelength."]}, {"cell_type": "markdown", "id": "2a423f6a", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.150745, "end_time": "2021-12-04T15:58:14.801934", "exception": false, "start_time": "2021-12-04T15:58:14.651189", "status": "completed"}, "tags": []}, "source": ["### Learning rate warm-up\n", "\n", "One commonly used technique for training a Transformer is learning rate warm-up.\n", "This means that we gradually increase the learning rate from 0 on to our originally specified\n", "learning rate in the first few iterations.\n", "Thus, we slowly start learning instead of taking very large steps from the beginning.\n", "In fact, training a deep Transformer without learning rate warm-up can make the model diverge\n", "and achieve a much worse performance on training and testing.\n", "Take for instance the following plot by [Liu et al.\n", "(2019)](https://arxiv.org/pdf/1908.03265.pdf) comparing Adam-vanilla (i.e. Adam without warm-up)\n", "vs Adam with a warm-up:\n", "\n", "
\n", "\n", "Clearly, the warm-up is a crucial hyperparameter in the Transformer architecture.\n", "Why is it so important?\n", "There are currently two common explanations.\n", "Firstly, Adam uses the bias correction factors which however can lead to a higher variance in the adaptive\n", "learning rate during the first iterations.\n", "Improved optimizers like [RAdam](https://arxiv.org/abs/1908.03265) have been shown to overcome this issue,\n", "not requiring warm-up for training Transformers.\n", "Secondly, the iteratively applied Layer Normalization across layers can lead to very high gradients during\n", "the first iterations, which can be solved by using Pre-Layer Normalization\n", "(similar to Pre-Activation ResNet), or replacing Layer Normalization by other techniques\n", "(Adaptive Normalization,\n", "[Power Normalization](https://arxiv.org/abs/2003.07845)).\n", "\n", "Nevertheless, many applications and papers still use the original Transformer architecture with Adam,\n", "because warm-up is a simple, yet effective way of solving the gradient problem in the first iterations.\n", "There are many different schedulers we could use.\n", "For instance, the original Transformer paper used an exponential decay scheduler with a warm-up.\n", "However, the currently most popular scheduler is the cosine warm-up scheduler,\n", "which combines warm-up with a cosine-shaped learning rate decay.\n", "We can implement it below, and visualize the learning rate factor over epochs."]}, {"cell_type": "code", "execution_count": 12, "id": "da5c81cf", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:15.111318Z", "iopub.status.busy": "2021-12-04T15:58:15.110838Z", "iopub.status.idle": "2021-12-04T15:58:15.112740Z", "shell.execute_reply": "2021-12-04T15:58:15.112354Z"}, "papermill": {"duration": 0.159462, "end_time": "2021-12-04T15:58:15.112851", "exception": false, "start_time": "2021-12-04T15:58:14.953389", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class CosineWarmupScheduler(optim.lr_scheduler._LRScheduler):\n", " def __init__(self, optimizer, warmup, max_iters):\n", " self.warmup = warmup\n", " self.max_num_iters = max_iters\n", " super().__init__(optimizer)\n", "\n", " def get_lr(self):\n", " lr_factor = self.get_lr_factor(epoch=self.last_epoch)\n", " return [base_lr * lr_factor for base_lr in self.base_lrs]\n", "\n", " def get_lr_factor(self, epoch):\n", " lr_factor = 0.5 * (1 + np.cos(np.pi * epoch / self.max_num_iters))\n", " if epoch <= self.warmup:\n", " lr_factor *= epoch * 1.0 / self.warmup\n", " return lr_factor"]}, {"cell_type": "code", "execution_count": 13, "id": "a0668690", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:15.442783Z", "iopub.status.busy": "2021-12-04T15:58:15.438778Z", "iopub.status.idle": "2021-12-04T15:58:15.738564Z", "shell.execute_reply": "2021-12-04T15:58:15.738973Z"}, "papermill": {"duration": 0.475589, "end_time": "2021-12-04T15:58:15.739126", "exception": false, "start_time": "2021-12-04T15:58:15.263537", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:58:15.545554\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["# Needed for initializing the lr scheduler\n", "p = nn.Parameter(torch.empty(4, 4))\n", "optimizer = optim.Adam([p], lr=1e-3)\n", "lr_scheduler = CosineWarmupScheduler(optimizer=optimizer, warmup=100, max_iters=2000)\n", "\n", "# Plotting\n", "epochs = list(range(2000))\n", "sns.set()\n", "plt.figure(figsize=(8, 3))\n", "plt.plot(epochs, [lr_scheduler.get_lr_factor(e) for e in epochs])\n", "plt.ylabel(\"Learning rate factor\")\n", "plt.xlabel(\"Iterations (in batches)\")\n", "plt.title(\"Cosine Warm-up Learning Rate Scheduler\")\n", "plt.show()\n", "sns.reset_orig()"]}, {"cell_type": "markdown", "id": "54af6807", "metadata": {"papermill": {"duration": 0.154142, "end_time": "2021-12-04T15:58:16.048540", "exception": false, "start_time": "2021-12-04T15:58:15.894398", "status": "completed"}, "tags": []}, "source": ["In the first 100 iterations, we increase the learning rate factor from 0 to 1,\n", "whereas for all later iterations, we decay it using the cosine wave.\n", "Pre-implementations of this scheduler can be found in the popular NLP Transformer library\n", "[huggingface](https://huggingface.co/transformers/main_classes/optimizer_schedules.html?highlight=cosine#transformers.get_cosine_schedule_with_warmup)."]}, {"cell_type": "markdown", "id": "a8c7d2a2", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.154296, "end_time": "2021-12-04T15:58:16.357362", "exception": false, "start_time": "2021-12-04T15:58:16.203066", "status": "completed"}, "tags": []}, "source": ["### PyTorch Lightning Module\n", "\n", "Finally, we can embed the Transformer architecture into a PyTorch lightning module.\n", "From Tutorial 5, you know that PyTorch Lightning simplifies our training and test code,\n", "as well as structures the code nicely in separate functions.\n", "We will implement a template for a classifier based on the Transformer encoder.\n", "Thereby, we have a prediction output per sequence element.\n", "If we would need a classifier over the whole sequence, the common approach is to add an additional\n", "`[CLS]` token to the sequence, representing the classifier token.\n", "However, here we focus on tasks where we have an output per element.\n", "\n", "Additionally to the Transformer architecture, we add a small input network (maps input dimensions to model dimensions),\n", "the positional encoding, and an output network (transforms output encodings to predictions).\n", "We also add the learning rate scheduler, which takes a step each iteration instead of once per epoch.\n", "This is needed for the warmup and the smooth cosine decay.\n", "The training, validation, and test step is left empty for now and will be filled for our task-specific models."]}, {"cell_type": "code", "execution_count": 14, "id": "a392e677", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:16.678659Z", "iopub.status.busy": "2021-12-04T15:58:16.678143Z", "iopub.status.idle": "2021-12-04T15:58:16.680126Z", "shell.execute_reply": "2021-12-04T15:58:16.679738Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.168727, "end_time": "2021-12-04T15:58:16.680237", "exception": false, "start_time": "2021-12-04T15:58:16.511510", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class TransformerPredictor(pl.LightningModule):\n", " def __init__(\n", " self,\n", " input_dim,\n", " model_dim,\n", " num_classes,\n", " num_heads,\n", " num_layers,\n", " lr,\n", " warmup,\n", " max_iters,\n", " dropout=0.0,\n", " input_dropout=0.0,\n", " ):\n", " \"\"\"\n", " Args:\n", " input_dim: Hidden dimensionality of the input\n", " model_dim: Hidden dimensionality to use inside the Transformer\n", " num_classes: Number of classes to predict per sequence element\n", " num_heads: Number of heads to use in the Multi-Head Attention blocks\n", " num_layers: Number of encoder blocks to use.\n", " lr: Learning rate in the optimizer\n", " warmup: Number of warmup steps. Usually between 50 and 500\n", " max_iters: Number of maximum iterations the model is trained for. This is needed for the CosineWarmup scheduler\n", " dropout: Dropout to apply inside the model\n", " input_dropout: Dropout to apply on the input features\n", " \"\"\"\n", " super().__init__()\n", " self.save_hyperparameters()\n", " self._create_model()\n", "\n", " def _create_model(self):\n", " # Input dim -> Model dim\n", " self.input_net = nn.Sequential(\n", " nn.Dropout(self.hparams.input_dropout), nn.Linear(self.hparams.input_dim, self.hparams.model_dim)\n", " )\n", " # Positional encoding for sequences\n", " self.positional_encoding = PositionalEncoding(d_model=self.hparams.model_dim)\n", " # Transformer\n", " self.transformer = TransformerEncoder(\n", " num_layers=self.hparams.num_layers,\n", " input_dim=self.hparams.model_dim,\n", " dim_feedforward=2 * self.hparams.model_dim,\n", " num_heads=self.hparams.num_heads,\n", " dropout=self.hparams.dropout,\n", " )\n", " # Output classifier per sequence lement\n", " self.output_net = nn.Sequential(\n", " nn.Linear(self.hparams.model_dim, self.hparams.model_dim),\n", " nn.LayerNorm(self.hparams.model_dim),\n", " nn.ReLU(inplace=True),\n", " nn.Dropout(self.hparams.dropout),\n", " nn.Linear(self.hparams.model_dim, self.hparams.num_classes),\n", " )\n", "\n", " def forward(self, x, mask=None, add_positional_encoding=True):\n", " \"\"\"\n", " Args:\n", " x: Input features of shape [Batch, SeqLen, input_dim]\n", " mask: Mask to apply on the attention outputs (optional)\n", " add_positional_encoding: If True, we add the positional encoding to the input.\n", " Might not be desired for some tasks.\n", " \"\"\"\n", " x = self.input_net(x)\n", " if add_positional_encoding:\n", " x = self.positional_encoding(x)\n", " x = self.transformer(x, mask=mask)\n", " x = self.output_net(x)\n", " return x\n", "\n", " @torch.no_grad()\n", " def get_attention_maps(self, x, mask=None, add_positional_encoding=True):\n", " \"\"\"Function for extracting the attention matrices of the whole Transformer for a single batch.\n", "\n", " Input arguments same as the forward pass.\n", " \"\"\"\n", " x = self.input_net(x)\n", " if add_positional_encoding:\n", " x = self.positional_encoding(x)\n", " attention_maps = self.transformer.get_attention_maps(x, mask=mask)\n", " return attention_maps\n", "\n", " def configure_optimizers(self):\n", " optimizer = optim.Adam(self.parameters(), lr=self.hparams.lr)\n", "\n", " # We don't return the lr scheduler because we need to apply it per iteration, not per epoch\n", " self.lr_scheduler = CosineWarmupScheduler(\n", " optimizer, warmup=self.hparams.warmup, max_iters=self.hparams.max_iters\n", " )\n", " return optimizer\n", "\n", " def optimizer_step(self, *args, **kwargs):\n", " super().optimizer_step(*args, **kwargs)\n", " self.lr_scheduler.step() # Step per iteration\n", "\n", " def training_step(self, batch, batch_idx):\n", " raise NotImplementedError\n", "\n", " def validation_step(self, batch, batch_idx):\n", " raise NotImplementedError\n", "\n", " def test_step(self, batch, batch_idx):\n", " raise NotImplementedError"]}, {"cell_type": "markdown", "id": "2818f62b", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.154523, "end_time": "2021-12-04T15:58:16.990037", "exception": false, "start_time": "2021-12-04T15:58:16.835514", "status": "completed"}, "tags": []}, "source": ["## Experiments\n", "\n", "
\n", "\n", "After having finished the implementation of the Transformer architecture, we can start experimenting\n", "and apply it to various tasks.\n", "In this notebook, we will focus on two tasks: parallel Sequence-to-Sequence, and set anomaly detection.\n", "The two tasks focus on different properties of the Transformer architecture, and we go through them below.\n", "\n", "### Sequence to Sequence\n", "\n", "A Sequence-to-Sequence task represents a task where the input _and_ the output is a sequence,\n", "not necessarily of the same length.\n", "Popular tasks in this domain include machine translation and summarization.\n", "For this, we usually have a Transformer encoder for interpreting the input sequence,\n", "and a decoder for generating the output in an autoregressive manner.\n", "Here, however, we will go back to a much simpler example task and use only the encoder.\n", "Given a sequence of $N$ numbers between $0$ and $M$, the task is to reverse the input sequence.\n", "In Numpy notation, if our input is $x$, the output should be $x$[::-1].\n", "Although this task sounds very simple, RNNs can have issues with such because the task requires long-term dependencies.\n", "Transformers are built to support such, and hence, we expect it to perform very well.\n", "\n", "First, let's create a dataset class below."]}, {"cell_type": "code", "execution_count": 15, "id": "d73f1841", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:17.308123Z", "iopub.status.busy": "2021-12-04T15:58:17.307642Z", "iopub.status.idle": "2021-12-04T15:58:17.309563Z", "shell.execute_reply": "2021-12-04T15:58:17.309179Z"}, "papermill": {"duration": 0.163367, "end_time": "2021-12-04T15:58:17.309674", "exception": false, "start_time": "2021-12-04T15:58:17.146307", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class ReverseDataset(data.Dataset):\n", " def __init__(self, num_categories, seq_len, size):\n", " super().__init__()\n", " self.num_categories = num_categories\n", " self.seq_len = seq_len\n", " self.size = size\n", "\n", " self.data = torch.randint(self.num_categories, size=(self.size, self.seq_len))\n", "\n", " def __len__(self):\n", " return self.size\n", "\n", " def __getitem__(self, idx):\n", " inp_data = self.data[idx]\n", " labels = torch.flip(inp_data, dims=(0,))\n", " return inp_data, labels"]}, {"cell_type": "markdown", "id": "5640c756", "metadata": {"papermill": {"duration": 0.157285, "end_time": "2021-12-04T15:58:17.623302", "exception": false, "start_time": "2021-12-04T15:58:17.466017", "status": "completed"}, "tags": []}, "source": ["We create an arbitrary number of random sequences of numbers between 0 and `num_categories-1`.\n", "The label is simply the tensor flipped over the sequence dimension.\n", "We can create the corresponding data loaders below."]}, {"cell_type": "code", "execution_count": 16, "id": "8e1d16b7", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:17.940041Z", "iopub.status.busy": "2021-12-04T15:58:17.939564Z", "iopub.status.idle": "2021-12-04T15:58:17.956756Z", "shell.execute_reply": "2021-12-04T15:58:17.957137Z"}, "papermill": {"duration": 0.177314, "end_time": "2021-12-04T15:58:17.957279", "exception": false, "start_time": "2021-12-04T15:58:17.779965", "status": "completed"}, "tags": []}, "outputs": [], "source": ["dataset = partial(ReverseDataset, 10, 16)\n", "train_loader = data.DataLoader(dataset(50000), batch_size=128, shuffle=True, drop_last=True, pin_memory=True)\n", "val_loader = data.DataLoader(dataset(1000), batch_size=128)\n", "test_loader = data.DataLoader(dataset(10000), batch_size=128)"]}, {"cell_type": "markdown", "id": "7a21b9dc", "metadata": {"papermill": {"duration": 0.156233, "end_time": "2021-12-04T15:58:18.269306", "exception": false, "start_time": "2021-12-04T15:58:18.113073", "status": "completed"}, "tags": []}, "source": ["Let's look at an arbitrary sample of the dataset:"]}, {"cell_type": "code", "execution_count": 17, "id": "aeda9084", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:18.587916Z", "iopub.status.busy": "2021-12-04T15:58:18.587443Z", "iopub.status.idle": "2021-12-04T15:58:18.590343Z", "shell.execute_reply": "2021-12-04T15:58:18.590793Z"}, "papermill": {"duration": 0.16296, "end_time": "2021-12-04T15:58:18.590927", "exception": false, "start_time": "2021-12-04T15:58:18.427967", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Input data: tensor([9, 6, 2, 0, 6, 2, 7, 9, 7, 3, 3, 4, 3, 7, 0, 9])\n", "Labels: tensor([9, 0, 7, 3, 4, 3, 3, 7, 9, 7, 2, 6, 0, 2, 6, 9])\n"]}], "source": ["inp_data, labels = train_loader.dataset[0]\n", "print(\"Input data:\", inp_data)\n", "print(\"Labels: \", labels)"]}, {"cell_type": "markdown", "id": "e5c8430c", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.156663, "end_time": "2021-12-04T15:58:18.903232", "exception": false, "start_time": "2021-12-04T15:58:18.746569", "status": "completed"}, "tags": []}, "source": ["During training, we pass the input sequence through the Transformer encoder and predict the output for each input token.\n", "We use the standard Cross-Entropy loss to perform this.\n", "Every number is represented as a one-hot vector.\n", "Remember that representing the categories as single scalars decreases the expressiveness of the model extremely\n", "as $0$ and $1$ are not closer related than $0$ and $9$ in our example.\n", "An alternative to a one-hot vector is using a learned embedding vector as it is provided by the PyTorch module `nn.Embedding`.\n", "However, using a one-hot vector with an additional linear layer as in our case has the same effect\n", "as an embedding layer (`self.input_net` maps one-hot vector to a dense vector,\n", "where each row of the weight matrix represents the embedding for a specific category).\n", "\n", "To implement the training dynamic, we create a new class inheriting from `TransformerPredictor`\n", "and overwriting the training, validation and test step functions."]}, {"cell_type": "code", "execution_count": 18, "id": "9e00bf72", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:19.222837Z", "iopub.status.busy": "2021-12-04T15:58:19.222299Z", "iopub.status.idle": "2021-12-04T15:58:19.224262Z", "shell.execute_reply": "2021-12-04T15:58:19.223880Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.164853, "end_time": "2021-12-04T15:58:19.224372", "exception": false, "start_time": "2021-12-04T15:58:19.059519", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class ReversePredictor(TransformerPredictor):\n", " def _calculate_loss(self, batch, mode=\"train\"):\n", " # Fetch data and transform categories to one-hot vectors\n", " inp_data, labels = batch\n", " inp_data = F.one_hot(inp_data, num_classes=self.hparams.num_classes).float()\n", "\n", " # Perform prediction and calculate loss and accuracy\n", " preds = self.forward(inp_data, add_positional_encoding=True)\n", " loss = F.cross_entropy(preds.view(-1, preds.size(-1)), labels.view(-1))\n", " acc = (preds.argmax(dim=-1) == labels).float().mean()\n", "\n", " # Logging\n", " self.log(\"%s_loss\" % mode, loss)\n", " self.log(\"%s_acc\" % mode, acc)\n", " return loss, acc\n", "\n", " def training_step(self, batch, batch_idx):\n", " loss, _ = self._calculate_loss(batch, mode=\"train\")\n", " return loss\n", "\n", " def validation_step(self, batch, batch_idx):\n", " _ = self._calculate_loss(batch, mode=\"val\")\n", "\n", " def test_step(self, batch, batch_idx):\n", " _ = self._calculate_loss(batch, mode=\"test\")"]}, {"cell_type": "markdown", "id": "5bbaf3a6", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.155556, "end_time": "2021-12-04T15:58:19.534838", "exception": false, "start_time": "2021-12-04T15:58:19.379282", "status": "completed"}, "tags": []}, "source": ["Finally, we can create a training function similar to the one we have seen in Tutorial 5 for PyTorch Lightning.\n", "We create a `pl.Trainer` object, running for $N$ epochs, logging in TensorBoard, and saving our best model based on the validation.\n", "Afterward, we test our models on the test set.\n", "An additional parameter we pass to the trainer here is `gradient_clip_val`.\n", "This clips the norm of the gradients for all parameters before taking an optimizer step and prevents the model\n", "from diverging if we obtain very high gradients at, for instance, sharp loss surfaces (see many good blog posts\n", "on gradient clipping, like [DeepAI glossary](https://deepai.org/machine-learning-glossary-and-terms/gradient-clipping)).\n", "For Transformers, gradient clipping can help to further stabilize the training during the first few iterations, and also afterward.\n", "In plain PyTorch, you can apply gradient clipping via `torch.nn.utils.clip_grad_norm_(...)`\n", "(see [documentation](https://pytorch.org/docs/stable/generated/torch.nn.utils.clip_grad_norm_.html#torch.nn.utils.clip_grad_norm_)).\n", "The clip value is usually between 0.5 and 10, depending on how harsh you want to clip large gradients.\n", "After having explained this, let's implement the training function:"]}, {"cell_type": "code", "execution_count": 19, "id": "13fba27b", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:19.861262Z", "iopub.status.busy": "2021-12-04T15:58:19.860777Z", "iopub.status.idle": "2021-12-04T15:58:19.862292Z", "shell.execute_reply": "2021-12-04T15:58:19.862689Z"}, "papermill": {"duration": 0.170942, "end_time": "2021-12-04T15:58:19.862822", "exception": false, "start_time": "2021-12-04T15:58:19.691880", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def train_reverse(**kwargs):\n", " # Create a PyTorch Lightning trainer with the generation callback\n", " root_dir = os.path.join(CHECKPOINT_PATH, \"ReverseTask\")\n", " os.makedirs(root_dir, exist_ok=True)\n", " trainer = pl.Trainer(\n", " default_root_dir=root_dir,\n", " callbacks=[ModelCheckpoint(save_weights_only=True, mode=\"max\", monitor=\"val_acc\")],\n", " gpus=1 if str(device).startswith(\"cuda\") else 0,\n", " max_epochs=10,\n", " gradient_clip_val=5,\n", " progress_bar_refresh_rate=1,\n", " )\n", " trainer.logger._default_hp_metric = None # Optional logging argument that we don't need\n", "\n", " # Check whether pretrained model exists. If yes, load it and skip training\n", " pretrained_filename = os.path.join(CHECKPOINT_PATH, \"ReverseTask.ckpt\")\n", " if os.path.isfile(pretrained_filename):\n", " print(\"Found pretrained model, loading...\")\n", " model = ReversePredictor.load_from_checkpoint(pretrained_filename)\n", " else:\n", " model = ReversePredictor(max_iters=trainer.max_epochs * len(train_loader), **kwargs)\n", " trainer.fit(model, train_loader, val_loader)\n", "\n", " # Test best model on validation and test set\n", " val_result = trainer.test(model, test_dataloaders=val_loader, verbose=False)\n", " test_result = trainer.test(model, test_dataloaders=test_loader, verbose=False)\n", " result = {\"test_acc\": test_result[0][\"test_acc\"], \"val_acc\": val_result[0][\"test_acc\"]}\n", "\n", " model = model.to(device)\n", " return model, result"]}, {"cell_type": "markdown", "id": "11c5e6ce", "metadata": {"papermill": {"duration": 0.157063, "end_time": "2021-12-04T15:58:20.175228", "exception": false, "start_time": "2021-12-04T15:58:20.018165", "status": "completed"}, "tags": []}, "source": ["Finally, we can train the model.\n", "In this setup, we will use a single encoder block and a single head in the Multi-Head Attention.\n", "This is chosen because of the simplicity of the task, and in this case, the attention can actually be interpreted\n", "as an \"explanation\" of the predictions (compared to the other papers above dealing with deep Transformers)."]}, {"cell_type": "code", "execution_count": 20, "id": "a41d7448", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:20.491778Z", "iopub.status.busy": "2021-12-04T15:58:20.491301Z", "iopub.status.idle": "2021-12-04T15:58:24.308685Z", "shell.execute_reply": "2021-12-04T15:58:24.308229Z"}, "papermill": {"duration": 3.977688, "end_time": "2021-12-04T15:58:24.308813", "exception": false, "start_time": "2021-12-04T15:58:20.331125", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/connectors/callback_connector.py:90: LightningDeprecationWarning: Setting `Trainer(progress_bar_refresh_rate=1)` is deprecated in v1.5 and will be removed in v1.7. Please pass `pytorch_lightning.callbacks.progress.TQDMProgressBar` with `refresh_rate` directly to the Trainer's `callbacks` argument instead. Or, to disable the progress bar pass `enable_progress_bar = False` to the Trainer.\n", " rank_zero_deprecation(\n", "GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/trainer.py:901: LightningDeprecationWarning: `trainer.test(test_dataloaders)` is deprecated in v1.4 and will be removed in v1.6. Use `trainer.test(dataloaders)` instead.\n", " rank_zero_deprecation(\n", "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model, loading...\n"]}, {"name": "stderr", "output_type": "stream", "text": ["Missing logger folder: saved_models/Transformers/ReverseTask/lightning_logs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/data_loading.py:111: UserWarning: The dataloader, test_dataloader 0, does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` (try 12 which is the number of cpus on this machine) in the `DataLoader` init to improve performance.\n", " rank_zero_warn(\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "b9ed1cfedbeb4586bab29909930e47b1", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "89c0145b83d34648bacf9da6ad15d74d", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}], "source": ["reverse_model, reverse_result = train_reverse(\n", " input_dim=train_loader.dataset.num_categories,\n", " model_dim=32,\n", " num_heads=1,\n", " num_classes=train_loader.dataset.num_categories,\n", " num_layers=1,\n", " dropout=0.0,\n", " lr=5e-4,\n", " warmup=50,\n", ")"]}, {"cell_type": "markdown", "id": "ccc85090", "metadata": {"papermill": {"duration": 0.163772, "end_time": "2021-12-04T15:58:24.638088", "exception": false, "start_time": "2021-12-04T15:58:24.474316", "status": "completed"}, "tags": []}, "source": ["The warning of PyTorch Lightning regarding the number of workers can be ignored for now.\n", "As the data set is so simple and the `__getitem__` finishes a neglectable time, we don't need subprocesses\n", "to provide us the data (in fact, more workers can slow down the training as we have communication overhead among processes/threads).\n", "First, let's print the results:"]}, {"cell_type": "code", "execution_count": 21, "id": "02e867c0", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:24.972467Z", "iopub.status.busy": "2021-12-04T15:58:24.971991Z", "iopub.status.idle": "2021-12-04T15:58:24.974029Z", "shell.execute_reply": "2021-12-04T15:58:24.974648Z"}, "papermill": {"duration": 0.171511, "end_time": "2021-12-04T15:58:24.974782", "exception": false, "start_time": "2021-12-04T15:58:24.803271", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Val accuracy: 100.00%\n", "Test accuracy: 100.00%\n"]}], "source": ["print(\"Val accuracy: %4.2f%%\" % (100.0 * reverse_result[\"val_acc\"]))\n", "print(\"Test accuracy: %4.2f%%\" % (100.0 * reverse_result[\"test_acc\"]))"]}, {"cell_type": "markdown", "id": "389ff9fb", "metadata": {"papermill": {"duration": 0.164894, "end_time": "2021-12-04T15:58:25.304480", "exception": false, "start_time": "2021-12-04T15:58:25.139586", "status": "completed"}, "tags": []}, "source": ["As we would have expected, the Transformer can correctly solve the task.\n", "However, how does the attention in the Multi-Head Attention block looks like for an arbitrary input?\n", "Let's try to visualize it below."]}, {"cell_type": "code", "execution_count": 22, "id": "f740e35c", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:25.645172Z", "iopub.status.busy": "2021-12-04T15:58:25.644677Z", "iopub.status.idle": "2021-12-04T15:58:25.650646Z", "shell.execute_reply": "2021-12-04T15:58:25.650153Z"}, "papermill": {"duration": 0.178894, "end_time": "2021-12-04T15:58:25.650756", "exception": false, "start_time": "2021-12-04T15:58:25.471862", "status": "completed"}, "tags": []}, "outputs": [], "source": ["data_input, labels = next(iter(val_loader))\n", "inp_data = F.one_hot(data_input, num_classes=reverse_model.hparams.num_classes).float()\n", "inp_data = inp_data.to(device)\n", "attention_maps = reverse_model.get_attention_maps(inp_data)"]}, {"cell_type": "markdown", "id": "82e9b36d", "metadata": {"papermill": {"duration": 0.164929, "end_time": "2021-12-04T15:58:25.982199", "exception": false, "start_time": "2021-12-04T15:58:25.817270", "status": "completed"}, "tags": []}, "source": ["The object `attention_maps` is a list of length $N$ where $N$ is the number of layers.\n", "Each element is a tensor of shape [Batch, Heads, SeqLen, SeqLen], which we can verify below."]}, {"cell_type": "code", "execution_count": 23, "id": "ba03c69a", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:26.324791Z", "iopub.status.busy": "2021-12-04T15:58:26.324320Z", "iopub.status.idle": "2021-12-04T15:58:26.326971Z", "shell.execute_reply": "2021-12-04T15:58:26.326543Z"}, "papermill": {"duration": 0.178216, "end_time": "2021-12-04T15:58:26.327081", "exception": false, "start_time": "2021-12-04T15:58:26.148865", "status": "completed"}, "tags": []}, "outputs": [{"data": {"text/plain": ["torch.Size([128, 1, 16, 16])"]}, "execution_count": 23, "metadata": {}, "output_type": "execute_result"}], "source": ["attention_maps[0].shape"]}, {"cell_type": "markdown", "id": "1ff46b13", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.16452, "end_time": "2021-12-04T15:58:26.658828", "exception": false, "start_time": "2021-12-04T15:58:26.494308", "status": "completed"}, "tags": []}, "source": ["Next, we will write a plotting function that takes as input the sequences, attention maps, and an index\n", "indicating for which batch element we want to visualize the attention map.\n", "We will create a plot where over rows, we have different layers, while over columns, we show the different heads.\n", "Remember that the softmax has been applied for each row separately."]}, {"cell_type": "code", "execution_count": 24, "id": "f23fa88e", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:26.999173Z", "iopub.status.busy": "2021-12-04T15:58:26.998690Z", "iopub.status.idle": "2021-12-04T15:58:27.000240Z", "shell.execute_reply": "2021-12-04T15:58:27.000618Z"}, "papermill": {"duration": 0.176536, "end_time": "2021-12-04T15:58:27.000749", "exception": false, "start_time": "2021-12-04T15:58:26.824213", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def plot_attention_maps(input_data, attn_maps, idx=0):\n", " if input_data is not None:\n", " input_data = input_data[idx].detach().cpu().numpy()\n", " else:\n", " input_data = np.arange(attn_maps[0][idx].shape[-1])\n", " attn_maps = [m[idx].detach().cpu().numpy() for m in attn_maps]\n", "\n", " num_heads = attn_maps[0].shape[0]\n", " num_layers = len(attn_maps)\n", " seq_len = input_data.shape[0]\n", " fig_size = 4 if num_heads == 1 else 3\n", " fig, ax = plt.subplots(num_layers, num_heads, figsize=(num_heads * fig_size, num_layers * fig_size))\n", " if num_layers == 1:\n", " ax = [ax]\n", " if num_heads == 1:\n", " ax = [[a] for a in ax]\n", " for row in range(num_layers):\n", " for column in range(num_heads):\n", " ax[row][column].imshow(attn_maps[row][column], origin=\"lower\", vmin=0)\n", " ax[row][column].set_xticks(list(range(seq_len)))\n", " ax[row][column].set_xticklabels(input_data.tolist())\n", " ax[row][column].set_yticks(list(range(seq_len)))\n", " ax[row][column].set_yticklabels(input_data.tolist())\n", " ax[row][column].set_title(\"Layer %i, Head %i\" % (row + 1, column + 1))\n", " fig.subplots_adjust(hspace=0.5)\n", " plt.show()"]}, {"cell_type": "markdown", "id": "5575de2c", "metadata": {"papermill": {"duration": 0.165585, "end_time": "2021-12-04T15:58:27.339327", "exception": false, "start_time": "2021-12-04T15:58:27.173742", "status": "completed"}, "tags": []}, "source": ["Finally, we can plot the attention map of our trained Transformer on the reverse task:"]}, {"cell_type": "code", "execution_count": 25, "id": "70711ff5", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:27.678174Z", "iopub.status.busy": "2021-12-04T15:58:27.677704Z", "iopub.status.idle": "2021-12-04T15:58:28.093751Z", "shell.execute_reply": "2021-12-04T15:58:28.094142Z"}, "papermill": {"duration": 0.587062, "end_time": "2021-12-04T15:58:28.094303", "exception": false, "start_time": "2021-12-04T15:58:27.507241", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "JVBERi0xLjQKJazcIKu6CjEgMCBvYmoKPDwgL1BhZ2VzIDIgMCBSIC9UeXBlIC9DYXRhbG9nID4+CmVuZG9iago4IDAgb2JqCjw8IC9FeHRHU3RhdGUgNCAwIFIgL0ZvbnQgMyAwIFIgL1BhdHRlcm4gNSAwIFIKL1Byb2NTZXQgWyAvUERGIC9UZXh0IC9JbWFnZUIgL0ltYWdlQyAvSW1hZ2VJIF0gL1NoYWRpbmcgNiAwIFIKL1hPYmplY3QgNyAwIFIgPj4KZW5kb2JqCjExIDAgb2JqCjw8IC9Bbm5vdHMgMTAgMCBSIC9Db250ZW50cyA5IDAgUgovR3JvdXAgPDwgL0NTIC9EZXZpY2VSR0IgL1MgL1RyYW5zcGFyZW5jeSAvVHlwZSAvR3JvdXAgPj4KL01lZGlhQm94IFsgMCAwIDI0NS4xOTkzNzUgMjYzLjYzNjg3NSBdIC9QYXJlbnQgMiAwIFIgL1Jlc291cmNlcyA4IDAgUgovVHlwZSAvUGFnZSA+PgplbmRvYmoKOSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDEyIDAgUiA+PgpzdHJlYW0KeJylmE1PGzEQhu/+FT62Ujvx+NtHEC0t6iVtpB6qHhCEtAioAKmo/77jQLCXWVu75ABJXu36eWfWnvEa5aVYHKDc3EslL+nvQaI8louj9d/fZ+uvx4fy7F4o0q+Ftg4wJRMc/byqf2pvwBsf6esVXTz4+UuIG0Hj0z3HNPRGCK3Aucf7DMSA+Toa3QRI6YV8NZAtgsGdXgapZaJdiFs5htAYwNrdx91afpc3cnGgc+hIoSOFrgahCwqdxsIocwLy59i4Z9dy8Rnl0R+5FEt5uxtSUch5WAXxaWBShA5gnGWxF1WB2YUuDilvD+KW/iv5XtFo2gIGu01sAh0i6owXhyu5+IgSlVxdbJ/V6lz8kG/SW/lTrk7Eh5VYiq0NYRUky/CV2sXTowh+Mt5yvLPgDMNXahfvMGdpKj5wvI+AmuErtYv3NmdpKl5xfEQIyPCV2sWHmLM0FW84PjkwiuErtYtPOmdpj+hRRYiJ8Wu5awCVy4ma6gBHHGgNNnIHldx3gCnnao9HgMaDCtxBJfcdGJ2TNdWBH3FgE3jPHVRy34H1OVl71ACk5qB5CazlvgOvcrL2mYnBQ+RVsJb7DoLJyZrqQI84SAosL4S13HcQQ07WVAeOO9DKguK1sJb7nUipnKw9nkLuw56Xw1ruO0CbkzXVQRxxYBA0r4i13HegY07WPg6etxNG0ZTyu4kI6qU62hFA01aLjM/bAxSotTSLGLSoLSjtF6yft+oL1AV4qh81tKgtKO0S1Mx+X6ABaa4waFFbUE+T0c6c18/Q6Gh6MGhRW1DaEWgzr7EUaIq0fBi0qC1oshD1ayNF1LRkGLWSW9jc/i3O6+MVV9OeIHFukZtc3Qu2m2E0tA2IHFrkJtQ4cGlew664TkMKnFvkJpe6O728vHLBovfgeG2q5CbXawi96tSfVFEB8vJUyU0udXLTK1AjLbniJgOBV6hKbnJjgjS7ET+/USp6C+RFqpKbTUAZcK8uU5q+Jl6nKrnJpauxV6m6LU8beu/jpaqSm1zqi6G3fgdcLU8ejza2L+LDg43GUcT42YL4Nn5Icd08pMh3zDnsGF5fRuoS1Da+TXWGsakTRt2EVsvjdsaG3Z1V7vQwd19O/63vJL6Tn9an53JQfpfiP9UvoXUKZW5kc3RyZWFtCmVuZG9iagoxMiAwIG9iago4NTcKZW5kb2JqCjEwIDAgb2JqClsgXQplbmRvYmoKMTggMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCA3OSA+PgpzdHJlYW0KeJwzNzVSMFCwtAASZqYmCuZGlgophlxAPoiVy2VoaQ5m5YBZJsYGQJapqSkSCyIL0wthweRgtLGJOdQEBAskB7Y2B2ZbDlcGVxoA1pQcDAplbmRzdHJlYW0KZW5kb2JqCjE5IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggNjEgPj4Kc3RyZWFtCnicMzU1VzBQsLQAEqamRgrmRpYKKYZcQD6IlctlaGkOZuWAWRbGQAZIGZxhAKTBmnNgenK4MrjSAMsVEMwKZW5kc3RyZWFtCmVuZG9iagoyMCAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDMwNyA+PgpzdHJlYW0KeJw9kktuAzEMQ/c+hS4QwPrZnvOkKLqY3n/bJyXpihzZFkVqlrpMWVMekDSThH/p8HCxnfI7bM9mZuBaopeJ5ZTn0BVi7qJ82cxGXVknxeqEZjq36FE5Fwc2Taqfqyyl3S54Dtcmnlv2ET+80KAe1DUuCTd0V6NlKTRjqvt/0nv8jDLgakxdbFKrex88XkRV6OgHR4kiY5cX5+NBCelKwmhaiJV3RQNB7vK0ynsJ7tveasiyB6mYzjspZrDrdFIubheHIR7I8qjw5aPYa0LP+LArJfRI2IYzcifuaMbm1MjikP7ejQRLj65oIfPgr27WLmC8UzpFYmROcqxpi1VO91AU07nDvQwQ9WxFQylzkdXqX8POC2uWbBZ4SvoFHqPdJksOVtnbqE7vrTzZ0PcfWtd0HwplbmRzdHJlYW0KZW5kb2JqCjIxIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggNjggPj4Kc3RyZWFtCnicMza0UDBQMDdX0DU0NFUwMjJQMDQyUUgx5DI0NAczc7lggjlglokBkGEIJMEacrhgWnPAOiCyUK05XBlcaQBxohJnCmVuZHN0cmVhbQplbmRvYmoKMjIgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAyMzEgPj4Kc3RyZWFtCnicNU85kgQhDMt5hT4wVRjbQL+np7Y22Pl/upKZTpDwIcnTEx2ZeJkjI7Bmx9taZCBm4FNMxb/2tA8TqvfgHiKUiwthhpFw1qzjbp6OF/92lc9YB+82+IpZXhDYwkzWVxZnLtsFY2mcxDnJboxdE7GNda2nU1hHMKEMhHS2w5Qgc1Sk9MmOMuboOJEnnovv9tssdjl+DusLNo0hFef4KnqCNoOi7HnvAhpyQf9d3fgeRbvoJSAbCRbWUWLunOWEX712dB61KBJzQppBLhMhzekqphCaUKyzo6BSUXCpPqforJ9/5V9cLQplbmRzdHJlYW0KZW5kb2JqCjIzIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMjQ5ID4+CnN0cmVhbQp4nD1QO45EIQzrOYUv8CTyI3AeRqstZu/frgOaKVBMfrYzJNARgUcMMZSv4yWtoK6Bv4tC8W7i64PCIKtDUiDOeg+IdOymNpETOh2cMz9hN2OOwEUxBpzpdKY9ByY5+8IKhHMbZexWSCeJqiKO6jOOKZ4qe594FiztyDZbJ5I95CDhUlKJyaWflMo/bcqUCjpm0QQsErngZBNNOMu7SVKMGZQy6h6mdiJ9rDzIozroZE3OrCOZ2dNP25n4HHC3X9pkTpXHdB7M+Jy0zoM5Fbr344k2B02N2ujs9xNpKi9Sux1anX51EpXdGOcYEpdnfxnfZP/5B/6HWiIKZW5kc3RyZWFtCmVuZG9iagoyNCAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDM5NSA+PgpzdHJlYW0KeJw9UktuxUAI2+cUXKDS8JvPeVJV3bz7b2tDUqkqvIkxxjB9ypC55UtdEnGFybderls8pnwuW1qZeYi7i40lPrbcl+4htl10LrE4HUfyCzKdKkSozarRofhCloUHkE7woQvCfTn+4y+AwdewDbjhPTJBsCTmKULGblEZmhJBEWHnkRWopFCfWcLfUe7r9zIFam+MpQtjHPQJtAVCbUjEAupAAETslFStkI5nJBO/Fd1nYhxg59GyAa4ZVESWe+zHiKnOqIy8RMQ+T036KJZMLVbGblMZX/yUjNR8dAUqqTTylPLQVbPQC1iJeRL2OfxI+OfWbCGGOm7W8onlHzPFMhLOYEs5YKGX40fg21l1Ea4dubjOdIEfldZwTLTrfsj1T/5021rNdbxyCKJA5U1B8LsOrkaxxMQyPp2NKXqiLLAamrxGM8FhEBHW98PIAxr9crwQNKdrIrRYIpu1YkSNimxzPb0E1kzvxTnWwxPCbO+d1qGyMzMqIYLauoZq60B2s77zcLafPzPoom0KZW5kc3RyZWFtCmVuZG9iagoyNSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDI0OSA+PgpzdHJlYW0KeJxNUUmKAzAMu+cV+kAhXpO8p0OZQ+f/18oOhTkECa+Sk5aYWAsPMYQfLD34kSFzN/0bfqLZu1l6ksnZ/5jnIlNR+FKoLmJCXYgbz6ER8D2haxJZsb3xOSyjmXO+Bx+FuAQzoQFjfUkyuajmlSETTgx1HA5apMK4a2LD4lrRPI3cbvtGZmUmhA2PZELcGICIIOsCshgslDY2EzJZzgPtDckNWmDXqRtRi4IrlNYJdKJWxKrM4LPm1nY3Qy3y4Kh98fpoVpdghdFL9Vh4X4U+mKmZdu6SQnrhTTsizB4KpDI7LSu1e8TqboH6P8tS8P3J9/gdrw/N/FycCmVuZHN0cmVhbQplbmRvYmoKMjYgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCA5NCA+PgpzdHJlYW0KeJxFjcERwCAIBP9UQQkKCtpPJpOH9v+NEDJ8YOcO7oQFC7Z5Rh8FlSZeFVgHSmPcUI9AveFyLcncBQ9wJ3/a0FScltN3aZFJVSncpBJ5/w5nJpCoedFjnfcLY/sjPAplbmRzdHJlYW0KZW5kb2JqCjI3IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMzIyID4+CnN0cmVhbQp4nDVRu23FMAzsNQUXMCB+Jc3jIEiRt3+bO9qpSNO8H1VeMqVcLnXJKllh8qVDdYqmfJ5mpvwO9ZDjmB7ZIbpT1pZ7GBaWiXlKHbGaLPdwCza+AJoScwvx9wjwK4BRwESgbvH3D7pZEkAaFPwU6JqrllhiAg2Lha3ZFeJW3SlYuKv4diS5BwlyMVnoUw5Fiim3wHwZLNmRWpzrclkK/259AhphhTjss4tE4HnAA0wk/mSAbM8+W+zq6kU2doY46dCAi4CbzSQBQVM4qz64Yftqu+bnmSgnODnWr6Ixvg1O5ktS3le5x8+gQd74Mzxnd45QDppQCPTdAiCH3cBGhD61z8AuA7ZJu3djSvmcZCm+BDYK9qhTHcrwYuzMVm/Y/MfoymZRbJCV9dHpDsrcoBNiHm9koVuytvs3D7N9/wFfGXtkCmVuZHN0cmVhbQplbmRvYmoKMjggMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCA4MyA+PgpzdHJlYW0KeJxFjLsNwDAIRHumYAR+JvY+UZTC3r8NECVuuCfdPVwdCZkpbjPDQwaeDCyGXXGB9JYwC1xHUI6d7KNh1b7qBI31plLz7w+Unuys4obrAQJCGmYKZW5kc3RyZWFtCmVuZG9iagoyOSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDE2MCA+PgpzdHJlYW0KeJxFkDkSAzEIBHO9gidIXIL3rMu1wfr/qQfWR6LpAjQcuhZNynoUaD7psUahutBr6CxKkkTBFpIdUKdjiDsoSExIY5JIth6DI5pYs12YmVQqs1LhtGnFwr/ZWtXIRI1wjfyJ6QZU/E/qXJTwTYOvkjH6GFS8O4OMSfheRdxaMe3+RDCxGfYJb0UmBYSJsanZvs9ghsz3Ctc4x/MNTII36wplbmRzdHJlYW0KZW5kb2JqCjMwIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggNzAgPj4Kc3RyZWFtCnicMzM2UzBQsDACEqamhgrmRpYKKYZcQD6IlcsFE8sBs8wszIEsIwuQlhwuQwtjMG1ibKRgZmIGZFkgMSC6MrjSAJiaEwMKZW5kc3RyZWFtCmVuZG9iagozMSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDMyMCA+PgpzdHJlYW0KeJw1UktuBTEI288puECl8E/O86qqi777b2sTvRVMMGDjKS9Z0ku+1CXbpcPkWx/3JbFC3o/tmsxSxfcWsxTPLa9HzxG3LQoEURM9WJkvFSLUz/ToOqhwSp+BVwi3FBu8g0kAg2r4Bx6lMyBQ50DGu2IyUgOCJNhzaXEIiXImiX+kvJ7fJ62kofQ9WZnL35NLpdAdTU7oAcXKxUmgXUn5oJmYSkSSl+t9sUL0hsCSPD5HMcmA7DaJbaIFJucepSXMxBQ6sMcCvGaa1VXoYMIehymMVwuzqB5s8lsTlaQdreMZ2TDeyzBTYqHhsAXU5mJlgu7l4zWvwojtUZNdw3Duls13CNFo/hsWyuBjFZKAR6exEg1pOMCIwJ5eOMVe8xM5DsCIY52aLAxjaCaneo6JwNCes6VhxsceWvXzD1TpfIcKZW5kc3RyZWFtCmVuZG9iagozMiAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDE4ID4+CnN0cmVhbQp4nDM2tFAwgMMUQ640AB3mA1IKZW5kc3RyZWFtCmVuZG9iagozMyAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDM0MCA+PgpzdHJlYW0KeJw1UjluBDEM6/0KfSCAbtvv2SBIkfy/DanZFANxdFKUO1pUdsuHhVS17HT5tJXaEjfkd2WFxAnJqxLtUoZIqLxWIdXvmTKvtzVnBMhSpcLkpORxyYI/w6WnC8f5trGv5cgdjx5YFSOhRMAyxcToGpbO7rBmW36WacCPeIScK9Ytx1gFUhvdOO2K96F5LbIGiL2ZlooKHVaJFn5B8aBHjX32GFRYINHtHElwjIlQkYB2gdpIDDl7LHZRH/QzKDET6NobRdxBgSWSmDnFunT03/jQsaD+2Iw3vzoq6VtaWWPSPhvtlMYsMul6WPR089bHgws076L859UMEjRljZLGB63aOYaimVFWeLdDkw3NMcch8w6ewxkJSvo8FL+PJRMdlMjfDg2hf18eo4ycNt4C5qI/bRUHDuKzw165gRVKF2uS9wGpTOiB6f+v8bW+19cfHe2AxgplbmRzdHJlYW0KZW5kb2JqCjM0IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMjUxID4+CnN0cmVhbQp4nC1RSXIDQQi7zyv0hGan32OXK4fk/9cIygcGDYtAdFrioIyfICxXvOWRq2jD3zMxgt8Fh34r121Y5EBUIEljUDWhdvF69B7YcZgJzJPWsAxmrA/8jCnc6MXhMRlnt9dl1BDsXa89mUHJrFzEJRMXTNVhI2cOP5kyLrRzPTcg50ZYl2GQblYaMxKONIVIIYWqm6TOBEESjK5GjTZyFPulL490hlWNqDHscy1tX89NOGvQ7Fis8uSUHl1xLicXL6wc9PU2AxdRaazyQEjA/W4P9XOyk994S+fOFtPje83J8sJUYMWb125ANtXi37yI4/uMr+fn+fwDX2BbiAplbmRzdHJlYW0KZW5kb2JqCjM1IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMTQxID4+CnN0cmVhbQp4nD2PwQ7DMAhD7/kK/0Ck2CmhfE+naofu/68jS7sLegJjjIXQ0BuqmsOGYJvjxdIlVGv4FMVAJTfImWAOpaTSHUeRemI4GFwetBuO4rHo+hG7kmZ90MZCuiVogHusU2ncpnETxB01Beop6pyjvBC5n6ln2DSS3TSzknO4Db97z1PX/6ervMv5Bb13Lv4KZW5kc3RyZWFtCmVuZG9iagozNiAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDIxNSA+PgpzdHJlYW0KeJw1UTkOAyEM7PcV/kAkjC94T6Iozf6/zYzRVh7BXIa0lCGZ8lKTqCHlUz56mS6cutzXzGo055a0LXOAuLa8L62SwIlmiIPBaZi4AZo8AUPX0ahRQxce0NSlUyiw3AQ+irduD91jtYGXtiHniSBiKBksQc2pRRMWbc8npDW/Xosb3pft3chTpcaWGIEGAVY4HNfo1/CVPU8m0XQVMtSrNcsYCRNFIjz5jqbVE+taNNIyEtTGEaxqA7w7/TBOAAATccsCZJ9KlLPkxG+x9LMGV/r+AZ9HVJYKZW5kc3RyZWFtCmVuZG9iagoxNiAwIG9iago8PCAvQmFzZUZvbnQgL0RlamFWdVNhbnMgL0NoYXJQcm9jcyAxNyAwIFIKL0VuY29kaW5nIDw8Ci9EaWZmZXJlbmNlcyBbIDMyIC9zcGFjZSA0NCAvY29tbWEgNDggL3plcm8gL29uZSAvdHdvIC90aHJlZSAvZm91ciAvZml2ZSAvc2l4IC9zZXZlbgovZWlnaHQgL25pbmUgNzIgL0ggNzYgL0wgOTcgL2EgMTAwIC9kIC9lIDExNCAvciAxMjEgL3kgXQovVHlwZSAvRW5jb2RpbmcgPj4KL0ZpcnN0Q2hhciAwIC9Gb250QkJveCBbIC0xMDIxIC00NjMgMTc5NCAxMjMzIF0gL0ZvbnREZXNjcmlwdG9yIDE1IDAgUgovRm9udE1hdHJpeCBbIDAuMDAxIDAgMCAwLjAwMSAwIDAgXSAvTGFzdENoYXIgMjU1IC9OYW1lIC9EZWphVnVTYW5zCi9TdWJ0eXBlIC9UeXBlMyAvVHlwZSAvRm9udCAvV2lkdGhzIDE0IDAgUiA+PgplbmRvYmoKMTUgMCBvYmoKPDwgL0FzY2VudCA5MjkgL0NhcEhlaWdodCAwIC9EZXNjZW50IC0yMzYgL0ZsYWdzIDMyCi9Gb250QkJveCBbIC0xMDIxIC00NjMgMTc5NCAxMjMzIF0gL0ZvbnROYW1lIC9EZWphVnVTYW5zIC9JdGFsaWNBbmdsZSAwCi9NYXhXaWR0aCAxMzQyIC9TdGVtViAwIC9UeXBlIC9Gb250RGVzY3JpcHRvciAvWEhlaWdodCAwID4+CmVuZG9iagoxNCAwIG9iagpbIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwCjYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgMzE4IDQwMSA0NjAgODM4IDYzNgo5NTAgNzgwIDI3NSAzOTAgMzkwIDUwMCA4MzggMzE4IDM2MSAzMTggMzM3IDYzNiA2MzYgNjM2IDYzNiA2MzYgNjM2IDYzNiA2MzYKNjM2IDYzNiAzMzcgMzM3IDgzOCA4MzggODM4IDUzMSAxMDAwIDY4NCA2ODYgNjk4IDc3MCA2MzIgNTc1IDc3NSA3NTIgMjk1CjI5NSA2NTYgNTU3IDg2MyA3NDggNzg3IDYwMyA3ODcgNjk1IDYzNSA2MTEgNzMyIDY4NCA5ODkgNjg1IDYxMSA2ODUgMzkwIDMzNwozOTAgODM4IDUwMCA1MDAgNjEzIDYzNSA1NTAgNjM1IDYxNSAzNTIgNjM1IDYzNCAyNzggMjc4IDU3OSAyNzggOTc0IDYzNCA2MTIKNjM1IDYzNSA0MTEgNTIxIDM5MiA2MzQgNTkyIDgxOCA1OTIgNTkyIDUyNSA2MzYgMzM3IDYzNiA4MzggNjAwIDYzNiA2MDAgMzE4CjM1MiA1MTggMTAwMCA1MDAgNTAwIDUwMCAxMzQyIDYzNSA0MDAgMTA3MCA2MDAgNjg1IDYwMCA2MDAgMzE4IDMxOCA1MTggNTE4CjU5MCA1MDAgMTAwMCA1MDAgMTAwMCA1MjEgNDAwIDEwMjMgNjAwIDUyNSA2MTEgMzE4IDQwMSA2MzYgNjM2IDYzNiA2MzYgMzM3CjUwMCA1MDAgMTAwMCA0NzEgNjEyIDgzOCAzNjEgMTAwMCA1MDAgNTAwIDgzOCA0MDEgNDAxIDUwMCA2MzYgNjM2IDMxOCA1MDAKNDAxIDQ3MSA2MTIgOTY5IDk2OSA5NjkgNTMxIDY4NCA2ODQgNjg0IDY4NCA2ODQgNjg0IDk3NCA2OTggNjMyIDYzMiA2MzIgNjMyCjI5NSAyOTUgMjk1IDI5NSA3NzUgNzQ4IDc4NyA3ODcgNzg3IDc4NyA3ODcgODM4IDc4NyA3MzIgNzMyIDczMiA3MzIgNjExIDYwNQo2MzAgNjEzIDYxMyA2MTMgNjEzIDYxMyA2MTMgOTgyIDU1MCA2MTUgNjE1IDYxNSA2MTUgMjc4IDI3OCAyNzggMjc4IDYxMiA2MzQKNjEyIDYxMiA2MTIgNjEyIDYxMiA4MzggNjEyIDYzNCA2MzQgNjM0IDYzNCA1OTIgNjM1IDU5MiBdCmVuZG9iagoxNyAwIG9iago8PCAvSCAxOCAwIFIgL0wgMTkgMCBSIC9hIDIwIDAgUiAvY29tbWEgMjEgMCBSIC9kIDIyIDAgUiAvZSAyMyAwIFIKL2VpZ2h0IDI0IDAgUiAvZml2ZSAyNSAwIFIgL2ZvdXIgMjYgMCBSIC9uaW5lIDI3IDAgUiAvb25lIDI4IDAgUiAvciAyOSAwIFIKL3NldmVuIDMwIDAgUiAvc2l4IDMxIDAgUiAvc3BhY2UgMzIgMCBSIC90aHJlZSAzMyAwIFIgL3R3byAzNCAwIFIgL3kgMzUgMCBSCi96ZXJvIDM2IDAgUiA+PgplbmRvYmoKMyAwIG9iago8PCAvRjEgMTYgMCBSID4+CmVuZG9iago0IDAgb2JqCjw8IC9BMSA8PCAvQ0EgMCAvVHlwZSAvRXh0R1N0YXRlIC9jYSAxID4+Ci9BMiA8PCAvQ0EgMSAvVHlwZSAvRXh0R1N0YXRlIC9jYSAxID4+ID4+CmVuZG9iago1IDAgb2JqCjw8ID4+CmVuZG9iago2IDAgb2JqCjw8ID4+CmVuZG9iago3IDAgb2JqCjw8IC9JMSAxMyAwIFIgPj4KZW5kb2JqCjEzIDAgb2JqCjw8IC9CaXRzUGVyQ29tcG9uZW50IDgKL0NvbG9yU3BhY2UgWy9JbmRleGVkIC9EZXZpY2VSR0IgNDQgKP3nJOnkGbXdK5/ZOJfYPpXXP5DWQ43WRIjVR4PTS37STmnMW1PFZ0/DaVwoe45cKXiOL2mNMGiNMWSNMmKNM2CNNF+NNV2MNVxcjDZbjDZajDdZjDdYjDhXjDhWizlVizlUizpSiztRijxOij5IiD9Fh0YMX0YLXkYJXFxFCFtFBlpFBVhEAlVEAVQpXQovRGVjb2RlUGFybXMgPDwgL0NvbG9ycyAxIC9Db2x1bW5zIDIxOCAvUHJlZGljdG9yIDEwID4+Ci9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9IZWlnaHQgMjE4IC9MZW5ndGggMzcgMCBSIC9TdWJ0eXBlIC9JbWFnZQovVHlwZSAvWE9iamVjdCAvV2lkdGggMjE4ID4+CnN0cmVhbQp4nO3cyXITMRSGUUOY5yGMCTOBEPz+z0d5p98Ocky1OtfmfDsv2q3TK99qWYtF9LTtPFruWws0tEqhoZUKDa1UaGilOmTas+io7Xt00Xbdy75KaGilQkMrFRpaqdDQSrX4GX1qux8dt+3DUICGVio0tFKhoZUKDa1Uh0zLjzG5fItutr2LakLR0NDmCQ0NbZ7Q0NDm6f+hReG8+NB2J+pAZ4NshoaGNk9oaGjzhIaGNk89WhYr/hgl9LTtRzQQshnaEg1tltCWaGizhLZEQ5sltPVyj9Dz6HHbqygvm1ayEdp6aGhjQlsPDW1MaOuhoY3pH2nZWfS27WF0/Pcd9VOsI0Prh4Y2VWj90NCmCq0fGtpUofX7HYXzc3Q3et82/byD1g8NDW1raP3Q0NC2htYPbR9pWThzt8+L6FHby2iKeQdtl9DQ0C4JbZfQ0NAuCW2XDpjWKYaCs5O2OJP+6Gtb/h33yjdDmyg0tC2hTRQa2pbQJgoNbUtoQ4rJJQ/RudcWj+DkV9T5erQhoaFthDYkNLSN0IaEhrYR2vhyt8+bttvRl6jjRBsfGtoqtPGhoa1CGx8a2qoytCyGgvzl/yB63RZXnaPNHRpaqdDQSoWGVio0tLrliuPg+dNbbfneAO1aQ0MrFRpaqdDQSoW2j7QsN9Q/absRoRUKDa1UaGilQkMrFdpB0/4AI6M+hwplbmRzdHJlYW0KZW5kb2JqCjM3IDAgb2JqCjUyNAplbmRvYmoKMiAwIG9iago8PCAvQ291bnQgMSAvS2lkcyBbIDExIDAgUiBdIC9UeXBlIC9QYWdlcyA+PgplbmRvYmoKMzggMCBvYmoKPDwgL0NyZWF0aW9uRGF0ZSAoRDoyMDIxMTIwNDE2NTgyOCswMicwMCcpCi9DcmVhdG9yIChNYXRwbG90bGliIHYzLjQuMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZykKL1Byb2R1Y2VyIChNYXRwbG90bGliIHBkZiBiYWNrZW5kIHYzLjQuMykgPj4KZW5kb2JqCnhyZWYKMCAzOQowMDAwMDAwMDAwIDY1NTM1IGYgCjAwMDAwMDAwMTYgMDAwMDAgbiAKMDAwMDAwOTQ2MiAwMDAwMCBuIAowMDAwMDA4MzI4IDAwMDAwIG4gCjAwMDAwMDgzNjAgMDAwMDAgbiAKMDAwMDAwODQ1OSAwMDAwMCBuIAowMDAwMDA4NDgwIDAwMDAwIG4gCjAwMDAwMDg1MDEgMDAwMDAgbiAKMDAwMDAwMDA2NSAwMDAwMCBuIAowMDAwMDAwNDAyIDAwMDAwIG4gCjAwMDAwMDEzNTQgMDAwMDAgbiAKMDAwMDAwMDIwOCAwMDAwMCBuIAowMDAwMDAxMzM0IDAwMDAwIG4gCjAwMDAwMDg1MzMgMDAwMDAgbiAKMDAwMDAwNzAyNSAwMDAwMCBuIAowMDAwMDA2ODI1IDAwMDAwIG4gCjAwMDAwMDY0MDcgMDAwMDAgbiAKMDAwMDAwODA3OCAwMDAwMCBuIAowMDAwMDAxMzc0IDAwMDAwIG4gCjAwMDAwMDE1MjUgMDAwMDAgbiAKMDAwMDAwMTY1OCAwMDAwMCBuIAowMDAwMDAyMDM4IDAwMDAwIG4gCjAwMDAwMDIxNzggMDAwMDAgbiAKMDAwMDAwMjQ4MiAwMDAwMCBuIAowMDAwMDAyODA0IDAwMDAwIG4gCjAwMDAwMDMyNzIgMDAwMDAgbiAKMDAwMDAwMzU5NCAwMDAwMCBuIAowMDAwMDAzNzYwIDAwMDAwIG4gCjAwMDAwMDQxNTUgMDAwMDAgbiAKMDAwMDAwNDMxMCAwMDAwMCBuIAowMDAwMDA0NTQzIDAwMDAwIG4gCjAwMDAwMDQ2ODUgMDAwMDAgbiAKMDAwMDAwNTA3OCAwMDAwMCBuIAowMDAwMDA1MTY4IDAwMDAwIG4gCjAwMDAwMDU1ODEgMDAwMDAgbiAKMDAwMDAwNTkwNSAwMDAwMCBuIAowMDAwMDA2MTE5IDAwMDAwIG4gCjAwMDAwMDk0NDIgMDAwMDAgbiAKMDAwMDAwOTUyMiAwMDAwMCBuIAp0cmFpbGVyCjw8IC9JbmZvIDM4IDAgUiAvUm9vdCAxIDAgUiAvU2l6ZSAzOSA+PgpzdGFydHhyZWYKOTY3OQolJUVPRgo=\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:58:27.918905\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["plot_attention_maps(data_input, attention_maps, idx=0)"]}, {"cell_type": "markdown", "id": "163001ca", "metadata": {"papermill": {"duration": 0.169201, "end_time": "2021-12-04T15:58:28.432387", "exception": false, "start_time": "2021-12-04T15:58:28.263186", "status": "completed"}, "tags": []}, "source": ["The model has learned to attend to the token that is on the flipped index of itself.\n", "Hence, it actually does what we intended it to do.\n", "We see that it however also pays some attention to values close to the flipped index.\n", "This is because the model doesn't need the perfect, hard attention to solve this problem,\n", "but is fine with this approximate, noisy attention map.\n", "The close-by indices are caused by the similarity of the positional encoding,\n", "which we also intended with the positional encoding."]}, {"cell_type": "markdown", "id": "d8ac4d91", "metadata": {"papermill": {"duration": 0.169547, "end_time": "2021-12-04T15:58:28.770515", "exception": false, "start_time": "2021-12-04T15:58:28.600968", "status": "completed"}, "tags": []}, "source": ["### Set Anomaly Detection\n", "\n", "Besides sequences, sets are another data structure that is relevant for many applications.\n", "In contrast to sequences, elements are unordered in a set.\n", "RNNs can only be applied on sets by assuming an order in the data, which however biases the model towards\n", "a non-existing order in the data.\n", "[Vinyals et al.\n", "(2015)](https://arxiv.org/abs/1511.06391) and other papers have shown that the assumed order can have a significant\n", "impact on the model's performance, and hence, we should try to not use RNNs on sets.\n", "Ideally, our model should be permutation-equivariant/invariant such that the output is the same no matter how we sort the elements in a set.\n", "\n", "Transformers offer the perfect architecture for this as the Multi-Head Attention is permutation-equivariant, and thus,\n", "outputs the same values no matter in what order we enter the inputs (inputs and outputs are permuted equally).\n", "The task we are looking at for sets is _Set Anomaly Detection_ which means that we try to find the element(s)\n", "in a set that does not fit the others.\n", "In the research community, the common application of anomaly detection is performed on a set of images,\n", "where $N-1$ images belong to the same category/have the same high-level features while one belongs to another category.\n", "Note that category does not necessarily have to relate to a class in a standard classification problem,\n", "but could be the combination of multiple features.\n", "For instance, on a face dataset, this could be people with glasses, male, beard, etc.\n", "An example of distinguishing different animals can be seen below.\n", "The first four images show foxes, while the last represents a different animal.\n", "We want to recognize that the last image shows a different animal, but it is not relevant which class of animal it is.\n", "\n", "
\n", "\n", "In this tutorial, we will use the CIFAR100 dataset.\n", "CIFAR100 has 600 images for 100 classes each with a resolution of 32x32, similar to CIFAR10.\n", "The larger amount of classes requires the model to attend to specific features in the images instead\n", "of coarse features as in CIFAR10, therefore making the task harder.\n", "We will show the model a set of 9 images of one class, and 1 image from another class.\n", "The task is to find the image that is from a different class than the other images.\n", "Using the raw images directly as input to the Transformer is not a good idea, because it is not translation\n", "invariant as a CNN, and would need to learn to detect image features from high-dimensional input first of all.\n", "Instead, we will use a pre-trained ResNet34 model from the torchvision package to obtain high-level,\n", "low-dimensional features of the images.\n", "The ResNet model has been pre-trained on the [ImageNet](http://image-net.org/) dataset which contains\n", "1 million images of 1k classes and varying resolutions.\n", "However, during training and testing, the images are usually scaled to a resolution of 224x224,\n", "and hence we rescale our CIFAR images to this resolution as well.\n", "Below, we will load the dataset, and prepare the data for being processed by the ResNet model."]}, {"cell_type": "code", "execution_count": 26, "id": "5ff1954f", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:29.115622Z", "iopub.status.busy": "2021-12-04T15:58:29.115139Z", "iopub.status.idle": "2021-12-04T15:58:34.276229Z", "shell.execute_reply": "2021-12-04T15:58:34.275775Z"}, "papermill": {"duration": 5.338193, "end_time": "2021-12-04T15:58:34.276369", "exception": false, "start_time": "2021-12-04T15:58:28.938176", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading https://www.cs.toronto.edu/~kriz/cifar-100-python.tar.gz to /__w/1/s/.datasets/cifar-100-python.tar.gz\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "efc763b5cd4e4ed9b3e3881bad434e2b", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0/169001437 [00:00150MB free disk space.\n", "So it is recommended to run this only on a local computer if you have enough free disk and a GPU (GoogleColab is fine for this).\n", "If you do not have a GPU, you can download the features from the\n", "[GoogleDrive folder](https://drive.google.com/drive/folders/1DF7POc6j03pRiWQPWSl5QJX5iY-xK0sV?usp=sharing)."]}, {"cell_type": "code", "execution_count": 28, "id": "68fcd0ab", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:58:37.486821Z", "iopub.status.busy": "2021-12-04T15:58:37.484217Z", "iopub.status.idle": "2021-12-04T15:59:11.196064Z", "shell.execute_reply": "2021-12-04T15:59:11.196470Z"}, "papermill": {"duration": 33.893166, "end_time": "2021-12-04T15:59:11.196649", "exception": false, "start_time": "2021-12-04T15:58:37.303483", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "336b58f1c17b4c2998f77978c46f92b2", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0/391 [00:00= anomaly_label:\n", " set_label += 1\n", "\n", " # Sample images from the class determined above\n", " img_indices = np.random.choice(self.img_idx_by_label.shape[1], size=self.set_size, replace=False)\n", " img_indices = self.img_idx_by_label[set_label, img_indices]\n", " return img_indices\n", "\n", " def __len__(self):\n", " return self.img_feats.shape[0]\n", "\n", " def __getitem__(self, idx):\n", " anomaly = self.img_feats[idx]\n", " if self.train: # If train => sample\n", " img_indices = self.sample_img_set(self.labels[idx])\n", " else: # If test => use pre-generated ones\n", " img_indices = self.test_sets[idx]\n", "\n", " # Concatenate images. The anomaly is always the last image for simplicity\n", " img_set = torch.cat([self.img_feats[img_indices], anomaly[None]], dim=0)\n", " indices = torch.cat([img_indices, torch.LongTensor([idx])], dim=0)\n", " label = img_set.shape[0] - 1\n", "\n", " # We return the indices of the images for visualization purpose. \"Label\" is the index of the anomaly\n", " return img_set, indices, label"]}, {"cell_type": "markdown", "id": "2fc781ed", "metadata": {"papermill": {"duration": 0.177543, "end_time": "2021-12-04T15:59:13.783170", "exception": false, "start_time": "2021-12-04T15:59:13.605627", "status": "completed"}, "tags": []}, "source": ["Next, we can setup our datasets and data loaders below.\n", "Here, we will use a set size of 10, i.e. 9 images from one category + 1 anomaly.\n", "Feel free to change it if you want to experiment with the sizes."]}, {"cell_type": "code", "execution_count": 32, "id": "d089f9e7", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:59:14.150564Z", "iopub.status.busy": "2021-12-04T15:59:14.150080Z", "iopub.status.idle": "2021-12-04T15:59:15.603980Z", "shell.execute_reply": "2021-12-04T15:59:15.603533Z"}, "papermill": {"duration": 1.641455, "end_time": "2021-12-04T15:59:15.604117", "exception": false, "start_time": "2021-12-04T15:59:13.962662", "status": "completed"}, "tags": []}, "outputs": [], "source": ["SET_SIZE = 10\n", "test_labels = torch.LongTensor(test_set.targets)\n", "\n", "train_anom_dataset = SetAnomalyDataset(train_feats, train_labels, set_size=SET_SIZE, train=True)\n", "val_anom_dataset = SetAnomalyDataset(val_feats, val_labels, set_size=SET_SIZE, train=False)\n", "test_anom_dataset = SetAnomalyDataset(test_feats, test_labels, set_size=SET_SIZE, train=False)\n", "\n", "train_anom_loader = data.DataLoader(\n", " train_anom_dataset, batch_size=64, shuffle=True, drop_last=True, num_workers=4, pin_memory=True\n", ")\n", "val_anom_loader = data.DataLoader(val_anom_dataset, batch_size=64, shuffle=False, drop_last=False, num_workers=4)\n", "test_anom_loader = data.DataLoader(test_anom_dataset, batch_size=64, shuffle=False, drop_last=False, num_workers=4)"]}, {"cell_type": "markdown", "id": "70f843f4", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.178644, "end_time": "2021-12-04T15:59:15.961336", "exception": false, "start_time": "2021-12-04T15:59:15.782692", "status": "completed"}, "tags": []}, "source": ["To understand the dataset a little better, we can plot below a few sets from the test dataset.\n", "Each row shows a different input set, where the first 9 are from the same class."]}, {"cell_type": "code", "execution_count": 33, "id": "cf7e1059", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:59:16.325926Z", "iopub.status.busy": "2021-12-04T15:59:16.325451Z", "iopub.status.idle": "2021-12-04T15:59:17.628117Z", "shell.execute_reply": "2021-12-04T15:59:17.628507Z"}, "papermill": {"duration": 1.488315, "end_time": "2021-12-04T15:59:17.628671", "exception": false, "start_time": "2021-12-04T15:59:16.140356", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:59:16.867016\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["def visualize_exmp(indices, orig_dataset):\n", " images = [orig_dataset[idx][0] for idx in indices.reshape(-1)]\n", " images = torch.stack(images, dim=0)\n", " images = images * TORCH_DATA_STD + TORCH_DATA_MEANS\n", "\n", " img_grid = torchvision.utils.make_grid(images, nrow=SET_SIZE, normalize=True, pad_value=0.5, padding=16)\n", " img_grid = img_grid.permute(1, 2, 0)\n", "\n", " plt.figure(figsize=(12, 8))\n", " plt.title(\"Anomaly examples on CIFAR100\")\n", " plt.imshow(img_grid)\n", " plt.axis(\"off\")\n", " plt.show()\n", " plt.close()\n", "\n", "\n", "_, indices, _ = next(iter(test_anom_loader))\n", "visualize_exmp(indices[:4], test_set)"]}, {"cell_type": "markdown", "id": "48c08ca7", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.1952, "end_time": "2021-12-04T15:59:18.016890", "exception": false, "start_time": "2021-12-04T15:59:17.821690", "status": "completed"}, "tags": []}, "source": ["We can already see that for some sets the task might be easier than for others.\n", "Difficulties can especially arise if the anomaly is in a different, but yet visually similar class\n", "(e.g. train vs bus, flour vs worm, etc.\n", ").\n", "\n", "After having prepared the data, we can look closer at the model.\n", "Here, we have a classification of the whole set.\n", "For the prediction to be permutation-equivariant, we will output one logit for each image.\n", "Over these logits, we apply a softmax and train the anomaly image to have the highest score/probability.\n", "This is a bit different than a standard classification layer as the softmax is applied over images,\n", "not over output classes in the classical sense.\n", "However, if we swap two images in their position, we effectively swap their position in the output softmax.\n", "Hence, the prediction is equivariant with respect to the input.\n", "We implement this idea below in the subclass of the Transformer Lightning module."]}, {"cell_type": "code", "execution_count": 34, "id": "cad86c76", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:59:18.412870Z", "iopub.status.busy": "2021-12-04T15:59:18.412388Z", "iopub.status.idle": "2021-12-04T15:59:18.414272Z", "shell.execute_reply": "2021-12-04T15:59:18.413887Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.20176, "end_time": "2021-12-04T15:59:18.414384", "exception": false, "start_time": "2021-12-04T15:59:18.212624", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class AnomalyPredictor(TransformerPredictor):\n", " def _calculate_loss(self, batch, mode=\"train\"):\n", " img_sets, _, labels = batch\n", " # No positional encodings as it is a set, not a sequence!\n", " preds = self.forward(img_sets, add_positional_encoding=False)\n", " preds = preds.squeeze(dim=-1) # Shape: [Batch_size, set_size]\n", " loss = F.cross_entropy(preds, labels) # Softmax/CE over set dimension\n", " acc = (preds.argmax(dim=-1) == labels).float().mean()\n", " self.log(\"%s_loss\" % mode, loss)\n", " self.log(\"%s_acc\" % mode, acc, on_step=False, on_epoch=True)\n", " return loss, acc\n", "\n", " def training_step(self, batch, batch_idx):\n", " loss, _ = self._calculate_loss(batch, mode=\"train\")\n", " return loss\n", "\n", " def validation_step(self, batch, batch_idx):\n", " _ = self._calculate_loss(batch, mode=\"val\")\n", "\n", " def test_step(self, batch, batch_idx):\n", " _ = self._calculate_loss(batch, mode=\"test\")"]}, {"cell_type": "markdown", "id": "d732d394", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.190651, "end_time": "2021-12-04T15:59:18.796683", "exception": false, "start_time": "2021-12-04T15:59:18.606032", "status": "completed"}, "tags": []}, "source": ["Finally, we write our train function below.\n", "It has the exact same structure as the reverse task one, hence not much of an explanation is needed here."]}, {"cell_type": "code", "execution_count": 35, "id": "261279ac", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:59:19.193945Z", "iopub.status.busy": "2021-12-04T15:59:19.193455Z", "iopub.status.idle": "2021-12-04T15:59:19.195328Z", "shell.execute_reply": "2021-12-04T15:59:19.194922Z"}, "papermill": {"duration": 0.207853, "end_time": "2021-12-04T15:59:19.195437", "exception": false, "start_time": "2021-12-04T15:59:18.987584", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def train_anomaly(**kwargs):\n", " # Create a PyTorch Lightning trainer with the generation callback\n", " root_dir = os.path.join(CHECKPOINT_PATH, \"SetAnomalyTask\")\n", " os.makedirs(root_dir, exist_ok=True)\n", " trainer = pl.Trainer(\n", " default_root_dir=root_dir,\n", " callbacks=[ModelCheckpoint(save_weights_only=True, mode=\"max\", monitor=\"val_acc\")],\n", " gpus=1 if str(device).startswith(\"cuda\") else 0,\n", " max_epochs=100,\n", " gradient_clip_val=2,\n", " progress_bar_refresh_rate=1,\n", " )\n", " trainer.logger._default_hp_metric = None # Optional logging argument that we don't need\n", "\n", " # Check whether pretrained model exists. If yes, load it and skip training\n", " pretrained_filename = os.path.join(CHECKPOINT_PATH, \"SetAnomalyTask.ckpt\")\n", " if os.path.isfile(pretrained_filename):\n", " print(\"Found pretrained model, loading...\")\n", " model = AnomalyPredictor.load_from_checkpoint(pretrained_filename)\n", " else:\n", " model = AnomalyPredictor(max_iters=trainer.max_epochs * len(train_anom_loader), **kwargs)\n", " trainer.fit(model, train_anom_loader, val_anom_loader)\n", " model = AnomalyPredictor.load_from_checkpoint(trainer.checkpoint_callback.best_model_path)\n", "\n", " # Test best model on validation and test set\n", " train_result = trainer.test(model, test_dataloaders=train_anom_loader, verbose=False)\n", " val_result = trainer.test(model, test_dataloaders=val_anom_loader, verbose=False)\n", " test_result = trainer.test(model, test_dataloaders=test_anom_loader, verbose=False)\n", " result = {\n", " \"test_acc\": test_result[0][\"test_acc\"],\n", " \"val_acc\": val_result[0][\"test_acc\"],\n", " \"train_acc\": train_result[0][\"test_acc\"],\n", " }\n", "\n", " model = model.to(device)\n", " return model, result"]}, {"cell_type": "markdown", "id": "3a251275", "metadata": {"papermill": {"duration": 0.192005, "end_time": "2021-12-04T15:59:19.580159", "exception": false, "start_time": "2021-12-04T15:59:19.388154", "status": "completed"}, "tags": []}, "source": ["Let's finally train our model.\n", "We will use 4 layers with 4 attention heads each.\n", "The hidden dimensionality of the model is 256, and we use a dropout of 0.1 throughout the model for good regularization.\n", "Note that we also apply the dropout on the input features, as this makes the model more robust against\n", "image noise and generalizes better.\n", "Again, we use warmup to slowly start our model training."]}, {"cell_type": "code", "execution_count": 36, "id": "adc7b1bb", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:59:19.979138Z", "iopub.status.busy": "2021-12-04T15:59:19.978661Z", "iopub.status.idle": "2021-12-04T15:59:25.752247Z", "shell.execute_reply": "2021-12-04T15:59:25.752638Z"}, "papermill": {"duration": 5.981928, "end_time": "2021-12-04T15:59:25.752808", "exception": false, "start_time": "2021-12-04T15:59:19.770880", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/connectors/callback_connector.py:90: LightningDeprecationWarning: Setting `Trainer(progress_bar_refresh_rate=1)` is deprecated in v1.5 and will be removed in v1.7. Please pass `pytorch_lightning.callbacks.progress.TQDMProgressBar` with `refresh_rate` directly to the Trainer's `callbacks` argument instead. Or, to disable the progress bar pass `enable_progress_bar = False` to the Trainer.\n", " rank_zero_deprecation(\n", "GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/trainer.py:901: LightningDeprecationWarning: `trainer.test(test_dataloaders)` is deprecated in v1.4 and will be removed in v1.6. Use `trainer.test(dataloaders)` instead.\n", " rank_zero_deprecation(\n", "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stderr", "output_type": "stream", "text": ["Missing logger folder: saved_models/Transformers/SetAnomalyTask/lightning_logs\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model, loading...\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/data_loading.py:453: UserWarning: Your `test_dataloader` has `shuffle=True`,it is strongly recommended that you turn this off for val/test/predict dataloaders.\n", " rank_zero_warn(\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "9c0f4106b2fa430d807e9c34f98e5bd2", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "983722707bb64460bfbdc38056f7d32d", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "ab0dc6637c5348a9839eded7ec182961", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}], "source": ["anomaly_model, anomaly_result = train_anomaly(\n", " input_dim=train_anom_dataset.img_feats.shape[-1],\n", " model_dim=256,\n", " num_heads=4,\n", " num_classes=1,\n", " num_layers=4,\n", " dropout=0.1,\n", " input_dropout=0.1,\n", " lr=5e-4,\n", " warmup=100,\n", ")"]}, {"cell_type": "markdown", "id": "b752953a", "metadata": {"papermill": {"duration": 0.212151, "end_time": "2021-12-04T15:59:26.177915", "exception": false, "start_time": "2021-12-04T15:59:25.965764", "status": "completed"}, "tags": []}, "source": ["We can print the achieved accuracy below."]}, {"cell_type": "code", "execution_count": 37, "id": "0c9ae3d1", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:59:26.590345Z", "iopub.status.busy": "2021-12-04T15:59:26.589872Z", "iopub.status.idle": "2021-12-04T15:59:26.592352Z", "shell.execute_reply": "2021-12-04T15:59:26.591950Z"}, "papermill": {"duration": 0.211453, "end_time": "2021-12-04T15:59:26.592461", "exception": false, "start_time": "2021-12-04T15:59:26.381008", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Train accuracy: 96.33%\n", "Val accuracy: 95.92%\n", "Test accuracy: 94.41%\n"]}], "source": ["print(\"Train accuracy: %4.2f%%\" % (100.0 * anomaly_result[\"train_acc\"]))\n", "print(\"Val accuracy: %4.2f%%\" % (100.0 * anomaly_result[\"val_acc\"]))\n", "print(\"Test accuracy: %4.2f%%\" % (100.0 * anomaly_result[\"test_acc\"]))"]}, {"cell_type": "markdown", "id": "93d2718b", "metadata": {"papermill": {"duration": 0.201663, "end_time": "2021-12-04T15:59:26.995547", "exception": false, "start_time": "2021-12-04T15:59:26.793884", "status": "completed"}, "tags": []}, "source": ["With ~94% validation and test accuracy, the model generalizes quite well.\n", "It should be noted that you might see slightly different scores depending on what computer/device you are running this notebook.\n", "This is because despite setting the seed before generating the test dataset, it is not the same across platforms and numpy versions.\n", "Nevertheless, we can conclude that the model performs quite well and can solve the task for most sets.\n", "Before trying to interpret the model, let's verify that our model is permutation-equivariant,\n", "and assigns the same predictions for different permutations of the input set.\n", "For this, we sample a batch from the test set and run it through the model to obtain the probabilities."]}, {"cell_type": "code", "execution_count": 38, "id": "dccefbde", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:59:27.411424Z", "iopub.status.busy": "2021-12-04T15:59:27.410941Z", "iopub.status.idle": "2021-12-04T15:59:27.581026Z", "shell.execute_reply": "2021-12-04T15:59:27.581442Z"}, "papermill": {"duration": 0.381038, "end_time": "2021-12-04T15:59:27.581610", "exception": false, "start_time": "2021-12-04T15:59:27.200572", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Preds\n", " [2.7691365e-05 1.8979923e-05 1.7386470e-05 2.7843047e-05 1.6143023e-05\n", " 1.7020926e-05 5.7294892e-05 9.9977750e-01 2.1365197e-05 1.8681889e-05]\n", "Permuted preds\n", " [2.7691472e-05 1.8979976e-05 1.7386521e-05 2.7843154e-05 1.6143069e-05\n", " 1.7020990e-05 5.7295114e-05 9.9977750e-01 2.1365277e-05 1.8681943e-05]\n"]}], "source": ["inp_data, indices, labels = next(iter(test_anom_loader))\n", "inp_data = inp_data.to(device)\n", "\n", "anomaly_model.eval()\n", "\n", "with torch.no_grad():\n", " preds = anomaly_model.forward(inp_data, add_positional_encoding=False)\n", " preds = F.softmax(preds.squeeze(dim=-1), dim=-1)\n", "\n", " # Permut input data\n", " permut = np.random.permutation(inp_data.shape[1])\n", " perm_inp_data = inp_data[:, permut]\n", " perm_preds = anomaly_model.forward(perm_inp_data, add_positional_encoding=False)\n", " perm_preds = F.softmax(perm_preds.squeeze(dim=-1), dim=-1)\n", "\n", "assert (preds[:, permut] - perm_preds).abs().max() < 1e-5, \"Predictions are not permutation equivariant\"\n", "\n", "print(\"Preds\\n\", preds[0, permut].cpu().numpy())\n", "print(\"Permuted preds\\n\", perm_preds[0].cpu().numpy())"]}, {"cell_type": "markdown", "id": "e44810c4", "metadata": {"papermill": {"duration": 0.202216, "end_time": "2021-12-04T15:59:27.986209", "exception": false, "start_time": "2021-12-04T15:59:27.783993", "status": "completed"}, "tags": []}, "source": ["You can see that the predictions are almost exactly the same, and only differ because of slight numerical\n", "differences inside the network operation.\n", "\n", "To interpret the model a little more, we can plot the attention maps inside the model.\n", "This will give us an idea of what information the model is sharing/communicating between images,\n", "and what each head might represent.\n", "First, we need to extract the attention maps for the test batch above, and determine the discrete predictions for simplicity."]}, {"cell_type": "code", "execution_count": 39, "id": "a3aa3c54", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:59:28.404309Z", "iopub.status.busy": "2021-12-04T15:59:28.403839Z", "iopub.status.idle": "2021-12-04T15:59:28.411125Z", "shell.execute_reply": "2021-12-04T15:59:28.410728Z"}, "papermill": {"duration": 0.214883, "end_time": "2021-12-04T15:59:28.411233", "exception": false, "start_time": "2021-12-04T15:59:28.196350", "status": "completed"}, "tags": []}, "outputs": [], "source": ["attention_maps = anomaly_model.get_attention_maps(inp_data, add_positional_encoding=False)\n", "predictions = preds.argmax(dim=-1)"]}, {"cell_type": "markdown", "id": "53fdeaca", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.203066, "end_time": "2021-12-04T15:59:28.821317", "exception": false, "start_time": "2021-12-04T15:59:28.618251", "status": "completed"}, "tags": []}, "source": ["Below we write a plot function which plots the images in the input set, the prediction of the model,\n", "and the attention maps of the different heads on layers of the transformer.\n", "Feel free to explore the attention maps for different input examples as well."]}, {"cell_type": "code", "execution_count": 40, "id": "73a6c7b3", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:59:29.243841Z", "iopub.status.busy": "2021-12-04T15:59:29.243370Z", "iopub.status.idle": "2021-12-04T15:59:32.280160Z", "shell.execute_reply": "2021-12-04T15:59:32.280550Z"}, "papermill": {"duration": 3.254644, "end_time": "2021-12-04T15:59:32.280702", "exception": false, "start_time": "2021-12-04T15:59:29.026058", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:59:29.364891\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Prediction: 9\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:59:30.887739\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["def visualize_prediction(idx):\n", " visualize_exmp(indices[idx : idx + 1], test_set)\n", " print(\"Prediction:\", predictions[idx].item())\n", " plot_attention_maps(input_data=None, attn_maps=attention_maps, idx=idx)\n", "\n", "\n", "visualize_prediction(0)"]}, {"cell_type": "markdown", "id": "c342c0bd", "metadata": {"papermill": {"duration": 0.217865, "end_time": "2021-12-04T15:59:32.717940", "exception": false, "start_time": "2021-12-04T15:59:32.500075", "status": "completed"}, "tags": []}, "source": ["Depending on the random seed, you might see a slightly different input set.\n", "For the version on the website, we compare 9 tree images with a volcano.\n", "We see that multiple heads, for instance, Layer 2 Head 1, Layer 2 Head 3, and Layer 3 Head 1 focus on the last image.\n", "Additionally, the heads in Layer 4 all seem to ignore the last image and assign a very low attention probability to it.\n", "This shows that the model has indeed recognized that the image doesn't fit the setting, and hence predicted it to be the anomaly.\n", "Layer 3 Head 2-4 seems to take a slightly weighted average of all images.\n", "That might indicate that the model extracts the \"average\" information of all images, to compare it to the image features itself.\n", "\n", "Let's try to find where the model actually makes a mistake.\n", "We can do this by identifying the sets where the model predicts something else than 9, as in the dataset,\n", "we ensured that the anomaly is always at the last position in the set."]}, {"cell_type": "code", "execution_count": 41, "id": "7d06d854", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:59:33.159783Z", "iopub.status.busy": "2021-12-04T15:59:33.159310Z", "iopub.status.idle": "2021-12-04T15:59:33.162672Z", "shell.execute_reply": "2021-12-04T15:59:33.162185Z"}, "papermill": {"duration": 0.227646, "end_time": "2021-12-04T15:59:33.162786", "exception": false, "start_time": "2021-12-04T15:59:32.935140", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Indices with mistake: [49]\n"]}], "source": ["mistakes = torch.where(predictions != 9)[0].cpu().numpy()\n", "print(\"Indices with mistake:\", mistakes)"]}, {"cell_type": "markdown", "id": "20752dd7", "metadata": {"papermill": {"duration": 0.217506, "end_time": "2021-12-04T15:59:33.599090", "exception": false, "start_time": "2021-12-04T15:59:33.381584", "status": "completed"}, "tags": []}, "source": ["As our model achieves ~94% accuracy, we only have very little number of mistakes in a batch of 64 sets.\n", "Still, let's visualize one of them, for example the last one:"]}, {"cell_type": "code", "execution_count": 42, "id": "aff3ca25", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T15:59:34.041610Z", "iopub.status.busy": "2021-12-04T15:59:34.041142Z", "iopub.status.idle": "2021-12-04T15:59:36.836836Z", "shell.execute_reply": "2021-12-04T15:59:36.836406Z"}, "papermill": {"duration": 3.018115, "end_time": "2021-12-04T15:59:36.836962", "exception": false, "start_time": "2021-12-04T15:59:33.818847", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:59:34.151133\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Prediction: 7\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-12-04T16:59:35.443130\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Probabilities:\n", "Image 0: 0.07%\n", "Image 1: 0.11%\n", "Image 2: 0.07%\n", "Image 3: 0.11%\n", "Image 4: 0.17%\n", "Image 5: 23.27%\n", "Image 6: 0.16%\n", "Image 7: 48.91%\n", "Image 8: 0.10%\n", "Image 9: 27.03%\n"]}], "source": ["visualize_prediction(mistakes[-1])\n", "print(\"Probabilities:\")\n", "for i, p in enumerate(preds[mistakes[-1]].cpu().numpy()):\n", " print(\"Image %i: %4.2f%%\" % (i, 100.0 * p))"]}, {"cell_type": "markdown", "id": "fafec094", "metadata": {"papermill": {"duration": 0.236848, "end_time": "2021-12-04T15:59:37.319392", "exception": false, "start_time": "2021-12-04T15:59:37.082544", "status": "completed"}, "tags": []}, "source": ["In this example, the model confuses a palm tree with a building, giving a probability of ~90% to image 2, and 8% to the actual anomaly.\n", "However, the difficulty here is that the picture of the building has been taken at a similar angle as the palms.\n", "Meanwhile, image 2 shows a rather unusual palm with a different color palette, which is why the model fails here.\n", "Nevertheless, in general, the model performs quite well."]}, {"cell_type": "markdown", "id": "3ca49cba", "metadata": {"papermill": {"duration": 0.234811, "end_time": "2021-12-04T15:59:37.793046", "exception": false, "start_time": "2021-12-04T15:59:37.558235", "status": "completed"}, "tags": []}, "source": ["## Conclusion\n", "\n", "In this tutorial, we took a closer look at the Multi-Head Attention layer which uses a scaled dot product between\n", "queries and keys to find correlations and similarities between input elements.\n", "The Transformer architecture is based on the Multi-Head Attention layer and applies multiple of them in a ResNet-like block.\n", "The Transformer is a very important, recent architecture that can be applied to many tasks and datasets.\n", "Although it is best known for its success in NLP, there is so much more to it.\n", "We have seen its application on sequence-to-sequence tasks and set anomaly detection.\n", "Its property of being permutation-equivariant if we do not provide any positional encodings, allows it to generalize to many settings.\n", "Hence, it is important to know the architecture, but also its possible issues such as the gradient problem during\n", "the first iterations solved by learning rate warm-up.\n", "If you are interested in continuing with the study of the Transformer architecture,\n", "please have a look at the blog posts listed at the beginning of the tutorial notebook."]}, {"cell_type": "markdown", "id": "88cdba30", "metadata": {"papermill": {"duration": 0.240818, "end_time": "2021-12-04T15:59:38.270965", "exception": false, "start_time": "2021-12-04T15:59:38.030147", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "[![Pytorch Lightning](){height=\"60px\" width=\"240px\"}](https://pytorchlightning.ai)"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: Tutorial 5: Transformers and Multi-Head Attention\n", " :card_description: In this tutorial, we will discuss one of the most impactful architectures of the last 2 years: the Transformer model. Since the paper Attention Is All You Need by Vaswani et...\n", " :tags: Text,GPU/TPU,UvA-DL-Course\n", " :image: _static/images/course_UvA-DL/05-transformers-and-MH-attention.jpg"]}], "metadata": {"jupytext": {"cell_metadata_filter": "id,colab,colab_type,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 100.878464, "end_time": "2021-12-04T15:59:39.519049", "environment_variables": {}, "exception": null, "input_path": "course_UvA-DL/05-transformers-and-MH-attention/Transformers_MHAttention.ipynb", "output_path": ".notebooks/course_UvA-DL/05-transformers-and-MH-attention.ipynb", "parameters": {}, "start_time": "2021-12-04T15:57:58.640585", "version": "2.3.3"}, "widgets": {"application/vnd.jupyter.widget-state+json": {"state": {"0b303c4195e64ef39fbeec6143263f98": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "0b80c7deefb24e7ba07594e61433755d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "0e657111ed994cd18ee73800d5175c7d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "117e6a6b8bf847059db276d064c2b13e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "13f1b84e24984ba0b79e6125f96f99f3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "169f7657723445bea5d0a4765d680159": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "178462769c7f44169c8ced0b55763811": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "236a5851e62d43d7b60a7d52dce28c1a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_e3e6a9b6686f420f80e224eca063a19f", "IPY_MODEL_24d5d210a2b24f36a66613fa0ccb4233", "IPY_MODEL_e1bd4f10532642b8a15721a759eeb58b"], "layout": "IPY_MODEL_b49848bb32524b95a97c93ad92127987"}}, "24471f587ee94549b81ff8a94a6e0a78": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_512f768512c74743b343a6e8251d6ff1", "placeholder": "\u200b", "style": "IPY_MODEL_b7ff55f2178541fc99b01101431fd146", "value": " 79/79 [00:00<00:00, 147.56it/s]"}}, "248e84e3800948aaa5d4b99a97521525": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "24d5d210a2b24f36a66613fa0ccb4233": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_87fe3739fd654f94bc44066ccbb7f227", "max": 87306240.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_dd2bb7a927774638a5d1894442cb22b2", "value": 87306240.0}}, "29f9153bb21a44b487d35377cb438123": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "2b58bae07432436298a33aaaf21cd6e4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "2bd4ea3a82024c858491e89acc4aa047": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "2ca1e45629ec4679a85bd781162d6b1c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "2f853c9d6857487ea62b0226abe31f79": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_178462769c7f44169c8ced0b55763811", "placeholder": "\u200b", "style": "IPY_MODEL_13f1b84e24984ba0b79e6125f96f99f3", "value": " 79/79 [00:05<00:00, 15.23it/s]"}}, "2f8d30ea351341eb8601ad7c4e38834c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "301dc13411cd4b16957a001be48e9feb": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "334865d5a9b24d738acc57ecf7793f00": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "336b58f1c17b4c2998f77978c46f92b2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_b68f68938fb444f8bda9725eb32bac90", "IPY_MODEL_7aa0e6f3f2884d28b3ab91fbe177cdd1", "IPY_MODEL_5f2d0ce055ee405b923e0a374e5932c6"], "layout": "IPY_MODEL_e3bf53dac0194713bd220e0fe48fee33"}}, "344aba03213349f591500fe672e8afdf": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "35f58d761f794fdea716c3eeb2c6ec80": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_77e443eccd6342b989fbcb88945429d3", "placeholder": "\u200b", "style": "IPY_MODEL_a58d18832c084ab792d67eeb729c7635", "value": "100%"}}, "37ccf9ab76824da89ed0187799f2ea08": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "3a3f8db09b6d4cc5b53b747e2b7b9da6": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "3aa4aeee7b5f4eb5aee77dce65dcade9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_35f58d761f794fdea716c3eeb2c6ec80", "IPY_MODEL_4fd7a34138db4283a966e6fb6a31b988", "IPY_MODEL_2f853c9d6857487ea62b0226abe31f79"], "layout": "IPY_MODEL_0e657111ed994cd18ee73800d5175c7d"}}, "3c5caa9157bc4baf9a570f8782e29475": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "4180b35ca339453686f92f651153f871": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ce6b8e1c9e7346ff92a0fd9dd9816ef0", "placeholder": "\u200b", "style": "IPY_MODEL_2b58bae07432436298a33aaaf21cd6e4", "value": "Testing: 100%"}}, "45a9d84f4f2c4e7bb899ba0057f9745d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f48bac3019244c07803f84c2e6d95ea0", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_522def02fad0470a9d6abc40677772dc", "value": 1.0}}, "47a76bee08d74e2799d591493ecb37f2": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4fd7a34138db4283a966e6fb6a31b988": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b15347bd314048409dbc07933d388917", "max": 79.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_248e84e3800948aaa5d4b99a97521525", "value": 79.0}}, "4fe895cd281b4d2f91f744ffc6f1a0bd": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "5007ffc533144720b1d8aabfe6bc2ec6": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "508f4a8250ff41eab6f008a7094da94a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "50e6daea1e294714a838e9a83f7f66ed": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "512f768512c74743b343a6e8251d6ff1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "522def02fad0470a9d6abc40677772dc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "563fcf83e0ce41379f34ddca6f1339a0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "575514ed749f42a997a2baa322b6efa5": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d4079c1c7a0e419fb8aca46a9ecefa25", "placeholder": "\u200b", "style": "IPY_MODEL_7da963515d2c41e889a004ca662079e4", "value": " 79/79 [00:00<00:00, 288.13it/s]"}}, "5c105436e67d40e0b6da633b6a00ead8": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "5f2d0ce055ee405b923e0a374e5932c6": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d2f30746e64b4ebba654f67c9f23b32f", "placeholder": "\u200b", "style": "IPY_MODEL_bcf6aea6625647039795bd8c30585346", "value": " 391/391 [00:27<00:00, 14.99it/s]"}}, "60febcf280f34ad8849e28a112b83802": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "65135f33d2c940b19ad2b625abb25376": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "6a189067bc0f406594c18d8e8f5640eb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "71e812687f0749799bf97615573d22f9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_50e6daea1e294714a838e9a83f7f66ed", "placeholder": "\u200b", "style": "IPY_MODEL_5007ffc533144720b1d8aabfe6bc2ec6", "value": ""}}, "73ef64d0e797442ab771d4e2728baaab": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "7428277b5ed04997b19990cc745ba65f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "767da7c44af140cdb3413c158988e913": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "77e443eccd6342b989fbcb88945429d3": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "7aa0e6f3f2884d28b3ab91fbe177cdd1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_db005c58c17c46bc904b0e844c4c1dc8", "max": 391.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_e5dedb39aecd428ea3dd6d2e15dbb49d", "value": 391.0}}, "7c565ce6f14141dca6e213b4c0a463a0": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "7da963515d2c41e889a004ca662079e4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "7e7c9b0794174e2aaa68e3682517db1d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_0b80c7deefb24e7ba07594e61433755d", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_8c3f67d4af6d4c9cae34014915f7cc58", "value": 1.0}}, "7f73079d25064959932573707f3e2c52": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "8474a73379874c7a9597a35a15c7e585": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c8a127a3c7d8451f9a464af27ccec9b4", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_896c1b7cd27a4e46b437fdb3666edf55", "value": 1.0}}, "87fe3739fd654f94bc44066ccbb7f227": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "896c1b7cd27a4e46b437fdb3666edf55": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "89c0145b83d34648bacf9da6ad15d74d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_dd915efd78e44054a1826e4be665b035", "IPY_MODEL_8474a73379874c7a9597a35a15c7e585", "IPY_MODEL_575514ed749f42a997a2baa322b6efa5"], "layout": "IPY_MODEL_60febcf280f34ad8849e28a112b83802"}}, "8c3f67d4af6d4c9cae34014915f7cc58": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "983722707bb64460bfbdc38056f7d32d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_d83de3be21e04615a11e3659d3a83abc", "IPY_MODEL_7e7c9b0794174e2aaa68e3682517db1d", "IPY_MODEL_24471f587ee94549b81ff8a94a6e0a78"], "layout": "IPY_MODEL_334865d5a9b24d738acc57ecf7793f00"}}, "99532397f9914f338666889ca9cd1285": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "99f1cedd123941169dc16b83030bced1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "9c0f4106b2fa430d807e9c34f98e5bd2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_f47589b9dfad41088d797c8ce2a9761a", "IPY_MODEL_d51b5e09340f4c24b51ac50bd1ef8c8f", "IPY_MODEL_cfc6b274acec498c870a3d5ef0252cf4"], "layout": "IPY_MODEL_65135f33d2c940b19ad2b625abb25376"}}, "9fe2ccea8542438f8b6f3adaf6a5e302": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "a58d18832c084ab792d67eeb729c7635": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "aad913a268f3461a947ea946df80ce7d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ab0dc6637c5348a9839eded7ec182961": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_ce0141f331ad484189ed4500c2287b0d", "IPY_MODEL_aba0095cda6a462d94fe0e0979e1bd9a", "IPY_MODEL_c7741f8ad62e493a97a27ea1f32acc15"], "layout": "IPY_MODEL_0b303c4195e64ef39fbeec6143263f98"}}, "ab80d9dadcc34224ad525011c3a46c9f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_117e6a6b8bf847059db276d064c2b13e", "max": 169001437.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_3c5caa9157bc4baf9a570f8782e29475", "value": 169001437.0}}, "aba0095cda6a462d94fe0e0979e1bd9a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_47a76bee08d74e2799d591493ecb37f2", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_2bd4ea3a82024c858491e89acc4aa047", "value": 1.0}}, "b15347bd314048409dbc07933d388917": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b49848bb32524b95a97c93ad92127987": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b68f68938fb444f8bda9725eb32bac90": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_344aba03213349f591500fe672e8afdf", "placeholder": "\u200b", "style": "IPY_MODEL_508f4a8250ff41eab6f008a7094da94a", "value": "100%"}}, "b7ff55f2178541fc99b01101431fd146": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "b9ed1cfedbeb4586bab29909930e47b1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_4180b35ca339453686f92f651153f871", "IPY_MODEL_45a9d84f4f2c4e7bb899ba0057f9745d", "IPY_MODEL_d51f7aa60a654aae991f9b2ccd974311"], "layout": "IPY_MODEL_301dc13411cd4b16957a001be48e9feb"}}, "bacb5883fee34339abc34dd04428fd19": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "bcf6aea6625647039795bd8c30585346": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "c7741f8ad62e493a97a27ea1f32acc15": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_7428277b5ed04997b19990cc745ba65f", "placeholder": "\u200b", "style": "IPY_MODEL_2ca1e45629ec4679a85bd781162d6b1c", "value": " 157/157 [00:01<00:00, 163.00it/s]"}}, "c8a127a3c7d8451f9a464af27ccec9b4": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c9833783e4f24255a6dbfb6716d13e22": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ce0141f331ad484189ed4500c2287b0d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_767da7c44af140cdb3413c158988e913", "placeholder": "\u200b", "style": "IPY_MODEL_dc3260543b5f40d58b6b604961c71781", "value": "Testing: 100%"}}, "ce6b8e1c9e7346ff92a0fd9dd9816ef0": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "cfc6b274acec498c870a3d5ef0252cf4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c9833783e4f24255a6dbfb6716d13e22", "placeholder": "\u200b", "style": "IPY_MODEL_3a3f8db09b6d4cc5b53b747e2b7b9da6", "value": " 703/703 [00:03<00:00, 197.32it/s]"}}, "d2f30746e64b4ebba654f67c9f23b32f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d4079c1c7a0e419fb8aca46a9ecefa25": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d4443194a5e84e52a7f9e44f7e4d7e6b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "d51b5e09340f4c24b51ac50bd1ef8c8f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_7c565ce6f14141dca6e213b4c0a463a0", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_37ccf9ab76824da89ed0187799f2ea08", "value": 1.0}}, "d51f7aa60a654aae991f9b2ccd974311": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2f8d30ea351341eb8601ad7c4e38834c", "placeholder": "\u200b", "style": "IPY_MODEL_d4443194a5e84e52a7f9e44f7e4d7e6b", "value": " 8/8 [00:00<00:00, 132.04it/s]"}}, "d83de3be21e04615a11e3659d3a83abc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_aad913a268f3461a947ea946df80ce7d", "placeholder": "\u200b", "style": "IPY_MODEL_9fe2ccea8542438f8b6f3adaf6a5e302", "value": "Testing: 100%"}}, "db005c58c17c46bc904b0e844c4c1dc8": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "dc3260543b5f40d58b6b604961c71781": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "dd2bb7a927774638a5d1894442cb22b2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "dd915efd78e44054a1826e4be665b035": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_bacb5883fee34339abc34dd04428fd19", "placeholder": "\u200b", "style": "IPY_MODEL_29f9153bb21a44b487d35377cb438123", "value": "Testing: 100%"}}, "e1bd4f10532642b8a15721a759eeb58b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_73ef64d0e797442ab771d4e2728baaab", "placeholder": "\u200b", "style": "IPY_MODEL_7f73079d25064959932573707f3e2c52", "value": " 83.3M/83.3M [00:00<00:00, 116MB/s]"}}, "e3bf53dac0194713bd220e0fe48fee33": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "e3e6a9b6686f420f80e224eca063a19f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_99f1cedd123941169dc16b83030bced1", "placeholder": "\u200b", "style": "IPY_MODEL_169f7657723445bea5d0a4765d680159", "value": "100%"}}, "e5dedb39aecd428ea3dd6d2e15dbb49d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "efc763b5cd4e4ed9b3e3881bad434e2b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_71e812687f0749799bf97615573d22f9", "IPY_MODEL_ab80d9dadcc34224ad525011c3a46c9f", "IPY_MODEL_f72acb891d864ee79f5d536286cc4667"], "layout": "IPY_MODEL_99532397f9914f338666889ca9cd1285"}}, "f47589b9dfad41088d797c8ce2a9761a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4fe895cd281b4d2f91f744ffc6f1a0bd", "placeholder": "\u200b", "style": "IPY_MODEL_6a189067bc0f406594c18d8e8f5640eb", "value": "Testing: 100%"}}, "f48bac3019244c07803f84c2e6d95ea0": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "f72acb891d864ee79f5d536286cc4667": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_5c105436e67d40e0b6da633b6a00ead8", "placeholder": "\u200b", "style": "IPY_MODEL_563fcf83e0ce41379f34ddca6f1339a0", "value": " 169001984/? [00:01<00:00, 103277285.22it/s]"}}}, "version_major": 2, "version_minor": 0}}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/course_UvA-DL/06-graph-neural-networks.ipynb b/source/notebooks/course_UvA-DL/06-graph-neural-networks.ipynb deleted file mode 100644 index beccef6..0000000 --- a/source/notebooks/course_UvA-DL/06-graph-neural-networks.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "c005cd13", "metadata": {"papermill": {"duration": 0.099647, "end_time": "2021-12-04T16:14:55.293606", "exception": false, "start_time": "2021-12-04T16:14:55.193959", "status": "completed"}, "tags": []}, "source": ["\n", "# Tutorial 6: Basics of Graph Neural Networks\n", "\n", "* **Author:** Phillip Lippe\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-12-04T16:52:52.769733\n", "\n", "In this tutorial, we will discuss the application of neural networks on graphs.\n", "Graph Neural Networks (GNNs) have recently gained increasing popularity in both applications and research,\n", "including domains such as social networks, knowledge graphs, recommender systems, and bioinformatics.\n", "While the theory and math behind GNNs might first seem complicated,\n", "the implementation of those models is quite simple and helps in understanding the methodology.\n", "Therefore, we will discuss the implementation of basic network layers of a GNN,\n", "namely graph convolutions, and attention layers.\n", "Finally, we will apply a GNN on semi-supervised node classification and molecule categorization.\n", "This notebook is part of a lecture series on Deep Learning at the University of Amsterdam.\n", "The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io.\n", "\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/course_UvA-DL/06-graph-neural-networks.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "8f81ec41", "metadata": {"papermill": {"duration": 0.098016, "end_time": "2021-12-04T16:14:55.489441", "exception": false, "start_time": "2021-12-04T16:14:55.391425", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "9f21578c", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-12-04T16:14:55.691145Z", "iopub.status.busy": "2021-12-04T16:14:55.690666Z", "iopub.status.idle": "2021-12-04T16:14:58.205336Z", "shell.execute_reply": "2021-12-04T16:14:58.204782Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 2.618634, "end_time": "2021-12-04T16:14:58.205486", "exception": false, "start_time": "2021-12-04T16:14:55.586852", "status": "completed"}, "tags": []}, "outputs": [], "source": ["! pip install --quiet \"torch>=1.6, <1.9\" \"torch-sparse\" \"torch-cluster\" \"pytorch-lightning>=1.3\" \"torch-scatter\" \"torch-spline-conv\" \"torchmetrics>=0.3\" \"torch-geometric==2.0.2\""]}, {"cell_type": "markdown", "id": "5f4b1636", "metadata": {"papermill": {"duration": 0.097058, "end_time": "2021-12-04T16:14:58.401563", "exception": false, "start_time": "2021-12-04T16:14:58.304505", "status": "completed"}, "tags": []}, "source": ["
\n", "We start by importing our standard libraries below."]}, {"cell_type": "code", "execution_count": 2, "id": "1fa61214", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:14:58.603576Z", "iopub.status.busy": "2021-12-04T16:14:58.603090Z", "iopub.status.idle": "2021-12-04T16:15:00.563541Z", "shell.execute_reply": "2021-12-04T16:15:00.563928Z"}, "papermill": {"duration": 2.064677, "end_time": "2021-12-04T16:15:00.564089", "exception": false, "start_time": "2021-12-04T16:14:58.499412", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}], "source": ["# Standard libraries\n", "import os\n", "\n", "# For downloading pre-trained models\n", "import urllib.request\n", "from urllib.error import HTTPError\n", "\n", "# PyTorch Lightning\n", "import pytorch_lightning as pl\n", "\n", "# PyTorch\n", "import torch\n", "import torch.nn as nn\n", "import torch.nn.functional as F\n", "import torch.optim as optim\n", "\n", "# PyTorch geometric\n", "import torch_geometric\n", "import torch_geometric.data as geom_data\n", "import torch_geometric.nn as geom_nn\n", "\n", "# PL callbacks\n", "from pytorch_lightning.callbacks import ModelCheckpoint\n", "\n", "AVAIL_GPUS = min(1, torch.cuda.device_count())\n", "BATCH_SIZE = 256 if AVAIL_GPUS else 64\n", "# Path to the folder where the datasets are/should be downloaded\n", "DATASET_PATH = os.environ.get(\"PATH_DATASETS\", \"data/\")\n", "# Path to the folder where the pretrained models are saved\n", "CHECKPOINT_PATH = os.environ.get(\"PATH_CHECKPOINT\", \"saved_models/GNNs/\")\n", "\n", "# Setting the seed\n", "pl.seed_everything(42)\n", "\n", "# Ensure that all operations are deterministic on GPU (if used) for reproducibility\n", "torch.backends.cudnn.determinstic = True\n", "torch.backends.cudnn.benchmark = False"]}, {"cell_type": "markdown", "id": "1a6c7487", "metadata": {"papermill": {"duration": 0.096843, "end_time": "2021-12-04T16:15:00.760797", "exception": false, "start_time": "2021-12-04T16:15:00.663954", "status": "completed"}, "tags": []}, "source": ["We also have a few pre-trained models we download below."]}, {"cell_type": "code", "execution_count": 3, "id": "e4661ab9", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:00.961509Z", "iopub.status.busy": "2021-12-04T16:15:00.961033Z", "iopub.status.idle": "2021-12-04T16:15:01.312867Z", "shell.execute_reply": "2021-12-04T16:15:01.312426Z"}, "papermill": {"duration": 0.455182, "end_time": "2021-12-04T16:15:01.313005", "exception": false, "start_time": "2021-12-04T16:15:00.857823", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial7/NodeLevelMLP.ckpt...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial7/NodeLevelGNN.ckpt...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial7/GraphLevelGraphConv.ckpt...\n"]}], "source": ["# Github URL where saved models are stored for this tutorial\n", "base_url = \"https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial7/\"\n", "# Files to download\n", "pretrained_files = [\"NodeLevelMLP.ckpt\", \"NodeLevelGNN.ckpt\", \"GraphLevelGraphConv.ckpt\"]\n", "\n", "# Create checkpoint path if it doesn't exist yet\n", "os.makedirs(CHECKPOINT_PATH, exist_ok=True)\n", "\n", "# For each file, check whether it already exists. If not, try downloading it.\n", "for file_name in pretrained_files:\n", " file_path = os.path.join(CHECKPOINT_PATH, file_name)\n", " if \"/\" in file_name:\n", " os.makedirs(file_path.rsplit(\"/\", 1)[0], exist_ok=True)\n", " if not os.path.isfile(file_path):\n", " file_url = base_url + file_name\n", " print(\"Downloading %s...\" % file_url)\n", " try:\n", " urllib.request.urlretrieve(file_url, file_path)\n", " except HTTPError as e:\n", " print(\n", " \"Something went wrong. Please try to download the file from the GDrive folder,\"\n", " \" or contact the author with the full output including the following error:\\n\",\n", " e,\n", " )"]}, {"cell_type": "markdown", "id": "2f0eab58", "metadata": {"papermill": {"duration": 0.097897, "end_time": "2021-12-04T16:15:01.509592", "exception": false, "start_time": "2021-12-04T16:15:01.411695", "status": "completed"}, "tags": []}, "source": ["## Graph Neural Networks"]}, {"cell_type": "markdown", "id": "3f505697", "metadata": {"papermill": {"duration": 0.102332, "end_time": "2021-12-04T16:15:01.708754", "exception": false, "start_time": "2021-12-04T16:15:01.606422", "status": "completed"}, "tags": []}, "source": ["### Graph representation\n", "\n", "Before starting the discussion of specific neural network operations on graphs, we should consider how to represent a graph.\n", "Mathematically, a graph $\\mathcal{G}$ is defined as a tuple of a set of nodes/vertices $V$, and a set of edges/links $E$: $\\mathcal{G}=(V,E)$.\n", "Each edge is a pair of two vertices, and represents a connection between them.\n", "For instance, let's look at the following graph:\n", "\n", "
\n", "\n", "The vertices are $V=\\{1,2,3,4\\}$, and edges $E=\\{(1,2), (2,3), (2,4), (3,4)\\}$.\n", "Note that for simplicity, we assume the graph to be undirected and hence don't add mirrored pairs like $(2,1)$.\n", "In application, vertices and edge can often have specific attributes, and edges can even be directed.\n", "The question is how we could represent this diversity in an efficient way for matrix operations.\n", "Usually, for the edges, we decide between two variants: an adjacency matrix, or a list of paired vertex indices.\n", "\n", "The **adjacency matrix** $A$ is a square matrix whose elements indicate whether pairs of vertices are adjacent,\n", "i.e. connected, or not.\n", "In the simplest case, $A_{ij}$ is 1 if there is a connection from node $i$ to $j$, and otherwise 0.\n", "If we have edge attributes or different categories of edges in a graph, this information can be added to the matrix as well.\n", "For an undirected graph, keep in mind that $A$ is a symmetric matrix ($A_{ij}=A_{ji}$).\n", "For the example graph above, we have the following adjacency matrix:\n", "\n", "$$\n", "A = \\begin{bmatrix}\n", " 0 & 1 & 0 & 0\\\\\n", " 1 & 0 & 1 & 1\\\\\n", " 0 & 1 & 0 & 1\\\\\n", " 0 & 1 & 1 & 0\n", "\\end{bmatrix}\n", "$$\n", "\n", "While expressing a graph as a list of edges is more efficient in terms of memory and (possibly) computation,\n", "using an adjacency matrix is more intuitive and simpler to implement.\n", "In our implementations below, we will rely on the adjacency matrix to keep the code simple.\n", "However, common libraries use edge lists, which we will discuss later more.\n", "Alternatively, we could also use the list of edges to define a sparse adjacency matrix with which we can work\n", "as if it was a dense matrix, but allows more memory-efficient operations.\n", "PyTorch supports this with the sub-package `torch.sparse`\n", "([documentation](https://pytorch.org/docs/stable/sparse.html)) which is however still in a beta-stage\n", "(API might change in future)."]}, {"cell_type": "markdown", "id": "9fea25df", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.097611, "end_time": "2021-12-04T16:15:01.904168", "exception": false, "start_time": "2021-12-04T16:15:01.806557", "status": "completed"}, "tags": []}, "source": ["### Graph Convolutions\n", "\n", "Graph Convolutional Networks have been introduced by [Kipf et al. ](https://openreview.net/pdf?id=SJU4ayYgl)\n", "in 2016 at the University of Amsterdam.\n", "He also wrote a great [blog post](https://tkipf.github.io/graph-convolutional-networks/) about this topic,\n", "which is recommended if you want to read about GCNs from a different perspective.\n", "GCNs are similar to convolutions in images in the sense that the \"filter\" parameters are typically shared over all locations in the graph.\n", "At the same time, GCNs rely on message passing methods, which means that vertices exchange information with the neighbors,\n", "and send \"messages\" to each other.\n", "Before looking at the math, we can try to visually understand how GCNs work.\n", "The first step is that each node creates a feature vector that represents the message it wants to send to all its neighbors.\n", "In the second step, the messages are sent to the neighbors, so that a node receives one message per adjacent node.\n", "Below we have visualized the two steps for our example graph.\n", "\n", "
\n", "\n", "If we want to formulate that in more mathematical terms, we need to first decide how to combine\n", "all the messages a node receives.\n", "As the number of messages vary across nodes, we need an operation that works for any number.\n", "Hence, the usual way to go is to sum or take the mean.\n", "Given the previous features of nodes $H^{(l)}$, the GCN layer is defined as follows:\n", "\n", "$$H^{(l+1)} = \\sigma\\left(\\hat{D}^{-1/2}\\hat{A}\\hat{D}^{-1/2}H^{(l)}W^{(l)}\\right)$$\n", "\n", "$W^{(l)}$ is the weight parameters with which we transform the input features into messages ($H^{(l)}W^{(l)}$).\n", "To the adjacency matrix $A$ we add the identity matrix so that each node sends its own message also to itself:\n", "$\\hat{A}=A+I$.\n", "Finally, to take the average instead of summing, we calculate the matrix $\\hat{D}$ which is a diagonal\n", "matrix with $D_{ii}$ denoting the number of neighbors node $i$ has.\n", "$\\sigma$ represents an arbitrary activation function, and not necessarily the sigmoid (usually a ReLU-based\n", "activation function is used in GNNs).\n", "\n", "When implementing the GCN layer in PyTorch, we can take advantage of the flexible operations on tensors.\n", "Instead of defining a matrix $\\hat{D}$, we can simply divide the summed messages by the number of neighbors afterward.\n", "Additionally, we replace the weight matrix with a linear layer, which additionally allows us to add a bias.\n", "Written as a PyTorch module, the GCN layer is defined as follows:"]}, {"cell_type": "code", "execution_count": 4, "id": "27e21d7b", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:02.104708Z", "iopub.status.busy": "2021-12-04T16:15:02.104230Z", "iopub.status.idle": "2021-12-04T16:15:02.106193Z", "shell.execute_reply": "2021-12-04T16:15:02.105814Z"}, "papermill": {"duration": 0.105512, "end_time": "2021-12-04T16:15:02.106302", "exception": false, "start_time": "2021-12-04T16:15:02.000790", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class GCNLayer(nn.Module):\n", " def __init__(self, c_in, c_out):\n", " super().__init__()\n", " self.projection = nn.Linear(c_in, c_out)\n", "\n", " def forward(self, node_feats, adj_matrix):\n", " \"\"\"\n", " Args:\n", " node_feats: Tensor with node features of shape [batch_size, num_nodes, c_in]\n", " adj_matrix: Batch of adjacency matrices of the graph. If there is an edge from i to j,\n", " adj_matrix[b,i,j]=1 else 0. Supports directed edges by non-symmetric matrices.\n", " Assumes to already have added the identity connections.\n", " Shape: [batch_size, num_nodes, num_nodes]\n", " \"\"\"\n", " # Num neighbours = number of incoming edges\n", " num_neighbours = adj_matrix.sum(dim=-1, keepdims=True)\n", " node_feats = self.projection(node_feats)\n", " node_feats = torch.bmm(adj_matrix, node_feats)\n", " node_feats = node_feats / num_neighbours\n", " return node_feats"]}, {"cell_type": "markdown", "id": "e0c30193", "metadata": {"papermill": {"duration": 0.097045, "end_time": "2021-12-04T16:15:02.300782", "exception": false, "start_time": "2021-12-04T16:15:02.203737", "status": "completed"}, "tags": []}, "source": ["To further understand the GCN layer, we can apply it to our example graph above.\n", "First, let's specify some node features and the adjacency matrix with added self-connections:"]}, {"cell_type": "code", "execution_count": 5, "id": "1a809047", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:02.499953Z", "iopub.status.busy": "2021-12-04T16:15:02.499486Z", "iopub.status.idle": "2021-12-04T16:15:02.504131Z", "shell.execute_reply": "2021-12-04T16:15:02.504506Z"}, "papermill": {"duration": 0.106672, "end_time": "2021-12-04T16:15:02.504629", "exception": false, "start_time": "2021-12-04T16:15:02.397957", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Node features:\n", " tensor([[[0., 1.],\n", " [2., 3.],\n", " [4., 5.],\n", " [6., 7.]]])\n", "\n", "Adjacency matrix:\n", " tensor([[[1., 1., 0., 0.],\n", " [1., 1., 1., 1.],\n", " [0., 1., 1., 1.],\n", " [0., 1., 1., 1.]]])\n"]}], "source": ["node_feats = torch.arange(8, dtype=torch.float32).view(1, 4, 2)\n", "adj_matrix = torch.Tensor([[[1, 1, 0, 0], [1, 1, 1, 1], [0, 1, 1, 1], [0, 1, 1, 1]]])\n", "\n", "print(\"Node features:\\n\", node_feats)\n", "print(\"\\nAdjacency matrix:\\n\", adj_matrix)"]}, {"cell_type": "markdown", "id": "e83b46bb", "metadata": {"papermill": {"duration": 0.09825, "end_time": "2021-12-04T16:15:02.700721", "exception": false, "start_time": "2021-12-04T16:15:02.602471", "status": "completed"}, "tags": []}, "source": ["Next, let's apply a GCN layer to it.\n", "For simplicity, we initialize the linear weight matrix as an identity matrix so that the input features are equal to the messages.\n", "This makes it easier for us to verify the message passing operation."]}, {"cell_type": "code", "execution_count": 6, "id": "74912306", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:02.902678Z", "iopub.status.busy": "2021-12-04T16:15:02.902191Z", "iopub.status.idle": "2021-12-04T16:15:02.907793Z", "shell.execute_reply": "2021-12-04T16:15:02.907388Z"}, "papermill": {"duration": 0.108228, "end_time": "2021-12-04T16:15:02.907895", "exception": false, "start_time": "2021-12-04T16:15:02.799667", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Adjacency matrix tensor([[[1., 1., 0., 0.],\n", " [1., 1., 1., 1.],\n", " [0., 1., 1., 1.],\n", " [0., 1., 1., 1.]]])\n", "Input features tensor([[[0., 1.],\n", " [2., 3.],\n", " [4., 5.],\n", " [6., 7.]]])\n", "Output features tensor([[[1., 2.],\n", " [3., 4.],\n", " [4., 5.],\n", " [4., 5.]]])\n"]}], "source": ["layer = GCNLayer(c_in=2, c_out=2)\n", "layer.projection.weight.data = torch.Tensor([[1.0, 0.0], [0.0, 1.0]])\n", "layer.projection.bias.data = torch.Tensor([0.0, 0.0])\n", "\n", "with torch.no_grad():\n", " out_feats = layer(node_feats, adj_matrix)\n", "\n", "print(\"Adjacency matrix\", adj_matrix)\n", "print(\"Input features\", node_feats)\n", "print(\"Output features\", out_feats)"]}, {"cell_type": "markdown", "id": "e60f06b6", "metadata": {"papermill": {"duration": 0.100382, "end_time": "2021-12-04T16:15:03.107772", "exception": false, "start_time": "2021-12-04T16:15:03.007390", "status": "completed"}, "tags": []}, "source": ["As we can see, the first node's output values are the average of itself and the second node.\n", "Similarly, we can verify all other nodes.\n", "However, in a GNN, we would also want to allow feature exchange between nodes beyond its neighbors.\n", "This can be achieved by applying multiple GCN layers, which gives us the final layout of a GNN.\n", "The GNN can be build up by a sequence of GCN layers and non-linearities such as ReLU.\n", "For a visualization, see below (figure credit - [Thomas Kipf, 2016](https://tkipf.github.io/graph-convolutional-networks/)).\n", "\n", "
\n", "\n", "However, one issue we can see from looking at the example above is that the output features for nodes 3 and 4 are\n", "the same because they have the same adjacent nodes (including itself).\n", "Therefore, GCN layers can make the network forget node-specific information if we just take a mean over all messages.\n", "Multiple possible improvements have been proposed.\n", "While the simplest option might be using residual connections, the more common approach is to either weigh\n", "the self-connections higher or define a separate weight matrix for the self-connections.\n", "Alternatively, we can use a well-known concept: attention."]}, {"cell_type": "markdown", "id": "fcca2c46", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.098504, "end_time": "2021-12-04T16:15:03.308884", "exception": false, "start_time": "2021-12-04T16:15:03.210380", "status": "completed"}, "tags": []}, "source": ["### Graph Attention\n", "\n", "Attention describes a weighted average of multiple elements with the weights dynamically computed based on an input\n", "query and elements' keys (if you don't know what attention is, it is recommended to at least go through\n", "the very first section called [What is Attention?](https://uvadlc-notebooks.readthedocs.io/en/latest/tutorial_notebooks/tutorial6/Transformers_and_MHAttention.html#What-is-Attention?)).\n", "This concept can be similarly applied to graphs, one of such is the Graph Attention Network\n", "(called GAT, proposed by [Velickovic et al., 2017](https://arxiv.org/abs/1710.10903)).\n", "Similarly to the GCN, the graph attention layer creates a message for each node using a linear layer/weight matrix.\n", "For the attention part, it uses the message from the node itself as a query, and the messages to average as both\n", "keys and values (note that this also includes the message to itself).\n", "The score function $f_{attn}$ is implemented as a one-layer MLP which maps the query and key to a single value.\n", "The MLP looks as follows (figure credit - [Velickovic et al. ](https://arxiv.org/abs/1710.10903)):\n", "\n", "
\n", "\n", "$h_i$ and $h_j$ are the original features from node $i$ and $j$ respectively, and represent the messages\n", "of the layer with $\\mathbf{W}$ as weight matrix.\n", "$\\mathbf{a}$ is the weight matrix of the MLP, which has the shape $[1,2\\times d_{\\text{message}}]$,\n", "and $\\alpha_{ij}$ the final attention weight from node $i$ to $j$.\n", "The calculation can be described as follows:\n", "\n", "$$\\alpha_{ij} = \\frac{\\exp\\left(\\text{LeakyReLU}\\left(\\mathbf{a}\\left[\\mathbf{W}h_i||\\mathbf{W}h_j\\right]\\right)\\right)}{\\sum_{k\\in\\mathcal{N}_i} \\exp\\left(\\text{LeakyReLU}\\left(\\mathbf{a}\\left[\\mathbf{W}h_i||\\mathbf{W}h_k\\right]\\right)\\right)}$$\n", "\n", "The operator $||$ represents the concatenation, and $\\mathcal{N}_i$ the indices of the neighbors of node $i$.\n", "Note that in contrast to usual practice, we apply a non-linearity (here LeakyReLU) before the softmax over elements.\n", "Although it seems like a minor change at first, it is crucial for the attention to depend on the original input.\n", "Specifically, let's remove the non-linearity for a second, and try to simplify the expression:\n", "\n", "$$\n", "\\begin{split}\n", " \\alpha_{ij} & = \\frac{\\exp\\left(\\mathbf{a}\\left[\\mathbf{W}h_i||\\mathbf{W}h_j\\right]\\right)}{\\sum_{k\\in\\mathcal{N}_i} \\exp\\left(\\mathbf{a}\\left[\\mathbf{W}h_i||\\mathbf{W}h_k\\right]\\right)}\\\\[5pt]\n", " & = \\frac{\\exp\\left(\\mathbf{a}_{:,:d/2}\\mathbf{W}h_i+\\mathbf{a}_{:,d/2:}\\mathbf{W}h_j\\right)}{\\sum_{k\\in\\mathcal{N}_i} \\exp\\left(\\mathbf{a}_{:,:d/2}\\mathbf{W}h_i+\\mathbf{a}_{:,d/2:}\\mathbf{W}h_k\\right)}\\\\[5pt]\n", " & = \\frac{\\exp\\left(\\mathbf{a}_{:,:d/2}\\mathbf{W}h_i\\right)\\cdot\\exp\\left(\\mathbf{a}_{:,d/2:}\\mathbf{W}h_j\\right)}{\\sum_{k\\in\\mathcal{N}_i} \\exp\\left(\\mathbf{a}_{:,:d/2}\\mathbf{W}h_i\\right)\\cdot\\exp\\left(\\mathbf{a}_{:,d/2:}\\mathbf{W}h_k\\right)}\\\\[5pt]\n", " & = \\frac{\\exp\\left(\\mathbf{a}_{:,d/2:}\\mathbf{W}h_j\\right)}{\\sum_{k\\in\\mathcal{N}_i} \\exp\\left(\\mathbf{a}_{:,d/2:}\\mathbf{W}h_k\\right)}\\\\\n", "\\end{split}\n", "$$\n", "\n", "We can see that without the non-linearity, the attention term with $h_i$ actually cancels itself out,\n", "resulting in the attention being independent of the node itself.\n", "Hence, we would have the same issue as the GCN of creating the same output features for nodes with the same neighbors.\n", "This is why the LeakyReLU is crucial and adds some dependency on $h_i$ to the attention.\n", "\n", "Once we obtain all attention factors, we can calculate the output features for each node by performing\n", "the weighted average:\n", "\n", "$$h_i'=\\sigma\\left(\\sum_{j\\in\\mathcal{N}_i}\\alpha_{ij}\\mathbf{W}h_j\\right)$$\n", "\n", "$\\sigma$ is yet another non-linearity, as in the GCN layer.\n", "Visually, we can represent the full message passing in an attention layer as follows\n", "(figure credit - [Velickovic et al. ](https://arxiv.org/abs/1710.10903)):\n", "\n", "
\n", "\n", "To increase the expressiveness of the graph attention network, [Velickovic et al. ](https://arxiv.org/abs/1710.10903)\n", "proposed to extend it to multiple heads similar to the Multi-Head Attention block in Transformers.\n", "This results in $N$ attention layers being applied in parallel.\n", "In the image above, it is visualized as three different colors of arrows (green, blue, and purple)\n", "that are afterward concatenated.\n", "The average is only applied for the very final prediction layer in a network.\n", "\n", "After having discussed the graph attention layer in detail, we can implement it below:"]}, {"cell_type": "code", "execution_count": 7, "id": "a5cd3c11", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:03.518254Z", "iopub.status.busy": "2021-12-04T16:15:03.517760Z", "iopub.status.idle": "2021-12-04T16:15:03.519768Z", "shell.execute_reply": "2021-12-04T16:15:03.519389Z"}, "papermill": {"duration": 0.112404, "end_time": "2021-12-04T16:15:03.519875", "exception": false, "start_time": "2021-12-04T16:15:03.407471", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class GATLayer(nn.Module):\n", " def __init__(self, c_in, c_out, num_heads=1, concat_heads=True, alpha=0.2):\n", " \"\"\"\n", " Args:\n", " c_in: Dimensionality of input features\n", " c_out: Dimensionality of output features\n", " num_heads: Number of heads, i.e. attention mechanisms to apply in parallel. The\n", " output features are equally split up over the heads if concat_heads=True.\n", " concat_heads: If True, the output of the different heads is concatenated instead of averaged.\n", " alpha: Negative slope of the LeakyReLU activation.\n", " \"\"\"\n", " super().__init__()\n", " self.num_heads = num_heads\n", " self.concat_heads = concat_heads\n", " if self.concat_heads:\n", " assert c_out % num_heads == 0, \"Number of output features must be a multiple of the count of heads.\"\n", " c_out = c_out // num_heads\n", "\n", " # Sub-modules and parameters needed in the layer\n", " self.projection = nn.Linear(c_in, c_out * num_heads)\n", " self.a = nn.Parameter(torch.Tensor(num_heads, 2 * c_out)) # One per head\n", " self.leakyrelu = nn.LeakyReLU(alpha)\n", "\n", " # Initialization from the original implementation\n", " nn.init.xavier_uniform_(self.projection.weight.data, gain=1.414)\n", " nn.init.xavier_uniform_(self.a.data, gain=1.414)\n", "\n", " def forward(self, node_feats, adj_matrix, print_attn_probs=False):\n", " \"\"\"\n", " Args:\n", " node_feats: Input features of the node. Shape: [batch_size, c_in]\n", " adj_matrix: Adjacency matrix including self-connections. Shape: [batch_size, num_nodes, num_nodes]\n", " print_attn_probs: If True, the attention weights are printed during the forward pass\n", " (for debugging purposes)\n", " \"\"\"\n", " batch_size, num_nodes = node_feats.size(0), node_feats.size(1)\n", "\n", " # Apply linear layer and sort nodes by head\n", " node_feats = self.projection(node_feats)\n", " node_feats = node_feats.view(batch_size, num_nodes, self.num_heads, -1)\n", "\n", " # We need to calculate the attention logits for every edge in the adjacency matrix\n", " # Doing this on all possible combinations of nodes is very expensive\n", " # => Create a tensor of [W*h_i||W*h_j] with i and j being the indices of all edges\n", " # Returns indices where the adjacency matrix is not 0 => edges\n", " edges = adj_matrix.nonzero(as_tuple=False)\n", " node_feats_flat = node_feats.view(batch_size * num_nodes, self.num_heads, -1)\n", " edge_indices_row = edges[:, 0] * num_nodes + edges[:, 1]\n", " edge_indices_col = edges[:, 0] * num_nodes + edges[:, 2]\n", " a_input = torch.cat(\n", " [\n", " torch.index_select(input=node_feats_flat, index=edge_indices_row, dim=0),\n", " torch.index_select(input=node_feats_flat, index=edge_indices_col, dim=0),\n", " ],\n", " dim=-1,\n", " ) # Index select returns a tensor with node_feats_flat being indexed at the desired positions\n", "\n", " # Calculate attention MLP output (independent for each head)\n", " attn_logits = torch.einsum(\"bhc,hc->bh\", a_input, self.a)\n", " attn_logits = self.leakyrelu(attn_logits)\n", "\n", " # Map list of attention values back into a matrix\n", " attn_matrix = attn_logits.new_zeros(adj_matrix.shape + (self.num_heads,)).fill_(-9e15)\n", " attn_matrix[adj_matrix[..., None].repeat(1, 1, 1, self.num_heads) == 1] = attn_logits.reshape(-1)\n", "\n", " # Weighted average of attention\n", " attn_probs = F.softmax(attn_matrix, dim=2)\n", " if print_attn_probs:\n", " print(\"Attention probs\\n\", attn_probs.permute(0, 3, 1, 2))\n", " node_feats = torch.einsum(\"bijh,bjhc->bihc\", attn_probs, node_feats)\n", "\n", " # If heads should be concatenated, we can do this by reshaping. Otherwise, take mean\n", " if self.concat_heads:\n", " node_feats = node_feats.reshape(batch_size, num_nodes, -1)\n", " else:\n", " node_feats = node_feats.mean(dim=2)\n", "\n", " return node_feats"]}, {"cell_type": "markdown", "id": "653c0d4e", "metadata": {"papermill": {"duration": 0.098839, "end_time": "2021-12-04T16:15:03.718323", "exception": false, "start_time": "2021-12-04T16:15:03.619484", "status": "completed"}, "tags": []}, "source": ["Again, we can apply the graph attention layer on our example graph above to understand the dynamics better.\n", "As before, the input layer is initialized as an identity matrix, but we set $\\mathbf{a}$\n", "to be a vector of arbitrary numbers to obtain different attention values.\n", "We use two heads to show the parallel, independent attention mechanisms working in the layer."]}, {"cell_type": "code", "execution_count": 8, "id": "18b9b0b5", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:03.921969Z", "iopub.status.busy": "2021-12-04T16:15:03.921496Z", "iopub.status.idle": "2021-12-04T16:15:03.929280Z", "shell.execute_reply": "2021-12-04T16:15:03.928808Z"}, "papermill": {"duration": 0.111598, "end_time": "2021-12-04T16:15:03.929387", "exception": false, "start_time": "2021-12-04T16:15:03.817789", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Attention probs\n", " tensor([[[[0.3543, 0.6457, 0.0000, 0.0000],\n", " [0.1096, 0.1450, 0.2642, 0.4813],\n", " [0.0000, 0.1858, 0.2885, 0.5257],\n", " [0.0000, 0.2391, 0.2696, 0.4913]],\n", "\n", " [[0.5100, 0.4900, 0.0000, 0.0000],\n", " [0.2975, 0.2436, 0.2340, 0.2249],\n", " [0.0000, 0.3838, 0.3142, 0.3019],\n", " [0.0000, 0.4018, 0.3289, 0.2693]]]])\n", "Adjacency matrix tensor([[[1., 1., 0., 0.],\n", " [1., 1., 1., 1.],\n", " [0., 1., 1., 1.],\n", " [0., 1., 1., 1.]]])\n", "Input features tensor([[[0., 1.],\n", " [2., 3.],\n", " [4., 5.],\n", " [6., 7.]]])\n", "Output features tensor([[[1.2913, 1.9800],\n", " [4.2344, 3.7725],\n", " [4.6798, 4.8362],\n", " [4.5043, 4.7351]]])\n"]}], "source": ["layer = GATLayer(2, 2, num_heads=2)\n", "layer.projection.weight.data = torch.Tensor([[1.0, 0.0], [0.0, 1.0]])\n", "layer.projection.bias.data = torch.Tensor([0.0, 0.0])\n", "layer.a.data = torch.Tensor([[-0.2, 0.3], [0.1, -0.1]])\n", "\n", "with torch.no_grad():\n", " out_feats = layer(node_feats, adj_matrix, print_attn_probs=True)\n", "\n", "print(\"Adjacency matrix\", adj_matrix)\n", "print(\"Input features\", node_feats)\n", "print(\"Output features\", out_feats)"]}, {"cell_type": "markdown", "id": "fdec7a34", "metadata": {"papermill": {"duration": 0.09994, "end_time": "2021-12-04T16:15:04.129204", "exception": false, "start_time": "2021-12-04T16:15:04.029264", "status": "completed"}, "tags": []}, "source": ["We recommend that you try to calculate the attention matrix at least for one head and one node for yourself.\n", "The entries are 0 where there does not exist an edge between $i$ and $j$.\n", "For the others, we see a diverse set of attention probabilities.\n", "Moreover, the output features of node 3 and 4 are now different although they have the same neighbors."]}, {"cell_type": "markdown", "id": "d4ac3429", "metadata": {"papermill": {"duration": 0.099386, "end_time": "2021-12-04T16:15:04.328973", "exception": false, "start_time": "2021-12-04T16:15:04.229587", "status": "completed"}, "tags": []}, "source": ["## PyTorch Geometric\n", "\n", "We had mentioned before that implementing graph networks with adjacency matrix is simple and straight-forward\n", "but can be computationally expensive for large graphs.\n", "Many real-world graphs can reach over 200k nodes, for which adjacency matrix-based implementations fail.\n", "There are a lot of optimizations possible when implementing GNNs, and luckily, there exist packages that provide such layers.\n", "The most popular packages for PyTorch are [PyTorch Geometric](https://pytorch-geometric.readthedocs.io/en/latest/)\n", "and the [Deep Graph Library](https://www.dgl.ai/) (the latter being actually framework agnostic).\n", "Which one to use depends on the project you are planning to do and personal taste.\n", "In this tutorial, we will look at PyTorch Geometric as part of the PyTorch family.\n", "\n", "PyTorch Geometric provides us a set of common graph layers, including the GCN and GAT layer we implemented above.\n", "Additionally, similar to PyTorch's torchvision, it provides the common graph datasets and transformations\n", "on those to simplify training.\n", "Compared to our implementation above, PyTorch Geometric uses a list of index pairs to represent the edges.\n", "The details of this library will be explored further in our experiments.\n", "\n", "In our tasks below, we want to allow us to pick from a multitude of graph layers.\n", "Thus, we define again below a dictionary to access those using a string:"]}, {"cell_type": "code", "execution_count": 9, "id": "bef53fb6", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:04.539895Z", "iopub.status.busy": "2021-12-04T16:15:04.539244Z", "iopub.status.idle": "2021-12-04T16:15:04.541427Z", "shell.execute_reply": "2021-12-04T16:15:04.540961Z"}, "papermill": {"duration": 0.109903, "end_time": "2021-12-04T16:15:04.541533", "exception": false, "start_time": "2021-12-04T16:15:04.431630", "status": "completed"}, "tags": []}, "outputs": [], "source": ["gnn_layer_by_name = {\"GCN\": geom_nn.GCNConv, \"GAT\": geom_nn.GATConv, \"GraphConv\": geom_nn.GraphConv}"]}, {"cell_type": "markdown", "id": "b62d2986", "metadata": {"papermill": {"duration": 0.101051, "end_time": "2021-12-04T16:15:04.742512", "exception": false, "start_time": "2021-12-04T16:15:04.641461", "status": "completed"}, "tags": []}, "source": ["Additionally to GCN and GAT, we added the layer `geom_nn.GraphConv`\n", "([documentation](https://pytorch-geometric.readthedocs.io/en/latest/modules/nn.html#torch_geometric.nn.conv.GraphConv)).\n", "GraphConv is a GCN with a separate weight matrix for the self-connections.\n", "Mathematically, this would be:\n", "\n", "$$\n", "\\mathbf{x}_i^{(l+1)} = \\mathbf{W}^{(l + 1)}_1 \\mathbf{x}_i^{(l)} + \\mathbf{W}^{(\\ell + 1)}_2 \\sum_{j \\in \\mathcal{N}_i} \\mathbf{x}_j^{(l)}\n", "$$\n", "\n", "In this formula, the neighbor's messages are added instead of averaged.\n", "However, PyTorch Geometric provides the argument `aggr` to switch between summing, averaging, and max pooling."]}, {"cell_type": "markdown", "id": "cd5a3c9a", "metadata": {"papermill": {"duration": 0.100612, "end_time": "2021-12-04T16:15:04.943942", "exception": false, "start_time": "2021-12-04T16:15:04.843330", "status": "completed"}, "tags": []}, "source": ["## Experiments on graph structures\n", "\n", "
\n", "\n", "Tasks on graph-structured data can be grouped into three groups: node-level, edge-level and graph-level.\n", "The different levels describe on which level we want to perform classification/regression.\n", "We will discuss all three types in more detail below."]}, {"cell_type": "markdown", "id": "4231c6c6", "metadata": {"papermill": {"duration": 0.101137, "end_time": "2021-12-04T16:15:05.148024", "exception": false, "start_time": "2021-12-04T16:15:05.046887", "status": "completed"}, "tags": []}, "source": ["### Node-level tasks: Semi-supervised node classification\n", "\n", "Node-level tasks have the goal to classify nodes in a graph.\n", "Usually, we have given a single, large graph with >1000 nodes of which a certain amount of nodes are labeled.\n", "We learn to classify those labeled examples during training and try to generalize to the unlabeled nodes.\n", "\n", "A popular example that we will use in this tutorial is the Cora dataset, a citation network among papers.\n", "The Cora consists of 2708 scientific publications with links between each other representing\n", "the citation of one paper by another.\n", "The task is to classify each publication into one of seven classes.\n", "Each publication is represented by a bag-of-words vector.\n", "This means that we have a vector of 1433 elements for each publication, where a 1 at feature $i$ indicates\n", "that the $i$-th word of a pre-defined dictionary is in the article.\n", "Binary bag-of-words representations are commonly used when we need very simple encodings,\n", "and already have an intuition of what words to expect in a network.\n", "There exist much better approaches, but we will leave this to the NLP courses to discuss.\n", "\n", "We will load the dataset below:"]}, {"cell_type": "code", "execution_count": 10, "id": "4805971d", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:05.356051Z", "iopub.status.busy": "2021-12-04T16:15:05.355583Z", "iopub.status.idle": "2021-12-04T16:15:06.678721Z", "shell.execute_reply": "2021-12-04T16:15:06.679111Z"}, "papermill": {"duration": 1.427385, "end_time": "2021-12-04T16:15:06.679294", "exception": false, "start_time": "2021-12-04T16:15:05.251909", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Downloading https://github.com/kimiyoung/planetoid/raw/master/data/ind.cora.x\n", "Downloading https://github.com/kimiyoung/planetoid/raw/master/data/ind.cora.tx\n"]}, {"name": "stderr", "output_type": "stream", "text": ["Downloading https://github.com/kimiyoung/planetoid/raw/master/data/ind.cora.allx\n", "Downloading https://github.com/kimiyoung/planetoid/raw/master/data/ind.cora.y\n"]}, {"name": "stderr", "output_type": "stream", "text": ["Downloading https://github.com/kimiyoung/planetoid/raw/master/data/ind.cora.ty\n", "Downloading https://github.com/kimiyoung/planetoid/raw/master/data/ind.cora.ally\n"]}, {"name": "stderr", "output_type": "stream", "text": ["Downloading https://github.com/kimiyoung/planetoid/raw/master/data/ind.cora.graph\n", "Downloading https://github.com/kimiyoung/planetoid/raw/master/data/ind.cora.test.index\n"]}, {"name": "stderr", "output_type": "stream", "text": ["Processing...\n", "Done!\n"]}], "source": ["cora_dataset = torch_geometric.datasets.Planetoid(root=DATASET_PATH, name=\"Cora\")"]}, {"cell_type": "markdown", "id": "c922d88d", "metadata": {"papermill": {"duration": 0.105227, "end_time": "2021-12-04T16:15:06.889432", "exception": false, "start_time": "2021-12-04T16:15:06.784205", "status": "completed"}, "tags": []}, "source": ["Let's look at how PyTorch Geometric represents the graph data.\n", "Note that although we have a single graph, PyTorch Geometric returns a dataset for compatibility to other datasets."]}, {"cell_type": "code", "execution_count": 11, "id": "a89178e2", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:07.109728Z", "iopub.status.busy": "2021-12-04T16:15:07.109256Z", "iopub.status.idle": "2021-12-04T16:15:07.112556Z", "shell.execute_reply": "2021-12-04T16:15:07.112172Z"}, "papermill": {"duration": 0.11818, "end_time": "2021-12-04T16:15:07.112667", "exception": false, "start_time": "2021-12-04T16:15:06.994487", "status": "completed"}, "tags": []}, "outputs": [{"data": {"text/plain": ["Data(x=[2708, 1433], edge_index=[2, 10556], y=[2708], train_mask=[2708], val_mask=[2708], test_mask=[2708])"]}, "execution_count": 11, "metadata": {}, "output_type": "execute_result"}], "source": ["cora_dataset[0]"]}, {"cell_type": "markdown", "id": "fbb76b54", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.104743, "end_time": "2021-12-04T16:15:07.323421", "exception": false, "start_time": "2021-12-04T16:15:07.218678", "status": "completed"}, "tags": []}, "source": ["The graph is represented by a `Data` object\n", "([documentation](https://pytorch-geometric.readthedocs.io/en/latest/modules/data.html#torch_geometric.data.Data))\n", "which we can access as a standard Python namespace.\n", "The edge index tensor is the list of edges in the graph and contains the mirrored version of each edge for undirected graphs.\n", "The `train_mask`, `val_mask`, and `test_mask` are boolean masks that indicate which nodes we should use for training,\n", "validation, and testing.\n", "The `x` tensor is the feature tensor of our 2708 publications, and `y` the labels for all nodes.\n", "\n", "After having seen the data, we can implement a simple graph neural network.\n", "The GNN applies a sequence of graph layers (GCN, GAT, or GraphConv), ReLU as activation function,\n", "and dropout for regularization.\n", "See below for the specific implementation."]}, {"cell_type": "code", "execution_count": 12, "id": "9a909772", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:07.543303Z", "iopub.status.busy": "2021-12-04T16:15:07.542816Z", "iopub.status.idle": "2021-12-04T16:15:07.544744Z", "shell.execute_reply": "2021-12-04T16:15:07.544369Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.115163, "end_time": "2021-12-04T16:15:07.544851", "exception": false, "start_time": "2021-12-04T16:15:07.429688", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class GNNModel(nn.Module):\n", " def __init__(\n", " self,\n", " c_in,\n", " c_hidden,\n", " c_out,\n", " num_layers=2,\n", " layer_name=\"GCN\",\n", " dp_rate=0.1,\n", " **kwargs,\n", " ):\n", " \"\"\"\n", " Args:\n", " c_in: Dimension of input features\n", " c_hidden: Dimension of hidden features\n", " c_out: Dimension of the output features. Usually number of classes in classification\n", " num_layers: Number of \"hidden\" graph layers\n", " layer_name: String of the graph layer to use\n", " dp_rate: Dropout rate to apply throughout the network\n", " kwargs: Additional arguments for the graph layer (e.g. number of heads for GAT)\n", " \"\"\"\n", " super().__init__()\n", " gnn_layer = gnn_layer_by_name[layer_name]\n", "\n", " layers = []\n", " in_channels, out_channels = c_in, c_hidden\n", " for l_idx in range(num_layers - 1):\n", " layers += [\n", " gnn_layer(in_channels=in_channels, out_channels=out_channels, **kwargs),\n", " nn.ReLU(inplace=True),\n", " nn.Dropout(dp_rate),\n", " ]\n", " in_channels = c_hidden\n", " layers += [gnn_layer(in_channels=in_channels, out_channels=c_out, **kwargs)]\n", " self.layers = nn.ModuleList(layers)\n", "\n", " def forward(self, x, edge_index):\n", " \"\"\"\n", " Args:\n", " x: Input features per node\n", " edge_index: List of vertex index pairs representing the edges in the graph (PyTorch geometric notation)\n", " \"\"\"\n", " for layer in self.layers:\n", " # For graph layers, we need to add the \"edge_index\" tensor as additional input\n", " # All PyTorch Geometric graph layer inherit the class \"MessagePassing\", hence\n", " # we can simply check the class type.\n", " if isinstance(layer, geom_nn.MessagePassing):\n", " x = layer(x, edge_index)\n", " else:\n", " x = layer(x)\n", " return x"]}, {"cell_type": "markdown", "id": "5645bafd", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.104054, "end_time": "2021-12-04T16:15:07.753237", "exception": false, "start_time": "2021-12-04T16:15:07.649183", "status": "completed"}, "tags": []}, "source": ["Good practice in node-level tasks is to create an MLP baseline that is applied to each node independently.\n", "This way we can verify whether adding the graph information to the model indeed improves the prediction, or not.\n", "It might also be that the features per node are already expressive enough to clearly point towards a specific class.\n", "To check this, we implement a simple MLP below."]}, {"cell_type": "code", "execution_count": 13, "id": "089e96c6", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:07.969616Z", "iopub.status.busy": "2021-12-04T16:15:07.969143Z", "iopub.status.idle": "2021-12-04T16:15:07.971505Z", "shell.execute_reply": "2021-12-04T16:15:07.971032Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.113096, "end_time": "2021-12-04T16:15:07.971610", "exception": false, "start_time": "2021-12-04T16:15:07.858514", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class MLPModel(nn.Module):\n", " def __init__(self, c_in, c_hidden, c_out, num_layers=2, dp_rate=0.1):\n", " \"\"\"\n", " Args:\n", " c_in: Dimension of input features\n", " c_hidden: Dimension of hidden features\n", " c_out: Dimension of the output features. Usually number of classes in classification\n", " num_layers: Number of hidden layers\n", " dp_rate: Dropout rate to apply throughout the network\n", " \"\"\"\n", " super().__init__()\n", " layers = []\n", " in_channels, out_channels = c_in, c_hidden\n", " for l_idx in range(num_layers - 1):\n", " layers += [nn.Linear(in_channels, out_channels), nn.ReLU(inplace=True), nn.Dropout(dp_rate)]\n", " in_channels = c_hidden\n", " layers += [nn.Linear(in_channels, c_out)]\n", " self.layers = nn.Sequential(*layers)\n", "\n", " def forward(self, x, *args, **kwargs):\n", " \"\"\"\n", " Args:\n", " x: Input features per node\n", " \"\"\"\n", " return self.layers(x)"]}, {"cell_type": "markdown", "id": "b76ef536", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.104726, "end_time": "2021-12-04T16:15:08.181306", "exception": false, "start_time": "2021-12-04T16:15:08.076580", "status": "completed"}, "tags": []}, "source": ["Finally, we can merge the models into a PyTorch Lightning module which handles the training,\n", "validation, and testing for us."]}, {"cell_type": "code", "execution_count": 14, "id": "505b841a", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:08.400501Z", "iopub.status.busy": "2021-12-04T16:15:08.400021Z", "iopub.status.idle": "2021-12-04T16:15:08.402029Z", "shell.execute_reply": "2021-12-04T16:15:08.401651Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.116664, "end_time": "2021-12-04T16:15:08.402137", "exception": false, "start_time": "2021-12-04T16:15:08.285473", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class NodeLevelGNN(pl.LightningModule):\n", " def __init__(self, model_name, **model_kwargs):\n", " super().__init__()\n", " # Saving hyperparameters\n", " self.save_hyperparameters()\n", "\n", " if model_name == \"MLP\":\n", " self.model = MLPModel(**model_kwargs)\n", " else:\n", " self.model = GNNModel(**model_kwargs)\n", " self.loss_module = nn.CrossEntropyLoss()\n", "\n", " def forward(self, data, mode=\"train\"):\n", " x, edge_index = data.x, data.edge_index\n", " x = self.model(x, edge_index)\n", "\n", " # Only calculate the loss on the nodes corresponding to the mask\n", " if mode == \"train\":\n", " mask = data.train_mask\n", " elif mode == \"val\":\n", " mask = data.val_mask\n", " elif mode == \"test\":\n", " mask = data.test_mask\n", " else:\n", " assert False, \"Unknown forward mode: %s\" % mode\n", "\n", " loss = self.loss_module(x[mask], data.y[mask])\n", " acc = (x[mask].argmax(dim=-1) == data.y[mask]).sum().float() / mask.sum()\n", " return loss, acc\n", "\n", " def configure_optimizers(self):\n", " # We use SGD here, but Adam works as well\n", " optimizer = optim.SGD(self.parameters(), lr=0.1, momentum=0.9, weight_decay=2e-3)\n", " return optimizer\n", "\n", " def training_step(self, batch, batch_idx):\n", " loss, acc = self.forward(batch, mode=\"train\")\n", " self.log(\"train_loss\", loss)\n", " self.log(\"train_acc\", acc)\n", " return loss\n", "\n", " def validation_step(self, batch, batch_idx):\n", " _, acc = self.forward(batch, mode=\"val\")\n", " self.log(\"val_acc\", acc)\n", "\n", " def test_step(self, batch, batch_idx):\n", " _, acc = self.forward(batch, mode=\"test\")\n", " self.log(\"test_acc\", acc)"]}, {"cell_type": "markdown", "id": "ca73bf4a", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.106691, "end_time": "2021-12-04T16:15:08.614156", "exception": false, "start_time": "2021-12-04T16:15:08.507465", "status": "completed"}, "tags": []}, "source": ["Additionally to the Lightning module, we define a training function below.\n", "As we have a single graph, we use a batch size of 1 for the data loader and share the same data loader for the train,\n", "validation, and test set (the mask is picked inside the Lightning module).\n", "Besides, we set the argument `progress_bar_refresh_rate` to zero as it usually shows the progress per epoch,\n", "but an epoch only consists of a single step.\n", "If you have downloaded the pre-trained models in the beginning of the tutorial, we load those instead of training from scratch.\n", "Finally, we test the model and return the results."]}, {"cell_type": "code", "execution_count": 15, "id": "43920ae6", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:08.833594Z", "iopub.status.busy": "2021-12-04T16:15:08.833097Z", "iopub.status.idle": "2021-12-04T16:15:08.835277Z", "shell.execute_reply": "2021-12-04T16:15:08.834895Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.115214, "end_time": "2021-12-04T16:15:08.835384", "exception": false, "start_time": "2021-12-04T16:15:08.720170", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def train_node_classifier(model_name, dataset, **model_kwargs):\n", " pl.seed_everything(42)\n", " node_data_loader = geom_data.DataLoader(dataset, batch_size=1)\n", "\n", " # Create a PyTorch Lightning trainer\n", " root_dir = os.path.join(CHECKPOINT_PATH, \"NodeLevel\" + model_name)\n", " os.makedirs(root_dir, exist_ok=True)\n", " trainer = pl.Trainer(\n", " default_root_dir=root_dir,\n", " callbacks=[ModelCheckpoint(save_weights_only=True, mode=\"max\", monitor=\"val_acc\")],\n", " gpus=AVAIL_GPUS,\n", " max_epochs=200,\n", " progress_bar_refresh_rate=0,\n", " ) # 0 because epoch size is 1\n", " trainer.logger._default_hp_metric = None # Optional logging argument that we don't need\n", "\n", " # Check whether pretrained model exists. If yes, load it and skip training\n", " pretrained_filename = os.path.join(CHECKPOINT_PATH, \"NodeLevel%s.ckpt\" % model_name)\n", " if os.path.isfile(pretrained_filename):\n", " print(\"Found pretrained model, loading...\")\n", " model = NodeLevelGNN.load_from_checkpoint(pretrained_filename)\n", " else:\n", " pl.seed_everything()\n", " model = NodeLevelGNN(\n", " model_name=model_name, c_in=dataset.num_node_features, c_out=dataset.num_classes, **model_kwargs\n", " )\n", " trainer.fit(model, node_data_loader, node_data_loader)\n", " model = NodeLevelGNN.load_from_checkpoint(trainer.checkpoint_callback.best_model_path)\n", "\n", " # Test best model on the test set\n", " test_result = trainer.test(model, test_dataloaders=node_data_loader, verbose=False)\n", " batch = next(iter(node_data_loader))\n", " batch = batch.to(model.device)\n", " _, train_acc = model.forward(batch, mode=\"train\")\n", " _, val_acc = model.forward(batch, mode=\"val\")\n", " result = {\"train\": train_acc, \"val\": val_acc, \"test\": test_result[0][\"test_acc\"]}\n", " return model, result"]}, {"cell_type": "markdown", "id": "b36ea590", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.104889, "end_time": "2021-12-04T16:15:09.046049", "exception": false, "start_time": "2021-12-04T16:15:08.941160", "status": "completed"}, "tags": []}, "source": ["Now, we can train our models. First, let's train the simple MLP:"]}, {"cell_type": "code", "execution_count": 16, "id": "ad9c97ab", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:09.261430Z", "iopub.status.busy": "2021-12-04T16:15:09.260757Z", "iopub.status.idle": "2021-12-04T16:15:09.262448Z", "shell.execute_reply": "2021-12-04T16:15:09.262843Z"}, "papermill": {"duration": 0.11123, "end_time": "2021-12-04T16:15:09.262970", "exception": false, "start_time": "2021-12-04T16:15:09.151740", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# Small function for printing the test scores\n", "def print_results(result_dict):\n", " if \"train\" in result_dict:\n", " print(\"Train accuracy: %4.2f%%\" % (100.0 * result_dict[\"train\"]))\n", " if \"val\" in result_dict:\n", " print(\"Val accuracy: %4.2f%%\" % (100.0 * result_dict[\"val\"]))\n", " print(\"Test accuracy: %4.2f%%\" % (100.0 * result_dict[\"test\"]))"]}, {"cell_type": "code", "execution_count": 17, "id": "8bd3817a", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:09.478007Z", "iopub.status.busy": "2021-12-04T16:15:09.477544Z", "iopub.status.idle": "2021-12-04T16:15:13.025779Z", "shell.execute_reply": "2021-12-04T16:15:13.026163Z"}, "papermill": {"duration": 3.657601, "end_time": "2021-12-04T16:15:13.026329", "exception": false, "start_time": "2021-12-04T16:15:09.368728", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/torch_geometric/deprecation.py:13: UserWarning: 'data.DataLoader' is deprecated, use 'loader.DataLoader' instead\n", " warnings.warn(out)\n", "/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/connectors/callback_connector.py:90: LightningDeprecationWarning: Setting `Trainer(progress_bar_refresh_rate=0)` is deprecated in v1.5 and will be removed in v1.7. Please pass `pytorch_lightning.callbacks.progress.TQDMProgressBar` with `refresh_rate` directly to the Trainer's `callbacks` argument instead. Or, to disable the progress bar pass `enable_progress_bar = False` to the Trainer.\n", " rank_zero_deprecation(\n", "GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/trainer.py:901: LightningDeprecationWarning: `trainer.test(test_dataloaders)` is deprecated in v1.4 and will be removed in v1.6. Use `trainer.test(dataloaders)` instead.\n", " rank_zero_deprecation(\n", "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model, loading...\n"]}, {"name": "stderr", "output_type": "stream", "text": ["Missing logger folder: saved_models/GNNs/NodeLevelMLP/lightning_logs\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Train accuracy: 97.14%\n", "Val accuracy: 54.60%\n", "Test accuracy: 60.60%\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/data_loading.py:111: UserWarning: The dataloader, test_dataloader 0, does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` (try 12 which is the number of cpus on this machine) in the `DataLoader` init to improve performance.\n", " rank_zero_warn(\n", "/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/utilities/data.py:59: UserWarning: Trying to infer the `batch_size` from an ambiguous collection. The batch size we found is 1. To avoid any miscalculations, use `self.log(..., batch_size=batch_size)`.\n", " warning_cache.warn(\n"]}], "source": ["node_mlp_model, node_mlp_result = train_node_classifier(\n", " model_name=\"MLP\", dataset=cora_dataset, c_hidden=16, num_layers=2, dp_rate=0.1\n", ")\n", "\n", "print_results(node_mlp_result)"]}, {"cell_type": "markdown", "id": "31d6a6c3", "metadata": {"papermill": {"duration": 0.111534, "end_time": "2021-12-04T16:15:13.251810", "exception": false, "start_time": "2021-12-04T16:15:13.140276", "status": "completed"}, "tags": []}, "source": ["Although the MLP can overfit on the training dataset because of the high-dimensional input features,\n", "it does not perform too well on the test set.\n", "Let's see if we can beat this score with our graph networks:"]}, {"cell_type": "code", "execution_count": 18, "id": "cdfebd3f", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:13.479708Z", "iopub.status.busy": "2021-12-04T16:15:13.479240Z", "iopub.status.idle": "2021-12-04T16:15:13.518967Z", "shell.execute_reply": "2021-12-04T16:15:13.518494Z"}, "papermill": {"duration": 0.155618, "end_time": "2021-12-04T16:15:13.519222", "exception": false, "start_time": "2021-12-04T16:15:13.363604", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}, {"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stderr", "output_type": "stream", "text": ["Missing logger folder: saved_models/GNNs/NodeLevelGNN/lightning_logs\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model, loading...\n", "Train accuracy: 100.00%\n", "Val accuracy: 78.60%\n", "Test accuracy: 82.40%\n"]}], "source": ["node_gnn_model, node_gnn_result = train_node_classifier(\n", " model_name=\"GNN\", layer_name=\"GCN\", dataset=cora_dataset, c_hidden=16, num_layers=2, dp_rate=0.1\n", ")\n", "print_results(node_gnn_result)"]}, {"cell_type": "markdown", "id": "ad396406", "metadata": {"papermill": {"duration": 0.117918, "end_time": "2021-12-04T16:15:13.755461", "exception": false, "start_time": "2021-12-04T16:15:13.637543", "status": "completed"}, "tags": []}, "source": ["As we would have hoped for, the GNN model outperforms the MLP by quite a margin.\n", "This shows that using the graph information indeed improves our predictions and lets us generalizes better.\n", "\n", "The hyperparameters in the model have been chosen to create a relatively small network.\n", "This is because the first layer with an input dimension of 1433 can be relatively expensive to perform for large graphs.\n", "In general, GNNs can become relatively expensive for very big graphs.\n", "This is why such GNNs either have a small hidden size or use a special batching strategy\n", "where we sample a connected subgraph of the big, original graph."]}, {"cell_type": "markdown", "id": "088207b7", "metadata": {"papermill": {"duration": 0.118156, "end_time": "2021-12-04T16:15:13.991933", "exception": false, "start_time": "2021-12-04T16:15:13.873777", "status": "completed"}, "tags": []}, "source": ["### Edge-level tasks: Link prediction\n", "\n", "In some applications, we might have to predict on an edge-level instead of node-level.\n", "The most common edge-level task in GNN is link prediction.\n", "Link prediction means that given a graph, we want to predict whether there will be/should be an edge between two nodes or not.\n", "For example, in a social network, this is used by Facebook and co to propose new friends to you.\n", "Again, graph level information can be crucial to perform this task.\n", "The output prediction is usually done by performing a similarity metric on the pair of node features,\n", "which should be 1 if there should be a link, and otherwise close to 0.\n", "To keep the tutorial short, we will not implement this task ourselves.\n", "Nevertheless, there are many good resources out there if you are interested in looking closer at this task.\n", "Tutorials and papers for this topic include:\n", "\n", "* [PyTorch Geometric example](https://github.com/rusty1s/pytorch_geometric/blob/master/examples/link_pred.py)\n", "* [Graph Neural Networks: A Review of Methods and Applications](https://arxiv.org/pdf/1812.08434.pdf), Zhou et al.\n", "2019\n", "* [Link Prediction Based on Graph Neural Networks](https://papers.nips.cc/paper/2018/file/53f0d7c537d99b3824f0f99d62ea2428-Paper.pdf), Zhang and Chen, 2018."]}, {"cell_type": "markdown", "id": "dcf6a450", "metadata": {"papermill": {"duration": 0.116763, "end_time": "2021-12-04T16:15:14.228118", "exception": false, "start_time": "2021-12-04T16:15:14.111355", "status": "completed"}, "tags": []}, "source": ["### Graph-level tasks: Graph classification\n", "\n", "Finally, in this part of the tutorial, we will have a closer look at how to apply GNNs to the task of graph classification.\n", "The goal is to classify an entire graph instead of single nodes or edges.\n", "Therefore, we are also given a dataset of multiple graphs that we need to classify based on some structural graph properties.\n", "The most common task for graph classification is molecular property prediction, in which molecules are represented as graphs.\n", "Each atom is linked to a node, and edges in the graph are the bonds between atoms.\n", "For example, look at the figure below.\n", "\n", "
\n", "\n", "On the left, we have an arbitrary, small molecule with different atoms, whereas the right part of the image shows the graph representation.\n", "The atom types are abstracted as node features (e.g. a one-hot vector), and the different bond types are used as edge features.\n", "For simplicity, we will neglect the edge attributes in this tutorial, but you can include by using methods like the\n", "[Relational Graph Convolution](https://arxiv.org/abs/1703.06103) that uses a different weight matrix for each edge type.\n", "\n", "The dataset we will use below is called the MUTAG dataset.\n", "It is a common small benchmark for graph classification algorithms, and contain 188 graphs with 18 nodes\n", "and 20 edges on average for each graph.\n", "The graph nodes have 7 different labels/atom types, and the binary graph labels represent \"their mutagenic effect\n", "on a specific gram negative bacterium\" (the specific meaning of the labels are not too important here).\n", "The dataset is part of a large collection of different graph classification datasets, known as the\n", "[TUDatasets](https://chrsmrrs.github.io/datasets/), which is directly accessible\n", "via `torch_geometric.datasets.TUDataset` ([documentation](https://pytorch-geometric.readthedocs.io/en/latest/modules/datasets.html#torch_geometric.datasets.TUDataset)) in PyTorch Geometric.\n", "We can load the dataset below."]}, {"cell_type": "code", "execution_count": 19, "id": "4438474b", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:14.467759Z", "iopub.status.busy": "2021-12-04T16:15:14.467292Z", "iopub.status.idle": "2021-12-04T16:15:15.161679Z", "shell.execute_reply": "2021-12-04T16:15:15.162066Z"}, "papermill": {"duration": 0.81606, "end_time": "2021-12-04T16:15:15.162230", "exception": false, "start_time": "2021-12-04T16:15:14.346170", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Downloading https://www.chrsmrrs.com/graphkerneldatasets/MUTAG.zip\n"]}, {"name": "stderr", "output_type": "stream", "text": ["Extracting /__w/1/s/.datasets/MUTAG/MUTAG.zip\n", "Processing...\n", "Done!\n"]}], "source": ["tu_dataset = torch_geometric.datasets.TUDataset(root=DATASET_PATH, name=\"MUTAG\")"]}, {"cell_type": "markdown", "id": "c86832d3", "metadata": {"papermill": {"duration": 0.118059, "end_time": "2021-12-04T16:15:15.401214", "exception": false, "start_time": "2021-12-04T16:15:15.283155", "status": "completed"}, "tags": []}, "source": ["Let's look at some statistics for the dataset:"]}, {"cell_type": "code", "execution_count": 20, "id": "e45b7974", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:15.655613Z", "iopub.status.busy": "2021-12-04T16:15:15.655131Z", "iopub.status.idle": "2021-12-04T16:15:15.657630Z", "shell.execute_reply": "2021-12-04T16:15:15.658011Z"}, "papermill": {"duration": 0.125603, "end_time": "2021-12-04T16:15:15.658142", "exception": false, "start_time": "2021-12-04T16:15:15.532539", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Data object: Data(x=[3371, 7], edge_index=[2, 7442], edge_attr=[7442, 4], y=[188])\n", "Length: 188\n", "Average label: 0.66\n"]}], "source": ["print(\"Data object:\", tu_dataset.data)\n", "print(\"Length:\", len(tu_dataset))\n", "print(\"Average label: %4.2f\" % (tu_dataset.data.y.float().mean().item()))"]}, {"cell_type": "markdown", "id": "e0d230ba", "metadata": {"papermill": {"duration": 0.11992, "end_time": "2021-12-04T16:15:15.897420", "exception": false, "start_time": "2021-12-04T16:15:15.777500", "status": "completed"}, "tags": []}, "source": ["The first line shows how the dataset stores different graphs.\n", "The nodes, edges, and labels of each graph are concatenated to one tensor, and the dataset stores the indices\n", "where to split the tensors correspondingly.\n", "The length of the dataset is the number of graphs we have, and the \"average label\"\n", "denotes the percentage of the graph with label 1.\n", "As long as the percentage is in the range of 0.5, we have a relatively balanced dataset.\n", "It happens quite often that graph datasets are very imbalanced, hence checking the class balance\n", "is always a good thing to do.\n", "\n", "Next, we will split our dataset into a training and test part.\n", "Note that we do not use a validation set this time because of the small size of the dataset.\n", "Therefore, our model might overfit slightly on the validation set due to the noise of the evaluation,\n", "but we still get an estimate of the performance on untrained data."]}, {"cell_type": "code", "execution_count": 21, "id": "39a5c558", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:16.156484Z", "iopub.status.busy": "2021-12-04T16:15:16.156008Z", "iopub.status.idle": "2021-12-04T16:15:16.157556Z", "shell.execute_reply": "2021-12-04T16:15:16.157962Z"}, "papermill": {"duration": 0.129586, "end_time": "2021-12-04T16:15:16.158089", "exception": false, "start_time": "2021-12-04T16:15:16.028503", "status": "completed"}, "tags": []}, "outputs": [], "source": ["torch.manual_seed(42)\n", "tu_dataset.shuffle()\n", "train_dataset = tu_dataset[:150]\n", "test_dataset = tu_dataset[150:]"]}, {"cell_type": "markdown", "id": "11db2e62", "metadata": {"papermill": {"duration": 0.121176, "end_time": "2021-12-04T16:15:16.398733", "exception": false, "start_time": "2021-12-04T16:15:16.277557", "status": "completed"}, "tags": []}, "source": ["When using a data loader, we encounter a problem with batching $N$ graphs.\n", "Each graph in the batch can have a different number of nodes and edges, and hence we would require a lot of padding to obtain a single tensor.\n", "Torch geometric uses a different, more efficient approach: we can view the $N$ graphs in a batch as a single large graph with concatenated node and edge list.\n", "As there is no edge between the $N$ graphs, running GNN layers on the large graph gives us the same output as running the GNN on each graph separately.\n", "Visually, this batching strategy is visualized below (figure credit - PyTorch Geometric team,\n", "[tutorial here](https://colab.research.google.com/drive/1I8a0DfQ3fI7Njc62__mVXUlcAleUclnb)).\n", "\n", "
\n", "\n", "The adjacency matrix is zero for any nodes that come from two different graphs, and otherwise according to the adjacency matrix of the individual graph.\n", "Luckily, this strategy is already implemented in torch geometric, and hence we can use the corresponding data loader:"]}, {"cell_type": "code", "execution_count": 22, "id": "5bb78c6b", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:16.644269Z", "iopub.status.busy": "2021-12-04T16:15:16.643796Z", "iopub.status.idle": "2021-12-04T16:15:16.645405Z", "shell.execute_reply": "2021-12-04T16:15:16.645784Z"}, "papermill": {"duration": 0.12704, "end_time": "2021-12-04T16:15:16.645907", "exception": false, "start_time": "2021-12-04T16:15:16.518867", "status": "completed"}, "tags": []}, "outputs": [], "source": ["graph_train_loader = geom_data.DataLoader(train_dataset, batch_size=BATCH_SIZE, shuffle=True)\n", "graph_val_loader = geom_data.DataLoader(test_dataset, batch_size=BATCH_SIZE) # Additional loader for a larger datasets\n", "graph_test_loader = geom_data.DataLoader(test_dataset, batch_size=BATCH_SIZE)"]}, {"cell_type": "markdown", "id": "2146847f", "metadata": {"papermill": {"duration": 0.121317, "end_time": "2021-12-04T16:15:16.886556", "exception": false, "start_time": "2021-12-04T16:15:16.765239", "status": "completed"}, "tags": []}, "source": ["Let's load a batch below to see the batching in action:"]}, {"cell_type": "code", "execution_count": 23, "id": "6bc7f675", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:17.130695Z", "iopub.status.busy": "2021-12-04T16:15:17.130205Z", "iopub.status.idle": "2021-12-04T16:15:17.140406Z", "shell.execute_reply": "2021-12-04T16:15:17.139998Z"}, "papermill": {"duration": 0.134013, "end_time": "2021-12-04T16:15:17.140515", "exception": false, "start_time": "2021-12-04T16:15:17.006502", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Batch: DataBatch(edge_index=[2, 1512], x=[687, 7], edge_attr=[1512, 4], y=[38], batch=[687], ptr=[39])\n", "Labels: tensor([1, 1, 1, 0, 0, 0, 1, 1, 1, 0])\n", "Batch indices: tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2])\n"]}], "source": ["batch = next(iter(graph_test_loader))\n", "print(\"Batch:\", batch)\n", "print(\"Labels:\", batch.y[:10])\n", "print(\"Batch indices:\", batch.batch[:40])"]}, {"cell_type": "markdown", "id": "28b5c41f", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.119685, "end_time": "2021-12-04T16:15:17.380797", "exception": false, "start_time": "2021-12-04T16:15:17.261112", "status": "completed"}, "tags": []}, "source": ["We have 38 graphs stacked together for the test dataset.\n", "The batch indices, stored in `batch`, show that the first 12 nodes belong to the first graph,\n", "the next 22 to the second graph, and so on.\n", "These indices are important for performing the final prediction.\n", "To perform a prediction over a whole graph, we usually perform a pooling operation over all nodes after running the GNN model.\n", "In this case, we will use the average pooling.\n", "Hence, we need to know which nodes should be included in which average pool.\n", "Using this pooling, we can already create our graph network below.\n", "Specifically, we re-use our class `GNNModel` from before,\n", "and simply add an average pool and single linear layer for the graph prediction task."]}, {"cell_type": "code", "execution_count": 24, "id": "1c7e611b", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:17.629106Z", "iopub.status.busy": "2021-12-04T16:15:17.628629Z", "iopub.status.idle": "2021-12-04T16:15:17.630171Z", "shell.execute_reply": "2021-12-04T16:15:17.630568Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.127887, "end_time": "2021-12-04T16:15:17.630712", "exception": false, "start_time": "2021-12-04T16:15:17.502825", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class GraphGNNModel(nn.Module):\n", " def __init__(self, c_in, c_hidden, c_out, dp_rate_linear=0.5, **kwargs):\n", " \"\"\"\n", " Args:\n", " c_in: Dimension of input features\n", " c_hidden: Dimension of hidden features\n", " c_out: Dimension of output features (usually number of classes)\n", " dp_rate_linear: Dropout rate before the linear layer (usually much higher than inside the GNN)\n", " kwargs: Additional arguments for the GNNModel object\n", " \"\"\"\n", " super().__init__()\n", " self.GNN = GNNModel(c_in=c_in, c_hidden=c_hidden, c_out=c_hidden, **kwargs) # Not our prediction output yet!\n", " self.head = nn.Sequential(nn.Dropout(dp_rate_linear), nn.Linear(c_hidden, c_out))\n", "\n", " def forward(self, x, edge_index, batch_idx):\n", " \"\"\"\n", " Args:\n", " x: Input features per node\n", " edge_index: List of vertex index pairs representing the edges in the graph (PyTorch geometric notation)\n", " batch_idx: Index of batch element for each node\n", " \"\"\"\n", " x = self.GNN(x, edge_index)\n", " x = geom_nn.global_mean_pool(x, batch_idx) # Average pooling\n", " x = self.head(x)\n", " return x"]}, {"cell_type": "markdown", "id": "99675752", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.119943, "end_time": "2021-12-04T16:15:17.871766", "exception": false, "start_time": "2021-12-04T16:15:17.751823", "status": "completed"}, "tags": []}, "source": ["Finally, we can create a PyTorch Lightning module to handle the training.\n", "It is similar to the modules we have seen before and does nothing surprising in terms of training.\n", "As we have a binary classification task, we use the Binary Cross Entropy loss."]}, {"cell_type": "code", "execution_count": 25, "id": "f954ef0e", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:18.121084Z", "iopub.status.busy": "2021-12-04T16:15:18.120606Z", "iopub.status.idle": "2021-12-04T16:15:18.122171Z", "shell.execute_reply": "2021-12-04T16:15:18.122544Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.131105, "end_time": "2021-12-04T16:15:18.122688", "exception": false, "start_time": "2021-12-04T16:15:17.991583", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class GraphLevelGNN(pl.LightningModule):\n", " def __init__(self, **model_kwargs):\n", " super().__init__()\n", " # Saving hyperparameters\n", " self.save_hyperparameters()\n", "\n", " self.model = GraphGNNModel(**model_kwargs)\n", " self.loss_module = nn.BCEWithLogitsLoss() if self.hparams.c_out == 1 else nn.CrossEntropyLoss()\n", "\n", " def forward(self, data, mode=\"train\"):\n", " x, edge_index, batch_idx = data.x, data.edge_index, data.batch\n", " x = self.model(x, edge_index, batch_idx)\n", " x = x.squeeze(dim=-1)\n", "\n", " if self.hparams.c_out == 1:\n", " preds = (x > 0).float()\n", " data.y = data.y.float()\n", " else:\n", " preds = x.argmax(dim=-1)\n", " loss = self.loss_module(x, data.y)\n", " acc = (preds == data.y).sum().float() / preds.shape[0]\n", " return loss, acc\n", "\n", " def configure_optimizers(self):\n", " # High lr because of small dataset and small model\n", " optimizer = optim.AdamW(self.parameters(), lr=1e-2, weight_decay=0.0)\n", " return optimizer\n", "\n", " def training_step(self, batch, batch_idx):\n", " loss, acc = self.forward(batch, mode=\"train\")\n", " self.log(\"train_loss\", loss)\n", " self.log(\"train_acc\", acc)\n", " return loss\n", "\n", " def validation_step(self, batch, batch_idx):\n", " _, acc = self.forward(batch, mode=\"val\")\n", " self.log(\"val_acc\", acc)\n", "\n", " def test_step(self, batch, batch_idx):\n", " _, acc = self.forward(batch, mode=\"test\")\n", " self.log(\"test_acc\", acc)"]}, {"cell_type": "markdown", "id": "c09f6bca", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.120516, "end_time": "2021-12-04T16:15:18.365106", "exception": false, "start_time": "2021-12-04T16:15:18.244590", "status": "completed"}, "tags": []}, "source": ["Below we train the model on our dataset. It resembles the typical training functions we have seen so far."]}, {"cell_type": "code", "execution_count": 26, "id": "48f499d3", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:18.612530Z", "iopub.status.busy": "2021-12-04T16:15:18.612053Z", "iopub.status.idle": "2021-12-04T16:15:18.614039Z", "shell.execute_reply": "2021-12-04T16:15:18.613578Z"}, "papermill": {"duration": 0.128866, "end_time": "2021-12-04T16:15:18.614142", "exception": false, "start_time": "2021-12-04T16:15:18.485276", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def train_graph_classifier(model_name, **model_kwargs):\n", " pl.seed_everything(42)\n", "\n", " # Create a PyTorch Lightning trainer with the generation callback\n", " root_dir = os.path.join(CHECKPOINT_PATH, \"GraphLevel\" + model_name)\n", " os.makedirs(root_dir, exist_ok=True)\n", " trainer = pl.Trainer(\n", " default_root_dir=root_dir,\n", " callbacks=[ModelCheckpoint(save_weights_only=True, mode=\"max\", monitor=\"val_acc\")],\n", " gpus=AVAIL_GPUS,\n", " max_epochs=500,\n", " progress_bar_refresh_rate=0,\n", " )\n", " trainer.logger._default_hp_metric = None\n", "\n", " # Check whether pretrained model exists. If yes, load it and skip training\n", " pretrained_filename = os.path.join(CHECKPOINT_PATH, \"GraphLevel%s.ckpt\" % model_name)\n", " if os.path.isfile(pretrained_filename):\n", " print(\"Found pretrained model, loading...\")\n", " model = GraphLevelGNN.load_from_checkpoint(pretrained_filename)\n", " else:\n", " pl.seed_everything(42)\n", " model = GraphLevelGNN(\n", " c_in=tu_dataset.num_node_features,\n", " c_out=1 if tu_dataset.num_classes == 2 else tu_dataset.num_classes,\n", " **model_kwargs,\n", " )\n", " trainer.fit(model, graph_train_loader, graph_val_loader)\n", " model = GraphLevelGNN.load_from_checkpoint(trainer.checkpoint_callback.best_model_path)\n", "\n", " # Test best model on validation and test set\n", " train_result = trainer.test(model, test_dataloaders=graph_train_loader, verbose=False)\n", " test_result = trainer.test(model, test_dataloaders=graph_test_loader, verbose=False)\n", " result = {\"test\": test_result[0][\"test_acc\"], \"train\": train_result[0][\"test_acc\"]}\n", " return model, result"]}, {"cell_type": "markdown", "id": "ca9673c3", "metadata": {"papermill": {"duration": 0.119315, "end_time": "2021-12-04T16:15:18.853469", "exception": false, "start_time": "2021-12-04T16:15:18.734154", "status": "completed"}, "tags": []}, "source": ["Finally, let's perform the training and testing.\n", "Feel free to experiment with different GNN layers, hyperparameters, etc."]}, {"cell_type": "code", "execution_count": 27, "id": "bc380c0d", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:19.098231Z", "iopub.status.busy": "2021-12-04T16:15:19.097768Z", "iopub.status.idle": "2021-12-04T16:15:19.155078Z", "shell.execute_reply": "2021-12-04T16:15:19.155459Z"}, "papermill": {"duration": 0.18191, "end_time": "2021-12-04T16:15:19.155600", "exception": false, "start_time": "2021-12-04T16:15:18.973690", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}, {"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stderr", "output_type": "stream", "text": ["Missing logger folder: saved_models/GNNs/GraphLevelGraphConv/lightning_logs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/data_loading.py:453: UserWarning: Your `test_dataloader` has `shuffle=True`,it is strongly recommended that you turn this off for val/test/predict dataloaders.\n", " rank_zero_warn(\n", "/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/utilities/data.py:59: UserWarning: Trying to infer the `batch_size` from an ambiguous collection. The batch size we found is 10. To avoid any miscalculations, use `self.log(..., batch_size=batch_size)`.\n", " warning_cache.warn(\n", "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model, loading...\n"]}], "source": ["model, result = train_graph_classifier(\n", " model_name=\"GraphConv\", c_hidden=256, layer_name=\"GraphConv\", num_layers=3, dp_rate_linear=0.5, dp_rate=0.0\n", ")"]}, {"cell_type": "code", "execution_count": 28, "id": "9db3f0a3", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:15:19.414152Z", "iopub.status.busy": "2021-12-04T16:15:19.413689Z", "iopub.status.idle": "2021-12-04T16:15:19.416116Z", "shell.execute_reply": "2021-12-04T16:15:19.415738Z"}, "papermill": {"duration": 0.133162, "end_time": "2021-12-04T16:15:19.416222", "exception": false, "start_time": "2021-12-04T16:15:19.283060", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Train performance: 92.67%\n", "Test performance: 92.11%\n"]}], "source": ["print(\"Train performance: %4.2f%%\" % (100.0 * result[\"train\"]))\n", "print(\"Test performance: %4.2f%%\" % (100.0 * result[\"test\"]))"]}, {"cell_type": "markdown", "id": "3737c725", "metadata": {"papermill": {"duration": 0.126889, "end_time": "2021-12-04T16:15:19.671142", "exception": false, "start_time": "2021-12-04T16:15:19.544253", "status": "completed"}, "tags": []}, "source": ["The test performance shows that we obtain quite good scores on an unseen part of the dataset.\n", "It should be noted that as we have been using the test set for validation as well, we might have overfitted slightly to this set.\n", "Nevertheless, the experiment shows us that GNNs can be indeed powerful to predict the properties of graphs and/or molecules."]}, {"cell_type": "markdown", "id": "df0d1c2e", "metadata": {"papermill": {"duration": 0.13482, "end_time": "2021-12-04T16:15:19.932515", "exception": false, "start_time": "2021-12-04T16:15:19.797695", "status": "completed"}, "tags": []}, "source": ["## Conclusion\n", "\n", "In this tutorial, we have seen the application of neural networks to graph structures.\n", "We looked at how a graph can be represented (adjacency matrix or edge list),\n", "and discussed the implementation of common graph layers: GCN and GAT.\n", "The implementations showed the practical side of the layers, which is often easier than the theory.\n", "Finally, we experimented with different tasks, on node-, edge- and graph-level.\n", "Overall, we have seen that including graph information in the predictions can be crucial for achieving high performance.\n", "There are a lot of applications that benefit from GNNs,\n", "and the importance of these networks will likely increase over the next years."]}, {"cell_type": "markdown", "id": "84b8f473", "metadata": {"papermill": {"duration": 0.135396, "end_time": "2021-12-04T16:15:20.206281", "exception": false, "start_time": "2021-12-04T16:15:20.070885", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "[![Pytorch Lightning](){height=\"60px\" width=\"240px\"}](https://pytorchlightning.ai)"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: Tutorial 6: Basics of Graph Neural Networks\n", " :card_description: In this tutorial, we will discuss the application of neural networks on graphs. Graph Neural Networks (GNNs) have recently gained increasing popularity in both applications...\n", " :tags: Graph,GPU/TPU,UvA-DL-Course\n", " :image: _static/images/course_UvA-DL/06-graph-neural-networks.jpg"]}], "metadata": {"jupytext": {"cell_metadata_filter": "id,colab_type,colab,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 27.294729, "end_time": "2021-12-04T16:15:21.142769", "environment_variables": {}, "exception": null, "input_path": "course_UvA-DL/06-graph-neural-networks/GNN_overview.ipynb", "output_path": ".notebooks/course_UvA-DL/06-graph-neural-networks.ipynb", "parameters": {}, "start_time": "2021-12-04T16:14:53.848040", "version": "2.3.3"}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/course_UvA-DL/07-deep-energy-based-generative-models.ipynb b/source/notebooks/course_UvA-DL/07-deep-energy-based-generative-models.ipynb deleted file mode 100644 index 7ebe824..0000000 --- a/source/notebooks/course_UvA-DL/07-deep-energy-based-generative-models.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "7a37951c", "metadata": {"papermill": {"duration": 0.023386, "end_time": "2021-09-16T12:40:39.258673", "exception": false, "start_time": "2021-09-16T12:40:39.235287", "status": "completed"}, "tags": []}, "source": ["\n", "# Tutorial 7: Deep Energy-Based Generative Models\n", "\n", "* **Author:** Phillip Lippe\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-09-16T14:32:29.871712\n", "\n", "In this tutorial, we will look at energy-based deep learning models, and focus on their application as generative models.\n", "Energy models have been a popular tool before the huge deep learning hype around 2012 hit.\n", "However, in recent years, energy-based models have gained increasing attention because of improved training methods and tricks being proposed.\n", "Although they are still in a research stage, they have shown to outperform strong Generative Adversarial Networks\n", "in certain cases which have been the state of the art of generating images\n", "([blog post](https://ajolicoeur.wordpress.com/the-new-contender-to-gans-score-matching-with-langevin-sampling/)about strong energy-based models,\n", "[blog post](https://medium.com/syncedreview/nvidia-open-sources-hyper-realistic-face-generator-stylegan-f346e1a73826) about the power of GANs).\n", "Hence, it is important to be aware of energy-based models, and as the theory can be abstract sometimes,\n", "we will show the idea of energy-based models with a lot of examples.\n", "This notebook is part of a lecture series on Deep Learning at the University of Amsterdam.\n", "The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io.\n", "\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/course_UvA-DL/07-deep-energy-based-generative-models.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "7f00f90d", "metadata": {"papermill": {"duration": 0.021442, "end_time": "2021-09-16T12:40:39.301749", "exception": false, "start_time": "2021-09-16T12:40:39.280307", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "33e8ad5c", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-09-16T12:40:39.347844Z", "iopub.status.busy": "2021-09-16T12:40:39.347375Z", "iopub.status.idle": "2021-09-16T12:40:39.349918Z", "shell.execute_reply": "2021-09-16T12:40:39.349436Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 0.026972, "end_time": "2021-09-16T12:40:39.350031", "exception": false, "start_time": "2021-09-16T12:40:39.323059", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# ! pip install --quiet \"torchvision\" \"torch>=1.6, <1.9\" \"tensorboard\" \"matplotlib\" \"pytorch-lightning>=1.3\" \"torchmetrics>=0.3\""]}, {"cell_type": "markdown", "id": "9eea4d0b", "metadata": {"papermill": {"duration": 0.022362, "end_time": "2021-09-16T12:40:39.394135", "exception": false, "start_time": "2021-09-16T12:40:39.371773", "status": "completed"}, "tags": []}, "source": ["
\n", "First, let's import our standard libraries below."]}, {"cell_type": "code", "execution_count": 2, "id": "8882a3d0", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:39.460040Z", "iopub.status.busy": "2021-09-16T12:40:39.459550Z", "iopub.status.idle": "2021-09-16T12:40:40.727064Z", "shell.execute_reply": "2021-09-16T12:40:40.726625Z"}, "papermill": {"duration": 1.298062, "end_time": "2021-09-16T12:40:40.727182", "exception": false, "start_time": "2021-09-16T12:40:39.429120", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/tmp/ipykernel_1940/3480345581.py:30: DeprecationWarning: `set_matplotlib_formats` is deprecated since IPython 7.23, directly use `matplotlib_inline.backend_inline.set_matplotlib_formats()`\n", " set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "Global seed set to 42\n"]}], "source": ["# Standard libraries\n", "import os\n", "import random\n", "import urllib.request\n", "from urllib.error import HTTPError\n", "\n", "# Plotting\n", "import matplotlib\n", "import matplotlib.pyplot as plt\n", "import numpy as np\n", "\n", "# PyTorch Lightning\n", "import pytorch_lightning as pl\n", "\n", "# PyTorch\n", "import torch\n", "import torch.nn as nn\n", "import torch.optim as optim\n", "import torch.utils.data as data\n", "\n", "# Torchvision\n", "import torchvision\n", "\n", "# %matplotlib inline\n", "from IPython.display import set_matplotlib_formats\n", "from pytorch_lightning.callbacks import LearningRateMonitor, ModelCheckpoint\n", "from torchvision import transforms\n", "from torchvision.datasets import MNIST\n", "\n", "set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "matplotlib.rcParams[\"lines.linewidth\"] = 2.0\n", "\n", "# Path to the folder where the datasets are/should be downloaded (e.g. CIFAR10)\n", "DATASET_PATH = os.environ.get(\"PATH_DATASETS\", \"data\")\n", "# Path to the folder where the pretrained models are saved\n", "CHECKPOINT_PATH = os.environ.get(\"PATH_CHECKPOINT\", \"saved_models/tutorial8\")\n", "\n", "# Setting the seed\n", "pl.seed_everything(42)\n", "\n", "# Ensure that all operations are deterministic on GPU (if used) for reproducibility\n", "torch.backends.cudnn.determinstic = True\n", "torch.backends.cudnn.benchmark = False\n", "\n", "device = torch.device(\"cuda:0\") if torch.cuda.is_available() else torch.device(\"cpu\")"]}, {"cell_type": "markdown", "id": "8fa2ad82", "metadata": {"papermill": {"duration": 0.022316, "end_time": "2021-09-16T12:40:40.772238", "exception": false, "start_time": "2021-09-16T12:40:40.749922", "status": "completed"}, "tags": []}, "source": ["We also have pre-trained models that we download below."]}, {"cell_type": "code", "execution_count": 3, "id": "8ddb6202", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:40.823433Z", "iopub.status.busy": "2021-09-16T12:40:40.820802Z", "iopub.status.idle": "2021-09-16T12:40:41.030878Z", "shell.execute_reply": "2021-09-16T12:40:41.030402Z"}, "papermill": {"duration": 0.236743, "end_time": "2021-09-16T12:40:41.030985", "exception": false, "start_time": "2021-09-16T12:40:40.794242", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial8/MNIST.ckpt...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial8/tensorboards/events.out.tfevents.MNIST...\n"]}], "source": ["# Github URL where saved models are stored for this tutorial\n", "base_url = \"https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial8/\"\n", "# Files to download\n", "pretrained_files = [\"MNIST.ckpt\", \"tensorboards/events.out.tfevents.MNIST\"]\n", "\n", "# Create checkpoint path if it doesn't exist yet\n", "os.makedirs(CHECKPOINT_PATH, exist_ok=True)\n", "\n", "# For each file, check whether it already exists. If not, try downloading it.\n", "for file_name in pretrained_files:\n", " file_path = os.path.join(CHECKPOINT_PATH, file_name)\n", " if \"/\" in file_name:\n", " os.makedirs(file_path.rsplit(\"/\", 1)[0], exist_ok=True)\n", " if not os.path.isfile(file_path):\n", " file_url = base_url + file_name\n", " print(\"Downloading %s...\" % file_url)\n", " try:\n", " urllib.request.urlretrieve(file_url, file_path)\n", " except HTTPError as e:\n", " print(\n", " \"Something went wrong. Please try to download the files manually,\"\n", " \" or contact the author with the full output including the following error:\\n\",\n", " e,\n", " )"]}, {"cell_type": "markdown", "id": "54b9725b", "metadata": {"papermill": {"duration": 0.02216, "end_time": "2021-09-16T12:40:41.075989", "exception": false, "start_time": "2021-09-16T12:40:41.053829", "status": "completed"}, "tags": []}, "source": ["## Energy Models\n", "\n", "In the first part of this tutorial, we will review the theory of the energy-based models\n", "(the same theory has been discussed in Lecture 8).\n", "While most of the previous models had the goal of classification or regression,\n", "energy-based models are motivated from a different perspective: density estimation.\n", "Given a dataset with a lot of elements, we want to estimate the probability distribution over the whole data space.\n", "As an example, if we model images from CIFAR10, our goal would be to have a probability distribution\n", "over all possible images of size $32\\times32\\times3$ where those images have a high likelihood\n", "that look realistic and are one of the 10 CIFAR classes.\n", "Simple methods like interpolation between images don't work because images are extremely high-dimensional\n", "(especially for large HD images).\n", "Hence, we turn to deep learning methods that have performed well on complex data.\n", "\n", "However, how do we predict a probability distribution $p(\\mathbf{x})$ over so many dimensions using a simple neural network?\n", "The problem is that we cannot just predict a score between 0 and 1,\n", "because a probability distribution over data needs to fulfill two properties:\n", "\n", "1.\n", "The probability distribution needs to assign any possible value of\n", "$\\mathbf{x}$ a non-negative value: $p(\\mathbf{x}) \\geq 0$.\n", "2.\n", "The probability density must sum/integrate to 1 over **all** possible inputs:\n", "$\\int_{\\mathbf{x}} p(\\mathbf{x}) d\\mathbf{x} = 1$.\n", "\n", "Luckily, there are actually many approaches for this, and one of them are energy-based models.\n", "The fundamental idea of energy-based models is that you can turn any function\n", "that predicts values larger than zero into a probability distribution by dviding by its volume.\n", "Imagine we have a neural network, which has as output a single neuron, like in regression.\n", "We can call this network $E_{\\theta}(\\mathbf{x})$, where $\\theta$ are our parameters of the network,\n", "and $\\mathbf{x}$ the input data (e.g. an image).\n", "The output of $E_{\\theta}$ is a scalar value between $-\\infty$ and $\\infty$.\n", "Now, we can use basic probability theory to *normalize* the scores of all possible inputs:\n", "\n", "$$\n", "q_{\\theta}(\\mathbf{x}) = \\frac{\\exp\\left(-E_{\\theta}(\\mathbf{x})\\right)}{Z_{\\theta}} \\hspace{5mm}\\text{where}\\hspace{5mm}\n", "Z_{\\theta} = \\begin{cases}\n", " \\int_{\\mathbf{x}}\\exp\\left(-E_{\\theta}(\\mathbf{x})\\right) d\\mathbf{x} & \\text{if }x\\text{ is continuous}\\\\\n", " \\sum_{\\mathbf{x}}\\exp\\left(-E_{\\theta}(\\mathbf{x})\\right) & \\text{if }x\\text{ is discrete}\n", "\\end{cases}\n", "$$\n", "\n", "The $\\exp$-function ensures that we assign a probability greater than zero to any possible input.\n", "We use a negative sign in front of $E$ because we call $E_{\\theta}$ to be the energy function:\n", "data points with high likelihood have a low energy, while data points with low likelihood have a high energy.\n", "$Z_{\\theta}$ is our normalization terms that ensures that the density integrates/sums to 1.\n", "We can show this by integrating over $q_{\\theta}(\\mathbf{x})$:\n", "\n", "$$\n", "\\int_{\\mathbf{x}}q_{\\theta}(\\mathbf{x})d\\mathbf{x} =\n", "\\int_{\\mathbf{x}}\\frac{\\exp\\left(-E_{\\theta}(\\mathbf{x})\\right)}{\\int_{\\mathbf{\\tilde{x}}}\\exp\\left(-E_{\\theta}(\\mathbf{\\tilde{x}})\\right) d\\mathbf{\\tilde{x}}}d\\mathbf{x} =\n", "\\frac{\\int_{\\mathbf{x}}\\exp\\left(-E_{\\theta}(\\mathbf{x})\\right)d\\mathbf{x}}{\\int_{\\mathbf{\\tilde{x}}}\\exp\\left(-E_{\\theta}(\\mathbf{\\tilde{x}})\\right) d\\mathbf{\\tilde{x}}} = 1\n", "$$\n", "\n", "Note that we call the probability distribution $q_{\\theta}(\\mathbf{x})$ because this is the learned distribution by the model,\n", "and is trained to be as close as possible to the *true*, unknown distribution $p(\\mathbf{x})$.\n", "\n", "The main benefit of this formulation of the probability distribution is its great flexibility as we can choose\n", "$E_{\\theta}$ in whatever way we like, without any constraints.\n", "Nevertheless, when looking at the equation above, we can see a fundamental issue: How do we calculate $Z_{\\theta}$?\n", "There is no chance that we can calculate $Z_{\\theta}$ analytically for high-dimensional input\n", "and/or larger neural networks, but the task requires us to know $Z_{\\theta}$.\n", "Although we can't determine the exact likelihood of a point, there exist methods with which we can train energy-based models.\n", "Thus, we will look next at \"Contrastive Divergence\" for training the model."]}, {"cell_type": "markdown", "id": "5f67ccab", "metadata": {"papermill": {"duration": 0.022199, "end_time": "2021-09-16T12:40:41.120470", "exception": false, "start_time": "2021-09-16T12:40:41.098271", "status": "completed"}, "tags": []}, "source": ["### Contrastive Divergence\n", "\n", "When we train a model on generative modeling, it is usually done by maximum likelihood estimation.\n", "In other words, we try to maximize the likelihood of the examples in the training set.\n", "As the exact likelihood of a point cannot be determined due to the unknown normalization constant $Z_{\\theta}$,\n", "we need to train energy-based models slightly different.\n", "We cannot just maximize the un-normalized probability $\\exp(-E_{\\theta}(\\mathbf{x}_{\\text{train}}))$\n", "because there is no guarantee that $Z_{\\theta}$ stays constant, or that $\\mathbf{x}_{\\text{train}}$\n", "is becoming more likely than the others.\n", "However, if we base our training on comparing the likelihood of points, we can create a stable objective.\n", "Namely, we can re-write our maximum likelihood objective where we maximize the probability\n", "of $\\mathbf{x}_{\\text{train}}$ compared to a randomly sampled data point of our model:\n", "\n", "$$\n", "\\begin{split}\n", " \\nabla_{\\theta}\\mathcal{L}_{\\text{MLE}}(\\mathbf{\\theta};p) & = -\\mathbb{E}_{p(\\mathbf{x})}\\left[\\nabla_{\\theta}\\log q_{\\theta}(\\mathbf{x})\\right]\\\\[5pt]\n", " & = \\mathbb{E}_{p(\\mathbf{x})}\\left[\\nabla_{\\theta}E_{\\theta}(\\mathbf{x})\\right] - \\mathbb{E}_{q_{\\theta}(\\mathbf{x})}\\left[\\nabla_{\\theta}E_{\\theta}(\\mathbf{x})\\right]\n", "\\end{split}\n", "$$\n", "\n", "Note that the loss is still an objective we want to minimize.\n", "Thus, we try to minimize the energy for data points from the dataset, while maximizing the energy for randomly\n", "sampled data points from our model (how we sample will be explained below).\n", "Although this objective sounds intuitive, how is it actually derived from our original distribution $q_{\\theta}(\\mathbf{x})$?\n", "The trick is that we approximate $Z_{\\theta}$ by a single Monte-Carlo sample.\n", "This gives us the exact same objective as written above.\n", "\n", "Visually, we can look at the objective as follows (figure credit\n", "- [Stefano Ermon and Aditya Grover](https://deepgenerativemodels.github.io/assets/slides/cs236_lecture11.pdf)):\n", "\n", "
\n", "\n", "$f_{\\theta}$ represents $\\exp(-E_{\\theta}(\\mathbf{x}))$ in our case.\n", "The point on the right, called \"correct answer\", represents a data point from the dataset\n", "(i.e. $x_{\\text{train}}$), and the left point, \"wrong answer\", a sample from our model (i.e. $x_{\\text{sample}}$).\n", "Thus, we try to \"pull up\" the probability of the data points in the dataset,\n", "while \"pushing down\" randomly sampled points.\n", "The two forces for pulling and pushing are in balance iff $q_{\\theta}(\\mathbf{x})=p(\\mathbf{x})$."]}, {"cell_type": "markdown", "id": "2b9dc4a8", "metadata": {"papermill": {"duration": 0.022022, "end_time": "2021-09-16T12:40:41.164700", "exception": false, "start_time": "2021-09-16T12:40:41.142678", "status": "completed"}, "tags": []}, "source": ["### Sampling from Energy-Based Models\n", "\n", "For sampling from an energy-based model, we can apply a Markov Chain Monte Carlo using Langevin Dynamics.\n", "The idea of the algorithm is to start from a random point, and slowly move towards the direction\n", "of higher probability using the gradients of $E_{\\theta}$.\n", "Nevertheless, this is not enough to fully capture the probability distribution.\n", "We need to add noise $\\omega$ at each gradient step to the current sample.\n", "Under certain conditions such as that we perform the gradient steps an infinite amount of times,\n", "we would be able to create an exact sample from our modeled distribution.\n", "However, as this is not practically possible, we usually limit the chain to $K$ steps\n", "($K$ a hyperparameter that needs to be finetuned).\n", "Overall, the sampling procedure can be summarized in the following algorithm:\n", "\n", "
"]}, {"cell_type": "markdown", "id": "c20bf67b", "metadata": {"papermill": {"duration": 0.02196, "end_time": "2021-09-16T12:40:41.209186", "exception": false, "start_time": "2021-09-16T12:40:41.187226", "status": "completed"}, "tags": []}, "source": ["### Applications of Energy-based models beyond generation\n", "\n", "Modeling the probability distribution for sampling new data is not the only application of energy-based models.\n", "Any application which requires us to compare two elements is much simpler to learn\n", "because we just need to go for the higher energy.\n", "A couple of examples are shown below (figure credit\n", "- [Stefano Ermon and Aditya Grover](https://deepgenerativemodels.github.io/assets/slides/cs236_lecture11.pdf)).\n", "A classification setup like object recognition or sequence labeling can be considered as an energy-based\n", "task as we just need to find the $Y$ input that minimizes the output $E(X, Y)$ (hence maximizes probability).\n", "Similarly, a popular application of energy-based models is denoising of images.\n", "Given an image $X$ with a lot of noise, we try to minimize the energy by finding the true input image $Y$.\n", "\n", "
\n", "\n", "Nonetheless, we will focus on generative modeling here as in the next couple of lectures,\n", "we will discuss more generative deep learning approaches."]}, {"cell_type": "markdown", "id": "89370a6d", "metadata": {"papermill": {"duration": 0.022103, "end_time": "2021-09-16T12:40:41.253274", "exception": false, "start_time": "2021-09-16T12:40:41.231171", "status": "completed"}, "tags": []}, "source": ["## Image generation\n", "\n", "
\n", "\n", "As an example for energy-based models, we will train a model on image generation.\n", "Specifically, we will look at how we can generate MNIST digits with a very simple CNN model.\n", "However, it should be noted that energy models are not easy to train and often diverge\n", "if the hyperparameters are not well tuned.\n", "We will rely on training tricks proposed in the paper\n", "[Implicit Generation and Generalization in Energy-Based Models](https://arxiv.org/abs/1903.08689)\n", "by Yilun Du and Igor Mordatch ([blog](https://openai.com/blog/energy-based-models/)).\n", "The important part of this notebook is however to see how the theory above can actually be used in a model.\n", "\n", "### Dataset\n", "\n", "First, we can load the MNIST dataset below.\n", "Note that we need to normalize the images between -1 and 1 instead of mean 0 and std 1 because during sampling,\n", "we have to limit the input space.\n", "Scaling between -1 and 1 makes it easier to implement it."]}, {"cell_type": "code", "execution_count": 4, "id": "d20babd4", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:41.303522Z", "iopub.status.busy": "2021-09-16T12:40:41.302963Z", "iopub.status.idle": "2021-09-16T12:40:41.332018Z", "shell.execute_reply": "2021-09-16T12:40:41.331579Z"}, "papermill": {"duration": 0.056251, "end_time": "2021-09-16T12:40:41.332136", "exception": false, "start_time": "2021-09-16T12:40:41.275885", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# Transformations applied on each image => make them a tensor and normalize between -1 and 1\n", "transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.5,), (0.5,))])\n", "\n", "# Loading the training dataset. We need to split it into a training and validation part\n", "train_set = MNIST(root=DATASET_PATH, train=True, transform=transform, download=True)\n", "\n", "# Loading the test set\n", "test_set = MNIST(root=DATASET_PATH, train=False, transform=transform, download=True)\n", "\n", "# We define a set of data loaders that we can use for various purposes later.\n", "# Note that for actually training a model, we will use different data loaders\n", "# with a lower batch size.\n", "train_loader = data.DataLoader(train_set, batch_size=128, shuffle=True, drop_last=True, num_workers=4, pin_memory=True)\n", "test_loader = data.DataLoader(test_set, batch_size=256, shuffle=False, drop_last=False, num_workers=4)"]}, {"cell_type": "markdown", "id": "3e1b26e0", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.02242, "end_time": "2021-09-16T12:40:41.378644", "exception": false, "start_time": "2021-09-16T12:40:41.356224", "status": "completed"}, "tags": []}, "source": ["### CNN Model\n", "\n", "First, we implement our CNN model.\n", "The MNIST images are of size 28x28, hence we only need a small model.\n", "As an example, we will apply several convolutions with stride 2 that downscale the images.\n", "If you are interested, you can also use a deeper model such as a small ResNet, but for simplicity,\n", "we will stick with the tiny network.\n", "\n", "It is a good practice to use a smooth activation function like Swish instead of ReLU in the energy model.\n", "This is because we will rely on the gradients we get back with respect to the input image, which should not be sparse."]}, {"cell_type": "code", "execution_count": 5, "id": "38169d71", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:41.429707Z", "iopub.status.busy": "2021-09-16T12:40:41.429207Z", "iopub.status.idle": "2021-09-16T12:40:41.431319Z", "shell.execute_reply": "2021-09-16T12:40:41.430920Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.030493, "end_time": "2021-09-16T12:40:41.431417", "exception": false, "start_time": "2021-09-16T12:40:41.400924", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class CNNModel(nn.Module):\n", " def __init__(self, hidden_features=32, out_dim=1, **kwargs):\n", " super().__init__()\n", " # We increase the hidden dimension over layers. Here pre-calculated for simplicity.\n", " c_hid1 = hidden_features // 2\n", " c_hid2 = hidden_features\n", " c_hid3 = hidden_features * 2\n", "\n", " # Series of convolutions and Swish activation functions\n", " self.cnn_layers = nn.Sequential(\n", " nn.Conv2d(1, c_hid1, kernel_size=5, stride=2, padding=4), # [16x16] - Larger padding to get 32x32 image\n", " nn.SiLU(),\n", " nn.Conv2d(c_hid1, c_hid2, kernel_size=3, stride=2, padding=1), # [8x8]\n", " nn.SiLU(),\n", " nn.Conv2d(c_hid2, c_hid3, kernel_size=3, stride=2, padding=1), # [4x4]\n", " nn.SiLU(),\n", " nn.Conv2d(c_hid3, c_hid3, kernel_size=3, stride=2, padding=1), # [2x2]\n", " nn.SiLU(),\n", " nn.Flatten(),\n", " nn.Linear(c_hid3 * 4, c_hid3),\n", " nn.SiLU(),\n", " nn.Linear(c_hid3, out_dim),\n", " )\n", "\n", " def forward(self, x):\n", " x = self.cnn_layers(x).squeeze(dim=-1)\n", " return x"]}, {"cell_type": "markdown", "id": "86a8d447", "metadata": {"papermill": {"duration": 0.022437, "end_time": "2021-09-16T12:40:41.476079", "exception": false, "start_time": "2021-09-16T12:40:41.453642", "status": "completed"}, "tags": []}, "source": ["In the rest of the notebook, the output of the model will actually not represent\n", "$E_{\\theta}(\\mathbf{x})$, but $-E_{\\theta}(\\mathbf{x})$.\n", "This is a standard implementation practice for energy-based models, as some people also write the energy probability\n", "density as $q_{\\theta}(\\mathbf{x}) = \\frac{\\exp\\left(f_{\\theta}(\\mathbf{x})\\right)}{Z_{\\theta}}$.\n", "In that case, the model would actually represent $f_{\\theta}(\\mathbf{x})$.\n", "In the training loss etc., we need to be careful to not switch up the signs."]}, {"cell_type": "markdown", "id": "5321df9e", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.022306, "end_time": "2021-09-16T12:40:41.520797", "exception": false, "start_time": "2021-09-16T12:40:41.498491", "status": "completed"}, "tags": []}, "source": ["### Sampling buffer\n", "\n", "In the next part, we look at the training with sampled elements.\n", "To use the contrastive divergence objective, we need to generate samples during training.\n", "Previous work has shown that due to the high dimensionality of images, we need a lot of iterations\n", "inside the MCMC sampling to obtain reasonable samples.\n", "However, there is a training trick that significantly reduces the sampling cost: using a sampling buffer.\n", "The idea is that we store the samples of the last couple of batches in a buffer,\n", "and re-use those as the starting point of the MCMC algorithm for the next batches.\n", "This reduces the sampling cost because the model requires a significantly\n", "lower number of steps to converge to reasonable samples.\n", "However, to not solely rely on previous samples and allow novel samples as well,\n", "we re-initialize 5% of our samples from scratch (random noise between -1 and 1).\n", "\n", "Below, we implement the sampling buffer.\n", "The function `sample_new_exmps` returns a new batch of \"fake\" images.\n", "We refer to those as fake images because they have been generated, but are not actually part of the dataset.\n", "As mentioned before, we use initialize 5% randomly, and 95% are randomly picked from our buffer.\n", "On this initial batch, we perform MCMC for 60 iterations to improve the image quality\n", "and come closer to samples from $q_{\\theta}(\\mathbf{x})$.\n", "In the function `generate_samples`, we implemented the MCMC for images.\n", "Note that the hyperparameters of `step_size`, `steps`, the noise standard deviation\n", "$\\sigma$ are specifically set for MNIST, and need to be finetuned for a different dataset if you want to use such."]}, {"cell_type": "code", "execution_count": 6, "id": "84649cbd", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:41.577495Z", "iopub.status.busy": "2021-09-16T12:40:41.576997Z", "iopub.status.idle": "2021-09-16T12:40:41.579100Z", "shell.execute_reply": "2021-09-16T12:40:41.578638Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.035877, "end_time": "2021-09-16T12:40:41.579195", "exception": false, "start_time": "2021-09-16T12:40:41.543318", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class Sampler:\n", " def __init__(self, model, img_shape, sample_size, max_len=8192):\n", " \"\"\"\n", " Args:\n", " model: Neural network to use for modeling E_theta\n", " img_shape: Shape of the images to model\n", " sample_size: Batch size of the samples\n", " max_len: Maximum number of data points to keep in the buffer\n", " \"\"\"\n", " super().__init__()\n", " self.model = model\n", " self.img_shape = img_shape\n", " self.sample_size = sample_size\n", " self.max_len = max_len\n", " self.examples = [(torch.rand((1,) + img_shape) * 2 - 1) for _ in range(self.sample_size)]\n", "\n", " def sample_new_exmps(self, steps=60, step_size=10):\n", " \"\"\"Function for getting a new batch of \"fake\" images.\n", "\n", " Args:\n", " steps: Number of iterations in the MCMC algorithm\n", " step_size: Learning rate nu in the algorithm above\n", " \"\"\"\n", " # Choose 95% of the batch from the buffer, 5% generate from scratch\n", " n_new = np.random.binomial(self.sample_size, 0.05)\n", " rand_imgs = torch.rand((n_new,) + self.img_shape) * 2 - 1\n", " old_imgs = torch.cat(random.choices(self.examples, k=self.sample_size - n_new), dim=0)\n", " inp_imgs = torch.cat([rand_imgs, old_imgs], dim=0).detach().to(device)\n", "\n", " # Perform MCMC sampling\n", " inp_imgs = Sampler.generate_samples(self.model, inp_imgs, steps=steps, step_size=step_size)\n", "\n", " # Add new images to the buffer and remove old ones if needed\n", " self.examples = list(inp_imgs.to(torch.device(\"cpu\")).chunk(self.sample_size, dim=0)) + self.examples\n", " self.examples = self.examples[: self.max_len]\n", " return inp_imgs\n", "\n", " @staticmethod\n", " def generate_samples(model, inp_imgs, steps=60, step_size=10, return_img_per_step=False):\n", " \"\"\"Function for sampling images for a given model.\n", "\n", " Args:\n", " model: Neural network to use for modeling E_theta\n", " inp_imgs: Images to start from for sampling. If you want to generate new images, enter noise between -1 and 1.\n", " steps: Number of iterations in the MCMC algorithm.\n", " step_size: Learning rate nu in the algorithm above\n", " return_img_per_step: If True, we return the sample at every iteration of the MCMC\n", " \"\"\"\n", " # Before MCMC: set model parameters to \"required_grad=False\"\n", " # because we are only interested in the gradients of the input.\n", " is_training = model.training\n", " model.eval()\n", " for p in model.parameters():\n", " p.requires_grad = False\n", " inp_imgs.requires_grad = True\n", "\n", " # Enable gradient calculation if not already the case\n", " had_gradients_enabled = torch.is_grad_enabled()\n", " torch.set_grad_enabled(True)\n", "\n", " # We use a buffer tensor in which we generate noise each loop iteration.\n", " # More efficient than creating a new tensor every iteration.\n", " noise = torch.randn(inp_imgs.shape, device=inp_imgs.device)\n", "\n", " # List for storing generations at each step (for later analysis)\n", " imgs_per_step = []\n", "\n", " # Loop over K (steps)\n", " for _ in range(steps):\n", " # Part 1: Add noise to the input.\n", " noise.normal_(0, 0.005)\n", " inp_imgs.data.add_(noise.data)\n", " inp_imgs.data.clamp_(min=-1.0, max=1.0)\n", "\n", " # Part 2: calculate gradients for the current input.\n", " out_imgs = -model(inp_imgs)\n", " out_imgs.sum().backward()\n", " inp_imgs.grad.data.clamp_(-0.03, 0.03) # For stabilizing and preventing too high gradients\n", "\n", " # Apply gradients to our current samples\n", " inp_imgs.data.add_(-step_size * inp_imgs.grad.data)\n", " inp_imgs.grad.detach_()\n", " inp_imgs.grad.zero_()\n", " inp_imgs.data.clamp_(min=-1.0, max=1.0)\n", "\n", " if return_img_per_step:\n", " imgs_per_step.append(inp_imgs.clone().detach())\n", "\n", " # Reactivate gradients for parameters for training\n", " for p in model.parameters():\n", " p.requires_grad = True\n", " model.train(is_training)\n", "\n", " # Reset gradient calculation to setting before this function\n", " torch.set_grad_enabled(had_gradients_enabled)\n", "\n", " if return_img_per_step:\n", " return torch.stack(imgs_per_step, dim=0)\n", " else:\n", " return inp_imgs"]}, {"cell_type": "markdown", "id": "da0da692", "metadata": {"papermill": {"duration": 0.022214, "end_time": "2021-09-16T12:40:41.623643", "exception": false, "start_time": "2021-09-16T12:40:41.601429", "status": "completed"}, "tags": []}, "source": ["The idea of the buffer becomes a bit clearer in the following algorithm."]}, {"cell_type": "markdown", "id": "a39ea7ee", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.022698, "end_time": "2021-09-16T12:40:41.668518", "exception": false, "start_time": "2021-09-16T12:40:41.645820", "status": "completed"}, "tags": []}, "source": ["### Training algorithm\n", "\n", "With the sampling buffer being ready, we can complete our training algorithm.\n", "Below is shown a summary of the full training algorithm of an energy model on image modeling:\n", "\n", "
\n", "\n", "The first few statements in each training iteration concern the sampling of the real and fake data,\n", "as we have seen above with the sample buffer.\n", "Next, we calculate the contrastive divergence objective using our energy model $E_{\\theta}$.\n", "However, one additional training trick we need is to add a regularization loss on the output of $E_{\\theta}$.\n", "As the output of the network is not constrained and adding a large bias or not to the output\n", "doesn't change the contrastive divergence loss, we need to ensure somehow else that the output values are in a reasonable range.\n", "Without the regularization loss, the output values will fluctuate in a very large range.\n", "With this, we ensure that the values for the real data are around 0, and the fake data likely slightly lower\n", "(for noise or outliers the score can be still significantly lower).\n", "As the regularization loss is less important than the Contrastive Divergence, we have a weight factor\n", "$\\alpha$ which is usually quite some smaller than 1.\n", "Finally, we perform an update step with an optimizer on the combined loss and add the new samples to the buffer.\n", "\n", "Below, we put this training dynamic into a PyTorch Lightning module:"]}, {"cell_type": "code", "execution_count": 7, "id": "5733f772", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:41.724998Z", "iopub.status.busy": "2021-09-16T12:40:41.717399Z", "iopub.status.idle": "2021-09-16T12:40:41.727028Z", "shell.execute_reply": "2021-09-16T12:40:41.726628Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.034742, "end_time": "2021-09-16T12:40:41.727126", "exception": false, "start_time": "2021-09-16T12:40:41.692384", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class DeepEnergyModel(pl.LightningModule):\n", " def __init__(self, img_shape, batch_size, alpha=0.1, lr=1e-4, beta1=0.0, **CNN_args):\n", " super().__init__()\n", " self.save_hyperparameters()\n", "\n", " self.cnn = CNNModel(**CNN_args)\n", " self.sampler = Sampler(self.cnn, img_shape=img_shape, sample_size=batch_size)\n", " self.example_input_array = torch.zeros(1, *img_shape)\n", "\n", " def forward(self, x):\n", " z = self.cnn(x)\n", " return z\n", "\n", " def configure_optimizers(self):\n", " # Energy models can have issues with momentum as the loss surfaces changes with its parameters.\n", " # Hence, we set it to 0 by default.\n", " optimizer = optim.Adam(self.parameters(), lr=self.hparams.lr, betas=(self.hparams.beta1, 0.999))\n", " scheduler = optim.lr_scheduler.StepLR(optimizer, 1, gamma=0.97) # Exponential decay over epochs\n", " return [optimizer], [scheduler]\n", "\n", " def training_step(self, batch, batch_idx):\n", " # We add minimal noise to the original images to prevent the model from focusing on purely \"clean\" inputs\n", " real_imgs, _ = batch\n", " small_noise = torch.randn_like(real_imgs) * 0.005\n", " real_imgs.add_(small_noise).clamp_(min=-1.0, max=1.0)\n", "\n", " # Obtain samples\n", " fake_imgs = self.sampler.sample_new_exmps(steps=60, step_size=10)\n", "\n", " # Predict energy score for all images\n", " inp_imgs = torch.cat([real_imgs, fake_imgs], dim=0)\n", " real_out, fake_out = self.cnn(inp_imgs).chunk(2, dim=0)\n", "\n", " # Calculate losses\n", " reg_loss = self.hparams.alpha * (real_out ** 2 + fake_out ** 2).mean()\n", " cdiv_loss = fake_out.mean() - real_out.mean()\n", " loss = reg_loss + cdiv_loss\n", "\n", " # Logging\n", " self.log(\"loss\", loss)\n", " self.log(\"loss_regularization\", reg_loss)\n", " self.log(\"loss_contrastive_divergence\", cdiv_loss)\n", " self.log(\"metrics_avg_real\", real_out.mean())\n", " self.log(\"metrics_avg_fake\", fake_out.mean())\n", " return loss\n", "\n", " def validation_step(self, batch, batch_idx):\n", " # For validating, we calculate the contrastive divergence between purely random images and unseen examples\n", " # Note that the validation/test step of energy-based models depends on what we are interested in the model\n", " real_imgs, _ = batch\n", " fake_imgs = torch.rand_like(real_imgs) * 2 - 1\n", "\n", " inp_imgs = torch.cat([real_imgs, fake_imgs], dim=0)\n", " real_out, fake_out = self.cnn(inp_imgs).chunk(2, dim=0)\n", "\n", " cdiv = fake_out.mean() - real_out.mean()\n", " self.log(\"val_contrastive_divergence\", cdiv)\n", " self.log(\"val_fake_out\", fake_out.mean())\n", " self.log(\"val_real_out\", real_out.mean())"]}, {"cell_type": "markdown", "id": "1ae0ae51", "metadata": {"papermill": {"duration": 0.022675, "end_time": "2021-09-16T12:40:41.772185", "exception": false, "start_time": "2021-09-16T12:40:41.749510", "status": "completed"}, "tags": []}, "source": ["We do not implement a test step because energy-based, generative models are usually not evaluated on a test set.\n", "The validation step however is used to get an idea of the difference between ennergy/likelihood\n", "of random images to unseen examples of the dataset."]}, {"cell_type": "markdown", "id": "6ae9a058", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.022224, "end_time": "2021-09-16T12:40:41.816602", "exception": false, "start_time": "2021-09-16T12:40:41.794378", "status": "completed"}, "tags": []}, "source": ["### Callbacks\n", "\n", "To track the performance of our model during training, we will make extensive use of PyTorch Lightning's callback framework.\n", "Remember that callbacks can be used for running small functions at any point of the training,\n", "for instance after finishing an epoch.\n", "Here, we will use three different callbacks we define ourselves.\n", "\n", "The first callback, called `GenerateCallback`, is used for adding image generations to the model during training.\n", "After every $N$ epochs (usually $N=5$ to reduce output to TensorBoard), we take a small batch\n", "of random images and perform many MCMC iterations until the model's generation converges.\n", "Compared to the training that used 60 iterations, we use 256 here because\n", "(1) we only have to do it once compared to the training that has to do it every iteration, and\n", "(2) we do not start from a buffer here, but from scratch.\n", "It is implemented as follows:"]}, {"cell_type": "code", "execution_count": 8, "id": "553fb562", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:41.868808Z", "iopub.status.busy": "2021-09-16T12:40:41.868332Z", "iopub.status.idle": "2021-09-16T12:40:41.870405Z", "shell.execute_reply": "2021-09-16T12:40:41.870008Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.031581, "end_time": "2021-09-16T12:40:41.870500", "exception": false, "start_time": "2021-09-16T12:40:41.838919", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class GenerateCallback(pl.Callback):\n", " def __init__(self, batch_size=8, vis_steps=8, num_steps=256, every_n_epochs=5):\n", " super().__init__()\n", " self.batch_size = batch_size # Number of images to generate\n", " self.vis_steps = vis_steps # Number of steps within generation to visualize\n", " self.num_steps = num_steps # Number of steps to take during generation\n", " # Only save those images every N epochs (otherwise tensorboard gets quite large)\n", " self.every_n_epochs = every_n_epochs\n", "\n", " def on_epoch_end(self, trainer, pl_module):\n", " # Skip for all other epochs\n", " if trainer.current_epoch % self.every_n_epochs == 0:\n", " # Generate images\n", " imgs_per_step = self.generate_imgs(pl_module)\n", " # Plot and add to tensorboard\n", " for i in range(imgs_per_step.shape[1]):\n", " step_size = self.num_steps // self.vis_steps\n", " imgs_to_plot = imgs_per_step[step_size - 1 :: step_size, i]\n", " grid = torchvision.utils.make_grid(\n", " imgs_to_plot, nrow=imgs_to_plot.shape[0], normalize=True, range=(-1, 1)\n", " )\n", " trainer.logger.experiment.add_image(\"generation_%i\" % i, grid, global_step=trainer.current_epoch)\n", "\n", " def generate_imgs(self, pl_module):\n", " pl_module.eval()\n", " start_imgs = torch.rand((self.batch_size,) + pl_module.hparams[\"img_shape\"]).to(pl_module.device)\n", " start_imgs = start_imgs * 2 - 1\n", " imgs_per_step = Sampler.generate_samples(\n", " pl_module.cnn, start_imgs, steps=self.num_steps, step_size=10, return_img_per_step=True\n", " )\n", " pl_module.train()\n", " return imgs_per_step"]}, {"cell_type": "markdown", "id": "10fb6c28", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.022491, "end_time": "2021-09-16T12:40:41.915420", "exception": false, "start_time": "2021-09-16T12:40:41.892929", "status": "completed"}, "tags": []}, "source": ["The second callback is called `SamplerCallback`, and simply adds a randomly picked subset of images\n", "in the sampling buffer to the TensorBoard.\n", "This helps to understand what images are currently shown to the model as \"fake\"."]}, {"cell_type": "code", "execution_count": 9, "id": "d973c3d0", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:41.965194Z", "iopub.status.busy": "2021-09-16T12:40:41.964725Z", "iopub.status.idle": "2021-09-16T12:40:41.966940Z", "shell.execute_reply": "2021-09-16T12:40:41.966479Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.029353, "end_time": "2021-09-16T12:40:41.967038", "exception": false, "start_time": "2021-09-16T12:40:41.937685", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class SamplerCallback(pl.Callback):\n", " def __init__(self, num_imgs=32, every_n_epochs=5):\n", " super().__init__()\n", " self.num_imgs = num_imgs # Number of images to plot\n", " # Only save those images every N epochs (otherwise tensorboard gets quite large)\n", " self.every_n_epochs = every_n_epochs\n", "\n", " def on_epoch_end(self, trainer, pl_module):\n", " if trainer.current_epoch % self.every_n_epochs == 0:\n", " exmp_imgs = torch.cat(random.choices(pl_module.sampler.examples, k=self.num_imgs), dim=0)\n", " grid = torchvision.utils.make_grid(exmp_imgs, nrow=4, normalize=True, range=(-1, 1))\n", " trainer.logger.experiment.add_image(\"sampler\", grid, global_step=trainer.current_epoch)"]}, {"cell_type": "markdown", "id": "adaa80d7", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.022387, "end_time": "2021-09-16T12:40:42.011824", "exception": false, "start_time": "2021-09-16T12:40:41.989437", "status": "completed"}, "tags": []}, "source": ["Finally, our last callback is `OutlierCallback`.\n", "This callback evaluates the model by recording the (negative) energy assigned to random noise.\n", "While our training loss is almost constant across iterations,\n", "this score is likely showing the progress of the model to detect \"outliers\"."]}, {"cell_type": "code", "execution_count": 10, "id": "9ac8745d", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:42.064684Z", "iopub.status.busy": "2021-09-16T12:40:42.064208Z", "iopub.status.idle": "2021-09-16T12:40:42.066806Z", "shell.execute_reply": "2021-09-16T12:40:42.066321Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.03245, "end_time": "2021-09-16T12:40:42.066912", "exception": false, "start_time": "2021-09-16T12:40:42.034462", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class OutlierCallback(pl.Callback):\n", " def __init__(self, batch_size=1024):\n", " super().__init__()\n", " self.batch_size = batch_size\n", "\n", " def on_epoch_end(self, trainer, pl_module):\n", " with torch.no_grad():\n", " pl_module.eval()\n", " rand_imgs = torch.rand((self.batch_size,) + pl_module.hparams[\"img_shape\"]).to(pl_module.device)\n", " rand_imgs = rand_imgs * 2 - 1.0\n", " rand_out = pl_module.cnn(rand_imgs).mean()\n", " pl_module.train()\n", "\n", " trainer.logger.experiment.add_scalar(\"rand_out\", rand_out, global_step=trainer.current_epoch)"]}, {"cell_type": "markdown", "id": "70834e47", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.022843, "end_time": "2021-09-16T12:40:42.112671", "exception": false, "start_time": "2021-09-16T12:40:42.089828", "status": "completed"}, "tags": []}, "source": ["### Running the model\n", "\n", "Finally, we can add everything together to create our final training function.\n", "The function is very similar to any other PyTorch Lightning training function we have seen so far.\n", "However, there is the small difference of that we do not test the model on a test set\n", "because we will analyse the model afterward by checking its prediction and ability to perform outlier detection."]}, {"cell_type": "code", "execution_count": 11, "id": "5561a42f", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:42.164214Z", "iopub.status.busy": "2021-09-16T12:40:42.163735Z", "iopub.status.idle": "2021-09-16T12:40:42.165765Z", "shell.execute_reply": "2021-09-16T12:40:42.165284Z"}, "papermill": {"duration": 0.030454, "end_time": "2021-09-16T12:40:42.165867", "exception": false, "start_time": "2021-09-16T12:40:42.135413", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def train_model(**kwargs):\n", " # Create a PyTorch Lightning trainer with the generation callback\n", " trainer = pl.Trainer(\n", " default_root_dir=os.path.join(CHECKPOINT_PATH, \"MNIST\"),\n", " gpus=1 if str(device).startswith(\"cuda\") else 0,\n", " max_epochs=60,\n", " gradient_clip_val=0.1,\n", " callbacks=[\n", " ModelCheckpoint(save_weights_only=True, mode=\"min\", monitor=\"val_contrastive_divergence\"),\n", " GenerateCallback(every_n_epochs=5),\n", " SamplerCallback(every_n_epochs=5),\n", " OutlierCallback(),\n", " LearningRateMonitor(\"epoch\"),\n", " ],\n", " progress_bar_refresh_rate=1,\n", " )\n", " # Check whether pretrained model exists. If yes, load it and skip training\n", " pretrained_filename = os.path.join(CHECKPOINT_PATH, \"MNIST.ckpt\")\n", " if os.path.isfile(pretrained_filename):\n", " print(\"Found pretrained model, loading...\")\n", " model = DeepEnergyModel.load_from_checkpoint(pretrained_filename)\n", " else:\n", " pl.seed_everything(42)\n", " model = DeepEnergyModel(**kwargs)\n", " trainer.fit(model, train_loader, test_loader)\n", " model = DeepEnergyModel.load_from_checkpoint(trainer.checkpoint_callback.best_model_path)\n", " # No testing as we are more interested in other properties\n", " return model"]}, {"cell_type": "code", "execution_count": 12, "id": "0d734155", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:42.214793Z", "iopub.status.busy": "2021-09-16T12:40:42.214331Z", "iopub.status.idle": "2021-09-16T12:40:42.228657Z", "shell.execute_reply": "2021-09-16T12:40:42.229038Z"}, "papermill": {"duration": 0.040314, "end_time": "2021-09-16T12:40:42.229150", "exception": false, "start_time": "2021-09-16T12:40:42.188836", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model, loading...\n"]}], "source": ["model = train_model(img_shape=(1, 28, 28), batch_size=train_loader.batch_size, lr=1e-4, beta1=0.0)"]}, {"cell_type": "markdown", "id": "3de610c0", "metadata": {"papermill": {"duration": 0.023634, "end_time": "2021-09-16T12:40:42.276465", "exception": false, "start_time": "2021-09-16T12:40:42.252831", "status": "completed"}, "tags": []}, "source": ["## Analysis\n", "\n", "In the last part of the notebook, we will try to take the trained energy-based generative model,\n", "and analyse its properties."]}, {"cell_type": "markdown", "id": "879c2039", "metadata": {"papermill": {"duration": 0.023472, "end_time": "2021-09-16T12:40:42.323822", "exception": false, "start_time": "2021-09-16T12:40:42.300350", "status": "completed"}, "tags": []}, "source": ["### TensorBoard\n", "\n", "The first thing we can look at is the TensorBoard generate during training.\n", "This can help us to understand the training dynamic even better, and shows potential issues.\n", "Let's load the TensorBoard below:"]}, {"cell_type": "code", "execution_count": 13, "id": "c4ffadfc", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:42.374084Z", "iopub.status.busy": "2021-09-16T12:40:42.373589Z", "iopub.status.idle": "2021-09-16T12:40:42.375710Z", "shell.execute_reply": "2021-09-16T12:40:42.375247Z"}, "papermill": {"duration": 0.028238, "end_time": "2021-09-16T12:40:42.375807", "exception": false, "start_time": "2021-09-16T12:40:42.347569", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# Uncomment the following two lines to open a tensorboard in the notebook.\n", "# Adjust the path to your CHECKPOINT_PATH if needed.\n", "# %load_ext tensorboard\n", "# %tensorboard --logdir ../saved_models/tutorial8/tensorboards/"]}, {"cell_type": "markdown", "id": "c7b8f333", "metadata": {"papermill": {"duration": 0.023692, "end_time": "2021-09-16T12:40:42.423585", "exception": false, "start_time": "2021-09-16T12:40:42.399893", "status": "completed"}, "tags": []}, "source": ["
"]}, {"cell_type": "markdown", "id": "e608ca53", "metadata": {"papermill": {"duration": 0.023833, "end_time": "2021-09-16T12:40:42.471015", "exception": false, "start_time": "2021-09-16T12:40:42.447182", "status": "completed"}, "tags": []}, "source": ["We see that the contrastive divergence as well as the regularization converge quickly to 0.\n", "However, the training continues although the loss is always close to zero.\n", "This is because our \"training\" data changes with the model by sampling.\n", "The progress of training can be best measured by looking at the samples across iterations,\n", "and the score for random images that decreases constantly over time."]}, {"cell_type": "markdown", "id": "a1184e57", "metadata": {"papermill": {"duration": 0.023719, "end_time": "2021-09-16T12:40:42.518253", "exception": false, "start_time": "2021-09-16T12:40:42.494534", "status": "completed"}, "tags": []}, "source": ["### Image Generation\n", "\n", "Another way of evaluating generative models is by sampling a few generated images.\n", "Generative models need to be good at generating realistic images as this truely shows that they have modeled the true data distribution.\n", "Thus, let's sample a few images of the model below:"]}, {"cell_type": "code", "execution_count": 14, "id": "f84da507", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:42.570336Z", "iopub.status.busy": "2021-09-16T12:40:42.569866Z", "iopub.status.idle": "2021-09-16T12:40:45.522168Z", "shell.execute_reply": "2021-09-16T12:40:45.521632Z"}, "papermill": {"duration": 2.980431, "end_time": "2021-09-16T12:40:45.522288", "exception": false, "start_time": "2021-09-16T12:40:42.541857", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 43\n"]}], "source": ["model.to(device)\n", "pl.seed_everything(43)\n", "callback = GenerateCallback(batch_size=4, vis_steps=8, num_steps=256)\n", "imgs_per_step = callback.generate_imgs(model)\n", "imgs_per_step = imgs_per_step.cpu()"]}, {"cell_type": "markdown", "id": "96a6dec4", "metadata": {"papermill": {"duration": 0.260591, "end_time": "2021-09-16T12:40:45.862389", "exception": false, "start_time": "2021-09-16T12:40:45.601798", "status": "completed"}, "tags": []}, "source": ["The characteristic of sampling with energy-based models is that they require the iterative MCMC algorithm.\n", "To gain an insight in how the images change over iterations, we plot a few intermediate samples in the MCMC as well:"]}, {"cell_type": "code", "execution_count": 15, "id": "8a53c31a", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:46.095876Z", "iopub.status.busy": "2021-09-16T12:40:46.095395Z", "iopub.status.idle": "2021-09-16T12:40:46.738218Z", "shell.execute_reply": "2021-09-16T12:40:46.738604Z"}, "papermill": {"duration": 0.675706, "end_time": "2021-09-16T12:40:46.738750", "exception": false, "start_time": "2021-09-16T12:40:46.063044", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:40:46.157923\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n"]}, {"data": {"application/pdf": "JVBERi0xLjQKJazcIKu6CjEgMCBvYmoKPDwgL1BhZ2VzIDIgMCBSIC9UeXBlIC9DYXRhbG9nID4+CmVuZG9iago4IDAgb2JqCjw8IC9FeHRHU3RhdGUgNCAwIFIgL0ZvbnQgMyAwIFIgL1BhdHRlcm4gNSAwIFIKL1Byb2NTZXQgWyAvUERGIC9UZXh0IC9JbWFnZUIgL0ltYWdlQyAvSW1hZ2VJIF0gL1NoYWRpbmcgNiAwIFIKL1hPYmplY3QgNyAwIFIgPj4KZW5kb2JqCjExIDAgb2JqCjw8IC9Bbm5vdHMgMTAgMCBSIC9Db250ZW50cyA5IDAgUgovR3JvdXAgPDwgL0NTIC9EZXZpY2VSR0IgL1MgL1RyYW5zcGFyZW5jeSAvVHlwZSAvR3JvdXAgPj4KL01lZGlhQm94IFsgMCAwIDQ2NC4zIDk3LjI2MTM5NzA1ODggXSAvUGFyZW50IDIgMCBSIC9SZXNvdXJjZXMgOCAwIFIKL1R5cGUgL1BhZ2UgPj4KZW5kb2JqCjkgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAxMiAwIFIgPj4Kc3RyZWFtCnichVXLbtswELzzK/bYHkpzH+SSxxhpjebm1kAPRQ6Fq6QOYgdOgub3u7JlhLJV6WCBGpMzs+RoifDgZlcI9y8Q4MF+b4CwgNl183ezbr4t5rB+ccHwrZMknm302I2KekrIRQ0Jvbc/zu2ccdrkhdHdOwxegdVHYY0tVVSP78BjB5Tgw4njsKQGjPTO7aFPJZK8QCQfUZNoiDnDcwM/YAezK2qrQqsKrarQq8pZVXtbrdDWFvmMdr2F2VeE6ydYuiXsT1zBSmr5gs8doyGOk0fOxLGusALFh65KN7ddeXN7ewb4FIyLyZeYo6gWQaD2zcTdfAWzL2imYHV32P3Vb/cTPuBHuIXVjfu8ckt3MOFy9KwcqdTiFTgmrsUHFIwiiHlSnOlSHY0/hZxJavkaHdNHyp6kiGSzKpMGkgwYyOzz0X9toEJHDah6yaJClp3p7S/p0gAx+9AeHtUGanTMABHbmsBSWgfT5095wEEmz2jZTz0HFTrqQMmrxiTM7XlNOkjh0gEz+thPf4eMR58sfqG0/0/KloHwcbZv9hidWrpCR+UVLXyJGJO1jkkHRAPpE7b+RIemUze3Ch1zIBQsfRgp2rfK0w5iL351jC3ulBSzCRVPmpHGiBbNrnn+9bp52sHmtRvVzAQ3x7vg0OX6N8F5I7/o0u77eXPfDjR3mzV5JZzmvK/7D9PS/QMFFmA7CmVuZHN0cmVhbQplbmRvYmoKMTIgMCBvYmoKNTI3CmVuZG9iagoxMCAwIG9iagpbIF0KZW5kb2JqCjE4IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMjQ3ID4+CnN0cmVhbQp4nE1RSW7EMAy7+xX8wACWrMV5T4pBD+3/ryUdFO3BECNLXOLuxEQWXrZQ10KH48NGXgmbge+D1pz4GrHiP9pGpJU/VFsgEzFRJHRRNxr3SDe8CtF+pIJXqvdY8xF3K81bOnaxv/fBtOaRKqtCPOTYHNlIWtdE0fE9tN5zQ3TKIIE+NyEHRGmOXoWkv/bDdW00u7U2syeqg0emhPJJsxqa0ylmyGyox20qVjIKN6qMivtURloP8jbOMoCT44QyWk92rCai/NQnl5AXE3HCLjs7FmITCxuHtB+VPrH8fOvN+JtpraWQcUEiNMWl32e8x+d4/wCVT1wmCmVuZHN0cmVhbQplbmRvYmoKMTkgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAzMDcgPj4Kc3RyZWFtCnicPZJLbgMxDEP3PoUuEMD62Z7zpCi6mN5/2ycl6Yoc2RZFapa6TFlTHpA0k4R/6fBwsZ3yO2zPZmbgWqKXieWU59AVYu6ifNnMRl1ZJ8XqhGY6t+hRORcHNk2qn6sspd0ueA7XJp5b9hE/vNCgHtQ1Lgk3dFejZSk0Y6r7f9J7/Iwy4GpMXWxSq3sfPF5EVejoB0eJImOXF+fjQQnpSsJoWoiVd0UDQe7ytMp7Ce7b3mrIsgepmM47KWaw63RSLm4XhyEeyPKo8OWj2GtCz/iwKyX0SNiGM3In7mjG5tTI4pD+3o0ES4+uaCHz4K9u1i5gvFM6RWJkTnKsaYtVTvdQFNO5w70MEPVsRUMpc5HV6l/DzgtrlmwWeEr6BR6j3SZLDlbZ26hO76082dD3H1rXdB8KZW5kc3RyZWFtCmVuZG9iagoyMCAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDI0OSA+PgpzdHJlYW0KeJw9UDuORCEM6zmFL/Ak8iNwHkarLWbv364DmilQTH62MyTQEYFHDDGUr+MlraCugb+LQvFu4uuDwiCrQ1IgznoPiHTspjaREzodnDM/YTdjjsBFMQac6XSmPQcmOfvCCoRzG2XsVkgniaoijuozjimeKnufeBYs7cg2WyeSPeQg4VJSicmln5TKP23KlAo6ZtEELBK54GQTTTjLu0lSjBmUMuoepnYifaw8yKM66GRNzqwjmdnTT9uZ+Bxwt1/aZE6Vx3QezPictM6DORW69+OJNgdNjdro7PcTaSovUrsdWp1+dRKV3RjnGBKXZ38Z32T/+Qf+h1oiCmVuZHN0cmVhbQplbmRvYmoKMjEgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAzOTUgPj4Kc3RyZWFtCnicPVJLbsVACNvnFFyg0vCbz3lSVd28+29rQ1KpKryJMcYwfcqQueVLXRJxhcm3Xq5bPKZ8LltamXmIu4uNJT623JfuIbZddC6xOB1H8gsynSpEqM2q0aH4QpaFB5BO8KELwn05/uMvgMHXsA244T0yQbAk5ilCxm5RGZoSQRFh55EVqKRQn1nC31Hu6/cyBWpvjKULYxz0CbQFQm1IxALqQABE7JRUrZCOZyQTvxXdZ2IcYOfRsgGuGVRElnvsx4ipzqiMvETEPk9N+iiWTC1Wxm5TGV/8lIzUfHQFKqk08pTy0FWz0AtYiXkS9jn8SPjn1mwhhjpu1vKJ5R8zxTISzmBLOWChl+NH4NtZdRGuHbm4znSBH5XWcEy0637I9U/+dNtazXW8cgiiQOVNQfC7Dq5GscTEMj6djSl6oiywGpq8RjPBYRAR1vfDyAMa/XK8EDSnayK0WCKbtWJEjYpscz29BNZM78U51sMTwmzvndahsjMzKiGC2rqGautAdrO+83C2nz8z6KJtCmVuZHN0cmVhbQplbmRvYmoKMjIgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAyNDkgPj4Kc3RyZWFtCnicTVFJigMwDLvnFfpAIV6TvKdDmUPn/9fKDoU5BAmvkpOWmFgLDzGEHyw9+JEhczf9G36i2btZepLJ2f+Y5yJTUfhSqC5iQl2IG8+hEfA9oWsSWbG98Tkso5lzvgcfhbgEM6EBY31JMrmo5pUhE04MdRwOWqTCuGtiw+Ja0TyN3G77RmZlJoQNj2RC3BiAiCDrArIYLJQ2NhMyWc4D7Q3JDVpg16kbUYuCK5TWCXSiVsSqzOCz5tZ2N0Mt8uCoffH6aFaXYIXRS/VYeF+FPpipmXbukkJ64U07IsweCqQyOy0rtXvE6m6B+j/LUvD9yff4Ha8PzfxcnAplbmRzdHJlYW0KZW5kb2JqCjIzIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggOTQgPj4Kc3RyZWFtCnicRY3BEcAgCAT/VEEJCgraTyaTh/b/jRAyfGDnDu6EBQu2eUYfBZUmXhVYB0pj3FCPQL3hci3J3AUPcCd/2tBUnJbTd2mRSVUp3KQSef8OZyaQqHnRY533C2P7IzwKZW5kc3RyZWFtCmVuZG9iagoyNCAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDcyID4+CnN0cmVhbQp4nDMyt1AwULA0ARKGFiYK5mYGCimGXEC+qYm5Qi4XSAzEygGzDIC0JZyCiGeAmCBtEMUgFkSxmYkZRB2cAZHL4EoDACXbFskKZW5kc3RyZWFtCmVuZG9iagoyNSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDE2MyA+PgpzdHJlYW0KeJxFkDsSAyEMQ3tOoSP4IwM+z2YyKTb3b2PYbFLA01ggg7sTgtTagonogoe2Jd0F760EZ2P86TZuNRLkBHWAVqTjaJRSfbnFaZV08Wg2cysLrRMdZg56lKMZoBA6Fd7touRypu7O+UNw9V/1v2LdOZuJgcnKHQjN6lPc+TY7orq6yf6kx9ys134r7FVhaVlLywm3nbtmQAncUznaqz0/Hwo69gplbmRzdHJlYW0KZW5kb2JqCjI2IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMzIyID4+CnN0cmVhbQp4nDVRu23FMAzsNQUXMCB+Jc3jIEiRt3+bO9qpSNO8H1VeMqVcLnXJKllh8qVDdYqmfJ5mpvwO9ZDjmB7ZIbpT1pZ7GBaWiXlKHbGaLPdwCza+AJoScwvx9wjwK4BRwESgbvH3D7pZEkAaFPwU6JqrllhiAg2Lha3ZFeJW3SlYuKv4diS5BwlyMVnoUw5Fiim3wHwZLNmRWpzrclkK/259AhphhTjss4tE4HnAA0wk/mSAbM8+W+zq6kU2doY46dCAi4CbzSQBQVM4qz64Yftqu+bnmSgnODnWr6Ixvg1O5ktS3le5x8+gQd74Mzxnd45QDppQCPTdAiCH3cBGhD61z8AuA7ZJu3djSvmcZCm+BDYK9qhTHcrwYuzMVm/Y/MfoymZRbJCV9dHpDsrcoBNiHm9koVuytvs3D7N9/wFfGXtkCmVuZHN0cmVhbQplbmRvYmoKMjcgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAyMTggPj4Kc3RyZWFtCnicPVC5jQQxDMtdhRpYwHrtqWcWi0um//RI+fYi0RZFUio1mZIpL3WUJVlT3jp8lsQOeYblbmQ2JSpFL5OwJffQCvF9ieYU993VlrNDNJdoOX4LMyqqGx3TSzaacCoTuqDcwzP6DW10A1aHHrFbINCkYNe2IHLHDxgMwZkTiyIMSk0G/65yj59eixs+w/FDFJGSDuY1/1j98nMNr1OPJ5Fub77iXpypDgMRHJKavCNdWLEuEhFpNUFNz8BaLYC7t17+G7QjugxA9onEcZpSjqG/a3Clzy/lJ1PYCmVuZHN0cmVhbQplbmRvYmoKMjggMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCA4MyA+PgpzdHJlYW0KeJxFjLsNwDAIRHumYAR+JvY+UZTC3r8NECVuuCfdPVwdCZkpbjPDQwaeDCyGXXGB9JYwC1xHUI6d7KNh1b7qBI31plLz7w+Unuys4obrAQJCGmYKZW5kc3RyZWFtCmVuZG9iagoyOSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDE2MCA+PgpzdHJlYW0KeJxFkDkSAzEIBHO9gidIXIL3rMu1wfr/qQfWR6LpAjQcuhZNynoUaD7psUahutBr6CxKkkTBFpIdUKdjiDsoSExIY5JIth6DI5pYs12YmVQqs1LhtGnFwr/ZWtXIRI1wjfyJ6QZU/E/qXJTwTYOvkjH6GFS8O4OMSfheRdxaMe3+RDCxGfYJb0UmBYSJsanZvs9ghsz3Ctc4x/MNTII36wplbmRzdHJlYW0KZW5kb2JqCjMwIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMzIwID4+CnN0cmVhbQp4nDVSS24FMQjbzym4QKXwT87zqqqLvvtvaxO9FUwwYOMpL1nSS77UJdulw+RbH/clsULej+2azFLF9xazFM8tr0fPEbctCgRREz1YmS8VItTP9Og6qHBKn4FXCLcUG7yDSQCDavgHHqUzIFDnQMa7YjJSA4Ik2HNpcQiJciaJf6S8nt8nraSh9D1Zmcvfk0ul0B1NTugBxcrFSaBdSfmgmZhKRJKX632xQvSGwJI8PkcxyYDsNoltogUm5x6lJczEFDqwxwK8ZprVVehgwh6HKYxXC7OoHmzyWxOVpB2t4xnZMN7LMFNioeGwBdTmYmWC7uXjNa/CiO1Rk13DcO6WzXcI0Wj+GxbK4GMVkoBHp7ESDWk4wIjAnl44xV7zEzkOwIhjnZosDGNoJqd6jonA0J6zpWHGxx5a9fMPVOl8hwplbmRzdHJlYW0KZW5kb2JqCjMxIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMTggPj4Kc3RyZWFtCnicMza0UDCAwxRDrjQAHeYDUgplbmRzdHJlYW0KZW5kb2JqCjMyIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMTMzID4+CnN0cmVhbQp4nEWPSw4EIQhE95yijsDHH+dxMumFc//tgJ1uE2M9hVSBuYKhPS5rA50VHyEZtvG3qZaORVk+VHpSVg/J4Iesxssh3KAs8IJJKoYhUIuYGpEtZW63gNs2DbKylVOljrCLozCP9rRsFR5folsidZI/g8QqL9zjuh3Ipda73qKLvn+kATEJCmVuZHN0cmVhbQplbmRvYmoKMzMgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAzNDAgPj4Kc3RyZWFtCnicNVI5bgQxDOv9Cn0ggG7b79kgSJH8vw2p2RQDcXRSlDtaVHbLh4VUtex0+bSV2hI35HdlhcQJyasS7VKGSKi8ViHV75kyr7c1ZwTIUqXC5KTkccmCP8OlpwvH+baxr+XIHY8eWBUjoUTAMsXE6BqWzu6wZlt+lmnAj3iEnCvWLcdYBVIb3TjtiveheS2yBoi9mZaKCh1WiRZ+QfGgR4199hhUWCDR7RxJcIyJUJGAdoHaSAw5eyx2UR/0MygxE+jaG0XcQYElkpg5xbp09N/40LGg/tiMN786KulbWllj0j4b7ZTGLDLpelj0dPPWx4MLNO+i/OfVDBI0ZY2Sxget2jmGoplRVni3Q5MNzTHHIfMOnsMZCUr6PBS/jyUTHZTI3w4NoX9fHqOMnDbeAuaiP20VBw7is8NeuYEVShdrkvcBqUzogen/r/G1vtfXHx3tgMYKZW5kc3RyZWFtCmVuZG9iagozNCAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDI1MSA+PgpzdHJlYW0KeJwtUUlyA0EIu88r9IRmp99jlyuH5P/XCMoHBg2LQHRa4qCMnyAsV7zlkatow98zMYLfBYd+K9dtWORAVCBJY1A1oXbxevQe2HGYCcyT1rAMZqwP/Iwp3OjF4TEZZ7fXZdQQ7F2vPZlByaxcxCUTF0zVYSNnDj+ZMi60cz03IOdGWJdhkG5WGjMSjjSFSCGFqpukzgRBEoyuRo02chT7pS+PdIZVjagx7HMtbV/PTThr0OxYrPLklB5dcS4nFy+sHPT1NgMXUWms8kBIwP1uD/VzspPfeEvnzhbT43vNyfLCVGDFm9duQDbV4t+8iOP7jK/n5/n8A19gW4gKZW5kc3RyZWFtCmVuZG9iagozNSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDIxNSA+PgpzdHJlYW0KeJw1UTkOAyEM7PcV/kAkjC94T6Iozf6/zYzRVh7BXIa0lCGZ8lKTqCHlUz56mS6cutzXzGo055a0LXOAuLa8L62SwIlmiIPBaZi4AZo8AUPX0ahRQxce0NSlUyiw3AQ+irduD91jtYGXtiHniSBiKBksQc2pRRMWbc8npDW/Xosb3pft3chTpcaWGIEGAVY4HNfo1/CVPU8m0XQVMtSrNcsYCRNFIjz5jqbVE+taNNIyEtTGEaxqA7w7/TBOAAATccsCZJ9KlLPkxG+x9LMGV/r+AZ9HVJYKZW5kc3RyZWFtCmVuZG9iagoxNiAwIG9iago8PCAvQmFzZUZvbnQgL0RlamFWdVNhbnMgL0NoYXJQcm9jcyAxNyAwIFIKL0VuY29kaW5nIDw8Ci9EaWZmZXJlbmNlcyBbIDMyIC9zcGFjZSA0OCAvemVybyAvb25lIC90d28gL3RocmVlIC9mb3VyIC9maXZlIC9zaXggNTYgL2VpZ2h0IC9uaW5lIDcxCi9HIDk3IC9hIDEwMSAvZSAxMDUgL2kgMTEwIC9uIC9vIDExNCAvciAxMTYgL3QgXQovVHlwZSAvRW5jb2RpbmcgPj4KL0ZpcnN0Q2hhciAwIC9Gb250QkJveCBbIC0xMDIxIC00NjMgMTc5NCAxMjMzIF0gL0ZvbnREZXNjcmlwdG9yIDE1IDAgUgovRm9udE1hdHJpeCBbIDAuMDAxIDAgMCAwLjAwMSAwIDAgXSAvTGFzdENoYXIgMjU1IC9OYW1lIC9EZWphVnVTYW5zCi9TdWJ0eXBlIC9UeXBlMyAvVHlwZSAvRm9udCAvV2lkdGhzIDE0IDAgUiA+PgplbmRvYmoKMTUgMCBvYmoKPDwgL0FzY2VudCA5MjkgL0NhcEhlaWdodCAwIC9EZXNjZW50IC0yMzYgL0ZsYWdzIDMyCi9Gb250QkJveCBbIC0xMDIxIC00NjMgMTc5NCAxMjMzIF0gL0ZvbnROYW1lIC9EZWphVnVTYW5zIC9JdGFsaWNBbmdsZSAwCi9NYXhXaWR0aCAxMzQyIC9TdGVtViAwIC9UeXBlIC9Gb250RGVzY3JpcHRvciAvWEhlaWdodCAwID4+CmVuZG9iagoxNCAwIG9iagpbIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwCjYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgMzE4IDQwMSA0NjAgODM4IDYzNgo5NTAgNzgwIDI3NSAzOTAgMzkwIDUwMCA4MzggMzE4IDM2MSAzMTggMzM3IDYzNiA2MzYgNjM2IDYzNiA2MzYgNjM2IDYzNiA2MzYKNjM2IDYzNiAzMzcgMzM3IDgzOCA4MzggODM4IDUzMSAxMDAwIDY4NCA2ODYgNjk4IDc3MCA2MzIgNTc1IDc3NSA3NTIgMjk1CjI5NSA2NTYgNTU3IDg2MyA3NDggNzg3IDYwMyA3ODcgNjk1IDYzNSA2MTEgNzMyIDY4NCA5ODkgNjg1IDYxMSA2ODUgMzkwIDMzNwozOTAgODM4IDUwMCA1MDAgNjEzIDYzNSA1NTAgNjM1IDYxNSAzNTIgNjM1IDYzNCAyNzggMjc4IDU3OSAyNzggOTc0IDYzNCA2MTIKNjM1IDYzNSA0MTEgNTIxIDM5MiA2MzQgNTkyIDgxOCA1OTIgNTkyIDUyNSA2MzYgMzM3IDYzNiA4MzggNjAwIDYzNiA2MDAgMzE4CjM1MiA1MTggMTAwMCA1MDAgNTAwIDUwMCAxMzQyIDYzNSA0MDAgMTA3MCA2MDAgNjg1IDYwMCA2MDAgMzE4IDMxOCA1MTggNTE4CjU5MCA1MDAgMTAwMCA1MDAgMTAwMCA1MjEgNDAwIDEwMjMgNjAwIDUyNSA2MTEgMzE4IDQwMSA2MzYgNjM2IDYzNiA2MzYgMzM3CjUwMCA1MDAgMTAwMCA0NzEgNjEyIDgzOCAzNjEgMTAwMCA1MDAgNTAwIDgzOCA0MDEgNDAxIDUwMCA2MzYgNjM2IDMxOCA1MDAKNDAxIDQ3MSA2MTIgOTY5IDk2OSA5NjkgNTMxIDY4NCA2ODQgNjg0IDY4NCA2ODQgNjg0IDk3NCA2OTggNjMyIDYzMiA2MzIgNjMyCjI5NSAyOTUgMjk1IDI5NSA3NzUgNzQ4IDc4NyA3ODcgNzg3IDc4NyA3ODcgODM4IDc4NyA3MzIgNzMyIDczMiA3MzIgNjExIDYwNQo2MzAgNjEzIDYxMyA2MTMgNjEzIDYxMyA2MTMgOTgyIDU1MCA2MTUgNjE1IDYxNSA2MTUgMjc4IDI3OCAyNzggMjc4IDYxMiA2MzQKNjEyIDYxMiA2MTIgNjEyIDYxMiA4MzggNjEyIDYzNCA2MzQgNjM0IDYzNCA1OTIgNjM1IDU5MiBdCmVuZG9iagoxNyAwIG9iago8PCAvRyAxOCAwIFIgL2EgMTkgMCBSIC9lIDIwIDAgUiAvZWlnaHQgMjEgMCBSIC9maXZlIDIyIDAgUiAvZm91ciAyMyAwIFIKL2kgMjQgMCBSIC9uIDI1IDAgUiAvbmluZSAyNiAwIFIgL28gMjcgMCBSIC9vbmUgMjggMCBSIC9yIDI5IDAgUgovc2l4IDMwIDAgUiAvc3BhY2UgMzEgMCBSIC90IDMyIDAgUiAvdGhyZWUgMzMgMCBSIC90d28gMzQgMCBSIC96ZXJvIDM1IDAgUgo+PgplbmRvYmoKMyAwIG9iago8PCAvRjEgMTYgMCBSID4+CmVuZG9iago0IDAgb2JqCjw8IC9BMSA8PCAvQ0EgMCAvVHlwZSAvRXh0R1N0YXRlIC9jYSAxID4+Ci9BMiA8PCAvQ0EgMSAvVHlwZSAvRXh0R1N0YXRlIC9jYSAxID4+ID4+CmVuZG9iago1IDAgb2JqCjw8ID4+CmVuZG9iago2IDAgb2JqCjw8ID4+CmVuZG9iago3IDAgb2JqCjw8IC9JMSAxMyAwIFIgPj4KZW5kb2JqCjEzIDAgb2JqCjw8IC9CaXRzUGVyQ29tcG9uZW50IDgKL0NvbG9yU3BhY2UgWy9JbmRleGVkIC9EZXZpY2VSR0IgMjU1ICj////+/v79/f38/Pz7+/v6+vr5+fn4+Pj39/f29vb19fX09PTz8/Py8vLx8fHw8PDv7+/u7u7t7e3s7Ozr6+vq6urp6eno6Ojn5+fm5ubl5eXk5OTj4+Pi4uLh4eHg4ODf39/e3t7d3d3c3Nzb29va2trZ2dnY2NjX19fW1tbV1dXU1NTT09PS0tLR0dHQ0NDPz8/Ozs7Nzc3MzMzLy8vKysrJycnIyMjHx8fGxsbFxcXExMTDw8PCwsLBwcHAwMC/v7++vr69vb28vLy7u7u6urq5ubm4uLi3t7e2tra1tbW0tLSzs7OysrKxsbGwsLCvr6+urq6tra2srKyrq6uqqqqpqamoqKinp6empqalpaWkpKSjo6OioqKhoaGgoKCfn5+enp6dnZ2cnJybm5uampqZmZmYmJiXl5eWlpaVlZWUlJSTk5OSkpKRkZGQkJCPj4+Ojo6NjY2MjIyLi4uKioqJiYmIiIiHh4eGhoaFhYWEhISDg4OCgoKBgYGAgIB/f39+fn59fX18fHx7e3t6enp5eXl4eHh3d3d2dnZ1dXV0dHRzc3NycnJxcXFwcHBvb29ubm5tbW1sbGxra2tqamppaWloaGhnZ2dmZmZlZWVkZGRjY2NiYmJhYWFgYGBfX19eXl5dXV1cXFxcXFxbW1taWlpZWVlYWFhXV1dWVlZVVVVUVFRTU1NSUlJRUVFQUFBPT09OTk5NTU1MTExLS0tKSkpJSUlISEhHR0dGRkZFRUVERERDQ0NCQkJBQUFAQEA/Pz8+Pj49PT08PDw7Ozs6Ojo5OTk4ODg3Nzc2NjY1NTU0NDQzMzMyMjIxMTEwMDAvLy8uLi4tLS0sLCwrKysqKipcKVwpXClcKFwoXCgnJycmJiYlJSUkJCQjIyMiIiIhISEgICAfHx8eHh4dHR0cHBwbGxsaGhoZGRkYGBgXFxcWFhYVFRUUFBQTExMSEhIREREQEBAPDw8ODg5cclxyXHIMDAwLCwtcblxuXG4JCQkICAgHBwcGBgYFBQUEBAQDAwMCAgIBAQEAAAApXQovRGVjb2RlUGFybXMgPDwgL0NvbG9ycyAxIC9Db2x1bW5zIDQ0NyAvUHJlZGljdG9yIDEwID4+Ci9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9IZWlnaHQgNTMgL0xlbmd0aCAzNiAwIFIgL1N1YnR5cGUgL0ltYWdlCi9UeXBlIC9YT2JqZWN0IC9XaWR0aCA0NDcgPj4Kc3RyZWFtCnic7ZwJNFVf28CdcyfzPIuMkRQqZCikookMlQwpUyGUMYmuIVJK5gwlQ2VqQkQZylSKiNAgSYUGlDLf6zsXdzqXv/retd73/b7Vs8q6+9z9nL3P/u3n2Xs/e59Lh/0r/5eF7j9dgb/yLwndf7oCf+VfEjrov6PlBg1l/3B7bGJSUrzj9uQb94+bObm4JmWFH1APjbFKbH1aElrQ5OPkfL3hQpCDDxZ7pe1PJB+LjWj+E4XHwdjAqj9RaI3BYq//UZ1ysNjYVkgRkt+5f2tbZQA2uG728+9otDWfxWILpj8R/8AykD8RKgH9S8dik2m+halM17d15lPb/Vl+hyxWrZALv+QYlnXjRqbL5oziWv/dbq72aUUXD8mHRm9N+Pz1+YnKfjdbr4c9SScsPLHYwqk/kSdYbNzEnyh8PYkN/PAnCviLWOzDP6pTBRabgv8ThfeB2JBvf6IwDvWp+pmPCxY0k6EAi82aTc+vQflN+yy/0sfYjJcDg62PS1++bmhuCnQyTqz+WGRzLHqw477L9qVaFk0V8n4FZscHShPs9hgc+S/n91tYyPzwuN8qgswPN/ZbGmR++JHx+TJRgSLzGxmmzTmHctssv7KnIYnFpfeuJ5+7ev12WnxKPDa36kGas53z9dwMCz1TG9fiAqdTCevNChNP+R6x9v4v5vcPHZdaiPxw45M0NOYkSuI3OjoOKwSHm5yjXBK/seHxSXgBY3O1B5Hf5PDIGExhYmxsjicj2t+diuCjzlbmFvraRlb+esuaPrVW5h/18t+qrGbgqLP16tW0+IzmNG9RiS12PhlJAdj/Yn64ibkAznFtlh9+4geNNeEn4YAI0j3LD//tO1xhfGxknBY5id/AZ9jtIBoDP+eoJpHfcO8oTGPy5/fvc/QRIr+L2fnHVZwcRfenx2K3amtdruiJd/KMqXXZvGOz1plrRWf27jDYecjvgPVen/MtT26c+8/ym5zLk5D8J82Xk2M/f83RuiT7g+PDTwx96/sxQqNA5Dc1BqOLn+zvfdc7QFME2f7gN8MPfGjvHBiDK5D4TfyC2evEj3etzX0/5uUXHlfkI+3rx2VblHNeV2fjqezOICPPxBdehnb68pcf3PFWVVZStg4KO255Mr25vihyPn7jQ58/9/X0fh78Sd1g8/KbHO3t6fnU2z8Cq9m8/CZHPnV1dn0Y+AW7Pu/8BffrU2vzi46+n/BnJ/KD+0r8UN+zupqmjp/wCpP4wcwA/+trfdW9qvrBUZgCiR+Ougj8eP/zsvySuk80YxyRH9yJ4L6+vncrt7J9GN5HiPysjPft3l5as3uTRlhqvs1yr+BTXs5Hj3oYG+ceV3by9VmH0XW5d+3ClQCZ1NdmFr7+8/CbeJ3tcMDGxNIx9nor1UxtXn69j8xNjPX3hFTC/MW8/HpqjBTXqK8Ph5c/Jz88Ho8bLLbhkJJb5ZkD91dE/wl3VMNFwez8opLbr3fBFLrnnH/iJ0cqIyXYufmk0uphX1HMP6k0Rl5H67CysnFgK+CzGvL8hUomvl+wYWFhYTWsgJdP5LfXYLve+qJSzQ36praBbrbme8yO+JqZ7bc4WBKmczJ8mxyHR0SC114PT5eiVyEh8aGU/MZ+tFRfv5YaF5cQF+m/T0VltexqTRNr/2t1A+T+SMuv/2luclxsTIib/DJZaXl9j9hbjym/puWHH2zJSoyJOXlkKY/AIlFDl7SyFsqnn4vfz9tpMdFnHJUQrJy82nap97upjHau9UNVbmxUxMHNIIaZdenBmII+KoW5+L25kxQd4WrIAqIxbDYhd3qovpyL3/f712Ij/A3FABBEGvgVtlJ/Owc/3NPCuKjwnUoAJCt8ch5TO1YiP2ujtUoKmTn8G934WJUCbyuLSxw6o6C0wzm4Nn7nzWxeAambBeZyTPI2z5ubG59Wx1LyG+yM91CXE0WimJF0M0LPjgQZ9LAUJkjDD/8iSI0bCQIzgmBiYt3gT9mYtPzGX8UpsgJEYeAQs73wg/KGtPzw3boSUAkgiIAUUEzye0s+UX49B7/JI2sQxBJQHMu3PqZSmIMfPlufa0YDKoV76fZqqhvOxe/N3hWo6fwAiOCRMk2mrsEc/MaCDVHEdmISMfSjHkqJ/AoLlmz0qa7z2a2qo7XSJVpaxsjRNznUUm/H7XOmx4K8HfdqKgiISmtsNDyZ/eXHYDolvzteGjLszAxQfYBZfgiohggeGceLpDwwfn1NztuWsKNBEg4EAsm1KqCBnIOGX9EZEyUWJFkBxSC65nozRUvC+b27fsyMh5HQrkgkAmotJIvoplv9FM0F5zdSe/nwUjYoP4hkYmRAIlGsAqYXKO9Iw6+3MWg7LwaqO5qNg50BiWEVNAujHNJo+E0MpXuKsiEAEMMlyMtBz8AstCn0LWUGWn51scqCUJ0YOcWFeOnpGUVUImsovybyq2+U1gusrL90aJ2pkZzd6TXaHg6OORectdRjg2ycfS6e91+EAAQVjAx13ONfvOu9TOaHH4nX42cikqMQEKPqRZrZUfPDN2Up8M10WwQSBAkYIQVuvSsfSc4Bxm/s69mdImwEBTQjBg0JRATNFXhrgORC4fxG605oi0N3RqDZ2ViYGJkwSICe/0zjMNn9wPn9SDusxAIASAwbJz8vNwcrGomWcemhmJPQ8GvK3boEcoMYdoHFoiL83AwYzHKTdxTDLA2/wdfuG+mRIIpZWHr5EnEhNgaUuGH1EEUGOL/Jb9es+VAA1FllVeWXCvMyswhYZVBOYoj8sq+brhXHpuYWP/DUZ7WIv15c76goa5q5R1neMjE84nZJ2RougGd55uOe3BMrtA77kvn9bDi0CAXMwQ9q6g1viB6Oih9u2H8FZsb2QA5uBnoMGknQB9GKZl/m4fcyTJWVABxEi6yRFhUSWcyCgVpaYmv863n4TTw/L8tKwEfPb7hBebmC5hIuFAKU39VEKoGG36dtS+kh02DmMzLT09E00BFjAZAyB5vm54cP1WeBfAhacLPrboNN5tZyAgCDUEDxP/B7cFSGDQEiBNWCXPeZ7vfaJIOk5wkoohjR4Pz6Io0EoCI4l5wIdrO38bVV40Tx2dVQjBtEfj7ex4+6Z2fbOLkbaQpvsvMLDNmtud27zHq9V/D5gOCriWedzLQsvTKKGu8krdW2pIh/fjiziQ1BwIVk4l21ydVSa6uuhBA3BvKlAKjzkehNqPh9ubOTF/oezapq7O7r5+3laWuqIcUJNZ3oht65+Q2VGoqiARSLtrlHUNSp4ICgoAOGUmwgh5IvqXlh/H5esBNjRjLJWxw5kZoQGX4uLsRTZTEgtCavbT5+TTlaEmimRXtdT6ReTboQl5JwUl+WXlCneJCUB8bv8xNXHWYG5h0HA5LzMlISr+accZDnYt+dMi+/8c7MgxJszGq2/tFleVnpWYWJAUqijHvCKaZhMH5D7Vg9HmbR/Z6h98ryc7OLc6O3yLBsjKAYlYn8tFSvPuzouotBMUjKrVwmraYsrW0SkP7C0fDFnROubrGuWzLzIwqbLsRl3i+zNDQkxz/xjaoC04aEYBRY5Z4y1nQ+K3WHpjwHhmBRGweJVaPkh2+2kSZ4TjZxYl99/SB051LIoLhXfpyTH+59MhcGQLCKRD2edR34tpvG4gC4eG/tPPy+Gq5axMa8yPEJ0TtNDHhuABgEz5bPxy/eWkWckV+z8TPpyuW9bCyLLr4heSsYv8ZwUw0OTqH8btKV+kMSaNlA8j1h/IaKwi0leRYFvp1uFUK2fk9tYNkeiiETxq+72m09P//m9gHSlchdaHF9ikkrkd/tsuggNwfz5VvsJaV2m+zOjtPbuC0u9aqxZpqz6Go1JTnp9Pyws2f3+T332lr8pCWRyA9fEc6JIfDbERSXU9/Ri//54XNvS3We6SoCP6G9D2aLoeA3WXpGmh0A5E/nPX7XP3NpZPB94RlhNIDmuUAcnKn4DZ82ZWPmD7n66CPJcwz31ZmzgIwi2cSHp+b3ttxEU8EvvfrVD6Jzwk92JDCiGZSDSHmo+eFSPXZ4ZFY0/iRbQ2+tEAajd5TUvDB+rYlHDucW13wlj5BDr/VAVq1T74hpGL+fpcnHb5VXd5JjFROvgwGWpRfJeWD8OmvP59RUPx8mTx26CpmYBFOaSHcg8qtp8TnsqKVq6HhCTcP9sFteirmRSeSlTCfzRHvhNesUlDVz8jyPY03cnx3Sqv/0K4PID5fphgKhBYOg371n78nP0R1mtZiVjo5Z5vrsFQp+44kHODBIKcvKrxQVneoo1hSG5sceubNpSn5jnw9t4JXTLe+kVJgc8pdFI+hj3hMtkopfe7GtuVneG+poxX0pVgS/0wjxIoxf3lnP9PfUEZQvKzmBpSak+QWMX+etyPgPsIiWFTtKxrKFmILxG6nLS/4wShX8m0xhxfAdKyGl4fb3PLeNOsAw2cbHQB9yn/RgRH4njiz2+Ki65G70oaScklupSpongoPMIkdHv1fdTEhJy6zqbM0Wd8087BqSUXD5+uM4Ir/JRFsQsjSZ0EYcZTH4iY+X9ejoUGzpsxco+I3sVUQhuGp6YSGlsYJjhBnPqdk0Jb+OsgMGa4pGcbDFWm08NwBYJs6aBzW/gXfZVWPwMGlHxGqQbdez77NJmP/88mkUrvDz5HZASIdk8zB++MkJeKgcF22CEdYlLYPg8xfcJI3C3a28HPtySGkYPzweXiV81wYxhONlGn5u+7iMc/TUT4cGXUm2T34QevJCXIT5+eGO+huFD/wcDme+e35Vwi7ew8EyvjD+XHAAyf7SD4HQTFOtsg9Wr/6K3XR0GIFrs2lKfnvkkGzSr+ChP9zTcwAd/c7Y2SQlv84H9hY2T6bg0nqdj47O/e5sEBjG70NzN43Ch2trQRbLj0Qbg/Ebpt0P+JVkCfBrzsdvDsFnODEIaD4lJueJn1HIZIX1IrZdV0npeeJnFPJx1zLQKoY0ZSXyO2jEpHjAfJfh0UtZQZiAtx9bb15Ltor4evdyXPHHnTJywa+fpMqaB/rYrgnJO++q7kTid8Mb4gdug5cyOvjaho6OSZroDin57ZZFLFrbB9fAdVwE6BidicAp+XXX2jtFv4YrTL0rhWZO5zpmHwXGD2be0/K5WAdksSclF95/H77uCPBq/AG/qXx/Rr41dcTUwvwmHnmLsWy/TEovzK/HXgk0CaPhdypgy6GLtxKl3Uq2KChqGaadVk58Guu17WLF/ZRjCacX+768dMbP51jGnSe3UmK9dZxJ889v+Qg6kHPXd+pALL7q4hYxOjrpEOL0npKf3dpF66zh7TD8SV8CoON4RBwUKfn96rtV0klrHUGyaACRRrQman6Tc2x3T96TZUPwuZDSC/Kb+KTGD0jqzzf+0cr4oK0wQtyYtKZZkB/ua6IQA7dzPunCgvz6H4mxII5co/GfgVj3c/lNRdIuBbpqVurSIa68YZWhtkoXa/PjPa9f5ndrOBccc8ypoGnkcfZZLyM38vqvhhkJcuk9bHrV/Y3c5XGXXYWY6ehW3SaG8Cn4jR43ktCxaf86QmUh7+4vpqND8JGcHiW/iV819b3wvZlf7aZ0dGhO4gRp4fMvuLZIgA4l60u6sCC/zmIeAFCxJ8WwF+T3+aEWAK44/JKYXpDf6AN3ACF4upJ0YUF+T5KZEJiwCpr555YtTxuf/OgwtvdPK+o8LG5rKr7biVf9TEmFQ1z77VNMplknA6IsNCo/To31OjpQ7r83LOcCAIZFa7Z5ZPwgTXPHtwsQpjUb+4k7lJTrh4cRkoqagRkvKKPPUzFKDHR0LNJzr/8mastKeqeopUFbkI6Ob2M5Mb0gvyF9SYCO6cAV0oUF+XlLoADAJYe0y7ogv3wxJgDc8WCAmF6QX88KTgC9lGJ5tyA/U06QnqeW3PWJ/HYYPbmJLby9Y+M6S0c/XUl3GzG1jct0XM9G2/tdrsph13R3dzIxNqttvNvQlpfgcZzMr2WjCAAgmQUkVQ2PXsibdVvj65gAOgC5hWRjFPzw77NEhUV1zdxPRcfefkns3MH8SDo68U2kYZGK33h+4rHY1KRLGVfySI66ejEzAMgcf07MA+M3/qym/FZWZs7Nz8T1xYASO4DiyyKHvGH8Bj5C69bruTeJARrc6AE2EMUa2zbf+n0K39Nekp97g2gM+JFrrGgkjwN5EULDb/hLXdmt2wVEjzzcLkwP8Gn1kX0LnB9uuKM67+btztnk2MBWepB3ZSM5A5GfuVVdhIZ/iIEMml9IYLFs8BFxMcn1m3fsP+jg4NjawLd0vY2piKHfo7tu6dW/qu2Pkvm92r8MmN1AAZVt+mcmyKMrCRE1JiNSMVTxswcizCAHF5eYjNz+Gx9neOA8CQHTNQ6k5qHiN5p6VGO9zpp1m7favPk2c3YBd4+wM6SeR8oD4/frUrjfPmODnXsbZ08CjPeKAiCjVC+ZGIxfx6Orp2zMTPdmj06fLMKPfdsDLUgXUYQzYfxwY09uuNuamp/4NTo+PdX/mgiAmKWB5BxwfpN9TVHH9u0/+G50OrCP/1zLAYDL9lDsCMH44UZ7Ck/ZWO4vma3T9zdaICi5gxwDJPErafv5qelpWViwn6Y0g35QQlzo3vVc/LLmPrcL7z69q2e4zz+2tqE+wN2tqP3c8UPHyPyGnuxnhpqSiR0B/eFR834MucWeR0shfhivXFIxVPyaraQAJBKFoWfgltjsRnBP38ugwQxEhb2fe/9h4sl5SQFOZhY2Nm65jTZvCA9WGggCCKH9g/PtPwzYbVrKz8HBySWrtu/2FB43WhUDDWZL9PvJWWD80o+oSvNwcXKJr9oVBC1mf7VHqwCAqNlTcg4Yv+fnjVX4uTm5BBX1rHvwk/1vz5sCILsDeTEH5/f9ylFdKQFubp7l6jtL8FPD3ZdcGBFou6R545/4yksmyot4uLmlVhuexk9Nvr/jKorgNEiiGEuI/J59a29tfdt4OsDHTBOpH5p2JQNrzSiwwepIQkFzTb7n/h1uMR+flx22c0wp8jjs6UfmN9Z9iAXiJ7dJQ1meDWTSibpbU3MjSoTAzzu19f0XHC2/FhtpAORRV1ddKQIIaZbX1NTcDV0HzV4YQt/0E/0pNb8HwXzMzMpqaspyCB6FjOqamsoQM8L+g/1nkuuh5tffsmkpu5yKitJKZoblvjVVleVnrVkBQN6sl9xYVPxG+/x1+cRVlJUUBEAJg8rqqvuX90sCCBnH+fYfcP23zGWFV61erSAF8MrfqK68c3XvGgDNd7xoPn4/X7vricivXqUgR88oEVRVfT/70AY0mtUzl2JjlIrf+Pd4J6llKxUVVnAjF++qqn6YhdXmQgla3KDoRER+j5p2mzu9emsuxxAVCi7Vv16SV17AtaH4sC7n4cH7hV3uSOV9D3x13V2M16m6B5wLJvMbeW2HAUBU9JfxvkeakEtDolAo5Mx+0GIF/RNXh2n51WnwA/RmExMjrf6QAoqggADp6FCc2gfyiMMTFb9ffptBhHDvxMSn+0wzJUAaEL9lO9M75+Z3x58VBDO/fu1+sZJCAaFs1UDuu1T8OlJXgoDNp57uZw6kOgEgs7wLaYCF8fuVZw8CS9redTVcRIIIyJsQHgJgX3Ly/nz8GlI40Kgbr1/W3xMl7D9DAimwSvrfnI9fT60SA+DSXF9XZYICETPNBNJL2czFLznJUN+wsj3R0+Soo/S+c0VZx67k8it4r5NWPPn9nNcFIxb7M/cCTKxsDhw5nhlOsf8wNTngSg8KmBSPTo307OEhBGOIm4EAK6+E+q6ZeD4Vv0cqPPRG0YQuHC+AIWWH7E9EwfRQWDstv59O6sAae8gx/2qSIB+hoAO5l+7wiUyvnYNf4h4GoU2VI6NDnzdzkRQAUFDeNSQtv2qSlt8j+8X0yqd+/Bz6HMCDmrk9HQDS86/yiL1V+nSIlt8393WAuH53/1BfsRAzOL0JDf1n4l1nn1jwsO3LHPxiLOh55Mp7v/S8UeUkVYlRQNMsJb/27ec5+JW7LGJcHNT58dMHV0EkML3LDYBowdU7o3KfdM4eQSXy83Ay2bI+99mzOwlWBpvOPqxI3nbuiri4BheLUfzng+tNVQSibheFWBlaHLtU9DxaxJry/IQ3AygXN93qzksQ8E14zpn5HBW/2lXcLJHTOxPZcsyUG74ggplb7A6eht/QXkXALp0wzHeqCFAqIBlFFQxi5+B3Uh2tGNA+CU0AzMTIpzRAELVIwcD57Cgtv0Ildjbba6M4/GSUFD2RH4BCAmIqB08kfqLl92ntIkDr8JeRqcn6FTyQXRAOaiBADD0gpH341I1WWn54GwlQ0uDp4Mj4r22LQWKFMKwY9u0ukfeaZ07CUfFLFqdnUY/pGRmfCFqGAWfPK6DYmOnX708ofTtGxW+jzpPq2yd80oofbV8upWXR/ORMWnao285lMmHephGxtmY7r1eU2Mgkp2Ijog9YUK7fJwc8ORHC1lWE6IM5FwjfhGe7+ISGX52mAKNrFmE6FUWPoMRBcL+YhI84OL+fB1UBk3BoaPxWzYWiUkBgmLicp+e81PxC16KXuUGNOPhKFU22PwSIYGQXFFv/k4Yf/g6BXxZ+aqzDffZoANT5EJDDYuGRkF7xhIYf/qOaILD5+DBuqvsGO/2MxRLcKApg5FuqsCpmDn4WguAK21eT+G+tKxhnT26B9PT0CBSvpJLK/pnWoeJ3QQjDbX5jDD/SZcOImTn0hGBiYUCDnCJrNTe+peKnsrKmNMPV8VJmru6qdbomOTdj0q4Ge1htN0rx1jgZf8LPLz75go3WxaQj7kd2GFG+f/Sjeh8bgks7orzi3m1tZsjCJWT5FsusVhSatiwE58yOHiU/XPUqboz+sfLy0jxHQh4uGeHFCirqi2ccHXj+9SSc35DZCkDDrqi8/GYEwTYYZCRFV6lpLxNEEXo9av/PSRp+x1egRI1SystvX1pCuKeolKjCWq01EuzQpJeJZcW3STg/3C1pZubtARXlxZcNCbXgkRKX1VqvtUyYgYmZjZ3zIQ7OD9clzwWo7rtXXnbVDxr6QCZJSal1OhtWy7Ays3Dzcs1s4lLxw5lwAUuMMisqbiYJI5EgUlxKSmW9nqYiHwsLpwD3hjFafrFcKA79Mw8r7mZsQkCeQFBaZuWGLZuVJNhYOUUXibTiKfktFzxsoWHmdtNrrbZpcrjvCu1T8bFaW13S75WGbdjhUNNQryu78mj2EXOtZRIGu/Z4kPm1GUnO9Ax6NGJ6UArNMPNKeFJ2YAWBDZNw9EM4v5ECegTB0hAIxLS5brl4xLv4xcejejN98mTDBJzfgCwjoQSCAuHgnWjiad/aLtw1W67pTrnr3TANP/MZc0BOawAov0jfe1/G2wJU2TDQQCL++gec3/jlGWOYnoRA0y/DiKCM0Ymh5IPCbPRQFyn6Bec32gaNYSh6RgxyugSE7Nmw84M4XFmUojAT9HTe06tUSn64kQ0AQM/BwoRGTg+VLIHnw9twuI5sE3keJgBQGsbD+eHDodGOi4eHHoWYPuJlHRdfisMN3fVTEedHI5kaxin5LWPXsI0K9tLfpLl2d1ZC6BpFjS07Pc/kNHZ1X93ll/A6083c/FBYSkqMr9PBC75rSfsPU8N1OsIzzowAAymgvLek5W5Vy+cPZRf9FQQA3pXVH+H8+m+woWe8JWSt7BIHL754WP2+/1f17aidsmh6/rQ+PJzfoDov0QWiOMQcI1vqa3uHpl6VJvho8yGFD3+foOF3gIM46iGZpUzDaxpru0fxA4+zI3evRgho9Y7R8EuHXBrUPwgo0OJaEQXP6tpxUxMvyi+5GbPxLKkaJ/Ijxtcn3nCDhFOP08XwywemN9Q3Qpk+NF07c1CSTSJseoFOyQ8/AfFDMaCnz3KyKjrF1TU2DEBrwteFl4/psoruGJqcgx+AZGVmJHQQ5ArDyPvPm6EWmeh6lBXuzC0g0zBMyU+RU8ixIfUok9R69V03UyM3yyE5liQVNvb8xJc5XL73IUzBAZsYfb60NPfypeeJsnYkfoMPVflnZ5CEw32ye9O7ZsMJPzotFABx3ZmZGGX8rC+Xl2F29EYgRLRLyAcgE42YOVfeo52//NgqQZjcQQaFZhFfV0bee2rxWcGscXrmtlT83MSQ0xEhSEFoc8oQKQT2K8GKabXVEB7ObyKTh37mqC+aiXO9F8X7KQ+iROW2NE7f4D0FP/w7QfTMI6AxTKvMSXHbqamugg0SuskjhN1m6vFvM2rGI6DQjGKWZWSFkTpfMS3nmcAglf88h4bGO8jAkRgGDtMYssLU2/ylq/Wahij5Zd103rdrn72HmbaukXtUdkW0lOLag+Zr9Wz731VcifP18dq0O//QGofIN5XFQ/cp3t/ENWotIvNDcOiEvZt9dtxYTSjCMHwIzm9q4uEKbkKfYmAVlpDd4dVPXlEPtq81zp7ZgqBe/3lsYscgmdgF1uhZHE/vIZ+3G/sSZl33kZYfLn43OxqAJrNqpp7nGnrINPCDD9wfzqap5p8Pdy8CQUZe0RUWR2NfkI8wQQ7mQ9St7pkJKyW/qc/QnBhEC4hIGh5KqflEsYSbGCrI7BqYriP1+iFgIwqJ4RaU3GCbVvqJ4mA+fqT1VnvfTBej4pe/ixtEsgmIrbKLLe4aoKjTeH9Vc/co1fiXlJGMtTQysjbVt7LeF3qtvcjMfK+PmciSjX2NqTdvRMYlunjf2b/E5WxR6cO2fGeK+FmnhzorhoFzkcQyOVlZ2ZXWV0nWgf+QweV2Z8Yaqc6fNZkricgqqG42srJ1DE2n3Kn7Ye3TNDj9iTr+meKlpqGpb2LuFRSdW0d53nUqL+bLTONSv39bfFpTXdtgt7V3ZFbpN6oT552ZRFuh4td6Tl9JZ/ue/c4xuVXUW40j5cRwIxW/7zEHVq3farHP7kxaA2wzuu05bop2/jKV46+iuW2XhR02qRH2Zs63l8QqUvGrj9isqmtkbu2WXNVN/dbDRB+xjkR+GusG2jK3LQFV3S6c3e4W/fZDa3F2WQC3wJoPcZKP8ZO9Lb0dOaZiGbHrLjZgw7LPkvnhhk8r8otp2/knJcdHR8U+oCymVp24M0m1fhioDrGJyXnaT/s24mhOxewn2PndrvTq1xNzvVn74xsx+k8d/xwprPky9s+v4hL4UexB1t4dGMX/owb8/FL+F/w/K8DPD5a8xMMP8cAEFv+sezyBw/1jGaT998T+3naX3SeO7N+uo+iaUnnNLKfRfweH3NYHMQbPBwormz9U7zIwiI9183Jbb3yM8v2xycasgNM3Kx4VVrxoaW6heuGj7+Yc+7eQ1+ttqGjp+EL79uIUroOoD+M39Kr3+5xPMT73/vvU5Pte6g1iWoHFr/u6F3qpHcZvqIv2FU9Y5aj5TXwYXEABvv/wuW+hl8FJv1/Q1tXzNcS3McpQjH+xQ2p+INOlLhMVES2zjEiPls6wa4867yzWdYhKTDRbKbUG9vsTuIYXE/iJp7QnVMjy/+L3J37j/Au1LHz+BS6z/H6/WqTzu/lbtu8Ji48y4g/ELlfd3lrt4OTsfbEj9ohpQHFKSlWw3rPHO+TFn7ytNRKpKaOMXxNkjDCGzfk+PlH+8vs9Wfj8EkyI/NKu2Jub+ITnYE3zbh2wtqssj7Ha6HhxoCA+MPbWcZ870YcLs7Yt4cl/dH/Xshd1MSH/xb9f8Nvy/4pfcNSbguPGDtOG9OlZyenktp0c63xaO3vwdUFaav4VE4GmKxdx2PnF7DeoKIo8+Zff78i/kZ/boQMRD2Kjyouun7nwMmy7roHNMnb1AzmxSWNdJZmpyRdiEpIvexpvsb3i65h3N//8X36/I/9Gfi6W0t7vC6+lh3vomNdasi2WWCIkqHcwzv7gcN/Tly03Q21yq16meW4wv3LK91rBg5i//H5H/o38buTbuZ8+HPg9auW6LfZGWmJrT/v6vWyvNtYcylbTMr3z/GtbifM2jVtJ6vbYoJOhgX/5/Y78r/hlzvXrNvMKkV9Gtof3CVf/5+GbjM3s95lp74oICX1cnb/PsD5ug55ZRllL2VWHXfrZF/QOYU+cwBIUXvyJ5GGx557/icKjYGxg5Z8otERjsbl/VCfC7w+2/InCwwBs8OM/UXh+FovN/6M6pWOxSc1/Uql72L+///l/Xej+0xX4K/+S0P2nK/BX/iX5H3oVbwQKZW5kc3RyZWFtCmVuZG9iagozNiAwIG9iago5MTAzCmVuZG9iagoyIDAgb2JqCjw8IC9Db3VudCAxIC9LaWRzIFsgMTEgMCBSIF0gL1R5cGUgL1BhZ2VzID4+CmVuZG9iagozNyAwIG9iago8PCAvQ3JlYXRpb25EYXRlIChEOjIwMjEwOTE2MTQ0MDQ2KzAyJzAwJykKL0NyZWF0b3IgKE1hdHBsb3RsaWIgdjMuNC4zLCBodHRwczovL21hdHBsb3RsaWIub3JnKQovUHJvZHVjZXIgKE1hdHBsb3RsaWIgcGRmIGJhY2tlbmQgdjMuNC4zKSA+PgplbmRvYmoKeHJlZgowIDM4CjAwMDAwMDAwMDAgNjU1MzUgZiAKMDAwMDAwMDAxNiAwMDAwMCBuIAowMDAwMDE4NDQzIDAwMDAwIG4gCjAwMDAwMDgwODUgMDAwMDAgbiAKMDAwMDAwODExNyAwMDAwMCBuIAowMDAwMDA4MjE2IDAwMDAwIG4gCjAwMDAwMDgyMzcgMDAwMDAgbiAKMDAwMDAwODI1OCAwMDAwMCBuIAowMDAwMDAwMDY1IDAwMDAwIG4gCjAwMDAwMDA0MDAgMDAwMDAgbiAKMDAwMDAwMTAyMiAwMDAwMCBuIAowMDAwMDAwMjA4IDAwMDAwIG4gCjAwMDAwMDEwMDIgMDAwMDAgbiAKMDAwMDAwODI5MCAwMDAwMCBuIAowMDAwMDA2ODAwIDAwMDAwIG4gCjAwMDAwMDY2MDAgMDAwMDAgbiAKMDAwMDAwNjE4OCAwMDAwMCBuIAowMDAwMDA3ODUzIDAwMDAwIG4gCjAwMDAwMDEwNDIgMDAwMDAgbiAKMDAwMDAwMTM2MiAwMDAwMCBuIAowMDAwMDAxNzQyIDAwMDAwIG4gCjAwMDAwMDIwNjQgMDAwMDAgbiAKMDAwMDAwMjUzMiAwMDAwMCBuIAowMDAwMDAyODU0IDAwMDAwIG4gCjAwMDAwMDMwMjAgMDAwMDAgbiAKMDAwMDAwMzE2NCAwMDAwMCBuIAowMDAwMDAzNDAwIDAwMDAwIG4gCjAwMDAwMDM3OTUgMDAwMDAgbiAKMDAwMDAwNDA4NiAwMDAwMCBuIAowMDAwMDA0MjQxIDAwMDAwIG4gCjAwMDAwMDQ0NzQgMDAwMDAgbiAKMDAwMDAwNDg2NyAwMDAwMCBuIAowMDAwMDA0OTU3IDAwMDAwIG4gCjAwMDAwMDUxNjMgMDAwMDAgbiAKMDAwMDAwNTU3NiAwMDAwMCBuIAowMDAwMDA1OTAwIDAwMDAwIG4gCjAwMDAwMTg0MjIgMDAwMDAgbiAKMDAwMDAxODUwMyAwMDAwMCBuIAp0cmFpbGVyCjw8IC9JbmZvIDM3IDAgUiAvUm9vdCAxIDAgUiAvU2l6ZSAzOCA+PgpzdGFydHhyZWYKMTg2NjAKJSVFT0YK\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:40:46.343108\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:40:46.488312\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:40:46.639358\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["for i in range(imgs_per_step.shape[1]):\n", " step_size = callback.num_steps // callback.vis_steps\n", " imgs_to_plot = imgs_per_step[step_size - 1 :: step_size, i]\n", " imgs_to_plot = torch.cat([imgs_per_step[0:1, i], imgs_to_plot], dim=0)\n", " grid = torchvision.utils.make_grid(\n", " imgs_to_plot, nrow=imgs_to_plot.shape[0], normalize=True, range=(-1, 1), pad_value=0.5, padding=2\n", " )\n", " grid = grid.permute(1, 2, 0)\n", " plt.figure(figsize=(8, 8))\n", " plt.imshow(grid)\n", " plt.xlabel(\"Generation iteration\")\n", " plt.xticks(\n", " [(imgs_per_step.shape[-1] + 2) * (0.5 + j) for j in range(callback.vis_steps + 1)],\n", " labels=[1] + list(range(step_size, imgs_per_step.shape[0] + 1, step_size)),\n", " )\n", " plt.yticks([])\n", " plt.show()"]}, {"cell_type": "markdown", "id": "d85bacf3", "metadata": {"papermill": {"duration": 0.032666, "end_time": "2021-09-16T12:40:46.804930", "exception": false, "start_time": "2021-09-16T12:40:46.772264", "status": "completed"}, "tags": []}, "source": ["We see that although starting from noise in the very first step, the sampling algorithm obtains reasonable shapes after only 32 steps.\n", "Over the next 200 steps, the shapes become clearer and changed towards realistic digits.\n", "The specific samples can differ when you run the code on Colab, hence the following description is specific to the plots shown on the website.\n", "The first row shows an 8, where we remove unnecessary white parts over iterations.\n", "The transformation across iterations can be seen at best for the second sample, which creates a digit of 2.\n", "While the first sample after 32 iterations looks a bit like a digit, but not really,\n", "the sample is transformed more and more to a typical image of the digit 2."]}, {"cell_type": "markdown", "id": "9b5682ed", "metadata": {"papermill": {"duration": 0.03313, "end_time": "2021-09-16T12:40:46.870416", "exception": false, "start_time": "2021-09-16T12:40:46.837286", "status": "completed"}, "tags": []}, "source": ["### Out-of-distribution detection\n", "\n", "A very common and strong application of energy-based models is out-of-distribution detection\n", "(sometimes referred to as \"anomaly\" detection).\n", "As more and more deep learning models are applied in production and applications,\n", "a crucial aspect of these models is to know what the models don't know.\n", "Deep learning models are usually overconfident, meaning that they classify even random images sometimes with 100% probability.\n", "Clearly, this is not something that we want to see in applications.\n", "Energy-based models can help with this problem because they are trained to detect images that do not fit the training dataset distribution.\n", "Thus, in those applications, you could train an energy-based model along with the classifier,\n", "and only output predictions if the energy-based models assign a (unnormalized) probability higher than $\\delta$ to the image.\n", "You can actually combine classifiers and energy-based objectives in a single model,\n", "as proposed in this [paper](https://arxiv.org/abs/1912.03263).\n", "\n", "In this part of the analysis, we want to test the out-of-distribution capability of our energy-based model.\n", "Remember that a lower output of the model denotes a low probability.\n", "Thus, we hope to see low scores if we enter random noise to the model:"]}, {"cell_type": "code", "execution_count": 16, "id": "303c00f7", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:46.941073Z", "iopub.status.busy": "2021-09-16T12:40:46.940608Z", "iopub.status.idle": "2021-09-16T12:40:46.945276Z", "shell.execute_reply": "2021-09-16T12:40:46.944875Z"}, "papermill": {"duration": 0.041937, "end_time": "2021-09-16T12:40:46.945424", "exception": false, "start_time": "2021-09-16T12:40:46.903487", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Average score for random images: -17.88\n"]}], "source": ["with torch.no_grad():\n", " rand_imgs = torch.rand((128,) + model.hparams.img_shape).to(model.device)\n", " rand_imgs = rand_imgs * 2 - 1.0\n", " rand_out = model.cnn(rand_imgs).mean()\n", " print(\"Average score for random images: %4.2f\" % (rand_out.item()))"]}, {"cell_type": "markdown", "id": "0a485fdb", "metadata": {"papermill": {"duration": 0.032686, "end_time": "2021-09-16T12:40:47.012111", "exception": false, "start_time": "2021-09-16T12:40:46.979425", "status": "completed"}, "tags": []}, "source": ["As we hoped, the model assigns very low probability to those noisy images.\n", "As another reference, let's look at predictions for a batch of images from the training set:"]}, {"cell_type": "code", "execution_count": 17, "id": "2bcb1282", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:47.081066Z", "iopub.status.busy": "2021-09-16T12:40:47.080584Z", "iopub.status.idle": "2021-09-16T12:40:47.233910Z", "shell.execute_reply": "2021-09-16T12:40:47.233401Z"}, "papermill": {"duration": 0.189477, "end_time": "2021-09-16T12:40:47.234026", "exception": false, "start_time": "2021-09-16T12:40:47.044549", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Average score for training images: -0.00\n"]}], "source": ["with torch.no_grad():\n", " train_imgs, _ = next(iter(train_loader))\n", " train_imgs = train_imgs.to(model.device)\n", " train_out = model.cnn(train_imgs).mean()\n", " print(\"Average score for training images: %4.2f\" % (train_out.item()))"]}, {"cell_type": "markdown", "id": "a559009f", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.032727, "end_time": "2021-09-16T12:40:47.300644", "exception": false, "start_time": "2021-09-16T12:40:47.267917", "status": "completed"}, "tags": []}, "source": ["The scores are close to 0 because of the regularization objective that was added to the training.\n", "So clearly, the model can distinguish between noise and real digits.\n", "However, what happens if we change the training images a little, and see which ones gets a very low score?"]}, {"cell_type": "code", "execution_count": 18, "id": "edff6bb0", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:47.372822Z", "iopub.status.busy": "2021-09-16T12:40:47.372352Z", "iopub.status.idle": "2021-09-16T12:40:47.374505Z", "shell.execute_reply": "2021-09-16T12:40:47.374110Z"}, "papermill": {"duration": 0.041215, "end_time": "2021-09-16T12:40:47.374604", "exception": false, "start_time": "2021-09-16T12:40:47.333389", "status": "completed"}, "tags": []}, "outputs": [], "source": ["@torch.no_grad()\n", "def compare_images(img1, img2):\n", " imgs = torch.stack([img1, img2], dim=0).to(model.device)\n", " score1, score2 = model.cnn(imgs).cpu().chunk(2, dim=0)\n", " grid = torchvision.utils.make_grid(\n", " [img1.cpu(), img2.cpu()], nrow=2, normalize=True, range=(-1, 1), pad_value=0.5, padding=2\n", " )\n", " grid = grid.permute(1, 2, 0)\n", " plt.figure(figsize=(4, 4))\n", " plt.imshow(grid)\n", " plt.xticks([(img1.shape[2] + 2) * (0.5 + j) for j in range(2)], labels=[\"Original image\", \"Transformed image\"])\n", " plt.yticks([])\n", " plt.show()\n", " print(\"Score original image: %4.2f\" % score1)\n", " print(\"Score transformed image: %4.2f\" % score2)"]}, {"cell_type": "markdown", "id": "7c540cbd", "metadata": {"papermill": {"duration": 0.033108, "end_time": "2021-09-16T12:40:47.440512", "exception": false, "start_time": "2021-09-16T12:40:47.407404", "status": "completed"}, "tags": []}, "source": ["We use a random test image for this. Feel free to change it to experiment with the model yourself."]}, {"cell_type": "code", "execution_count": 19, "id": "befba0f4", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:47.509319Z", "iopub.status.busy": "2021-09-16T12:40:47.508856Z", "iopub.status.idle": "2021-09-16T12:40:47.685776Z", "shell.execute_reply": "2021-09-16T12:40:47.686151Z"}, "papermill": {"duration": 0.212897, "end_time": "2021-09-16T12:40:47.686303", "exception": false, "start_time": "2021-09-16T12:40:47.473406", "status": "completed"}, "tags": []}, "outputs": [], "source": ["test_imgs, _ = next(iter(test_loader))\n", "exmp_img = test_imgs[0].to(model.device)"]}, {"cell_type": "markdown", "id": "12364d29", "metadata": {"papermill": {"duration": 0.033603, "end_time": "2021-09-16T12:40:47.754499", "exception": false, "start_time": "2021-09-16T12:40:47.720896", "status": "completed"}, "tags": []}, "source": ["The first transformation is to add some random noise to the image:"]}, {"cell_type": "code", "execution_count": 20, "id": "bc21923d", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:47.824609Z", "iopub.status.busy": "2021-09-16T12:40:47.824143Z", "iopub.status.idle": "2021-09-16T12:40:47.919759Z", "shell.execute_reply": "2021-09-16T12:40:47.919292Z"}, "papermill": {"duration": 0.132328, "end_time": "2021-09-16T12:40:47.919863", "exception": false, "start_time": "2021-09-16T12:40:47.787535", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:40:47.862252\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Score original image: 0.03\n", "Score transformed image: -0.07\n"]}], "source": ["img_noisy = exmp_img + torch.randn_like(exmp_img) * 0.3\n", "img_noisy.clamp_(min=-1.0, max=1.0)\n", "compare_images(exmp_img, img_noisy)"]}, {"cell_type": "markdown", "id": "2544f964", "metadata": {"papermill": {"duration": 0.03459, "end_time": "2021-09-16T12:40:47.989386", "exception": false, "start_time": "2021-09-16T12:40:47.954796", "status": "completed"}, "tags": []}, "source": ["We can see that the score considerably drops.\n", "Hence, the model can detect random Gaussian noise on the image.\n", "This is also to expect as initially, the \"fake\" samples are pure noise images.\n", "\n", "Next, we flip an image and check how this influences the score:"]}, {"cell_type": "code", "execution_count": 21, "id": "cc6e4e18", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:48.060789Z", "iopub.status.busy": "2021-09-16T12:40:48.060321Z", "iopub.status.idle": "2021-09-16T12:40:48.147462Z", "shell.execute_reply": "2021-09-16T12:40:48.147064Z"}, "papermill": {"duration": 0.12397, "end_time": "2021-09-16T12:40:48.147562", "exception": false, "start_time": "2021-09-16T12:40:48.023592", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:40:48.094457\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Score original image: 0.03\n", "Score transformed image: -0.00\n"]}], "source": ["img_flipped = exmp_img.flip(dims=(1, 2))\n", "compare_images(exmp_img, img_flipped)"]}, {"cell_type": "markdown", "id": "d6f1c7b3", "metadata": {"papermill": {"duration": 0.036128, "end_time": "2021-09-16T12:40:48.219851", "exception": false, "start_time": "2021-09-16T12:40:48.183723", "status": "completed"}, "tags": []}, "source": ["If the digit can only be read in this way, for example, the 7, then we can see that the score drops.\n", "However, the score only drops slightly.\n", "This is likely because of the small size of our model.\n", "Keep in mind that generative modeling is a much harder task than classification,\n", "as we do not only need to distinguish between classes but learn **all** details/characteristics of the digits.\n", "With a deeper model, this could eventually be captured better (but at the cost of greater training instability).\n", "\n", "Finally, we check what happens if we reduce the digit significantly in size:"]}, {"cell_type": "code", "execution_count": 22, "id": "799ea05d", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:48.296476Z", "iopub.status.busy": "2021-09-16T12:40:48.296010Z", "iopub.status.idle": "2021-09-16T12:40:48.386691Z", "shell.execute_reply": "2021-09-16T12:40:48.387068Z"}, "papermill": {"duration": 0.131568, "end_time": "2021-09-16T12:40:48.387188", "exception": false, "start_time": "2021-09-16T12:40:48.255620", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:40:48.333827\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Score original image: 0.03\n", "Score transformed image: -0.02\n"]}], "source": ["img_tiny = torch.zeros_like(exmp_img) - 1\n", "img_tiny[:, exmp_img.shape[1] // 2 :, exmp_img.shape[2] // 2 :] = exmp_img[:, ::2, ::2]\n", "compare_images(exmp_img, img_tiny)"]}, {"cell_type": "markdown", "id": "abbe7583", "metadata": {"papermill": {"duration": 0.037748, "end_time": "2021-09-16T12:40:48.462802", "exception": false, "start_time": "2021-09-16T12:40:48.425054", "status": "completed"}, "tags": []}, "source": ["The score again drops but not by a large margin, although digits in the MNIST dataset usually are much larger.\n", "\n", "Overall, we can conclude that our model is good for detecting Gaussian noise and smaller transformations to existing digits.\n", "Nonetheless, to obtain a very good out-of-distribution model, we would need to train deeper models and for more iterations."]}, {"cell_type": "markdown", "id": "714313c8", "metadata": {"papermill": {"duration": 0.037582, "end_time": "2021-09-16T12:40:48.538109", "exception": false, "start_time": "2021-09-16T12:40:48.500527", "status": "completed"}, "tags": []}, "source": ["### Instability\n", "\n", "Finally, we should discuss the possible instabilities of energy-based models,\n", "in particular for the example of image generation that we have implemented in this notebook.\n", "In the process of hyperparameter search for this notebook, there have been several models that diverged.\n", "Divergence in energy-based models means that the models assign a high probability to examples of the training set which is a good thing.\n", "However, at the same time, the sampling algorithm fails and only generates noise images that obtain minimal probability scores.\n", "This happens because the model has created many local maxima in which the generated noise images fall.\n", "The energy surface over which we calculate the gradients to reach data points with high probability has \"diverged\" and is not useful for our MCMC sampling.\n", "\n", "Besides finding the optimal hyperparameters, a common trick in energy-based models is to reload stable checkpoints.\n", "If we detect that the model is diverging, we stop the training, load the model from one epoch ago where it did not diverge yet.\n", "Afterward, we continue training and hope that with a different seed the model is not diverging again.\n", "Nevertheless, this should be considered as the \"last hope\" for stabilizing the models,\n", "and careful hyperparameter tuning is the better way to do so.\n", "Sensitive hyperparameters include `step_size`, `steps` and the noise standard deviation in the sampler,\n", "and the learning rate and feature dimensionality in the CNN model."]}, {"cell_type": "markdown", "id": "a34043a7", "metadata": {"papermill": {"duration": 0.037416, "end_time": "2021-09-16T12:40:48.621320", "exception": false, "start_time": "2021-09-16T12:40:48.583904", "status": "completed"}, "tags": []}, "source": ["## Conclusion\n", "\n", "In this tutorial, we have discussed energy-based models for generative modeling.\n", "The concept relies on the idea that any strictly positive function can be turned into a probability\n", "distribution by normalizing over the whole dataset.\n", "As this is not reasonable to calculate for high dimensional data like images,\n", "we train the model using contrastive divergence and sampling via MCMC.\n", "While the idea allows us to turn any neural network into an energy-based model,\n", "we have seen that there are multiple training tricks needed to stabilize the training.\n", "Furthermore, the training time of these models is relatively long as, during every training iteration,\n", "we need to sample new \"fake\" images, even with a sampling buffer.\n", "In the next lectures and assignment, we will see different generative models (e.g. VAE, GAN, NF)\n", "that allow us to do generative modeling more stably, but with the cost of more parameters."]}, {"cell_type": "markdown", "id": "6ca06d61", "metadata": {"papermill": {"duration": 0.038052, "end_time": "2021-09-16T12:40:48.697258", "exception": false, "start_time": "2021-09-16T12:40:48.659206", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "![Pytorch Lightning](){height=\"60px\" width=\"240px\"}"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: Tutorial 7: Deep Energy-Based Generative Models\n", " :card_description: In this tutorial, we will look at energy-based deep learning models, and focus on their application as generative models. Energy models have been a popular tool before the...\n", " :tags: Image,GPU/TPU,UvA-DL-Course\n", " :image: _static/images/course_UvA-DL/07-deep-energy-based-generative-models.jpg"]}], "metadata": {"jupytext": {"cell_metadata_filter": "colab_type,id,colab,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 11.264697, "end_time": "2021-09-16T12:40:49.242921", "environment_variables": {}, "exception": null, "input_path": "course_UvA-DL/07-deep-energy-based-generative-models/Deep_Energy_Models.ipynb", "output_path": ".notebooks/course_UvA-DL/07-deep-energy-based-generative-models.ipynb", "parameters": {}, "start_time": "2021-09-16T12:40:37.978224", "version": "2.3.3"}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/course_UvA-DL/08-deep-autoencoders.ipynb b/source/notebooks/course_UvA-DL/08-deep-autoencoders.ipynb deleted file mode 100644 index f3e2f32..0000000 --- a/source/notebooks/course_UvA-DL/08-deep-autoencoders.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "37d6e7ea", "metadata": {"papermill": {"duration": 0.02405, "end_time": "2021-09-16T12:40:58.041596", "exception": false, "start_time": "2021-09-16T12:40:58.017546", "status": "completed"}, "tags": []}, "source": ["\n", "# Tutorial 8: Deep Autoencoders\n", "\n", "* **Author:** Phillip Lippe\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-09-16T14:32:32.123712\n", "\n", "In this tutorial, we will take a closer look at autoencoders (AE).\n", "Autoencoders are trained on encoding input data such as images into a smaller feature vector,\n", "and afterward, reconstruct it by a second neural network, called a decoder.\n", "The feature vector is called the \"bottleneck\" of the network as we aim to compress the input data into a smaller amount of features.\n", "This property is useful in many applications, in particular in compressing data or comparing images on a metric beyond pixel-level comparisons.\n", "Besides learning about the autoencoder framework, we will also see the \"deconvolution\"\n", "(or transposed convolution) operator in action for scaling up feature maps in height and width.\n", "Such deconvolution networks are necessary wherever we start from a small feature vector\n", "and need to output an image of full size (e.g. in VAE, GANs, or super-resolution applications).\n", "This notebook is part of a lecture series on Deep Learning at the University of Amsterdam.\n", "The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io.\n", "\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/course_UvA-DL/08-deep-autoencoders.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "858d9128", "metadata": {"papermill": {"duration": 0.021931, "end_time": "2021-09-16T12:40:58.085647", "exception": false, "start_time": "2021-09-16T12:40:58.063716", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "7358cb32", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-09-16T12:40:58.133268Z", "iopub.status.busy": "2021-09-16T12:40:58.132753Z", "iopub.status.idle": "2021-09-16T12:40:58.135280Z", "shell.execute_reply": "2021-09-16T12:40:58.134801Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 0.02804, "end_time": "2021-09-16T12:40:58.135398", "exception": false, "start_time": "2021-09-16T12:40:58.107358", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# ! pip install --quiet \"torch>=1.6, <1.9\" \"pytorch-lightning>=1.3\" \"torchvision\" \"seaborn\" \"torchmetrics>=0.3\" \"matplotlib\""]}, {"cell_type": "markdown", "id": "33e2dd60", "metadata": {"papermill": {"duration": 0.021405, "end_time": "2021-09-16T12:40:58.179525", "exception": false, "start_time": "2021-09-16T12:40:58.158120", "status": "completed"}, "tags": []}, "source": ["
"]}, {"cell_type": "code", "execution_count": 2, "id": "52180301", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:40:58.232432Z", "iopub.status.busy": "2021-09-16T12:40:58.231957Z", "iopub.status.idle": "2021-09-16T12:40:59.951493Z", "shell.execute_reply": "2021-09-16T12:40:59.951078Z"}, "papermill": {"duration": 1.749593, "end_time": "2021-09-16T12:40:59.951608", "exception": false, "start_time": "2021-09-16T12:40:58.202015", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/tmp/ipykernel_2146/3711936426.py:23: DeprecationWarning: `set_matplotlib_formats` is deprecated since IPython 7.23, directly use `matplotlib_inline.backend_inline.set_matplotlib_formats()`\n", " set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "Global seed set to 42\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Device: cuda:0\n"]}], "source": ["import os\n", "import urllib.request\n", "from urllib.error import HTTPError\n", "\n", "import matplotlib\n", "import matplotlib.pyplot as plt\n", "import pytorch_lightning as pl\n", "import seaborn as sns\n", "import torch\n", "import torch.nn as nn\n", "import torch.nn.functional as F\n", "import torch.optim as optim\n", "import torch.utils.data as data\n", "import torchvision\n", "from IPython.display import set_matplotlib_formats\n", "from pytorch_lightning.callbacks import LearningRateMonitor, ModelCheckpoint\n", "from torch.utils.tensorboard import SummaryWriter\n", "from torchvision import transforms\n", "from torchvision.datasets import CIFAR10\n", "from tqdm.notebook import tqdm\n", "\n", "# %matplotlib inline\n", "set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "matplotlib.rcParams[\"lines.linewidth\"] = 2.0\n", "sns.reset_orig()\n", "sns.set()\n", "\n", "# Tensorboard extension (for visualization purposes later)\n", "# %load_ext tensorboard\n", "\n", "# Path to the folder where the datasets are/should be downloaded (e.g. CIFAR10)\n", "DATASET_PATH = os.environ.get(\"PATH_DATASETS\", \"data\")\n", "# Path to the folder where the pretrained models are saved\n", "CHECKPOINT_PATH = os.environ.get(\"PATH_CHECKPOINT\", \"saved_models/tutorial9\")\n", "\n", "# Setting the seed\n", "pl.seed_everything(42)\n", "\n", "# Ensure that all operations are deterministic on GPU (if used) for reproducibility\n", "torch.backends.cudnn.determinstic = True\n", "torch.backends.cudnn.benchmark = False\n", "\n", "device = torch.device(\"cuda:0\") if torch.cuda.is_available() else torch.device(\"cpu\")\n", "print(\"Device:\", device)"]}, {"cell_type": "markdown", "id": "28912006", "metadata": {"papermill": {"duration": 0.021859, "end_time": "2021-09-16T12:40:59.996263", "exception": false, "start_time": "2021-09-16T12:40:59.974404", "status": "completed"}, "tags": []}, "source": ["We have 4 pretrained models that we have to download.\n", "Remember the adjust the variables `DATASET_PATH` and `CHECKPOINT_PATH` if needed."]}, {"cell_type": "code", "execution_count": 3, "id": "4a75be18", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:00.045043Z", "iopub.status.busy": "2021-09-16T12:41:00.044569Z", "iopub.status.idle": "2021-09-16T12:41:00.679694Z", "shell.execute_reply": "2021-09-16T12:41:00.679188Z"}, "papermill": {"duration": 0.661412, "end_time": "2021-09-16T12:41:00.679814", "exception": false, "start_time": "2021-09-16T12:41:00.018402", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial9/cifar10_64.ckpt...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial9/cifar10_128.ckpt...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial9/cifar10_256.ckpt...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial9/cifar10_384.ckpt...\n"]}], "source": ["# Github URL where saved models are stored for this tutorial\n", "base_url = \"https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial9/\"\n", "# Files to download\n", "pretrained_files = [\"cifar10_64.ckpt\", \"cifar10_128.ckpt\", \"cifar10_256.ckpt\", \"cifar10_384.ckpt\"]\n", "# Create checkpoint path if it doesn't exist yet\n", "os.makedirs(CHECKPOINT_PATH, exist_ok=True)\n", "\n", "# For each file, check whether it already exists. If not, try downloading it.\n", "for file_name in pretrained_files:\n", " file_path = os.path.join(CHECKPOINT_PATH, file_name)\n", " if not os.path.isfile(file_path):\n", " file_url = base_url + file_name\n", " print(\"Downloading %s...\" % file_url)\n", " try:\n", " urllib.request.urlretrieve(file_url, file_path)\n", " except HTTPError as e:\n", " print(\n", " \"Something went wrong. Please try to download the files manually,\"\n", " \" or contact the author with the full output including the following error:\\n\",\n", " e,\n", " )"]}, {"cell_type": "markdown", "id": "c8fc2858", "metadata": {"papermill": {"duration": 0.023053, "end_time": "2021-09-16T12:41:00.726214", "exception": false, "start_time": "2021-09-16T12:41:00.703161", "status": "completed"}, "tags": []}, "source": ["In this tutorial, we work with the CIFAR10 dataset.\n", "In CIFAR10, each image has 3 color channels and is 32x32 pixels large.\n", "As autoencoders do not have the constrain of modeling images probabilistic, we can work on more complex image data\n", "(i.e. 3 color channels instead of black-and-white) much easier than for VAEs.\n", "In case you have downloaded CIFAR10 already in a different directory, make sure to set DATASET_PATH\n", "accordingly to prevent another download.\n", "\n", "In contrast to previous tutorials on CIFAR10 like\n", "[Tutorial 5](https://uvadlc-notebooks.readthedocs.io/en/latest/tutorial_notebooks/tutorial5/Inception_ResNet_DenseNet.html)\n", "(CNN classification), we do not normalize the data explicitly with a mean of 0 and std of 1,\n", "but roughly estimate it scaling the data between -1 and 1.\n", "This is because limiting the range will make our task of predicting/reconstructing images easier."]}, {"cell_type": "code", "execution_count": 4, "id": "e7a54614", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:00.777942Z", "iopub.status.busy": "2021-09-16T12:41:00.777448Z", "iopub.status.idle": "2021-09-16T12:41:02.307895Z", "shell.execute_reply": "2021-09-16T12:41:02.307448Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 1.558951, "end_time": "2021-09-16T12:41:02.308015", "exception": false, "start_time": "2021-09-16T12:41:00.749064", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}, {"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}], "source": ["# Transformations applied on each image => only make them a tensor\n", "transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.5,), (0.5,))])\n", "\n", "# Loading the training dataset. We need to split it into a training and validation part\n", "train_dataset = CIFAR10(root=DATASET_PATH, train=True, transform=transform, download=True)\n", "pl.seed_everything(42)\n", "train_set, val_set = torch.utils.data.random_split(train_dataset, [45000, 5000])\n", "\n", "# Loading the test set\n", "test_set = CIFAR10(root=DATASET_PATH, train=False, transform=transform, download=True)\n", "\n", "# We define a set of data loaders that we can use for various purposes later.\n", "train_loader = data.DataLoader(train_set, batch_size=256, shuffle=True, drop_last=True, pin_memory=True, num_workers=4)\n", "val_loader = data.DataLoader(val_set, batch_size=256, shuffle=False, drop_last=False, num_workers=4)\n", "test_loader = data.DataLoader(test_set, batch_size=256, shuffle=False, drop_last=False, num_workers=4)\n", "\n", "\n", "def get_train_images(num):\n", " return torch.stack([train_dataset[i][0] for i in range(num)], dim=0)"]}, {"cell_type": "markdown", "id": "ac14f5b0", "metadata": {"papermill": {"duration": 0.023214, "end_time": "2021-09-16T12:41:02.355175", "exception": false, "start_time": "2021-09-16T12:41:02.331961", "status": "completed"}, "tags": []}, "source": ["## Building the autoencoder\n", "\n", "In general, an autoencoder consists of an **encoder** that maps the input $x$ to a lower-dimensional feature vector $z$,\n", "and a **decoder** that reconstructs the input $\\hat{x}$ from $z$.\n", "We train the model by comparing $x$ to $\\hat{x}$ and optimizing the parameters to increase the similarity between $x$ and $\\hat{x}$.\n", "See below for a small illustration of the autoencoder framework."]}, {"cell_type": "markdown", "id": "8aa77f09", "metadata": {"papermill": {"duration": 0.023251, "end_time": "2021-09-16T12:41:02.401674", "exception": false, "start_time": "2021-09-16T12:41:02.378423", "status": "completed"}, "tags": []}, "source": ["
"]}, {"cell_type": "markdown", "id": "b4e16e51", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.023141, "end_time": "2021-09-16T12:41:02.447908", "exception": false, "start_time": "2021-09-16T12:41:02.424767", "status": "completed"}, "tags": []}, "source": ["We first start by implementing the encoder.\n", "The encoder effectively consists of a deep convolutional network, where we scale down the image layer-by-layer using strided convolutions.\n", "After downscaling the image three times, we flatten the features and apply linear layers.\n", "The latent representation $z$ is therefore a vector of size *d* which can be flexibly selected."]}, {"cell_type": "code", "execution_count": 5, "id": "7a89bc88", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:02.501193Z", "iopub.status.busy": "2021-09-16T12:41:02.500706Z", "iopub.status.idle": "2021-09-16T12:41:02.502735Z", "shell.execute_reply": "2021-09-16T12:41:02.502267Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.031646, "end_time": "2021-09-16T12:41:02.502835", "exception": false, "start_time": "2021-09-16T12:41:02.471189", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class Encoder(nn.Module):\n", " def __init__(self, num_input_channels: int, base_channel_size: int, latent_dim: int, act_fn: object = nn.GELU):\n", " \"\"\"\n", " Args:\n", " num_input_channels : Number of input channels of the image. For CIFAR, this parameter is 3\n", " base_channel_size : Number of channels we use in the first convolutional layers. Deeper layers might use a duplicate of it.\n", " latent_dim : Dimensionality of latent representation z\n", " act_fn : Activation function used throughout the encoder network\n", " \"\"\"\n", " super().__init__()\n", " c_hid = base_channel_size\n", " self.net = nn.Sequential(\n", " nn.Conv2d(num_input_channels, c_hid, kernel_size=3, padding=1, stride=2), # 32x32 => 16x16\n", " act_fn(),\n", " nn.Conv2d(c_hid, c_hid, kernel_size=3, padding=1),\n", " act_fn(),\n", " nn.Conv2d(c_hid, 2 * c_hid, kernel_size=3, padding=1, stride=2), # 16x16 => 8x8\n", " act_fn(),\n", " nn.Conv2d(2 * c_hid, 2 * c_hid, kernel_size=3, padding=1),\n", " act_fn(),\n", " nn.Conv2d(2 * c_hid, 2 * c_hid, kernel_size=3, padding=1, stride=2), # 8x8 => 4x4\n", " act_fn(),\n", " nn.Flatten(), # Image grid to single feature vector\n", " nn.Linear(2 * 16 * c_hid, latent_dim),\n", " )\n", "\n", " def forward(self, x):\n", " return self.net(x)"]}, {"cell_type": "markdown", "id": "76a60820", "metadata": {"papermill": {"duration": 0.023574, "end_time": "2021-09-16T12:41:02.549985", "exception": false, "start_time": "2021-09-16T12:41:02.526411", "status": "completed"}, "tags": []}, "source": ["Note that we do not apply Batch Normalization here.\n", "This is because we want the encoding of each image to be independent of all the other images.\n", "Otherwise, we might introduce correlations into the encoding or decoding that we do not want to have.\n", "In some implementations, you still can see Batch Normalization being used, because it can also serve as a form of regularization.\n", "Nevertheless, the better practice is to go with other normalization techniques if necessary like Instance Normalization or Layer Normalization.\n", "Given the small size of the model, we can neglect normalization for now."]}, {"cell_type": "markdown", "id": "56b7a01a", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.023466, "end_time": "2021-09-16T12:41:02.596962", "exception": false, "start_time": "2021-09-16T12:41:02.573496", "status": "completed"}, "tags": []}, "source": ["The decoder is a mirrored, flipped version of the encoder.\n", "The only difference is that we replace strided convolutions by transposed convolutions\n", "(i.e. deconvolutions) to upscale the features.\n", "Transposed convolutions can be imagined as adding the stride to the input instead of the output,\n", "and can thus upscale the input.\n", "For an illustration of a `nn.ConvTranspose2d` layer with kernel size 3, stride 2, and padding 1,\n", "see below (figure credit - [Vincent Dumoulin and Francesco Visin](https://arxiv.org/abs/1603.07285)):\n", "\n", "
\n", "\n", "You see that for an input of size $3\\times3$, we obtain an output of $5\\times5$.\n", "However, to truly have a reverse operation of the convolution,\n", "we need to ensure that the layer scales the input shape by a factor of 2 (e.g. $4\\times4\\to8\\times8$).\n", "For this, we can specify the parameter `output_padding` which adds additional values to the output shape.\n", "Note that we do not perform zero-padding with this, but rather increase the output shape for calculation.\n", "\n", "Overall, the decoder can be implemented as follows:"]}, {"cell_type": "code", "execution_count": 6, "id": "8197fb2e", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:02.650981Z", "iopub.status.busy": "2021-09-16T12:41:02.650503Z", "iopub.status.idle": "2021-09-16T12:41:02.652477Z", "shell.execute_reply": "2021-09-16T12:41:02.652080Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.032082, "end_time": "2021-09-16T12:41:02.652576", "exception": false, "start_time": "2021-09-16T12:41:02.620494", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class Decoder(nn.Module):\n", " def __init__(self, num_input_channels: int, base_channel_size: int, latent_dim: int, act_fn: object = nn.GELU):\n", " \"\"\"\n", " Args:\n", " num_input_channels : Number of channels of the image to reconstruct. For CIFAR, this parameter is 3\n", " base_channel_size : Number of channels we use in the last convolutional layers. Early layers might use a duplicate of it.\n", " latent_dim : Dimensionality of latent representation z\n", " act_fn : Activation function used throughout the decoder network\n", " \"\"\"\n", " super().__init__()\n", " c_hid = base_channel_size\n", " self.linear = nn.Sequential(nn.Linear(latent_dim, 2 * 16 * c_hid), act_fn())\n", " self.net = nn.Sequential(\n", " nn.ConvTranspose2d(\n", " 2 * c_hid, 2 * c_hid, kernel_size=3, output_padding=1, padding=1, stride=2\n", " ), # 4x4 => 8x8\n", " act_fn(),\n", " nn.Conv2d(2 * c_hid, 2 * c_hid, kernel_size=3, padding=1),\n", " act_fn(),\n", " nn.ConvTranspose2d(2 * c_hid, c_hid, kernel_size=3, output_padding=1, padding=1, stride=2), # 8x8 => 16x16\n", " act_fn(),\n", " nn.Conv2d(c_hid, c_hid, kernel_size=3, padding=1),\n", " act_fn(),\n", " nn.ConvTranspose2d(\n", " c_hid, num_input_channels, kernel_size=3, output_padding=1, padding=1, stride=2\n", " ), # 16x16 => 32x32\n", " nn.Tanh(), # The input images is scaled between -1 and 1, hence the output has to be bounded as well\n", " )\n", "\n", " def forward(self, x):\n", " x = self.linear(x)\n", " x = x.reshape(x.shape[0], -1, 4, 4)\n", " x = self.net(x)\n", " return x"]}, {"cell_type": "markdown", "id": "d2ea7d77", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.023491, "end_time": "2021-09-16T12:41:02.699586", "exception": false, "start_time": "2021-09-16T12:41:02.676095", "status": "completed"}, "tags": []}, "source": ["The encoder and decoder networks we chose here are relatively simple.\n", "Usually, more complex networks are applied, especially when using a ResNet-based architecture.\n", "For example, see [VQ-VAE](https://arxiv.org/abs/1711.00937) and\n", "[NVAE](https://arxiv.org/abs/2007.03898) (although the papers discuss architectures for VAEs,\n", "they can equally be applied to standard autoencoders).\n", "\n", "In a final step, we add the encoder and decoder together into the autoencoder architecture.\n", "We define the autoencoder as PyTorch Lightning Module to simplify the needed training code:"]}, {"cell_type": "code", "execution_count": 7, "id": "3addaf83", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:02.755000Z", "iopub.status.busy": "2021-09-16T12:41:02.748144Z", "iopub.status.idle": "2021-09-16T12:41:02.756989Z", "shell.execute_reply": "2021-09-16T12:41:02.756529Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.034085, "end_time": "2021-09-16T12:41:02.757086", "exception": false, "start_time": "2021-09-16T12:41:02.723001", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class Autoencoder(pl.LightningModule):\n", " def __init__(\n", " self,\n", " base_channel_size: int,\n", " latent_dim: int,\n", " encoder_class: object = Encoder,\n", " decoder_class: object = Decoder,\n", " num_input_channels: int = 3,\n", " width: int = 32,\n", " height: int = 32,\n", " ):\n", " super().__init__()\n", " # Saving hyperparameters of autoencoder\n", " self.save_hyperparameters()\n", " # Creating encoder and decoder\n", " self.encoder = encoder_class(num_input_channels, base_channel_size, latent_dim)\n", " self.decoder = decoder_class(num_input_channels, base_channel_size, latent_dim)\n", " # Example input array needed for visualizing the graph of the network\n", " self.example_input_array = torch.zeros(2, num_input_channels, width, height)\n", "\n", " def forward(self, x):\n", " \"\"\"The forward function takes in an image and returns the reconstructed image.\"\"\"\n", " z = self.encoder(x)\n", " x_hat = self.decoder(z)\n", " return x_hat\n", "\n", " def _get_reconstruction_loss(self, batch):\n", " \"\"\"Given a batch of images, this function returns the reconstruction loss (MSE in our case)\"\"\"\n", " x, _ = batch # We do not need the labels\n", " x_hat = self.forward(x)\n", " loss = F.mse_loss(x, x_hat, reduction=\"none\")\n", " loss = loss.sum(dim=[1, 2, 3]).mean(dim=[0])\n", " return loss\n", "\n", " def configure_optimizers(self):\n", " optimizer = optim.Adam(self.parameters(), lr=1e-3)\n", " # Using a scheduler is optional but can be helpful.\n", " # The scheduler reduces the LR if the validation performance hasn't improved for the last N epochs\n", " scheduler = optim.lr_scheduler.ReduceLROnPlateau(optimizer, mode=\"min\", factor=0.2, patience=20, min_lr=5e-5)\n", " return {\"optimizer\": optimizer, \"lr_scheduler\": scheduler, \"monitor\": \"val_loss\"}\n", "\n", " def training_step(self, batch, batch_idx):\n", " loss = self._get_reconstruction_loss(batch)\n", " self.log(\"train_loss\", loss)\n", " return loss\n", "\n", " def validation_step(self, batch, batch_idx):\n", " loss = self._get_reconstruction_loss(batch)\n", " self.log(\"val_loss\", loss)\n", "\n", " def test_step(self, batch, batch_idx):\n", " loss = self._get_reconstruction_loss(batch)\n", " self.log(\"test_loss\", loss)"]}, {"cell_type": "markdown", "id": "5ce14e90", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.02353, "end_time": "2021-09-16T12:41:02.804310", "exception": false, "start_time": "2021-09-16T12:41:02.780780", "status": "completed"}, "tags": []}, "source": ["For the loss function, we use the mean squared error (MSE).\n", "The mean squared error pushes the network to pay special attention to those pixel values its estimate is far away.\n", "Predicting 127 instead of 128 is not important when reconstructing, but confusing 0 with 128 is much worse.\n", "Note that in contrast to VAEs, we do not predict the probability per pixel value, but instead use a distance measure.\n", "This saves a lot of parameters and simplifies training.\n", "To get a better intuition per pixel, we report the summed squared error averaged over the batch dimension\n", "(any other mean/sum leads to the same result/parameters).\n", "\n", "However, MSE has also some considerable disadvantages.\n", "Usually, MSE leads to blurry images where small noise/high-frequent patterns are removed as those cause a very low error.\n", "To ensure realistic images to be reconstructed, one could combine Generative Adversarial Networks\n", "(lecture 10) with autoencoders as done in several works (e.g. see [here](https://arxiv.org/abs/1704.02304),\n", "[here](https://arxiv.org/abs/1511.05644) or these [slides](http://elarosca.net/slides/iccv_autoencoder_gans.pdf)).\n", "Additionally, comparing two images using MSE does not necessarily reflect their visual similarity.\n", "For instance, suppose the autoencoder reconstructs an image shifted by one pixel to the right and bottom.\n", "Although the images are almost identical, we can get a higher loss than predicting a constant pixel value for half of the image (see code below).\n", "An example solution for this issue includes using a separate, pre-trained CNN,\n", "and use a distance of visual features in lower layers as a distance measure instead of the original pixel-level comparison."]}, {"cell_type": "code", "execution_count": 8, "id": "031f9cd6", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:02.857901Z", "iopub.status.busy": "2021-09-16T12:41:02.852996Z", "iopub.status.idle": "2021-09-16T12:41:03.403790Z", "shell.execute_reply": "2021-09-16T12:41:03.403315Z"}, "papermill": {"duration": 0.576043, "end_time": "2021-09-16T12:41:03.403902", "exception": false, "start_time": "2021-09-16T12:41:02.827859", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:02.925215\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n"]}, {"data": {"application/pdf": "JVBERi0xLjQKJazcIKu6CjEgMCBvYmoKPDwgL1BhZ2VzIDIgMCBSIC9UeXBlIC9DYXRhbG9nID4+CmVuZG9iago4IDAgb2JqCjw8IC9FeHRHU3RhdGUgNCAwIFIgL0ZvbnQgMyAwIFIgL1BhdHRlcm4gNSAwIFIKL1Byb2NTZXQgWyAvUERGIC9UZXh0IC9JbWFnZUIgL0ltYWdlQyAvSW1hZ2VJIF0gL1NoYWRpbmcgNiAwIFIKL1hPYmplY3QgNyAwIFIgPj4KZW5kb2JqCjExIDAgb2JqCjw8IC9Bbm5vdHMgMTAgMCBSIC9Db250ZW50cyA5IDAgUgovR3JvdXAgPDwgL0NTIC9EZXZpY2VSR0IgL1MgL1RyYW5zcGFyZW5jeSAvVHlwZSAvR3JvdXAgPj4KL01lZGlhQm94IFsgMCAwIDIyNS44IDEzOC4yNDUgXSAvUGFyZW50IDIgMCBSIC9SZXNvdXJjZXMgOCAwIFIgL1R5cGUgL1BhZ2UKPj4KZW5kb2JqCjkgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAxMiAwIFIgPj4Kc3RyZWFtCnicTY9BT8MwDIXv/hXv2B6WxG7TZtw2DSoQHIYicUAcUNcBhTGVSOzv44wxEelF71nxZ4cxkl0wXhL0gsOoOqjvcianaUci3gR1HyfHVTBSe83un38l2tKE1shRwmxqsAumFXwNeMAn7EJ+J42qgxI72NXw/dYP990SfdJ2YUGeym5+RvU72GvGao81rTH9YZxhrzufaTl2pypNxEqZKQh1Y1xTu0Y8WNjMM5CWEfaKtYC4PX4zbugRxd1zei9ReYXk98WwwQy3JbjRvtaFKh8U+5QuwD6YOpR4Qryhy0i6HP0AtdVHYAplbmRzdHJlYW0KZW5kb2JqCjEyIDAgb2JqCjIzMQplbmRvYmoKMTAgMCBvYmoKWyBdCmVuZG9iagoxOCAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDYxID4+CnN0cmVhbQp4nDM1NVcwULC0ABKmpkYK5kaWCimGXEA+iJXLZWhpDmblgFkWxkAGSBmcYQCkwZpzYHpyuDK40gDLFRDMCmVuZHN0cmVhbQplbmRvYmoKMTkgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCA5MCA+PgpzdHJlYW0KeJw9jssNwDAIQ+9MwQjhUwL7VFUPyf7Xhnx6wQ9byLgJFgwfo9qFlQNvgrEndWBdXgMVQhYZZOTbOxeLSmYWv5omqRPSJHHeRKE7TUqdD7TT2+CF5wP16R3sCmVuZHN0cmVhbQplbmRvYmoKMjAgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAzMDcgPj4Kc3RyZWFtCnicPZJLbgMxDEP3PoUuEMD62Z7zpCi6mN5/2ycl6Yoc2RZFapa6TFlTHpA0k4R/6fBwsZ3yO2zPZmbgWqKXieWU59AVYu6ifNnMRl1ZJ8XqhGY6t+hRORcHNk2qn6sspd0ueA7XJp5b9hE/vNCgHtQ1Lgk3dFejZSk0Y6r7f9J7/Iwy4GpMXWxSq3sfPF5EVejoB0eJImOXF+fjQQnpSsJoWoiVd0UDQe7ytMp7Ce7b3mrIsgepmM47KWaw63RSLm4XhyEeyPKo8OWj2GtCz/iwKyX0SNiGM3In7mjG5tTI4pD+3o0ES4+uaCHz4K9u1i5gvFM6RWJkTnKsaYtVTvdQFNO5w70MEPVsRUMpc5HV6l/DzgtrlmwWeEr6BR6j3SZLDlbZ26hO76082dD3H1rXdB8KZW5kc3RyZWFtCmVuZG9iagoyMSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDczID4+CnN0cmVhbQp4nDM2NlcwUDA0BJFGRgYKpkBWiiEXSMDQyEQhlwskCGLlgFkGQBqiOAeuJocrA8wGaYWoB7Eg6o0tjaEqESyIbAZXGgCnyBevCmVuZHN0cmVhbQplbmRvYmoKMjIgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAyMzEgPj4Kc3RyZWFtCnicNU85kgQhDMt5hT4wVRjbQL+np7Y22Pl/upKZTpDwIcnTEx2ZeJkjI7Bmx9taZCBm4FNMxb/2tA8TqvfgHiKUiwthhpFw1qzjbp6OF/92lc9YB+82+IpZXhDYwkzWVxZnLtsFY2mcxDnJboxdE7GNda2nU1hHMKEMhHS2w5Qgc1Sk9MmOMuboOJEnnovv9tssdjl+DusLNo0hFef4KnqCNoOi7HnvAhpyQf9d3fgeRbvoJSAbCRbWUWLunOWEX712dB61KBJzQppBLhMhzekqphCaUKyzo6BSUXCpPqforJ9/5V9cLQplbmRzdHJlYW0KZW5kb2JqCjIzIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMjQ5ID4+CnN0cmVhbQp4nD1QO45EIQzrOYUv8CTyI3AeRqstZu/frgOaKVBMfrYzJNARgUcMMZSv4yWtoK6Bv4tC8W7i64PCIKtDUiDOeg+IdOymNpETOh2cMz9hN2OOwEUxBpzpdKY9ByY5+8IKhHMbZexWSCeJqiKO6jOOKZ4qe594FiztyDZbJ5I95CDhUlKJyaWflMo/bcqUCjpm0QQsErngZBNNOMu7SVKMGZQy6h6mdiJ9rDzIozroZE3OrCOZ2dNP25n4HHC3X9pkTpXHdB7M+Jy0zoM5Fbr344k2B02N2ujs9xNpKi9Sux1anX51EpXdGOcYEpdnfxnfZP/5B/6HWiIKZW5kc3RyZWFtCmVuZG9iagoyNCAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDM5NSA+PgpzdHJlYW0KeJw9UktuxUAI2+cUXKDS8JvPeVJV3bz7b2tDUqkqvIkxxjB9ypC55UtdEnGFybderls8pnwuW1qZeYi7i40lPrbcl+4htl10LrE4HUfyCzKdKkSozarRofhCloUHkE7woQvCfTn+4y+AwdewDbjhPTJBsCTmKULGblEZmhJBEWHnkRWopFCfWcLfUe7r9zIFam+MpQtjHPQJtAVCbUjEAupAAETslFStkI5nJBO/Fd1nYhxg59GyAa4ZVESWe+zHiKnOqIy8RMQ+T036KJZMLVbGblMZX/yUjNR8dAUqqTTylPLQVbPQC1iJeRL2OfxI+OfWbCGGOm7W8onlHzPFMhLOYEs5YKGX40fg21l1Ea4dubjOdIEfldZwTLTrfsj1T/5021rNdbxyCKJA5U1B8LsOrkaxxMQyPp2NKXqiLLAamrxGM8FhEBHW98PIAxr9crwQNKdrIrRYIpu1YkSNimxzPb0E1kzvxTnWwxPCbO+d1qGyMzMqIYLauoZq60B2s77zcLafPzPoom0KZW5kc3RyZWFtCmVuZG9iagoyNSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDI0OSA+PgpzdHJlYW0KeJxNUUmKAzAMu+cV+kAhXpO8p0OZQ+f/18oOhTkECa+Sk5aYWAsPMYQfLD34kSFzN/0bfqLZu1l6ksnZ/5jnIlNR+FKoLmJCXYgbz6ER8D2haxJZsb3xOSyjmXO+Bx+FuAQzoQFjfUkyuajmlSETTgx1HA5apMK4a2LD4lrRPI3cbvtGZmUmhA2PZELcGICIIOsCshgslDY2EzJZzgPtDckNWmDXqRtRi4IrlNYJdKJWxKrM4LPm1nY3Qy3y4Kh98fpoVpdghdFL9Vh4X4U+mKmZdu6SQnrhTTsizB4KpDI7LSu1e8TqboH6P8tS8P3J9/gdrw/N/FycCmVuZHN0cmVhbQplbmRvYmoKMjYgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCA5NCA+PgpzdHJlYW0KeJxFjcERwCAIBP9UQQkKCtpPJpOH9v+NEDJ8YOcO7oQFC7Z5Rh8FlSZeFVgHSmPcUI9AveFyLcncBQ9wJ3/a0FScltN3aZFJVSncpBJ5/w5nJpCoedFjnfcLY/sjPAplbmRzdHJlYW0KZW5kb2JqCjI3IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggNTQgPj4Kc3RyZWFtCnicMzYzVDBQMLFUMDI2UTA2NAJiE4UUQy6gCIiVywUTywGzQKpyuKDKc2CqcrgyuNIABRgOMgplbmRzdHJlYW0KZW5kb2JqCjI4IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggODMgPj4Kc3RyZWFtCnicPcw5EoAwCAXQnlP8I4TIIvdxHIt4/1Yw0QYeq3qgITiDusGt4WDKunQT71Pj1cacEgmoeEpNlroLetS0vtS+aOC76+ZL1Yk/zc8XnQ+7HRndCmVuZHN0cmVhbQplbmRvYmoKMjkgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAyMTggPj4Kc3RyZWFtCnicPVC5jQQxDMtdhRpYwHrtqWcWi0um//RI+fYi0RZFUio1mZIpL3WUJVlT3jp8lsQOeYblbmQ2JSpFL5OwJffQCvF9ieYU993VlrNDNJdoOX4LMyqqGx3TSzaacCoTuqDcwzP6DW10A1aHHrFbINCkYNe2IHLHDxgMwZkTiyIMSk0G/65yj59eixs+w/FDFJGSDuY1/1j98nMNr1OPJ5Fub77iXpypDgMRHJKavCNdWLEuEhFpNUFNz8BaLYC7t17+G7QjugxA9onEcZpSjqG/a3Clzy/lJ1PYCmVuZHN0cmVhbQplbmRvYmoKMzAgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCA4MyA+PgpzdHJlYW0KeJxFjLsNwDAIRHumYAR+JvY+UZTC3r8NECVuuCfdPVwdCZkpbjPDQwaeDCyGXXGB9JYwC1xHUI6d7KNh1b7qBI31plLz7w+Unuys4obrAQJCGmYKZW5kc3RyZWFtCmVuZG9iagozMSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDUxID4+CnN0cmVhbQp4nDM2tFAwUDA0MAeSRoZAlpGJQoohF0gAxMzlggnmgFkGQBqiOAeuJocrgysNAOG0DZgKZW5kc3RyZWFtCmVuZG9iagozMiAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDMzNCA+PgpzdHJlYW0KeJwtUktyxSAM23MKXaAz+AfkPOl0uni9/7aSk0VGDmD0MeWGiUp8WSC3o9bEt43MQIXhr6vMhc9I28g6iMuQi7iSLYV7RCzkMcQ8xILvq/EeHvmszMmzB8Yv2XcPK/bUhGUh48UZ2mEVx2EV5FiwdSGqe3hTpMOpJNjji/8+xXMtBC18RtCAX+Sfr47g+ZIWafeYbdOuerBMO6qksBxsT3NeJl9aZ7k6Hs8Hyfau2BFSuwIUhbkzznPhKNNWRrQWdjZIalxsb479WErQhW5cRoojkJ+pIjygpMnMJgrij5wecioDYeqarnRyG1Vxp57MNZuLtzNJZuu+SLGZwnldOLP+DFNmtXknz3Ki1KkI77FnS9DQOa6evZZZaHSbE7ykhM/GTk9Ovlcz6yE5FQmpYlpXwWkUmWIJ2xJfU1FTmnoZ/vvy7vE7fv4BLHN8cwplbmRzdHJlYW0KZW5kb2JqCjMzIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMTggPj4Kc3RyZWFtCnicMza0UDCAwxRDrjQAHeYDUgplbmRzdHJlYW0KZW5kb2JqCjE2IDAgb2JqCjw8IC9CYXNlRm9udCAvRGVqYVZ1U2FucyAvQ2hhclByb2NzIDE3IDAgUgovRW5jb2RpbmcgPDwKL0RpZmZlcmVuY2VzIFsgMzIgL3NwYWNlIDQ1IC9oeXBoZW4gL3BlcmlvZCA0OSAvb25lIDUyIC9mb3VyIC9maXZlIDU2IC9laWdodCA1OCAvY29sb24KNzYgL0wgL00gOTcgL2EgMTAwIC9kIC9lIDEwNyAvayAxMTEgL28gMTE1IC9zIF0KL1R5cGUgL0VuY29kaW5nID4+Ci9GaXJzdENoYXIgMCAvRm9udEJCb3ggWyAtMTAyMSAtNDYzIDE3OTQgMTIzMyBdIC9Gb250RGVzY3JpcHRvciAxNSAwIFIKL0ZvbnRNYXRyaXggWyAwLjAwMSAwIDAgMC4wMDEgMCAwIF0gL0xhc3RDaGFyIDI1NSAvTmFtZSAvRGVqYVZ1U2FucwovU3VidHlwZSAvVHlwZTMgL1R5cGUgL0ZvbnQgL1dpZHRocyAxNCAwIFIgPj4KZW5kb2JqCjE1IDAgb2JqCjw8IC9Bc2NlbnQgOTI5IC9DYXBIZWlnaHQgMCAvRGVzY2VudCAtMjM2IC9GbGFncyAzMgovRm9udEJCb3ggWyAtMTAyMSAtNDYzIDE3OTQgMTIzMyBdIC9Gb250TmFtZSAvRGVqYVZ1U2FucyAvSXRhbGljQW5nbGUgMAovTWF4V2lkdGggMTM0MiAvU3RlbVYgMCAvVHlwZSAvRm9udERlc2NyaXB0b3IgL1hIZWlnaHQgMCA+PgplbmRvYmoKMTQgMCBvYmoKWyA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMAo2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDMxOCA0MDEgNDYwIDgzOCA2MzYKOTUwIDc4MCAyNzUgMzkwIDM5MCA1MDAgODM4IDMxOCAzNjEgMzE4IDMzNyA2MzYgNjM2IDYzNiA2MzYgNjM2IDYzNiA2MzYgNjM2CjYzNiA2MzYgMzM3IDMzNyA4MzggODM4IDgzOCA1MzEgMTAwMCA2ODQgNjg2IDY5OCA3NzAgNjMyIDU3NSA3NzUgNzUyIDI5NQoyOTUgNjU2IDU1NyA4NjMgNzQ4IDc4NyA2MDMgNzg3IDY5NSA2MzUgNjExIDczMiA2ODQgOTg5IDY4NSA2MTEgNjg1IDM5MCAzMzcKMzkwIDgzOCA1MDAgNTAwIDYxMyA2MzUgNTUwIDYzNSA2MTUgMzUyIDYzNSA2MzQgMjc4IDI3OCA1NzkgMjc4IDk3NCA2MzQgNjEyCjYzNSA2MzUgNDExIDUyMSAzOTIgNjM0IDU5MiA4MTggNTkyIDU5MiA1MjUgNjM2IDMzNyA2MzYgODM4IDYwMCA2MzYgNjAwIDMxOAozNTIgNTE4IDEwMDAgNTAwIDUwMCA1MDAgMTM0MiA2MzUgNDAwIDEwNzAgNjAwIDY4NSA2MDAgNjAwIDMxOCAzMTggNTE4IDUxOAo1OTAgNTAwIDEwMDAgNTAwIDEwMDAgNTIxIDQwMCAxMDIzIDYwMCA1MjUgNjExIDMxOCA0MDEgNjM2IDYzNiA2MzYgNjM2IDMzNwo1MDAgNTAwIDEwMDAgNDcxIDYxMiA4MzggMzYxIDEwMDAgNTAwIDUwMCA4MzggNDAxIDQwMSA1MDAgNjM2IDYzNiAzMTggNTAwCjQwMSA0NzEgNjEyIDk2OSA5NjkgOTY5IDUzMSA2ODQgNjg0IDY4NCA2ODQgNjg0IDY4NCA5NzQgNjk4IDYzMiA2MzIgNjMyIDYzMgoyOTUgMjk1IDI5NSAyOTUgNzc1IDc0OCA3ODcgNzg3IDc4NyA3ODcgNzg3IDgzOCA3ODcgNzMyIDczMiA3MzIgNzMyIDYxMSA2MDUKNjMwIDYxMyA2MTMgNjEzIDYxMyA2MTMgNjEzIDk4MiA1NTAgNjE1IDYxNSA2MTUgNjE1IDI3OCAyNzggMjc4IDI3OCA2MTIgNjM0CjYxMiA2MTIgNjEyIDYxMiA2MTIgODM4IDYxMiA2MzQgNjM0IDYzNCA2MzQgNTkyIDYzNSA1OTIgXQplbmRvYmoKMTcgMCBvYmoKPDwgL0wgMTggMCBSIC9NIDE5IDAgUiAvYSAyMCAwIFIgL2NvbG9uIDIxIDAgUiAvZCAyMiAwIFIgL2UgMjMgMCBSCi9laWdodCAyNCAwIFIgL2ZpdmUgMjUgMCBSIC9mb3VyIDI2IDAgUiAvaHlwaGVuIDI3IDAgUiAvayAyOCAwIFIgL28gMjkgMCBSCi9vbmUgMzAgMCBSIC9wZXJpb2QgMzEgMCBSIC9zIDMyIDAgUiAvc3BhY2UgMzMgMCBSID4+CmVuZG9iagozIDAgb2JqCjw8IC9GMSAxNiAwIFIgPj4KZW5kb2JqCjQgMCBvYmoKPDwgL0ExIDw8IC9DQSAwIC9UeXBlIC9FeHRHU3RhdGUgL2NhIDEgPj4KL0EyIDw8IC9DQSAxIC9UeXBlIC9FeHRHU3RhdGUgL2NhIDEgPj4gPj4KZW5kb2JqCjUgMCBvYmoKPDwgPj4KZW5kb2JqCjYgMCBvYmoKPDwgPj4KZW5kb2JqCjcgMCBvYmoKPDwgL0kxIDEzIDAgUiA+PgplbmRvYmoKMTMgMCBvYmoKPDwgL0JpdHNQZXJDb21wb25lbnQgOCAvQ29sb3JTcGFjZSAvRGV2aWNlUkdCCi9EZWNvZGVQYXJtcyA8PCAvQ29sb3JzIDMgL0NvbHVtbnMgMjEyIC9QcmVkaWN0b3IgMTAgPj4KL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0hlaWdodCAxMDkgL0xlbmd0aCAzNCAwIFIgL1N1YnR5cGUgL0ltYWdlCi9UeXBlIC9YT2JqZWN0IC9XaWR0aCAyMTIgPj4Kc3RyZWFtCnic7V3JjyRXXn6xZkbulVWVtXZ3ubvdjd243TMej4ZmGHmYy3BhERck/gIkbvwLXDkjODBC4ogAjdBIiGWsQXgksGXLjPdeXVvXlhlVGRmRGUsGh/d9UT3tLIQ0BZFCv+9SP0W8ePHq6eX74rc+pQQCgUAgEAgEAoFAIPj/BuOrl+7/2ne04Pt9LVTMqRYW3VwLV5dqWlju1rWw1GlqwbUcLdgVDz1atv7bH/haiFP0s9Bpa8HMEi1MJhMtjMfjYkhVr6qFTGVaCKNAC+1OC41y3IonMV6rMBLLsrTQbDS0UK9j2I6DniM+lRsmOjTtFzpMc0zXH/7xn6mfx5/8wVtK8N/ij/707ReumLOaCQT/F5DFJygN9lcvffTxR1o4PTnRwkIFt4xFSEsZSNbweloYTcHRQQZKzQ1XC+EYtBVGoNQkA48fWyCyqo2n0hS3LPN8bJVKhV2N0GyKPo3xohZMUKtKSNyeDUoNyJv9LNVCrQbaNUxQs8GvBWWafBe+BNIEgmVzIgSXAdn5BKVBFp+gNMygXc+mCgzaVNfIti+tQDnt9bpoXPCXgaeiCbTUcQL6y3nL9aj/UtvNp2jT7kJ9ThPcch02ViqDIqssFyOZxHhLkqLzGm/ZdTxY5ZXUAFmbOTg9pZpP2lcN6r/BaMSewbYm2wzPTpXg8iA7n6A0yOITlIYZtFs1oBI2m1Agb28saGHRwxVnCtYL+lAksynWcTTC4yZVw1YHpl2bPOifDnGF7+82QbvDM7BeTMVWKRVR8cxJlwVLJnGE12Xoy6FqnNFwbZNcJxNccR18UphTjHYSQFtX1NYrVJ/TKcj6NJgoweVBdj5BaZDFJygNM2h3oYKLHvmr3YD+uNyCJTabQv+kGqosmyxFI+1kStYjudpUNrMJuDK30Pjw0MetBF0Ow7AYUpiB3BsePbkTNLMU+jQN0KVFn3I0wltqTpsDQJsx7d5RAtqdKtzyA3xR+COMPwjRZpzIb/UyIbMpKA2y+ASlYQbt9jpwiTYdMGm1CsG0wE0ezcVJCvqbUg/NczBaETeVxeCvaU6llTSa29A6hzF02yzDu0L6f9VzDt9hgB52J2jvMNyrFWAAybMjLUQ+iPvq8sv413pXtGA0YS6eDI61EATo8PQMtHt8CtZ+vH2GsTE0S3ApkJ1PUBpk8QlKwwzaXe/BfttyoeU1aiBHg7ypqBsaVGAnETjOJP8uNqFj1uvg8bNTcFy7BaV1SOvx0x3S3wTU5p6zrtqoUV92QIVPTnwtjHPavantdloI97p/5028dx/fBnmINu0lqO2TED0HAX6HFQe3rqyin15vRQsHZOSnH24rwS8M2fkEpUEWn6A0zKDdbhOarB37Wqg4aFarwAM7iUCXCX2jnQ78vzkNuXGGlZ0kYKsa83f2juAkffgEWufhEP3QoKu2vHPV8re/8zUtbK6hh79+76EWfvrFMy0Usc22iQEM/UP0OcTrmk2GK2eMoK7iikuNvmbgSsqw56vr63i8D5f0vwjtXgZk5xOUBll8gtIwy8jcXdJC1AddmgZVwhBsG8WgJNugTZg+2WI5Rwl4sLMA3TZmtNKj7T0tnJxRD6W12aK3t1Ut/MaqZ8PMW+WQXm6taWG/i/YHJNlJiPe+/9nnGBJt1EmDruE2FNgiObfdxhdFc0r/L23jeYy3by3XleDyIDufoDTI4hOUhlkhVUvLEBhJZTK51T8baCEZQe8zs8K3C2rLqRo3GrAtJwr9fPLwMy0E9MxWq4ja8lzGcdVBfwsW9V6l3ntwoIU0RrNJe1ULy128xVCg1CQFNYcMch7RthwzgMrgJ0FRL8RhmlDOBGCHkWApE4FzfjYILgWy8wlKgyw+QWmYQbuqqCBBL2eBCk2yNcWcIC5fkwHMCfm34sG3e/wMHB0eg7VvkCuZ46uqZNvbNzfQ4eS8SlXKWhZn5H3bgnW66UIDXVy4ic5fvqqFx1/+uxY+/WxXC65DAs1R5CpNMQMm1W3HxbumzBsqosUMQ36rlwmZTUFpkMUnKA0zaLdIkjWSiNegJI5GILuYqTSpCU02CGGJPQtBshtX0Hme4ta1JfDXjQ1QWzjGlY1b97Tg5mDbwWkRvqW8Duze6gSq6JVV+Ft9Vre4/ksIV24t1Ci8iq6OMKSBj/E7JGszh7qdMCWKZKsyqsZFuYzCbS24FMjOJygNsvgEpWEG7WYG/a2MKSroxquC0RqsbrF3VGTZIG3Hdlhm6gA65pgZPS+vgG2/9xYo8uEuilQ0N2DZXlqE9fjw6KAYUqdDlpwyAoqm4MMjvMWu+lo48ve1sLsPldZxMNpOG5waRSyTZePnZ5Bcp+Rfk8W1DCryYmO+XMjOJygNsvgEpWEG7XZYVCq1QbsBK0jkjJs6HfpaePr0gG3AcV4VC3r/EZTclSrstxsb1/CK9etacIbULWm+3nz9m7jwbLcYkpeCuDOFkYxGENZq4OuYeb5GHePfrDMCuQMqH54g7PnwAPlKCQtHj1ltUjEQul6BJTzmsQuF/VlwKZCdT1AaZPEJSsMM2h36OAHBjmGbdQqfJnN6bBaOCAOYbReaUEg7jKSK+qDd3gZOK9i4+5YWfraDiKbPH0C4v4Yiz76PKys3Xi+GZCokBccT8G+H+cJnhxitx8DjtS67ymBAdu4iuSmiIvxvP/qhFna2Ef9snVMqi0tTt00K/3VybvcW/OKQnU9QGmTxCUrDDNotTgfIItBuUQnZpJM3Y95Qn0Rkn9Fsy+N+1mgZfvO7v66Fzdvf0sLf/OAvtLBKzdRi1PHuIyTkrl5/tRhSdRHhUvWc0Vl90KU3BaXGrNdxPITQWX5JC4urW1qIAkQ7m0wkylwouYWROWGQs8ECXAaPFCzirwSXAtn5BKVBFp+gNMzgEVZ7UhmVu8K5SUeoylkug6UZVXcR/tPVOqj569+4rYVX7oNtB4ew1lZSXwvXN1GtcWqgo9UejMbp+DyBKPSLgpO4mEQYecaY6oe7O1r4z5+9q4X738JTi6tQt8+GIGs6e9XSFr4NpoUDNybJ8vvh9AijnQz52FdQrSFsOz5+qoVi0iqctJMA/+M/fYChLi0iVGyTk/YGJ+3bv/v7Whgc4oPkX//qz9HmDiatyriyzrW7Wli59Q0tmPVuMbY45ZlKEatcsib2gwefauG5SYOR/9V7OHb5YB8HQb79o7/UQv8UFobnJg0h4il7/p9Mmux8gtIgi09QGmTxCUrDjG++KU0M0QTfKC4NInZRUcUEx99cg6Wj6mEdb11D8tjr3/6uFtZu44vkg5/+QAtXr+CLZPXOa3jF8g28gh9P4TgohhSdwcJysIfaZIMDfDZlCQwrXhOelSVWHd3ee18LK2vIiEtD9Jnz2GljhHS4LOfRIPzm9SqMHVxl7lyFVqivYN4mrZgxNceTJjufoDTI4hOUhhm061i4OKCrIGOOmVdDrprFoLceLSzbe74WbvzO97Ww+dr32SVYJhlC52+zVvgyk9ZGNjjlo/f/QwuT6PzUybMzdH68+yUGwJM8qlWMduMl0MTdW3CHpFad/1EHgssTucbgi/ApogYL3kz5ewwYPFFbRD8r64vqAszbpBUzpuZ40mTnE5QGWXyC0jCDdicR63fz+EmDxbIdk/lsTGzzGrj1m7/3W1q4/xvf00JricdXPPpECxYf94eIAjx6gqJpe0Ns4G//3d9qoeGdx6yPJ1C4VldAPa0mdMnHO+CUmJ1317e0cOu1N/A8A/v6PtS9cIxf3SBi0bQc/+w4groaMGcvZxbBKx11EeZt0ooZU3M8abLzCUqDLD5BaZhlZOaxkYrp0wYLaqc8/sqgUbFaQWTcvTewXRfHR338AcyVgz2E6E1Y9Ww4gGd6+8HHWghyqIROhjaN4vRopVpVqE7LCx0t7B8gID5l9EM4BNFsP/6Sz8EjHgSwuFZtDDut9LRwkmL8ngdza43HkHg2eGfIMjTp9DzW4QXM26QVM6bmeNJk5xOUBll8gtIwMy6cFTlTHijF8LeMRsWY8fQrbdg5/+GHf6+F7gr27d4aws7ikIXJHOzJjTr0L5slV+rkndUeTwEZ9osBeRYePDlC9lrCqLtmFRt+TJr4ghbX/U9xDsckZa03Hl+dFe/dJD3V8c+aFVBYlXyxwILmr9y5zhG9r17EfE1aMWNqjidNdj5BaZDFJygNs7TdKZySLlWnqs1g+eKwCnoAp0zVPj6GJhUcQfCSX0Yb5pp3F+Dm66wzVj5DlM7uHqqo5DxG2jTPx1ZEz1s8ErLOYm3UKZVVSFQqM56aafI/OmN0UFwBpzTXMYCRh8ZDnl45HuGXudgCcSz1LnRTztukFTOm5njSZOcTlAZZfILSMIN2TQOKUrUChSWnmlb3sG/Xm6CAkAc5LzZd9ojG8Smqp01N3AodbPIrK0jnnsbYrm/f3dTCOz/+Zzyen4dUOSwSGgUIWGo1Yed0bXCKxYKqwRhDeryPgFt/gCFNDPS5fBu/uo0O9b4cgxwc4xXumGzFWjNReH4Q5guYt0krZkzN86RddEMg+N+GLD5BaZhBuy5Tw0OetmjRUTil6TJkBorF8t8VF+TiOGjsMqul3cKVZ6zxHW6AL3pXEEC7e4hSoXfe/FUtBEd7xZAefQ4b7CjwMW4Lmle7jZ3foJl3fxcPfvkEdlqzggG0VjHI5S4IyCDdGH20WRgwyrcHU/BmB4bfBx8/Uxdg3iatmDE1x5MmO5+gNMjiE5SGGbS7sszzI08QwxOx1jaPmlK5CRXG5onIrRbciy4djtEIQTUej39WPKr53Xfe0cL12+CUnR1sziZNsrXKeSSzRebyPOzzowAMEkUQUjpVGx4a3//6LS1UmXqTWrDuFomr0TYYxBwiOqhXa2rha7dg7+11EF383v4jdQHmbdKs53y7cztpsvMJSoMsPkFpmEG7V69AFWob2FQfbGO/PTiCmhYzu6TRQA+j0NdCNkWUjsWV3T+CUjYMYLccJ1CprBxPNRvQkg6egbZ2eNKGUmqag1ZWlsFTxhRcMPARRFSpY0idNijAZQ7pJKajk5UrRgwPjgMaRacY7c0ra1pYZ2G17R3Q3MlRqC7AvE1aMWNqjidNdj5BaZDFJygNM2i3tUDNixvmQo+5PHXYG48PYEod089ou7BAxkUmDc/KShgCdBrBb1inbjUOsZNHY0TbxnwqS859gnmOAQRnUB1bLZ7o3IJSFhUFwU/wlkYDWl5RJNRIeSKmDe8kj7hSrotXbN3cQochGv/kJzDYfvjZoboA8zZpxYypOZ402fkEpUEWn6A0zKBdmyWMqi2oOd0GC4KzPKDj8fQpOvVUhjZeFdbFjLFA2QRbultDY6eol2iBCCY8zirmMRj5c/paUaM859mQTFQ970q5YCV/gNdFDBhud8BuNqnEZHppyFimg2PomwNql8MRtMt//DGqZh9cqLfN3aQVM6bmeNJk5xOUBll8gtIwg3YDmhCVhaJGjTr2a8d78SDkdpvlic4iCnA4BgxhTcZMF3VhgazSlZkyAMlmSJLLn4NTOdfXDB57WaN5tsguSjPQhMsCTa0OWKnfBykMSU+tLgYQpnjvF09gnv3kQxQuXmHg0EqRncrDRpZoiX3SPzeA45+ds0krZkzN8aTJzicoDbL4BKVhBu3u4PwmNfFBE81l6DJVj6oQuEV1u+ghGEGr8X0IgxNml2CTVtYUpDBlCcEsoyWZxZ2KX0NxDKRSymIMUkT1MKfj0aG/Mg3hr8xoOM2YJuMzg4blIlSffPf4CwzOP2GbERqttle18Oo1FC7mQ+rdx/yXiHmbtGLG1BxPmux8gtIgi09QGmbQbuYgAidx39TCZAo1x0wR51NtY3vvLINlForqviHUHL8PV6B/DOKIRjwqMqWRM8fqn7Juw5jFjV2XbZSyWINiOEaziCV/HVZlbPIA56kJO2eS4HWVOqsyOhhtx8V/dEN1tHD3HtS023fvaWHrJvJ0vvkrIJedPRY6fvex+nnM26RZz5XWnNtJk51PUBpk8QkEAoFAIBAIBAKBQCAQXBr+C7mW3JsKZW5kc3RyZWFtCmVuZG9iagozNCAwIG9iago0NTE5CmVuZG9iagoyIDAgb2JqCjw8IC9Db3VudCAxIC9LaWRzIFsgMTEgMCBSIF0gL1R5cGUgL1BhZ2VzID4+CmVuZG9iagozNSAwIG9iago8PCAvQ3JlYXRpb25EYXRlIChEOjIwMjEwOTE2MTQ0MTAzKzAyJzAwJykKL0NyZWF0b3IgKE1hdHBsb3RsaWIgdjMuNC4zLCBodHRwczovL21hdHBsb3RsaWIub3JnKQovUHJvZHVjZXIgKE1hdHBsb3RsaWIgcGRmIGJhY2tlbmQgdjMuNC4zKSA+PgplbmRvYmoKeHJlZgowIDM2CjAwMDAwMDAwMDAgNjU1MzUgZiAKMDAwMDAwMDAxNiAwMDAwMCBuIAowMDAwMDExMzM5IDAwMDAwIG4gCjAwMDAwMDYzNjUgMDAwMDAgbiAKMDAwMDAwNjM5NyAwMDAwMCBuIAowMDAwMDA2NDk2IDAwMDAwIG4gCjAwMDAwMDY1MTcgMDAwMDAgbiAKMDAwMDAwNjUzOCAwMDAwMCBuIAowMDAwMDAwMDY1IDAwMDAwIG4gCjAwMDAwMDAzOTQgMDAwMDAgbiAKMDAwMDAwMDcyMCAwMDAwMCBuIAowMDAwMDAwMjA4IDAwMDAwIG4gCjAwMDAwMDA3MDAgMDAwMDAgbiAKMDAwMDAwNjU3MCAwMDAwMCBuIAowMDAwMDA1MTAwIDAwMDAwIG4gCjAwMDAwMDQ5MDAgMDAwMDAgbiAKMDAwMDAwNDQ4OSAwMDAwMCBuIAowMDAwMDA2MTUzIDAwMDAwIG4gCjAwMDAwMDA3NDAgMDAwMDAgbiAKMDAwMDAwMDg3MyAwMDAwMCBuIAowMDAwMDAxMDM1IDAwMDAwIG4gCjAwMDAwMDE0MTUgMDAwMDAgbiAKMDAwMDAwMTU2MCAwMDAwMCBuIAowMDAwMDAxODY0IDAwMDAwIG4gCjAwMDAwMDIxODYgMDAwMDAgbiAKMDAwMDAwMjY1NCAwMDAwMCBuIAowMDAwMDAyOTc2IDAwMDAwIG4gCjAwMDAwMDMxNDIgMDAwMDAgbiAKMDAwMDAwMzI2OCAwMDAwMCBuIAowMDAwMDAzNDIzIDAwMDAwIG4gCjAwMDAwMDM3MTQgMDAwMDAgbiAKMDAwMDAwMzg2OSAwMDAwMCBuIAowMDAwMDAzOTkyIDAwMDAwIG4gCjAwMDAwMDQzOTkgMDAwMDAgbiAKMDAwMDAxMTMxOCAwMDAwMCBuIAowMDAwMDExMzk5IDAwMDAwIG4gCnRyYWlsZXIKPDwgL0luZm8gMzUgMCBSIC9Sb290IDEgMCBSIC9TaXplIDM2ID4+CnN0YXJ0eHJlZgoxMTU1NgolJUVPRgo=\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:03.075694\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:03.202620\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:03.332269\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["def compare_imgs(img1, img2, title_prefix=\"\"):\n", " # Calculate MSE loss between both images\n", " loss = F.mse_loss(img1, img2, reduction=\"sum\")\n", " # Plot images for visual comparison\n", " grid = torchvision.utils.make_grid(torch.stack([img1, img2], dim=0), nrow=2, normalize=True, range=(-1, 1))\n", " grid = grid.permute(1, 2, 0)\n", " plt.figure(figsize=(4, 2))\n", " plt.title(f\"{title_prefix} Loss: {loss.item():4.2f}\")\n", " plt.imshow(grid)\n", " plt.axis(\"off\")\n", " plt.show()\n", "\n", "\n", "for i in range(2):\n", " # Load example image\n", " img, _ = train_dataset[i]\n", " img_mean = img.mean(dim=[1, 2], keepdims=True)\n", "\n", " # Shift image by one pixel\n", " SHIFT = 1\n", " img_shifted = torch.roll(img, shifts=SHIFT, dims=1)\n", " img_shifted = torch.roll(img_shifted, shifts=SHIFT, dims=2)\n", " img_shifted[:, :1, :] = img_mean\n", " img_shifted[:, :, :1] = img_mean\n", " compare_imgs(img, img_shifted, \"Shifted -\")\n", "\n", " # Set half of the image to zero\n", " img_masked = img.clone()\n", " img_masked[:, : img_masked.shape[1] // 2, :] = img_mean\n", " compare_imgs(img, img_masked, \"Masked -\")"]}, {"cell_type": "markdown", "id": "7bfc9b9f", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.028564, "end_time": "2021-09-16T12:41:03.462047", "exception": false, "start_time": "2021-09-16T12:41:03.433483", "status": "completed"}, "tags": []}, "source": ["### Training the model\n", "\n", "During the training, we want to keep track of the learning progress by seeing reconstructions made by our model.\n", "For this, we implement a callback object in PyTorch Lightning which will add reconstructions every $N$ epochs to our tensorboard:"]}, {"cell_type": "code", "execution_count": 9, "id": "e6e82979", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:03.525671Z", "iopub.status.busy": "2021-09-16T12:41:03.525205Z", "iopub.status.idle": "2021-09-16T12:41:03.527269Z", "shell.execute_reply": "2021-09-16T12:41:03.526813Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.036008, "end_time": "2021-09-16T12:41:03.527366", "exception": false, "start_time": "2021-09-16T12:41:03.491358", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class GenerateCallback(pl.Callback):\n", " def __init__(self, input_imgs, every_n_epochs=1):\n", " super().__init__()\n", " self.input_imgs = input_imgs # Images to reconstruct during training\n", " # Only save those images every N epochs (otherwise tensorboard gets quite large)\n", " self.every_n_epochs = every_n_epochs\n", "\n", " def on_epoch_end(self, trainer, pl_module):\n", " if trainer.current_epoch % self.every_n_epochs == 0:\n", " # Reconstruct images\n", " input_imgs = self.input_imgs.to(pl_module.device)\n", " with torch.no_grad():\n", " pl_module.eval()\n", " reconst_imgs = pl_module(input_imgs)\n", " pl_module.train()\n", " # Plot and add to tensorboard\n", " imgs = torch.stack([input_imgs, reconst_imgs], dim=1).flatten(0, 1)\n", " grid = torchvision.utils.make_grid(imgs, nrow=2, normalize=True, range=(-1, 1))\n", " trainer.logger.experiment.add_image(\"Reconstructions\", grid, global_step=trainer.global_step)"]}, {"cell_type": "markdown", "id": "0825de1a", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.028704, "end_time": "2021-09-16T12:41:03.584828", "exception": false, "start_time": "2021-09-16T12:41:03.556124", "status": "completed"}, "tags": []}, "source": ["We will now write a training function that allows us to train the autoencoder with different latent dimensionality\n", "and returns both the test and validation score.\n", "We provide pre-trained models and recommend you using those, especially when you work on a computer without GPU.\n", "Of course, feel free to train your own models on Lisa."]}, {"cell_type": "code", "execution_count": 10, "id": "da4ec41c", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:03.648305Z", "iopub.status.busy": "2021-09-16T12:41:03.647832Z", "iopub.status.idle": "2021-09-16T12:41:03.649849Z", "shell.execute_reply": "2021-09-16T12:41:03.649433Z"}, "papermill": {"duration": 0.036319, "end_time": "2021-09-16T12:41:03.649948", "exception": false, "start_time": "2021-09-16T12:41:03.613629", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def train_cifar(latent_dim):\n", " # Create a PyTorch Lightning trainer with the generation callback\n", " trainer = pl.Trainer(\n", " default_root_dir=os.path.join(CHECKPOINT_PATH, \"cifar10_%i\" % latent_dim),\n", " gpus=1 if str(device).startswith(\"cuda\") else 0,\n", " max_epochs=500,\n", " callbacks=[\n", " ModelCheckpoint(save_weights_only=True),\n", " GenerateCallback(get_train_images(8), every_n_epochs=10),\n", " LearningRateMonitor(\"epoch\"),\n", " ],\n", " )\n", " trainer.logger._log_graph = True # If True, we plot the computation graph in tensorboard\n", " trainer.logger._default_hp_metric = None # Optional logging argument that we don't need\n", "\n", " # Check whether pretrained model exists. If yes, load it and skip training\n", " pretrained_filename = os.path.join(CHECKPOINT_PATH, \"cifar10_%i.ckpt\" % latent_dim)\n", " if os.path.isfile(pretrained_filename):\n", " print(\"Found pretrained model, loading...\")\n", " model = Autoencoder.load_from_checkpoint(pretrained_filename)\n", " else:\n", " model = Autoencoder(base_channel_size=32, latent_dim=latent_dim)\n", " trainer.fit(model, train_loader, val_loader)\n", " # Test best model on validation and test set\n", " val_result = trainer.test(model, test_dataloaders=val_loader, verbose=False)\n", " test_result = trainer.test(model, test_dataloaders=test_loader, verbose=False)\n", " result = {\"test\": test_result, \"val\": val_result}\n", " return model, result"]}, {"cell_type": "markdown", "id": "f9c30a4b", "metadata": {"papermill": {"duration": 0.028762, "end_time": "2021-09-16T12:41:03.707706", "exception": false, "start_time": "2021-09-16T12:41:03.678944", "status": "completed"}, "tags": []}, "source": ["### Comparing latent dimensionality\n", "\n", "
\n", "\n", "When training an autoencoder, we need to choose a dimensionality for the latent representation $z$.\n", "The higher the latent dimensionality, the better we expect the reconstruction to be.\n", "However, the idea of autoencoders is to *compress* data.\n", "Hence, we are also interested in keeping the dimensionality low.\n", "To find the best tradeoff, we can train multiple models with different latent dimensionalities.\n", "The original input has $32\\times 32\\times 3 = 3072$ pixels.\n", "Keeping this in mind, a reasonable choice for the latent dimensionality might be between 64 and 384:"]}, {"cell_type": "code", "execution_count": 11, "id": "af2a8f9a", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:03.768726Z", "iopub.status.busy": "2021-09-16T12:41:03.768265Z", "iopub.status.idle": "2021-09-16T12:41:12.482167Z", "shell.execute_reply": "2021-09-16T12:41:12.482555Z"}, "papermill": {"duration": 8.746282, "end_time": "2021-09-16T12:41:12.482697", "exception": false, "start_time": "2021-09-16T12:41:03.736415", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/trainer.py:678: LightningDeprecationWarning: `trainer.test(test_dataloaders)` is deprecated in v1.4 and will be removed in v1.6. Use `trainer.test(dataloaders)` instead.\n", " rank_zero_deprecation(\n", "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model, loading...\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torch/_jit_internal.py:603: LightningDeprecationWarning: The `LightningModule.datamodule` property is deprecated in v1.3 and will be removed in v1.5. Access the datamodule through using `self.trainer.datamodule` instead.\n", " if hasattr(mod, name):\n", "/usr/local/lib/python3.9/dist-packages/torch/_jit_internal.py:603: LightningDeprecationWarning: The `LightningModule.loaded_optimizer_states_dict` property is deprecated in v1.4 and will be removed in v1.6.\n", " if hasattr(mod, name):\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "0f11cd1f8ebc4c9cbc69478f55dac457", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n", "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "1eeadd6528c746868701b83f54b200dc", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model, loading...\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "47c8df90b5414d1e8ee6e8afc2057c52", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "0cdd717c36684008add2d6d3f93caa65", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model, loading...\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "8bedc95274e84f799bbef9fc04ca9934", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "213f1af06c854f0fa5ac9c7f42e86b8b", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model, loading...\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "07a7fcadf97f442ca3088a5bbbcba662", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "5cf0706e7c07460880d2fe93a1e1d4c4", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}], "source": ["model_dict = {}\n", "for latent_dim in [64, 128, 256, 384]:\n", " model_ld, result_ld = train_cifar(latent_dim)\n", " model_dict[latent_dim] = {\"model\": model_ld, \"result\": result_ld}"]}, {"cell_type": "markdown", "id": "e6e59925", "metadata": {"papermill": {"duration": 0.036287, "end_time": "2021-09-16T12:41:12.556351", "exception": false, "start_time": "2021-09-16T12:41:12.520064", "status": "completed"}, "tags": []}, "source": ["After training the models, we can plot the reconstruction loss over the latent dimensionality to get an intuition\n", "how these two properties are correlated:"]}, {"cell_type": "code", "execution_count": 12, "id": "1b5b80aa", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:12.655386Z", "iopub.status.busy": "2021-09-16T12:41:12.644902Z", "iopub.status.idle": "2021-09-16T12:41:12.911585Z", "shell.execute_reply": "2021-09-16T12:41:12.911109Z"}, "papermill": {"duration": 0.318993, "end_time": "2021-09-16T12:41:12.911693", "exception": false, "start_time": "2021-09-16T12:41:12.592700", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:12.740985\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["latent_dims = sorted(k for k in model_dict)\n", "val_scores = [model_dict[k][\"result\"][\"val\"][0][\"test_loss\"] for k in latent_dims]\n", "\n", "fig = plt.figure(figsize=(6, 4))\n", "plt.plot(\n", " latent_dims, val_scores, \"--\", color=\"#000\", marker=\"*\", markeredgecolor=\"#000\", markerfacecolor=\"y\", markersize=16\n", ")\n", "plt.xscale(\"log\")\n", "plt.xticks(latent_dims, labels=latent_dims)\n", "plt.title(\"Reconstruction error over latent dimensionality\", fontsize=14)\n", "plt.xlabel(\"Latent dimensionality\")\n", "plt.ylabel(\"Reconstruction error\")\n", "plt.minorticks_off()\n", "plt.ylim(0, 100)\n", "plt.show()"]}, {"cell_type": "markdown", "id": "e03a327e", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.037468, "end_time": "2021-09-16T12:41:12.988817", "exception": false, "start_time": "2021-09-16T12:41:12.951349", "status": "completed"}, "tags": []}, "source": ["As we initially expected, the reconstruction loss goes down with increasing latent dimensionality.\n", "For our model and setup, the two properties seem to be exponentially (or double exponentially) correlated.\n", "To understand what these differences in reconstruction error mean, we can visualize example reconstructions of the four models:"]}, {"cell_type": "code", "execution_count": 13, "id": "24dd2b64", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:13.069820Z", "iopub.status.busy": "2021-09-16T12:41:13.069333Z", "iopub.status.idle": "2021-09-16T12:41:13.071023Z", "shell.execute_reply": "2021-09-16T12:41:13.071399Z"}, "papermill": {"duration": 0.045096, "end_time": "2021-09-16T12:41:13.071514", "exception": false, "start_time": "2021-09-16T12:41:13.026418", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def visualize_reconstructions(model, input_imgs):\n", " # Reconstruct images\n", " model.eval()\n", " with torch.no_grad():\n", " reconst_imgs = model(input_imgs.to(model.device))\n", " reconst_imgs = reconst_imgs.cpu()\n", "\n", " # Plotting\n", " imgs = torch.stack([input_imgs, reconst_imgs], dim=1).flatten(0, 1)\n", " grid = torchvision.utils.make_grid(imgs, nrow=4, normalize=True, range=(-1, 1))\n", " grid = grid.permute(1, 2, 0)\n", " plt.figure(figsize=(7, 4.5))\n", " plt.title(\"Reconstructed from %i latents\" % (model.hparams.latent_dim))\n", " plt.imshow(grid)\n", " plt.axis(\"off\")\n", " plt.show()"]}, {"cell_type": "code", "execution_count": 14, "id": "2b81b994", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:13.150447Z", "iopub.status.busy": "2021-09-16T12:41:13.149978Z", "iopub.status.idle": "2021-09-16T12:41:14.196317Z", "shell.execute_reply": "2021-09-16T12:41:14.196704Z"}, "papermill": {"duration": 1.087391, "end_time": "2021-09-16T12:41:14.196840", "exception": false, "start_time": "2021-09-16T12:41:13.109449", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n"]}, {"data": {"application/pdf": "JVBERi0xLjQKJazcIKu6CjEgMCBvYmoKPDwgL1BhZ2VzIDIgMCBSIC9UeXBlIC9DYXRhbG9nID4+CmVuZG9iago4IDAgb2JqCjw8IC9FeHRHU3RhdGUgNCAwIFIgL0ZvbnQgMyAwIFIgL1BhdHRlcm4gNSAwIFIKL1Byb2NTZXQgWyAvUERGIC9UZXh0IC9JbWFnZUIgL0ltYWdlQyAvSW1hZ2VJIF0gL1NoYWRpbmcgNiAwIFIKL1hPYmplY3QgNyAwIFIgPj4KZW5kb2JqCjExIDAgb2JqCjw8IC9Bbm5vdHMgMTAgMCBSIC9Db250ZW50cyA5IDAgUgovR3JvdXAgPDwgL0NTIC9EZXZpY2VSR0IgL1MgL1RyYW5zcGFyZW5jeSAvVHlwZSAvR3JvdXAgPj4KL01lZGlhQm94IFsgMCAwIDQwNSAyMjcuNjU1NDM0NzgyNiBdIC9QYXJlbnQgMiAwIFIgL1Jlc291cmNlcyA4IDAgUgovVHlwZSAvUGFnZSA+PgplbmRvYmoKOSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDEyIDAgUiA+PgpzdHJlYW0KeJxVj01PwzAMhu/+Fe9xPZDGSfp13DSo4LapEgfEYcpSoFo79QP293HLGCKSY7+29dhmNBSvGW8j5INGI3aRuJw1aVEtOZ2IPy3emEylSeJsIgn9X74T1dQjU2YxW2iVgotcsdXOuiw3KYaAZ3SI1+ZnZiN2EXqJeBu+PnzYlxv4UTC2YMzzuShuSN8ifmRsz9jRDv0vRitOZPsbbZblNUs9zZw7AYGZldGWjdwhof1by7e0qRA/SI9BVS+HV0d6wWofwTllMp3b5WEV/Lkbp+HTT+GIeohgtLoWl/q5RepwOkyhm8YIr6ie6L4i2Zi+AR1UUP8KZW5kc3RyZWFtCmVuZG9iagoxMiAwIG9iagoyNDUKZW5kb2JqCjEwIDAgb2JqClsgXQplbmRvYmoKMTggMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAyMzIgPj4Kc3RyZWFtCnicPZBLcgQhDEP3nEJHAH/hPJ1KzaLn/tvI7plskKrA8hNxHBNn84gIpBz8rGFmUBO8h4VD1WA7oOvAZ0BO4BoudClwo9qEc3ydw5sKmriHx2y1SKyd5Uwh6jAmSWzoScg2zmhy45zcqlTeTGu9xuKbcne7ymvalsK9h8r6OONUOasqa5E2EZlFaxvBRh7ssM+jq2jLWSrcN4xNXROVw5vF7lndyeKK769c49Uswcz3w7e/HB9X3egqx9jKhNlSk+bSOfWvltH6cLSLhXrhR3smSHB1qyBVpdbO2lN6/VPcJPr9A/TBVx0KZW5kc3RyZWFtCmVuZG9iagoxOSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDMwNyA+PgpzdHJlYW0KeJw9kktuAzEMQ/c+hS4QwPrZnvOkKLqY3n/bJyXpihzZFkVqlrpMWVMekDSThH/p8HCxnfI7bM9mZuBaopeJ5ZTn0BVi7qJ82cxGXVknxeqEZjq36FE5Fwc2Taqfqyyl3S54Dtcmnlv2ET+80KAe1DUuCTd0V6NlKTRjqvt/0nv8jDLgakxdbFKrex88XkRV6OgHR4kiY5cX5+NBCelKwmhaiJV3RQNB7vK0ynsJ7tveasiyB6mYzjspZrDrdFIubheHIR7I8qjw5aPYa0LP+LArJfRI2IYzcifuaMbm1MjikP7ejQRLj65oIfPgr27WLmC8UzpFYmROcqxpi1VO91AU07nDvQwQ9WxFQylzkdXqX8POC2uWbBZ4SvoFHqPdJksOVtnbqE7vrTzZ0PcfWtd0HwplbmRzdHJlYW0KZW5kb2JqCjIwIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMjMyID4+CnN0cmVhbQp4nDVRSW7EMAy7+xX8wADW7rwnxaCH9v/XUsoUCEAltrglYmMjAi8x+DmI3PiSNaMmfmdyV/wsT4VHwq3gSRSBl+FedoLLG8ZlPw4zH7yXVs6kxpMMyEU2PTwRMtglEDowuwZ12Gbaib4h4bMjUs1GltPXEvTSKgTKU7bf6YISbav6c/usC2372hNOdnvqSeUTiOeWrMBl4xWTxVgGPVG5SzF9kOpsoSehvCifg2w+aohElyhn4InBwSjQDuy57WfiVSFoXd2nbWOoRkrH078NTU2SCPlECWe2NO4W/n/Pvb7X+w9OIVQRCmVuZHN0cmVhbQplbmRvYmoKMjEgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAyMzEgPj4Kc3RyZWFtCnicNU85kgQhDMt5hT4wVRjbQL+np7Y22Pl/upKZTpDwIcnTEx2ZeJkjI7Bmx9taZCBm4FNMxb/2tA8TqvfgHiKUiwthhpFw1qzjbp6OF/92lc9YB+82+IpZXhDYwkzWVxZnLtsFY2mcxDnJboxdE7GNda2nU1hHMKEMhHS2w5Qgc1Sk9MmOMuboOJEnnovv9tssdjl+DusLNo0hFef4KnqCNoOi7HnvAhpyQf9d3fgeRbvoJSAbCRbWUWLunOWEX712dB61KBJzQppBLhMhzekqphCaUKyzo6BSUXCpPqforJ9/5V9cLQplbmRzdHJlYW0KZW5kb2JqCjIyIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMjQ5ID4+CnN0cmVhbQp4nD1QO45EIQzrOYUv8CTyI3AeRqstZu/frgOaKVBMfrYzJNARgUcMMZSv4yWtoK6Bv4tC8W7i64PCIKtDUiDOeg+IdOymNpETOh2cMz9hN2OOwEUxBpzpdKY9ByY5+8IKhHMbZexWSCeJqiKO6jOOKZ4qe594FiztyDZbJ5I95CDhUlKJyaWflMo/bcqUCjpm0QQsErngZBNNOMu7SVKMGZQy6h6mdiJ9rDzIozroZE3OrCOZ2dNP25n4HHC3X9pkTpXHdB7M+Jy0zoM5Fbr344k2B02N2ujs9xNpKi9Sux1anX51EpXdGOcYEpdnfxnfZP/5B/6HWiIKZW5kc3RyZWFtCmVuZG9iagoyMyAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDEzNiA+PgpzdHJlYW0KeJxNj0EOAzEIA+95hZ9AIEB4z1ZVD9v/X0vYdtMLHsmAbFEGgSWHeIcb4dHbD99FNhVn45xfUiliIZhPcJ8wUxyNKXfyY4+AcZRqLKdoeF5Lzk3DFy13Ey2lrZeTGW+47pf3R5VtkQ1Fzy0LQtdskvkygQd8GJhHdeNppcfd9myv9vwAzmw0SQplbmRzdHJlYW0KZW5kb2JqCjI0IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggOTQgPj4Kc3RyZWFtCnicRY3BEcAgCAT/VEEJCgraTyaTh/b/jRAyfGDnDu6EBQu2eUYfBZUmXhVYB0pj3FCPQL3hci3J3AUPcCd/2tBUnJbTd2mRSVUp3KQSef8OZyaQqHnRY533C2P7IzwKZW5kc3RyZWFtCmVuZG9iagoyNSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDQ3ID4+CnN0cmVhbQp4nDMyt1AwULA0ARKGFiYK5mYGCimGXJYQVi4XTCwHzALRlnAKIp7BlQYAuWcNJwplbmRzdHJlYW0KZW5kb2JqCjI2IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMjU4ID4+CnN0cmVhbQp4nEWRS3IEIAhE956CI4D85DyTSmUxuf82Dc5kNnaXqP2ESiOmEiznFHkwfcnyzWS26Xc5VjsbBRRFKJjJVeixAqs7U8SZa4lq62Nl5LjTOwbFG85dOalkcaOMdVR1KnBMz5X1Ud35dlmUfUcOZQrYrHMcbODKbcMYJ0abre4O94kgTydTR8XtINnwByeNfZWrK3CdbPbRSzAOBP1CE5jki0DrDIHGzVP05BLs4+N254Fgb3kRSNkQyJEhGB2Cdp1c/+LW+b3/cYY7z7UZrhzv4neY1nbHX2KSFXMBi9wpqOdrLlrXGTrekzPH5Kb7hs65YJe7g0zv+T/Wz/r+Ax4pZvoKZW5kc3RyZWFtCmVuZG9iagoyNyAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDE2MyA+PgpzdHJlYW0KeJxFkDsSAyEMQ3tOoSP4IwM+z2YyKTb3b2PYbFLA01ggg7sTgtTagonogoe2Jd0F760EZ2P86TZuNRLkBHWAVqTjaJRSfbnFaZV08Wg2cysLrRMdZg56lKMZoBA6Fd7touRypu7O+UNw9V/1v2LdOZuJgcnKHQjN6lPc+TY7orq6yf6kx9ys134r7FVhaVlLywm3nbtmQAncUznaqz0/Hwo69gplbmRzdHJlYW0KZW5kb2JqCjI4IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMjE4ID4+CnN0cmVhbQp4nD1QuY0EMQzLXYUaWMB67alnFotLpv/0SPn2ItEWRVIqNZmSKS91lCVZU946fJbEDnmG5W5kNiUqRS+TsCX30ArxfYnmFPfd1ZazQzSXaDl+CzMqqhsd00s2mnAqE7qg3MMz+g1tdANWhx6xWyDQpGDXtiByxw8YDMGZE4siDEpNBv+uco+fXosbPsPxQxSRkg7mNf9Y/fJzDa9TjyeRbm++4l6cqQ4DERySmrwjXVixLhIRaTVBTc/AWi2Au7de/hu0I7oMQPaJxHGaUo6hv2twpc8v5SdT2AplbmRzdHJlYW0KZW5kb2JqCjI5IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMTYwID4+CnN0cmVhbQp4nEWQORIDMQgEc72CJ0hcgvesy7XB+v+pB9ZHoukCNBy6Fk3KehRoPumxRqG60GvoLEqSRMEWkh1Qp2OIOyhITEhjkki2HoMjmlizXZiZVCqzUuG0acXCv9la1chEjXCN/InpBlT8T+pclPBNg6+SMfoYVLw7g4xJ+F5F3Fox7f5EMLEZ9glvRSYFhImxqdm+z2CGzPcK1zjH8w1MgjfrCmVuZHN0cmVhbQplbmRvYmoKMzAgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAzMzQgPj4Kc3RyZWFtCnicLVJLcsUgDNtzCl2gM/gH5DzpdLp4vf+2kpNFRg5g9DHlholKfFkgt6PWxLeNzECF4a+rzIXPSNvIOojLkIu4ki2Fe0Qs5DHEPMSC76vxHh75rMzJswfGL9l3Dyv21IRlIePFGdphFcdhFeRYsHUhqnt4U6TDqSTY44v/PsVzLQQtfEbQgF/kn6+O4PmSFmn3mG3TrnqwTDuqpLAcbE9zXiZfWme5Oh7PB8n2rtgRUrsCFIW5M85z4SjTVka0FnY2SGpcbG+O/VhK0IVuXEaKI5CfqSI8oKTJzCYK4o+cHnIqA2Hqmq50chtVcaeezDWbi7czSWbrvkixmcJ5XTiz/gxTZrV5J89yotSpCO+xZ0vQ0Dmunr2WWWh0mxO8pITPxk5PTr5XM+shORUJqWJaV8FpFJliCdsSX1NRU5p6Gf778u7xO37+ASxzfHMKZW5kc3RyZWFtCmVuZG9iagozMSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDMyMCA+PgpzdHJlYW0KeJw1UktuBTEI288puECl8E/O86qqi777b2sTvRVMMGDjKS9Z0ku+1CXbpcPkWx/3JbFC3o/tmsxSxfcWsxTPLa9HzxG3LQoEURM9WJkvFSLUz/ToOqhwSp+BVwi3FBu8g0kAg2r4Bx6lMyBQ50DGu2IyUgOCJNhzaXEIiXImiX+kvJ7fJ62kofQ9WZnL35NLpdAdTU7oAcXKxUmgXUn5oJmYSkSSl+t9sUL0hsCSPD5HMcmA7DaJbaIFJucepSXMxBQ6sMcCvGaa1VXoYMIehymMVwuzqB5s8lsTlaQdreMZ2TDeyzBTYqHhsAXU5mJlgu7l4zWvwojtUZNdw3Duls13CNFo/hsWyuBjFZKAR6exEg1pOMCIwJ5eOMVe8xM5DsCIY52aLAxjaCaneo6JwNCes6VhxsceWvXzD1TpfIcKZW5kc3RyZWFtCmVuZG9iagozMiAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDE4ID4+CnN0cmVhbQp4nDM2tFAwgMMUQ640AB3mA1IKZW5kc3RyZWFtCmVuZG9iagozMyAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDEzMyA+PgpzdHJlYW0KeJxFj0sOBCEIRPecoo7Axx/ncTLphXP/7YCdbhNjPYVUgbmCoT0uawOdFR8hGbbxt6mWjkVZPlR6UlYPyeCHrMbLIdygLPCCSSqGIVCLmBqRLWVut4DbNg2yspVTpY6wi6Mwj/a0bBUeX6JbInWSP4PEKi/c47odyKXWu96ii75/pAExCQplbmRzdHJlYW0KZW5kb2JqCjM0IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMTc0ID4+CnN0cmVhbQp4nE2QSQ5DIQxD95zCF6iEM8DnPL+qumjvv61DB3WB/OQgcDw80HEkLnRk6IyOK5sc48CzIGPi0Tj/ybg+xDFB3aItWJd2x9nMEnPCMjECtkbJ2TyiwA/HXAgSZJcfvsAgIl2P+VbzWZP0z7c73Y+6tGZfPaLAiewIxbABV4D9useBS8L5XtPklyolYxOH8oHqIlI2O6EQtVTscqqKs92bK3AV9PzRQ+7tBbUjPN8KZW5kc3RyZWFtCmVuZG9iagoxNiAwIG9iago8PCAvQmFzZUZvbnQgL0RlamFWdVNhbnMgL0NoYXJQcm9jcyAxNyAwIFIKL0VuY29kaW5nIDw8Ci9EaWZmZXJlbmNlcyBbIDMyIC9zcGFjZSA1MiAvZm91ciA1NCAvc2l4IDgyIC9SIDk3IC9hIDk5IC9jIC9kIC9lIC9mIDEwOCAvbCAvbSAvbiAvbwoxMTQgL3IgL3MgL3QgL3UgXQovVHlwZSAvRW5jb2RpbmcgPj4KL0ZpcnN0Q2hhciAwIC9Gb250QkJveCBbIC0xMDIxIC00NjMgMTc5NCAxMjMzIF0gL0ZvbnREZXNjcmlwdG9yIDE1IDAgUgovRm9udE1hdHJpeCBbIDAuMDAxIDAgMCAwLjAwMSAwIDAgXSAvTGFzdENoYXIgMjU1IC9OYW1lIC9EZWphVnVTYW5zCi9TdWJ0eXBlIC9UeXBlMyAvVHlwZSAvRm9udCAvV2lkdGhzIDE0IDAgUiA+PgplbmRvYmoKMTUgMCBvYmoKPDwgL0FzY2VudCA5MjkgL0NhcEhlaWdodCAwIC9EZXNjZW50IC0yMzYgL0ZsYWdzIDMyCi9Gb250QkJveCBbIC0xMDIxIC00NjMgMTc5NCAxMjMzIF0gL0ZvbnROYW1lIC9EZWphVnVTYW5zIC9JdGFsaWNBbmdsZSAwCi9NYXhXaWR0aCAxMzQyIC9TdGVtViAwIC9UeXBlIC9Gb250RGVzY3JpcHRvciAvWEhlaWdodCAwID4+CmVuZG9iagoxNCAwIG9iagpbIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwCjYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgMzE4IDQwMSA0NjAgODM4IDYzNgo5NTAgNzgwIDI3NSAzOTAgMzkwIDUwMCA4MzggMzE4IDM2MSAzMTggMzM3IDYzNiA2MzYgNjM2IDYzNiA2MzYgNjM2IDYzNiA2MzYKNjM2IDYzNiAzMzcgMzM3IDgzOCA4MzggODM4IDUzMSAxMDAwIDY4NCA2ODYgNjk4IDc3MCA2MzIgNTc1IDc3NSA3NTIgMjk1CjI5NSA2NTYgNTU3IDg2MyA3NDggNzg3IDYwMyA3ODcgNjk1IDYzNSA2MTEgNzMyIDY4NCA5ODkgNjg1IDYxMSA2ODUgMzkwIDMzNwozOTAgODM4IDUwMCA1MDAgNjEzIDYzNSA1NTAgNjM1IDYxNSAzNTIgNjM1IDYzNCAyNzggMjc4IDU3OSAyNzggOTc0IDYzNCA2MTIKNjM1IDYzNSA0MTEgNTIxIDM5MiA2MzQgNTkyIDgxOCA1OTIgNTkyIDUyNSA2MzYgMzM3IDYzNiA4MzggNjAwIDYzNiA2MDAgMzE4CjM1MiA1MTggMTAwMCA1MDAgNTAwIDUwMCAxMzQyIDYzNSA0MDAgMTA3MCA2MDAgNjg1IDYwMCA2MDAgMzE4IDMxOCA1MTggNTE4CjU5MCA1MDAgMTAwMCA1MDAgMTAwMCA1MjEgNDAwIDEwMjMgNjAwIDUyNSA2MTEgMzE4IDQwMSA2MzYgNjM2IDYzNiA2MzYgMzM3CjUwMCA1MDAgMTAwMCA0NzEgNjEyIDgzOCAzNjEgMTAwMCA1MDAgNTAwIDgzOCA0MDEgNDAxIDUwMCA2MzYgNjM2IDMxOCA1MDAKNDAxIDQ3MSA2MTIgOTY5IDk2OSA5NjkgNTMxIDY4NCA2ODQgNjg0IDY4NCA2ODQgNjg0IDk3NCA2OTggNjMyIDYzMiA2MzIgNjMyCjI5NSAyOTUgMjk1IDI5NSA3NzUgNzQ4IDc4NyA3ODcgNzg3IDc4NyA3ODcgODM4IDc4NyA3MzIgNzMyIDczMiA3MzIgNjExIDYwNQo2MzAgNjEzIDYxMyA2MTMgNjEzIDYxMyA2MTMgOTgyIDU1MCA2MTUgNjE1IDYxNSA2MTUgMjc4IDI3OCAyNzggMjc4IDYxMiA2MzQKNjEyIDYxMiA2MTIgNjEyIDYxMiA4MzggNjEyIDYzNCA2MzQgNjM0IDYzNCA1OTIgNjM1IDU5MiBdCmVuZG9iagoxNyAwIG9iago8PCAvUiAxOCAwIFIgL2EgMTkgMCBSIC9jIDIwIDAgUiAvZCAyMSAwIFIgL2UgMjIgMCBSIC9mIDIzIDAgUgovZm91ciAyNCAwIFIgL2wgMjUgMCBSIC9tIDI2IDAgUiAvbiAyNyAwIFIgL28gMjggMCBSIC9yIDI5IDAgUiAvcyAzMCAwIFIKL3NpeCAzMSAwIFIgL3NwYWNlIDMyIDAgUiAvdCAzMyAwIFIgL3UgMzQgMCBSID4+CmVuZG9iagozIDAgb2JqCjw8IC9GMSAxNiAwIFIgPj4KZW5kb2JqCjQgMCBvYmoKPDwgL0ExIDw8IC9DQSAwIC9UeXBlIC9FeHRHU3RhdGUgL2NhIDEgPj4KL0EyIDw8IC9DQSAxIC9UeXBlIC9FeHRHU3RhdGUgL2NhIDEgPj4gPj4KZW5kb2JqCjUgMCBvYmoKPDwgPj4KZW5kb2JqCjYgMCBvYmoKPDwgPj4KZW5kb2JqCjcgMCBvYmoKPDwgL0kxIDEzIDAgUiA+PgplbmRvYmoKMTMgMCBvYmoKPDwgL0JpdHNQZXJDb21wb25lbnQgOCAvQ29sb3JTcGFjZSAvRGV2aWNlUkdCCi9EZWNvZGVQYXJtcyA8PCAvQ29sb3JzIDMgL0NvbHVtbnMgMzkxIC9QcmVkaWN0b3IgMTAgPj4KL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0hlaWdodCAxOTkgL0xlbmd0aCAzNSAwIFIgL1N1YnR5cGUgL0ltYWdlCi9UeXBlIC9YT2JqZWN0IC9XaWR0aCAzOTEgPj4Kc3RyZWFtCnic7P1JkyRLkiaI8Saiqmbm7hHvvVxqJ9DM4IYbQDjh0IQfjjPOIAINGjQzmOru6qrKfEssbqaqwgsOLKJm7vEyq5oGhFNqRsazcLdFTYSF+eOPN4C/XH+5/nL95frL9ZfrL9dfrr9cf7n+cv3l+sv1l+sv11+uv1x/uf7bL/y1nyECRMSvPxUfnvfvfkt4/2bfPO3bJ/yZ69/52m/u5PjBv//Twr9ZiH/jQ/7Eov6bz/j/z/W/5ZN/bSHiG0lBJCQEABi/CIjH1+IbwcG8pV/Z0vv7Rrz9dIRfkb6Ht0XA/hZv3u/Xv8Lbj/p3XfHfso7frg/inzg6/5sufPvXf/v17ZH/t3/z/4vrT6qa41pOp8vlQkRmZmYAgBCEgACCQBhMWIWYkIlEiBCZSZgQEaEvNyIB4VgiDHc1c/eILhnMzMyp/LrQhkdEBHh4RCAgESGmFEUARLi7AwAxMXN+nf6d8pWAKeA4/keERIyIREREeWN5h+7ub0QL83V5F/nWEbA3/cd//sO//vGXY9kK03kpRe43gID5wURIiIAohESICEz5JSCXBx8kcvzn4VDi2814lK/++E+JHD4+7Vd1B/bn0dif++3Aw+0cBzSiq5K+GmONIyLC84EBRMSPv1z/+ccvap4fVKfpH/67/+F3f/N3EL6vV22bq+q2umkAQCAAcqmlzkhU61ymiZC4VJYCCISIhNr29fbVdFfdt/XmbuEeZhC5SYCIzExMgIhIiFRqPT89lVJLKfM8E3G4uWm4r+tt3dYI73IEXdhU9Xa7qqqbmen4jg4AERgOAaDqbh4B5n6sAUQwsxRO+RJmQADwAINDogPcIQK2dfv550/bto+twt/9/vd///d/V2t92DeEt6r2vfl8kJNDTN5ptrHFeJyAB1G7X/BgJPKBR37HiAh3jwg3c1OP0Larqru3fTfVgAj3iECM+z0MwflTV3zz2xhfIQBM7aefP3/+fH18grz5YoiXy9Nf/83fSCn7vu3bBhCMQRCMMHMUgknoeSlVqBY+zYWZpirLVAmRiQgJAVGEiAERkABRVW/rZqbuYAEQUGuZpokQIRzDIcLMzC08chWIiIWJKCDyj5k2bQBRa61Txf6lIiJMzd0REIH7ZhAiYClSSiEkKVJEEImIidgj1MwTBPV1xXzg7maW2tMDP79e/2//9//HH376FN5Xthb+4eV0XsohMkTAiIgoTIWJCKYitRAh1sLCxIRVmBCJkIn6MTq0OA5BuotTClkM2eoC+O4J8EY6v9FVATjkYSggIOL85FxbQMxtQkAkAoSudwDCDzHt9sLMPXxsUFhE81CP/+f//C8/fb4eWmleTv+H/+P/+f/0f/kPbu3Lj/+8vn7W7Xb95ce23QDIHQFoPj+fnj6K1Mvzh8vzRxaZzk91PiOhCBHhevv60x//83r7ert++fzzv2rbvTXfW0RQEAYhYp2nUgoSkQgSXy5Pf/W3f39+ejqfzx8+fl9K8bbrtprpzz/98eeff3S3CMsvY64Rfrte//jHP9xuN237vt3czdxy993RDd1jXXXf1CNaUzUPCHcFiFrLsswiXKtMc0WEgBbRAMK96yNt4Q4///xpXbdHrfQP//D3/+H/+h+enp773uf/+y/7Rh+7fBzoRw0DAIT4IAkwZATSBqdk8dhiIkJEZmKifmaGpQEIVdv35u6mZto8om1r21Yzu76+3m431fb65dO23tzdrEU4AiAGIgAGUgLToXzwvQ7yb0BqpHIMCIB13f/H/9c/fvlye0RM8u4tiEiKlCJmSkyplRiDESpDJZgKLVUmoWmS81KFaZ5kmSoRMhIhIyKxIDMAAqVWYqFQZY8w71ppnishYRimoFgKRKiSm+dtpFZy8IBQJVUIiGmq01wREMDT7Jl9o5Wwa6VaKhGVUqQIIjHJoZXMPZVB6pY89OZm6hDhgPnutfA7xS1MRbivKwARMiECFOEiRIRL5SrMhFOVQysxIRHKoZWIEAA7vAJEABrYEu+7ezdwD5J7h1XxTk+lfA5lFMMqdaWExExISMgslPiNuGtxolzQ1NXuHu4R+SAiQs3Cw91bYw83h+ah7lOVR38EkZbz5eXjd25KtlXBtlayrVWGQHcCoOXyfH75IKU+vXz39PKRpSyXl7qch4ah23V2e71NXARdr23foqm3Bh4ERMFENC1znSoiUSnEcnl6/s1vf3N5er5cLh+//6GWavum22rWSiERfKOVrHn46+vc2lYKt31bBczU3dUsItzRjdwDsTGpeRArm0W4O0f4NNV5mYV5msq8FEQM4ACKALfoWknCDGqtidOP/anT9Pzy8vLykivf9/bQOnek89ZnRTiw9qHM7tpqaCUae5ooARGJOT0GZmYmADj8gYS9qrpvzd1VVbW5e9vWfb2ZaREuRbTtYI0RPNyUwz1VEmIAAtHhpx/KJ467hgB/7x9jDIWbtl7kzRF7r5UiYt3Wn3/+mVnW9batK4JXgkIgBFDJBaFwg8qFJCrIDMGOrLAhokLqTURiII4AD3AAU9u2Xc0iwDwCYBNeixAigRMERJh7d/E8IoKIRIQIPVzdItzczBoggM5oEyICBOIdKxEgoyBiDL+jEW1EiFhKESmI6dBxHBvTFT5EgDkEgLslmgUkALpe17atbxHogBAHPolDOwRCEAACEPY/TMAIjEFd8/UnYDgAgkekQGE3Ntj37L6vj5bzURCjb/vx/0cepv+u260h5WRpNgnE3QiJiDy9TSICwBg0WldGEJ6ed1/kSIvq7hagHmYeZu8Moba2byuGC/MyzQLhy0kIAThAAGm5PJ+fXkRKqTUgIhzCMBQcwQACoq22rbauvm/RFNQKkUwzIU51mcrCwuen83xamGVaTqWU5XT+4be/XZbTNM3n88IsXsgmdnNhfLqcvKM+8wjT5u6fPv2yrRui3PDr7bZ6WAARQycDAJGgVkQUd2dhNXO31nZ3YCFhYiEkCAiEQEQEDgh1VTV3MA13cLN3vAkefx4tzl0r9f/gXdmP/UtMm1iJDqjdn9/RNxGTJFBi7hAhH4gIEx0C20UZwtT2WXNnVTXc921t86ymAQRI27bx61dYMT16D08JhwDE95zQW78SAwMThN+90X500hvuvtDb6z1WWtf1p59/RsTtdttuN4SYBSaGysiLQCWs0rBy5QJTTI4gHth8HJS008gA7BEt+SSPvanb4Q0AUV9doWBK0ig8YuwFEaGwEJG6qjYP9zB3Q0TUGW0mxH7KIzydPiQgIaBh8ZKpDgCQUooURARk7JqTh0eEAGAebQB0TzaNGJFf171t6+P6DG7l8Pc7j5C/xHcqCYPzMQAj0F0lBQDhg3WJoUKO9437w0fi4dBQCaXg8Tbur4/+S7x7cMnFeGe6gokYCYMlLXYwpWpMWsW9a15Pc5GA1Nw8VC09OAtQc3d/VEoRYdr2bWVEJpZ5FoSulbAEVUQ+PX04P78wFyKKiAiDUAxFgDAPC99X2266rrZtoQqqUqfzNDPz0+Xl6fJBijx/fDk/X6SUp6fneZ5rrZen51oqMQsLIroX9ynCn55O7r+JCHdzTzze3O2Pf/zx558/m4F7AH4y76gRAQAp96BUZgF3Z21mbqaAbgYixELMSAk+EuwSu4d7a00julYy1/fEyoHnh2dOcIc+j5joOOV5YwAdZUNqpe56I+bPGdPuCgsSMokIIxKLMEvXSszYHaghMgHm3ppFuJmpWrjv+9q2RVXNwwGQhaXkeYkAj6AUsbtZHuTk/RveZTMiEDG62D9CKng4SW+u91opgQAgRiJRCAzAAAwiDEIgCBwn7c51BXRWwvODMRAiaTSL4Q74caTd+ylzBIrhQXf4ggiRQZSDXx1nbtCuHo5AAEDfhE9wHMvxRAAId3frGg899zL5+Hy1e7iZJ93nnu+AGK6a9Of76wCt7yie8XdKXP9AHDx8N5LRoW1+6cO2PH6Rw03H459dN0W+9L7Lx3vBARLvWCk/tK9r2nNwRHQCcAQEdERCcvREnv2jUi/1EIOPpfSDaLqj2m/FqhPiBHR3NTutRSKIQpy2IfGheXrMnX/whB5ExExFZKqTMy11XuZFRE6n8+l0liLLcprnRYrM8zzNcymlSD+H1E9rri0eDhQRRlB4IKK711JLqaVUZkFMLPsWFaeLDQgI7ASQ5wuGOgm8706kgbxffpfc957YmwsPwfhz1+HdDU31gKGHTz+Uav9//5sSEuObmM94oy5AGAHulLo4IsIN3BEx18dUiRiJ0P3Xb3T8MB58ycdfPkj82/X9E9c3vBKCJAZhBAZCuFQ6VapCL6d6nmQqcjnNU5V5rrVUEUY6fAq3MAiwDn3AIxwgEIkZmTHSywyEAHBAkEJTYUy94MnVMSEBdJebnJE5DZ25AgCieCQPw8NeCEcQUrI3ZuZI7g4RHAEIgORjudLikDBzJ5iSLrHwIwAHkFyV7nvztx5K9/cOZRIHHgFCQAIiYAIhYEImYAZGYDro7UEY3NVsvs3AOo/R9DfiPPa6S/GjMOcLh1qL/mp8kPWUX6ZICWWLjEwQB3V+ifEB27/FShERqj1CoM09wiLUQz0yRPVG1jzjT+BmYG7qqt6a1YmW5cxSSYqqgnmEBwQzT3OdvCAiQQCCFH5+fl6mivAB43eIcZpOl9OZWU6np9NyISZZqlRh5nmZaylMJFL6Mkdk/ES1pV61jN6O01lJAOF0enp5/s4NVaPIH3cyxED0AEhpA0Bm4SLuTgTuhBjbHmYGQNAjN12Tt2bu5u773rQlOZV22t5hpc7JPNh0wPu+p2PUocwdL40n4515GhouDjyNHVQRUUaqZdBJQv0BI2ACrSFE6BEidxsUETZNqrupQmAt9fXr108//XG9vjbcW9tgwDlAAIpOycIdMz1qLoxxfw8CMgxrJPX5rXr6Riulr4EABMhACKdKl5mr8NNSzlOpRU7LXIvUSaQUZjrOS5h2CXY3H2gt8ShTB1WY628QgQAsXKeCCG7gHgchHSP2RhHoHBHmhsap4tyBCAPoANwpc7n6gYYOiI5waBl8AB4QuUMi6J5+W+I3j2Ndwc1aU21q7u8WDd+t8tig4btlRgJSKqbjnx034cA7XQf1UPMAOgf6eHDIHtwwGBL4+ACgO+l3xRSQu/74VESjSAaUIzoTKpEpGBke65H3pA+8B4JTUjUDBB6q7h4OoR7mYe5vxCqZAvdACHNIY6Km6nWmaZpLnS1QLV9q5ioiTRd3JcRgREBhOp/PMU+1yOlUhfm8nJ/Oz8w8TadpOgGCcwQGElURZkIABsAYZiMDKNrcw9wsLb8UYCIkkULE87xfLi9m8fp6ZZmIdkAHSLFxswQLXEqJcCQ3Aw9CDOh8qScMzTVX1dZaZLROR4pANzPvjx32hR6bM6Q03R3ASG/h0Q4dauTuJ72VSRh+XzczlEqYiJmZEImJR6IMpz+YaiwCXIZtTJ/O1FXNNDyEhYnm+VRKjQhEBtCuAwkAA8kfWNFfuXDwEXdhheio9J5j8OZ6r5UOPdiZWsIiNAkXocIkhJLB/1QvKXxjaT2txch66LDkEWV6PJIQSdH1VKcIiOHp5En1gxqKVGGEGAcvGGNX475Xh3M0lvsNdIahULD7GB7uEB3PQX854MOxtMFMvbsiHmDqeNDBEA7c9GBRHhTZ0DOd6btrpU4zv9FKd6YIc0Ef3DcY93DcYbqex2l4+Lx8B0AIz8VxB0jHDSl9Ouw2rGOl6BTg4bB555fiQMExfPJvVyfCu5nsin5sbOq4hJUERCxIIlJrLbUQojASYhghRLjWIlKLEAGzBYQDmkdrAOjkTgEAN1gRgBEnZkZioiqS53ugzxheOZg5UVo1V9VuMFmYhUXC0wjFOOA4BHB8+6GCk8tJ2/NmTw/z8ihz38pP9wa70N2Bd+AgiCNi6KEIQByIKqUah98ImJQzInSBRyJHAjRHckJwc6MgdBv8eJ48wHSyU65wnL6UMUJmABAppZTMApNS3C0zfx6/17H9cRAKB4aD9/+NIZldxP8EsfQtVgpBZ8QiAECF8MO5fjzXwnSZZBZiRgHjiFBvqxkNIBagzVUNAoICAJCw1EIdLTAiqlp4ODhkZibCVHiZCgC0ZhYWEOGaQq89r62LNhEVltR+4Y6I6Ng5ok79YURkcl/qhTT2AdEzhKArU/Bw3cDTFXGIwAjGbtRymdRta7o1s/dQ6c4pHVLXIRL23KVMCmJEpk5791jfXRn1AIQP/qazbg9ZnP6tWhlO20F4PzhwB1C6a7O3mA4RwLv9xIjMEKCQSOvqRjgO3ADzkaAnFUlLZjtANVUWKID1/IG36+PmTZEQLJM6gIhZCjjs62pqUqYyFyKeT/N8mqXI04fn8+XcU2uIwD20RThiEAECNIufrmsARKwpXkYe6Nra18+ftvW21On75+elTk+X82+/+66W4oPGVNVt39zD1M0CEYULEa3rZobMcy3LcnrywG277tcv7h6ALAXyC7Y9wrbtprabKoATgwhNUxHhEdpLfQvjUdwxCx6kIsChuO6ncWi0h60KAPS+3R6AgB5BMRTTAw47/kJEIkVAZhU1QhKxoo6EIkXUkJK06FG5pJsSRB1c1DhIAMIwUiulFGJ6/vBhvV2v19fr9atqg7fmMDFEqv4Dnj9+50e24lDaKTxdzt5e77USAhAEAxABCRam8ySXpQrhUqh2r8QRANytmXUhxghQDW0OAMgAlKxUMAESMBMgppzhiCwSoTDVzFYwB4IOTxzc3fXxfhFH/oVbRusCgiAi+acBa+M4kNCNh8MdsBw2KcLCHT0CfHzrzvZkElS4R7MM7v0axPzmSjuUm3rE4HCow0NBDBqpc+gPVPIbDALJ/R6c97EG8KCV7t957LofZgggwxT3bR3mKwIRDQKdDuMRjkGOA01H55U6VsqTZuYpRjYApB93+8aBy9dYAIJ7EvKElCF3bc3Nk/RmpvNpfnp5liKn56flfEoSBJEgAtwS5WTG437dvu6bmatCaxEQjubo27r+8V/++evnT0+n0/6b315OJzf/+PQsLDEoHzPTpua23tq+KyImS9DUwoFIWGqts6q1tlvXKQMFJS1l2nRX3d0tIIiQmURIhM2itQEsA2KkUMIbwAWPC/QGI+D9YHdBzHAG4tA8HSAnDooR7Xiw2P0dMvGNzS2AEC3CAQnJI2OE6OJsjoQcQMREDmmogIQ7u5AVF3lYXGIOJyI3XU6n5XQyNxbuAanhl+SnDx5yiHomBOTjboxjkBYdMaVoHQL/eP0KryRZMwHIQIVRiIRIGAtTYRw+F9xtwGDiCIMYA6DH1Q7+bXA/mLDAI8NC6fu3ZgigZmYeadA83KO5pc1J2jupUXzABHf/CBGJIKtVACCQkPMZjP5IKx9HKPlyD1D3cLAI9cNrC3dYd92bN/0WCvTPPTag+2vjQcI2Gvc98M2DSMKgu+LuBfmgtfoP+nMOwAuD8EnI1XNAehDoEOyhxfDBNMEhOz1IBAAQHkAegREIjn6nvPqbjYgb9BKEDufuUdT7N3lHmkRXJgHUbSYSi0BEnabldBKR+XQ5PT2JyLIspVZiMvN12w8nONzDNBWCWnP363X9+vXmHu5ojhDgaI623W4//fzLp59/3i/783JGwKfz2QMyxoeIBCTCpRRyVg2zPEvoHqZ2W9d9b9u2RyTc6MVMiAhIABCZvDa+IyKKcMQR18tMkpZ6+K5qME84MTMxv1NMb7DSr/kvQyVhAFDEA11w930OkBEPJAMCEhOrEaE0K8WRqLQiRRFJhIUZkbg4ExNz8az9AsRAAoohqmlQPYiZJRPLap3msm8jGyLgEJaUwXueC769057Ne3ghQ/jHt//3eHBMOAsWJg6W8CK0VJlrEcZTpUmOG3q8FYyhHJAjAizpQOqcGyJynoskS80QAQjDYVtbajDrEQzfMwctvJl5BDEXroiJo7x7wJEAd2QgMpOIe3iDCCdgIUJAwp0GreDmg7u92yjz2JqpuXps6u6hFk09AvYWu8babG/+7twlHXa4SNTzaFEQhYgJhZAJmXAgpmOHUtV0DNKVoHsE2IhlRQdn4YfMdkGHg/DsWn4YgxSM+9kZQoqdeTgwPvhgKgCCErNGdOeX8DB80UOifYnSqVTLzEpIrBoIATgM3eMChZtqa8Bcsg5QAKbFS326PP3ww2+mOp2enp9ePrJwEAeTR7zu2y/XT+7RzLLoR7fNzZq2dbuZ+/W6fX29uQfzJDIBAqAG+uuXL//T//j//uO//PMPH7/jwB8+fpzqZA5ATBAMHuHTRKVM5o4ohJt77Lua+u22/uGPP379et32m3sQC5da6sTeS44iU5zCI7xXgxLxNKXGQYxMqrzebu4OzhF0aDciqrWWUqZ6e5PbncbYzdwye+FRsh62eRRsBg3Tn/8c25HZRNELG6L72f3TETDVyShsqIRYpGTxYK0TcxHheVlEpJRyWhIlZfYaZaAGGABAWNzt8vyyrptDlGmim0QHCQEUeHcyuu07VOgASoEPLOohoX1lf425/bXMAEQhFEABKkzCJEyFsQgXyaXpXs2RyYNJwBJSek2BRxHXHcUOKJBJTUkNmVlrnQcND3NXNTWz8ObmEAzA5IlI0eNwxO7eBg7LhgFg0ZkmRkBABqTIIoo7aXmcpDCPbW9q3izWZuahGntzD1BHc9ibf8srPWSNRAYiEisRvvlzcIt35TH4pAMj+cj5GanUg2CK99VDuYAdOicdiocJHfbm/ne8eXCch8OD9JR2dO/I3wHxIV2na6XOfEHAcOXGqYiAwF+BSp1iMHPELEoGIpZCwdM8P10u8zxfnp+fP7wQ8+6+R6iZ3m7X22buW2uqZqbb7Waqe9tv601Nr7ft69fVHaZpqdOCiIEK4F8/f/nDjz/9y7/8ISw+ff4y12ld90wDyNRCQBBiADC3fTdtbmYImUtp19fbly9fPTQi+Uli4TSq+Z3vq5tBDMpcROoCHWFuWaWBAMd5TFJJhEU6lfNOhDpWQod4VFgBQXdZSYjkPlBAQHeU3CP21jM1dBQQZ6Cpe/aIzCJcEKnUUooSUiktM5ObhhQrUoCkOACSWmQMCMahJSKAYBEkLKXUOk3zXKeJWNIv6fwl9vKRkTz3BivlMcMHFvX+3YaSiuH8PF5vq3MBmLAUrowFRRAKY+nUWH5ZAICet979KRgOG3RyORnljBYc0CDtuRt0y5PvFVlQAgCprDxCR7WSRzgERqgFuQP6roaICE7ghFmMgkiApsjg5m1r7l6ozFKYCKEgIqIza6BmbWmAxSB01Dz/NPW9mXlsu62rWoA7WuBmrmZvlggzESnVTTKD1CESkxAyY08IyMjpo0o6/Ov7wtyPeiZJD9o7t/CulFIHxRGmPOT4Dbp/eMU3HHSC6Yjh9z+aLRhh7hjOn4/b9A6548Ht6LLyhqK9/xwpc/cpkAM5IIwwwhvIzcLV7Lqu8AmJdvVNTc1+/vzl8/XVPTQLW8y07R0r7ZuZt02teZ6FZD7MzHx3bRQhhATgatp02/frequ3ShRJnXRMiSRFpnlyd2I2NXU7XeZmbd9vbu6uTFBrNbfWbG/W3QvvlVPhEYBpNJB7wCqVXyD2RLxRu8PcS8G/VUm5xeaOcf9lDOkai5j/HMB4iI95lknH3lpTdY+mzSzzlZMb6SCa2YQNkUStiCFRERZiYq7qIkVKccBS1N1FxEOEs/TvEKqeN95rY2vNyi0RMTc36xjp0RN9A5pTRR3S80YZwV2ifsWFe4+VhOk08VS4EhUkYZomkUJMQJwtAJCJETEirH8UjlxCS9VnQ5P2Ao6AAEcI0xau4A5MqdU1LMwA0APDwSOau3rkm/ev4o4AGtoMItkrDEKYdigSgOjogGTmujVXn+vpeV565eScWbs7wu5hFmuGSZq5mTe1bdNmvje7bmrmr9f2+etuHg7kiOqw7fq4aoRYGKtQp5AAimBGGudCU2EmLEzCg/YeW9O37uFLpRJPMGaWpg4GlDssDxwCiuk29jA7Ditx5xQOaXjUgw9CAhE9Uyo6NgLPrID+dvmc4cFFRByU9nHjg7sETDP5TcJJlvEzMwNVI/EIxeoQN6yfmpdodvtkP372iHVr26pq9vnL16/XG4wWGUl3ZapJsxYRTa3tiog4RWGCCG1b2151vTL4xCyI2tq2rq+v159++cXc57ksy5QxvSyCnpd5mqd0kyGgzPLLl19Q4PrF2/az6VYKUF3c4+vrurbNM2kklyBre8NDydkRek125itioI3iylqLiBARcyFizOYZD5d7NLWmhoiA/mavMKET3t3zgcryTKtaU/fwdd9bU3Pf92aqHqHaC+4SITKNQhMWkXzATETEdZpESin1tu611vP5hMS1FkJapkoIwP3zCQgRSpF5nk+nZV2XaZ6naW66mzVP0siH2ATc7VQXlyRQ7rb4oL0DIs+7jajzn9NKhChMwihEhSBTsgeJC4D3kGcEjiLVnqKJnfU5AMIhxd7TvI8eN9Fx30hgQneMQI+wPAaDKImRt6QWu3nEoZUw/cEAdAQHd3Nd1c0pvDFCUCkEIAhA5IAG3gnoAAzvToqNv22ApqwjdqQgsiPV5fHYDb4/9457Dhf2ZO7Dg4NHQzhA+NiqAzbB3WjAAZ2gn/zHV993DnvG7HE/kCTSANPwoKreXgmVHmJ3Q2PeiamDUhkQ6cBKb975z1yH1x5IABzYy0kUaDc3xNZs3dXd11tb16ZqX75+vV5XgOChbHnULGlWrpm5GSJBeIpWuLm2UCUAJiJME+iquu37um3EWKeaKDOFk6gHmJJdmNapTmWaZF8J0QGMkFDYIzA7fhyGfexNzwnqMd6+xXRU0McIxQ46dZyJb7ch48jfuNrYnYojgjT2vm+DmqXj1tR2VTffW8t66fz5gFdIFMxBiMah5oSo2TKC2ANY3DxKrR5QSmmqRDTYjei7mGLVmXvOerrO39tI6I7htn6LlfKbHszNXdphxIr7b7595VuthCCC88RL5UpeyZlwKlwKMwJSvF3fTnZn6ThAgAeGU2C27yCiKiLC4ehmAUEIIkKRLjVEpji5RYQ5uWNEJL2IEIJBAIhBaIC+K+6tZfeRXLTaUDgZSAEiQb6cLoxccBIs6AzWa9BJkIkcQ5msZ7V2wji56iK8zJlcV5irebQIdWgeX32D1o7vTAhVaCpMqZUQqmAVIsJJeBImxMokRNj5piFV7w72/bQPV+lw6gbCPTYlFfcR+DscN3zw4MZhe3T7HsFWf4DwVlXFEYT+BmD9iv55Yw3f8O3HRyASFZEZSdTZApv7dd/V7HZdb69fidDcm0VE7Htrm5r57Xrb1mzmlfgvABQi1K1p8whV3VURcdfrbXsFiLavpptuey31+en5tJyYCNy22+2nH/+43a7n82nbLiI8z/M0T4QkhUVGGgkCERahUlgYMBS9eZCFWoCpmrqbWzPbW7hp9vBCgKCIcHfVnoMmIkRBvRlMGux0EgwAzN/3DLCOlfRQPR1oHLruAe+Ow9+vpt7UPHzbdVdz9109M8jUMrkp3cKgCA5HRA7jAEQUinSsDYnNzYOlVPMi0nYlYrUsdHgLsu/RSeGeVVndDQfBO3Q04aPoBA5NdECjTpgeCuq9vD9c77FSEb4s5TRJ5a6VapFaGCEYsqYNRi+CYfnvrfwAAAhJuCIXIqylsJCbbh7mRoRTLQ6o5s3cI9ZNr+tmHs1QnSCCHAigIFwKCSFiECsA+m7r6urhgB4EAExAAEQ4TZMIX+bzh6cP5/nsG7QrhgEqQANgEEER8gATciO0DKIhAjJxsgC1MgCeT/HyAu5xbXZrvjX7ZXe8tmPZiHAqdKpMI829ClUhIpiEa+EDbKY0pWbwQzt0w3B4Qvd9iYOU7+kN4yWDCIK74B4SgaPmNh5w6oNOeQvXjshD/xNDBXTK6sCnBwCHA7kdqjUX7uDav0ECyDwVuQTSprBrrLv/8vm27jtCA1ihO48IAKbuZuG+b7vuDQAoKRo3tS3Cmuq6b+7etO17C4T50zItCxJKsnkA83S61NM81UIEbrfXL//1n/5LreVyeXr58FJKefnw8vLyIsIzTEQFMRgJCZixVp4mLgIEO/rqgRpkEW3X1tTNdN913SHMvXkoBHlhyoKktMSItdQAMEPxLHMNd0fE7F94OFYPWsk31dL00D7Hat+10iPYRez0Hgyt5LHubU9eqWnWlWdqC2APwqA7ESAgebAFIjBmBQqJOROVogFUSyPm520HpOwREEFdj9wDhMjc9VGt8zTNZgbAEQaAlODVEYHuhje6XxQjrHP4AXHIVGdR/x1ZlIQgPe4GkrWmPCpLjxZib67xCXHPm0LE3laBOhfYjwECQi9bjsDwMMtuJ7AbqgUGMAAFCBMFMnQsA9nPLZIPBu2dAAIxOFjMiDAChKRKUQ0FDz84ksiSOYCeTHSg3DulgtmMMb0OjABDNVAf1P79zKWnxsijPILp/iCrcHmkDkAPmx6oZRz6d6s3HhyyeSCrOOiiX3t0SO4jGoID0jxCW/xm395uYgdef/7CexrfXV1++ywkJAagjFabRWva9haxu28A1rPgAUKzm5Xr3qwpQDhGj7jr5mFN275t5t5Um7aAQMIgIKIoswgiErNUoiKCAOHZj3d1UxGZ1snMln3RphFRirgz9VB7j6kxERMyAiOMsAscjvYDmoVjK/Nyd4CggZGCKDK76Oil0BPk3wdxoyeC+1HiMyw6jpBEPu3RqPQbSv4xE0p6bnQPDR293B4QcX6CR9YUJV2XmV4RQORmqoSWyQU+EqC6QLwVM0QY3Qqpt5yFznA+wPQh6UPeh3Ad7nD/Zzx+p18Ru29icEy18FS4YAgEZrEuIwEyEeezOkjCLAoi4loHDogOQZIK7lkU4RlibAbawD1um7/edjV/XfV1dQ9oRs2BARbCijCV8tcfnl6WWoTnmRHxn7+s0y+3tdmXTb+s2tO7EzV0z8W0bW3jtrs2dw0RdEvLYxCO4ESR7fiYkRgBUYIwWTsMAChFpNYALLWVrdVNq/DjIjPiUuUyF0IojJjkN2PmqRemVFuU8OZO73WBplw8hNFJBGgkWLzb1eNHd4U+np/HavRiGTmch2Qc+ugQqsPk9XyFnnc+/pnOLOSxGJ+M2Gsc8NBEaYojBspKI/OWOEFEkTLNszn49bq3fdvW2+vX6+2GoARbbxsTFhGmu7YdIkw1evZNtiGwXfc8KuoW0BsLISEKS6nMMp+ep/lckC7MMxG67vu6r1ezJhyllH4zpZjZum6lyMvL8+VyEuHTeZmmikTLPIUt2J7it99v6/K6ts/XXc1N2ZTNRMOMIcIjJMAy3k+Mqi17EhERZa4vUfZURFTNHuXZwsfsXdjBI1mhe+XIPdni7tA9bEU/wg4AGTJ2D82a44is6vGACBzFh4nhOncbEZxhBMpmNZh9EdSsqQJg21vbd2HS1kzVEIzRnbC3sffsE5utftIMEAtL8bvjHxBHiW50FwGpZ93hYfDwruihx9wfGnX8Ca0EAEI0V5mrsBu5Y+YuESX5woTuYa37GZlkI0wi9Vg8ALTA5N0iS8oBmJmFbXM1VYPrzX75vKn6ddfb7h7QHNRJEKRgIZjP5e8+fvf7D+d5kudLIab/z49fkH953fWfP13XdrWBCdOjJQQI17ZuCLZ52zUsrJAbIeIov01iiwCBhdgRnSR5gs7AxTLx+bIA4rRKLVylveuQy4yniS+zdIgEKJzqCZiOzP0eHMsgTgA4AkQQdjyZyaAU/UiPBIJupd6BFup/J8sG1CtsjpSou8G6g6bH/8QdMyXqRDjyPIZHN15wqMgeOuyA77DkeX/R/TfCQS7dL0QspUzzqal5vO77vt1ur1++vL6+MlphRYim+9ZWD2/7te23iMjaFHPf9r2pqfvamnkAITEBwjTPy+nEyMQsdZJSl6eP5/PHQvgitDBu16+f/vXTfv1qbWfyWouZqTszX6+3T5+/lFJa21VfpqlKKaVUQjrNE6NP8LzEb3S//fzplfDL3sw0aWVTCq+Z8lYjSUp0ADAzVTVTImZxRKpTTVV4ACXVfprfnTp3b81a04HJjsArDt0Eo5Xeg2GJCAizSC+rac/vtKwx75VSONAIQEodBEf30SEgiAIB3QOAzFpTiGhtT63UWlNVQjAhd8bMTPSulSzZ9MzpEpFSAsBDwyEgNSKMhMroWgpToHCAwqEjBqTslYPw/vqmDg6Bs0gyHsMHx8OOiRzG5x+/vncze5d8Pt4XIQDMQS3M3DTUshXGyAiJXgMNAIxYmSbhWWgWJsZZeBJRh0IsxJlydL8hiAjXlBV1NQ0Lc7JgCPSegHlwK0ngIWQOsB9qKQvZARGFsQgJI79x4AChl+8xghBiluAS0mii9OgrdQbontgFg1iOQxW8A0cDssTxW3iAS/D44FEfvYNL8CAGh1N3X4D7M48P6c96e0tDmhEewnujUP1PeoUBEdmlxFQ1id1m2gANXRFCLYPZmfPiGEHUm3Q1IqKgXjLihEQsiJh5fMwyTXOdZpFayiSlCiJzb8xoZq21ptJaAwCSXVpzDxEVMx5je+xIV4cj3AHUe/hgYQqHWqIWMCK0XZ0iAznj2B9+nSe1ZE5090R6/PHher8+WS8yGi50HdQJFxyswzuA1T/2yO0+jt5b2XzYxdw+uLPXB6MzuJ137ub7f8ABZ2LkbnZw1CkPzE1K1YOE2D1GOEQRY5DvR4u88W3gICv/LQ8OAEVkmebTUmKP2A0QMjsJAlObZNHICBghAFhgrysbTos6mEd2siG+j1XYTb+8btuur7d23dw81BEwXaTkoUAkJoaJbeF2om0KLrsj4snhQzlVsOuM142a2aZb0z2hkDVbbf/JPglJqPvuEbCTeBEx8lJBKyBYZMEPlCJI4BHFumdu5gAgDOgNEScBISGIKqOYHgAAiHAufKpMBEKECExwz07CROARGajvdFsgAGUXEQDEzD8PiCxRBgwkQoreODfNZmeHsuUmdsWHqTczdj6UYA9Bw1srMuTy2P1UPomNem34UFGPuiyzPLqNw77J2eN0pHNExHACA+gYsQUAAO52vX765Zf/ujf76ecff/789fp6+/Llj9frFd3IFcJzMAYgTFWm0zMzXc6X0zybxeutbU139a9r29WllmmemPl0OT89P7PIfH6azxckRpqAK7uz3cCaNrt+ff36+fO2rdu+ceGnp5cXw1LrNC+n5VRKQaDWlCgL/SEcwB3Mtuv153/9l+36NbA8T5NXnCa6PFFT/eVn//J5M/d1U9U9Bjvb9qbN1LJRcC5jkTIBwvBLsjm/qqo/HLwAMPemtjU9mm14PNJZbz24OxYNAHAHjyEhmdyUqLtbIDwoyYyR9VzCwACwJOMfwhTuYdSbZPU/ZsakZqoGCKbmbtvetr1tW2ujLjRrGwMCgtwJIBTVkAZX5BGJyTzQASAwM3Fw6MwBae4U2p/TSiDM8zQtU9FoZgIQ1G0J9OkPHm1U7ad9M4DeWqQb2N71jSDbmjP0rDzYDb7etuutrZuvu7uDEwT2SW0EQASFozJM7Au1EzYJk90QcHZ+KXPF+DrBlwmbae+YDBHm5mGxb2uDgIRGAOBccJ5KMCiyCd5H1JEUzr7xaRMs279FMAJ4A8QqIrVAZMjlrpcy6DZ3rdSxElNHKyk9HZcGQFbjAzimsx2EEdG5IQcgRMbw0Qsl9ZA/nPJUdvm5jAAAnCsFic4A8IhF4FsElPI9RGBI7XDhukYbrNL4uNHzByJrNYelxfB4yDuIdCmzJcob+Ynw2+3zp0//ujX75fOPP3/6ut7WL19/Wm8rqPrewL1UqVNhpno6vzyfaqm/+eE3H18+mMWXa1s335r98rqv6tM0nS9nLuXp6en544tIqcupLqcIeN103RW18U3B1Myv19vXL19vK79uN2LeWyDXaZq//y7meSmlIJI2YxpOVfT2Bvvt+ssf/rB+/XR5/u7luzNJPWF9xmlvzdrXdf0EDTI5ISIy4NV6ZUzCc0PEUufZDRGTSY0INW3azCzeNll2j11Nst9gdsL2R32U55ViwA0ckgBDhY3UtJSMg9V+iMF2sJ02ErMdhGVgjYA8Jao3EvE7fT4Uk3GWNKiqqe1723fd99aadaWEJCwAAEGRrTu6N3QALs8fxkgRSDdvyPbh6L2P/vyaVkJApGypCVJABACICzEH5OGNLCyDdy97YFQj2XqKDEQCUNZ2ZI1bny4wogXYzxggogMWylZzAYhqvqs5eL7lrpgvQ0RhCqBsZhDfhLNjcCneF6lXcfRu/Xevp8fDo7faiOgVAAF3t+i9l4LQw21HZunRumk4rocKO1apn+SR+xjHR3T8khMy8A6OYrwOx9MGJIYD4tAghWgw1iOz7Ru/6hDWobT6K++qdPwHDwWMR9dW7B3BDh+0dxLEu5Z7+KiI1vb19rqrq2qeDhaWIp0p96i1LPPEwufT+Xw611qWeZnqrBa1iYc5mBQqYCITS5V8PVeRwlyIxAMQHAbWyG3vVTuGoIYeu+relFh9TEUVkSyYQKJeFuURFtZ0X7fttk7TZvsOAVhLEQqgWrnWghi8MlIOCfPufXUHMMkO6o5K13V9bEGvm/pmP8Y1COK7b/hwXqE3pBy79+CQ45Ec2s8aBBANIxSBSU5mw+G+RQMxD20Q8XhqHyzZgWEenbrh2w05QSLioHHzd9QzGk4hhAdCBip7OiMRuQdlm9guTL9KAnyDlUTm5bScpyjsUwWAzJp3973tWaZk2JKexAPT96Fq3Y1g6AMXgIsBb9o+fblu+/71dV3bvps6IDNyDyIjYu/7UBAu7DM6Iv70ZQ01DERnALzh9BWXBgQIp5nVEaByZrRl95Gsn47IoTcR4BDmjpatWu1grXAwx4GJcoEwesDYI3IIXxyhkTfrgwSlUK10NE5Klwpg7CTctzfuf493GXI3ptAluY1MkHFlh8R5A4UfoTeCMY+3t8sX7g/GuIscKPfA/xxJtPcvkS4m0h0rPZyVR2yVAox3WzYKvztbcbDdhG/Ukqn+/OMf/vP/+j8HyeaVhOs8P3/4ztTRnZsjxOVyfvnwVEr57uPl48cLM09lqTw1C8Amm0nVHW7cVKQwT0RMtCAtiBJQ3cUjWot9VzRDdbJM0g8PUDU1D0SUVymfl72pWq3TPM2Xp/PptIhwqVPCP9tV13b9/PrzP//h6y8/tusezcs0n37zu9PTZYry3ccLcVu31WMPsH1v623dWwsHZmGGUrqOr7UiQISr7vu+m3lrm6raN5OXoudYeoxkmzdYaVjMEUjo7tbhyGWMgXvv0N63AQIdetOjQ6WNvhPRyYOsNU36xzvKPViiLs53imkUQlmHhH0WLCIzhUit1Y2JgCggm+pan5CWs45NW2pnbS0RGCFGuGr/mGzcjg9f7de1EgIQc5mmOs3ABLVA9DQFdwskaDu4k4eDda3UVW4ecIw+pVOIOJs1BZKavl7367re1m3Xln2pmAWyXIMRCUthFhGEGb2iA+KXtYVaOLpRBFpFnUqmE9XK7GgmOHLWMnujoZuDAVg3LtkmCCMc3YBooIYjqyAJHgDMhkwQ6K4PpUl3HTOW6GFK5WirNNoc/Wo44TjjD+j8+BUOZJ5keQRAICbFgAAxkh5GO3DsTh8iHtMxD63U2x4ecumH4RtkOw54c/BKfdejL4x3nrIDu9Q+Y4OTtR/v1jttvAdm7v71y6cf//DPWCY6/4DTRQrzZYpA9igWBPjhw/MPv/mu1vLdx6ePHy+E5Eph2DSatkADbpNKUCNmZkEixEpYEAVAPDjLK7Xd9VGMmGyzuLkFQKnb9HrzQLM8RNP5dH56fsoJvbkh1lx33V7XLz99+vLTz+hYuNRlmT+8TBUD+elpBr5cb/z56+fbtmYHktYaIREXwuzoKIiYGeKRLeLanr3i3M3jfWZAx2hHbssb0chOyD1A2gUOBjky/n9kZARAr4EZoxiHCYp+NAPc1A/11EXRw0dgtQd/Ujbu9+MDLHnvMNSrf9P7Z+IiEkTMmANbLeenR5ipmUa4NRrKCNxIEcHdPdMNzDMCNcI7f04rDSHF4SoMH2Zo1IyVUB9pGJ1GO3qCU/Ir2YKTI9Ad3cEMzNxV0b0QEmcKJQCAcFZX01yl1CIIM1iFKILIEkwOYA7ZmywjaUjBAQBYi+T95seqta3d1LQ1B1D3EM6kAcfs/R5DJ933984mxiN79CtrEsejHGSCI29ooOzxrNzdvum/pqbGEgMgYhBgpi910TzmPsRw3FJtUVdG3MeC91Dp3ZXrkxU6QR2Qg1xxQJy7B9g3+BEoDQ/hgS9/WI8Ynubgu7sgU28Y/XgFhKm1vTEUJpEyQRCIQBBHVA8CnOZTrVOpBYnNwSF0V2ugFq11o/uokceBOUJH/vZPp76QmEk06VWAQMpqcsD3Qn987TxgwlykFMnUl3QrIpu71MLLXAHicj6buTC/fr2a9bhFBDCSiBxdZxExOxa5WwIB+dVOJu8l7bAPx4nDIZo4XO6+8B0iEWFO07s3raTx1gEAIxscLAjc7uNEInoH6/CHGzkEYgxkyL3snMjhuXWnNQiJOEZGMSCgYSAGRJrPCCcAs3xsSXO7MSBQEBoROh0a8Zvr22kC2I9d8LjvrpeYEYDBsUQh9xEDgGP9ureIKFKJi3u0m+nubfd23fbrjTCeKyGgO5ohAIoQSxHhl6fz+TwTQHGl8ILIwk6oavu+hwewAa2AxMAVGQDn6RzAInJ5Os1z3dv185c/bO16ve6/fHptzUoBYWNyxBY5AiMoAwE9k7uf5e6Nd7flkXv5ZsmQQARLoeG23l22lOU43LNjxki+6yGGGNgnIwAi0vi9ZUSd0A879dC+hjk7jUH2BcVe19IHFh7WFXsRVopjtl6M7CQ5NvchBncch7g7mhk5HCC7g6N3J6q/FaH3GNzDbz322/766Tqd5fzb5fL0PYIQLYhcAGYEBrhc5ueXEwsRwbqpW1w/77drc4etkTqqm7shOBISBVIAWoBFgAeCg3m4tVDtLSg8CKmUuc5nM4PWIgJ4QqlIFZAejlZ0SBBAQIVLyLRMp5fLk+g+z3NhFAwCRdiZ+Pl5fqJp33Wa6uvr+sunz6ou8rnttq6ZdlBPpyciAvJ0wdObc7dt21S17U7M7xZw8DA48HsXuej4p2dKDM9tjHJ7cLmIqSc133ekh2VwxMGSANshmrdwMPDe9NsdAYERuoTm+zMOVOGAGaXMmaHDR0RI0lmk84/hIlQK08BgEGGu6cFp283UTTdhM22tEaKZ7YidYw9w70N3/i2t1EWVhjEcP0klCUQI7AzYhzPddTgAQu+STVKIa8/WdTd1a+pNWXCuRIRuoPnxQlxYhJ+W+nKZMQKNwZ0BkcgBHZpZcwwkzzJdRBRkQGSpRFOdynfffTifl237ynxdN2eCbVuZnAiYgjDbYhj01NK0vH1c3xvVE3f/fRzZb7QS9NkIB57BzmcOajrur+/nvb9Xl8Oh58fbHfwjHKDaoYOmexFPQqSjHggRijCPuc79/4QI6NEHnY+aOiQPPzpkHF+bDozYhflx+w+H78GkJy13dDYbAOpdPCBAm+1r42JMtdYTURG5EEkBOBEw4ulU5mUiQrdddTf1621//bJFoAYHkMaouITAtMHdq8DRfs57d/CDec7ZbVIICSwiAogBs5HI21mmQzshIBEzSZW6TLNPcy2Fe8GQIygiznPhKqoeQcvSEOl8+sO6bhBtXTUiiLiWSsIB2bqLEEGEszSXmUtZ6X2c8s1JG5NsAQD7fJO+oXSPSuRAlTuGQmHJKoUhXgN3DFLFrbdYd0VDcAyCsLTJnoxhF+K7QcP0CnNsI0BPGc+JENBbN/VRl5xdlkWopJGEHh9xZw8PN0YwIzOKMFNEAFNFRDPLlnJE9499d73RSmPzw9yxzxo8GgN4cl7Wo4mjuC0VM3gAmLuFIVEgC2ZWiIYroleBKDAVOC/IhGagCgBY56nOZxG+nKe5cqYVhDkhigghRQMORfdSSpkmQLRgA0LiaZ5KPZUi50tdlkJSL7qU6u7w5fMty3+OUUO9MjHIc6p2n92Kh6DG8KDers+veGBvF/IIZdyPcLfMjx6Gdy3hY0xeh85dS/Rq4c4rZVA+odLAN8JUCiFmR1AiRBGWO+I7NERWF2b1hlMfhDX6Ah9fgY4vgAeBdtR8x0OIB+4KFt98ySPy9351sne0EAv13tdh1syCGA0JEA2yMxeYgzm49wk2EcjBKXEWCIFjDi4MLgQo+GEcmx8ODRCRVCkTo5IBuSMX5AIkPR5BAOgB2Q6lg9TuGmFOpMEsiiNGwAi3cNSWbXsDwQvhMpWPH56J6HrdiKamNs8Ll0qEHuG9gSik6WNiYOiDId/ID3Q2JKFgKqORJRDxaCz77WVD8fvd5u4nBDvMaE986VlyjmgQgT7y2rqti4EWo1cedBXfZ7ebB1mM7skPDvLhSRISEQQwQ0QGN3upAAAAuKOHhxNCkBEp9Ul/Ednmycz6qBULRMc3VEK/3mOlTJJs6ugK1qATw+7u+76ZqTuogzsgUnahz4zqiNi1NWtIdLngjBjmbjt4E2xPcywIp5k+XKgwqqEqAPLp5fn8/AMRVYFCEG7b5qpOLGWaiYVaw0Luvszz5XQmok1tN2Pm5w8vp6dnEV7OU62lNZyX7/f9XOSX69f1Sqiq+76DAyIzV0SK4My96m0NR7FQxGg/9UiU3P3pt6cugUYPaqRv5jDCrYf2yWKlbMftno2kenHAYRoPlMOIjBQQhuiPMbMx4bJWnqZCRLVIrUKIRWT05cDDBQAAM1fV8GhmrfVWsJkj+vjOD98wPODevvRQPwe/MJ6cv4wBr7L0+F0MDgBZSqmnUmYmJgB329vNA6MIT5MglfDmYQBmYQruCCxlxgCQwAg0d7CwDFAkbQFu3gIoQ7cBAWiIBmiAEEjIReZzddhbk7iFO5eFZKEyg5RgCsZAD2yR5TRZoJHGn7OBjUjlMjEXJgy3PUBVLcABSXCSKvR8xn/4u23XT59v//yvn7ZNvbc8DLMMvRgCggcCJldVS33XtztLySRLMXtbVzrQ4NBKedApxyIIC2ctMva2sLUUEb6j7sEUZvIFRFjThuDu1qgxIoBGuOX06UAANwxr4RjWwpobuzbTRuiGQRiQxz7zeIbYZ95QUB87W0uKZdYpAgCEZ0DcdRczNVUiMFUWAQAzQ4SeFOXRmo35rX9WK0HXoRF+NGnLWURHmtWRFdBJ7hyO6hF7010bEanlfFXPFn4IXji44FzgNGEVUoUmCIiXU708nYiIQxnMDMwwAEmIq5CUQDBVNK9TneeJiLA1aMAiy1Ivl5mZpiUbpYvZJALXeaoijTmyue2Anpglxkn1ZUfYfjQPYi8g7p7Mn2C+YVDGSQfBiMf2lwyasCOmzKjz+9T57m4kRjno58NfDqI+AwwBkuROFkmkFGGmqZZahZBKEWE++OtDn5gZEbo7KEL2fQZEtOTAR67DG4U7UBLi+DIPnNOxEo+iM6pzI97ZOQQgTPvJhN33cjPzMMI0Z5Z19AEWYA6RWEmORYPITPcRVoKBlSCyWUZ6GI49HphhGSIWkkIOyA3BkQQpc1QYMEnsGHV+cXg6AHgv/e2DJzEFHtwt1EMRuZRCDFDk+enSNADK16tLaVln6+4R5IGP5D9nq9xvmuRijtTO4cUJb6P7TYPMO8xVMiVIPcSRY2+JELMW7WFbOoaCiJ4x51lg27tuZC+oEYbLGig/JHWEMC0R4jE+JTrZONx8vDv/QYAQNLASDT0VjllRAyOzWqQgQPbhTUc7h2N3fXSnTO4S+V4rBUBgeKZhxcGBRgQgESc5FRSA7qiG7rA3u667u6upuRHHtu3MFObtdrO9kW+FgxCfL+U335+mytvut80C+fQ0nc4TMVdGITIzuV33trNInRcWMTU9n8JjnqbzPCOg7BvvKxKVKZB3IFJrBtj2dtu2tu97sxRzZi9igIBIZoCdjU4IQGP3BuNzJ8f+JAtwF6vhzSDcD3F/elfp2eIyE+KzUgeG1OUhylONqVeySx4AUF/rLq/MVAoT0TzV02km5qmWOtX04Lp3cKCVAIAwc20a7k2ttZYN57OVR+9j2LFbHNVNmXsPyXY/KqRUngdweliPrIo+gkOPi1NqnU/naTllyByywNNDTbem6sGlVIcc72rZRC378/RBR+4OlpkNmH2x0YkDKZCRmUUoolaJxuhQAMl6h/te5dqpEqJH/yIx8WEdYATGe5IdBIJHqGlQuFsnDXt1dJg217BADBLEZSrffXzam63bfr1tanZbd9UAD1PTpgCY2ZVu7xNGOjmT6oVGaTb23kwRkRC56xNiABxDkzBbQRJSLUVEHiDyIJh6eDvQHYzNgJm4Z5Yll97zUTIDLltLZuQRoGdSBZNblmyMXizvMfM7HD0cS4Cg0e6VOQ9ckZIeXGsFAZVFODvEMv+J1ua/gpVGs+Yxvzh6kJopB9QRUEGkdfddTd1vm376clWzJCbTvIe3MNOvV9u2Sfwy+yT8w8f5H/7uw+lUv173X76uHjQ9LdPTmViW+TTVycxer6/bvgnzvFRmzqQACBBiYYaI2+31ujIg1CVYtoDY1Lz5tumXr9u+6W1tgcycvSwAIAg5O//17Mm+qtgriqDb/kRV/TUD9by/sCPrbpSi967J3c5TYZ0xiaZH5WDOUut2h7jX/WO3fBnaONwxQCRhRsJSZJoqMy+n5XK5MHOdpjpNOABJF4nUHtlgy816vzFte/PwtrW27+HR9l2buntrmmkorakPb9yz0cUARoesHCW7ONK9I7Cz0Hh8er+IaF5Ol5ePdT5JrYAYkH1rLSAciZihVFbIgb3mDBGADBzh3qzlZCeLTCMk7GvEjgLEKLVME4RDKxIChggMzYlpaP/kZpEo4/1CTGNSaEQmHIcjUESMPP1ek+3he9s52E3THWDoi9L21Q0AmWQmkqfzdDqdHfDzl9efP33ZWwO/rdcId226b3sHBcg5L/qNBBFRIS5Mw4NLGBQRacN6HggkchNAFMqBJSiSTbhpmkqRgmObDoMHERAGEQxBbkbYhHYmhAziOXSdB0xYhEvJbt6QXTfc1DBMoXtw5j4mO6XB7qnTAz/FCDl377KD/0heiYmMGDzMBAFN3UhNfZdGQIV9Z2NywrcV8L8eg+uqd2ip8fed6yKCTETIxGrz1kzNiIEoAtDUlBHMTJurAgURCONUeFnq6VQ1YlI1x5JVBCJ1nqZpMbPmFjlTd67ChIEYnPwsI0aEmhRjQGAGpMQl2W3GNBNQE2oQUzhzyhV15XNvZZW8YOd6D57n/r1/jcm9/6qjqqMk5H5192j4a+7gvUc4xGhKCdmGDkfcDtONyNaBhMPM55yfWgsz16nWaWLhOs21jyRj6h30huGKnHlnyhzuOVDQ3VN0fQx1TSHLaAORd3L2wafsNHB+HXxU43APw3VeKb4xdMmaFGbBIW1pc9H73FF1VwdG8EDrBH8AYOa192mPh3pMnDP+JLUBgcwEggEIjGH4SN3g0JSDn8FRTTb8F4C7V3L/ezi4neLtv8Fk+jzziDNFK4RRuADSvu+1CkAklknM4R6YxY94hAjh7f0d5gf6bVL3KdN97/COemX+6ANOSYIhZZoVHVZsUJZ37sCIsooqz6v78AqPoFt3V2nEwrplg4flHz7cfZG+kfWHU4FHcAY6kiaKiKw4ZWImitE0ztNlxlFa/vb6phclUy2lTiXIgrK/iluOK4WACLcwbQF4u7XX121vdr3d9tbcjQKZIAjWm/tOGE5qBCDEyzyfZ1rOT9PpaTrVYsybhwMWASEsMl2ezs/fmSlMS9lWppgkmB6gY6e6oix84jkAUBAZPSKYyR0oTjGXFlI3pKq7mu7ZviedKQB0okCCAM/GJTDK4hAZGSCJws7EJA/6Lbw83G18q7t7tNrDLFTd/N7PNLESQDcsjMQeBHdqk5mlMCKx5BwKqqUSU611OS0sspxO58sTs5Q6lammgHZput+YdxDuGYMzU4vwrK10s31d27672bZt2tRU13VVVVWznKI+UlPeebF3RyGV+fjhr6juoWozTTmNVrqQAMjFIMBNtW1uZGqeNd86Yvym4Q59PAwwc61MzDKVOhViOlVZKmOQLsWphpmhhUD49HQ5EQKvezNo5pUJQ8E5Ewg8ianoyX7JVHRvSrhMtU4TkRM5EQOgh7MjCTGhE4A7IwSiRzaos4z4TOLfPc9qhfBFBLZtD/d93dy9bS0itm1/P5CiMzld3AATtHf9xJBIuSTXRZxYqQiX7IheSslO07WUtBOAyfvCyFPqhUzYM80n06aq4Zqh1yxamqfpfD7N03xalrnWqZZapHC6VZhJQRnUOfTno6gddGzHTT18OPZ+1HYCYTDnrId05bSUUoQQN27pwv0bHhwCcA4smqqTB0U2Bo7Mms+BZe6tuXvcrtvnz69b03Xb923zCBEARgfwzfcIBjgzMWGhcj6dn871/PS0PH1IrUSrkgGWAsJYyvzy8ek3f+VmfPq8byuFlrhSKIA7KECoWmsOEbVIXRggMu0w55hpAE2AE5ljO7dpuViztt329dXNbrdtvW2JoRw4vSwfmUt52nJ5XMM8QQwiH5Mqvrni+Cvty2DhMoFCXdXNfG/WmrlHHjrAkV4JkDxCDC+lT50mqrWwCAtP0yQidZpOlwuLzMt5uTwzs5RJau2G9OAV8IG0H1R29FLJsLbpvrvbfru2bTPV9XZt+972HQna3va9NU3638AgDtqgo6Sujh60cAdXb9jduxjlyUfvNIVpa21viBhWA8G07fuKSNmCKV1Ly6ZIkDF14sJMWFlOk4hImcu0FGI+LWWZC4I7Va8WpkpmOxDa9flchFjWvfmuVgkxDEzBtfO40THQIE17KwYWmabJlxlCIzQre8Ii0Bm5iEQEAziHeay7ujkQBW2AOJfpcl4CYJ74cjrdbuv6evv8y6cw2Ldtb7qtm9sbrTQQdHT+HQ/9fhQ2cuWSXc6IjulJlRBLLbUUIppqHVqpo3Y96mjdITxJfndzsxiVHyKCAGn45ml6ujwt83Q+nZZ5mmqZenp7x0+JYuNAbAMKPpQtjHQmgGzEk0JCXcx7cSlKuFNE1FpMSYtOtSpp2ZMaZfrzWgkOq5hU7K8Yw3v9Xlb6ZLHPyOwcTIRHjwBwulIkUqVUlhoogRJAEQmEEisQMpMUQOIySQQFsSsFBhgGBDj1meuBPhwhD4ug7PMNgE6OWV5C3tAku6m7qTZ12hpERLz/PgHHmcsj+PY8/okrfu13D0GL7FTQhzv1B3GQyeNsQNcoI7CRGbZJaLIkwykiIiyFpfTRNyLE8qiVxq1H75Iwbi16D7H+UW7uauGBRKK5GsEsLk7Wy7nx/tquhP6MI3uoqT+3TPe4WkAEYlDvHZqKK4AwIDy7rkUm7wb31hEghMIojDktlZlydgMCRkiguCFpcQhVnaZiZk19qgWRapHMOB3ZNPjmvvDufR8+UgSBH5jgzoYHYJYyJKeSxPT4fQhDAFaRqRY3r0WqFAhE3IeZ+HZlBufez1lf6nTJuBvEFAdCRMl0BaTCnHojpyAdTLcD9N5m2S8gMDxC2A2FpYgkSMnyWmEixJrgKOUr/asBv99K1j0eeARWcuPxjXMXh0z03yJAdux5iHBGd91o/BlV4m+v91mUZtq2dS8AuoHuKdmUvSeThqEcgAUQodra3jBiEgGEKlSEACD2FqrCtCzTUuX0fD5///vL8xlP5fO2vBr9/Jl/+sXd44V5Oc8CkyttqwFhWZ7L8kygFCuFejT3LcCKxeQWHtbU9gYB7O7ugDSLALMFbcYW6IreMBx0u+63r6btx3/9V4d/VbV1U8+pk300CCT3EQAW4AgeYEcsw4/Q2fuzBsmo9H8dQAndIQzcIjvkqXrTyI5U0b01QEyqO5nWPtCxllKnSszzPEkpLDLPM4vUaa7LmaWUaZEyE3HmzY/o1yEk0BHAIADzzhgwIkiqlxbuLLVMzU2lzLrv+74BcNs3llUViHRve86eOYgXgl5MNqKVA2+M8/xeb0W2JvPMh6EwRi8UIDAXuFQoBc8nfn6emLNzFUJE74wf6esaQBe5UmmenMTPZ3p6nqTI+XK+XM6IALGEa5jtt5vt+/W6LtNyva5fX9eXl697s2mW06mWKj98/2FZ5lqkFCFi7DMBO2gCAkxEVMQdwjyTgnAcMMKcJOkBjgR1koCeaRwQ4K3tAYBCeF5qYfzrv/rtNNXbbf0v//Vff/n05bZt7/KVIr+vWbinVc4wGyHVQswsLKd5EhZmLqWmi5kPioiUnhfCIti3AKLzcblBBhHaMgLr81TOy+xue9tba4iQblMt8vx0nmqZp+lyPonIVCV9q1TSXXcTOiETCZMxcbYP8p56T9mraPzB0dITAKL3MURkiCBgNxEDVCm1FEKsIkWKiL5bn/daCXKkzL7tG5DtZHtAZJnjqA+DUX0HEW7atG0skh8zFZkKR/RelIV5nqdlqafnp8t3v7t8eAmIT5vHGr984Z8/ebgvFxacBCc32nZnKcvTpcwTgiPsCO62mV0jtFP/Hu227tc1ok+YROKyLFyLBq3OGoRYCGYE0u2q21fddwu4vX7d931vbrYDIvBRNR8wJh9CgANYHreAzs7+iq1Lirpn9kSyxZGNIiB5JVNXi9Zib+4B6u5+dCMJ6eUO1Gf/MZdSa63MMs2L1CIi07yIlDLN03xmKVJnLjMSEZdsGjvctwPQ9soMgKwLulMB4ebu4C5lMVU3LXXWtu/bCgH7tgLKuirgrh4AbZC+/bvm/L6jI+exHvcbeKeWIlIlYTiCM3hloIBF4FKxVng5yffPNYdDFxboPVgg3PdtNW3hpm11NxYqNZj95UTffZhKKU/Pp6fny+FUuNt+W7W1221d5vl23b6+ri/Pr61ZnXmaRQp//92HZZ6KsIhk4na/zXTgEYCIRbgUtMiB4YTdC6WeBt/XlgilCBKq2d6SrGq6NwBkns/ztFQh/M2Hl+cvX19v67a39nq9Eb9ZpN751PxITujRGcZKmH2knqZaSilSpmki4lJKrRMijRgckjATAY65FSORNzpllYyHhfs+T+20RISamhn2GatYhM+nSYRrKcs8MbNwVhrn7WBEbzWf1U69RxWREceopXtURqPLcAe8kQmiWdsVASzGQytJwZ5lKoWF/x0xuANvZ0J69EMY8K5bd/SJ6YDpWiL6YBERehZorXWapzrPMi0yLdpa21Yz05YjvnvRB0a4mTbNCkMiGWPOHAiDLEIwAt2DHNlRLEtcAByZADmAuz8ORFiZllSeWc3ERXqjtpGthsM5OZSOw72b0HBIx/f81evPAvORW3GYr7vLlh7bcN/7ZueOd+ctUxC5o+rMAB6u/cFw41ALXUWMexr8Z/6wu6WEafTJiQMBjIXD2YRFxIp0Bz+DejjQX2YwYcBIs8SHQYR/wm9DRBGeaim1zFOZptoYw1UZ56nMU6lFlqksUy1FqkiVggNxuXvl0EbuphLuxsxSCjFNk+S01Cpcku9jwkxDLoIQreWKQhGepyLCdZL5VKTwVMtI6qSxRvD4PXI58zYePNIH7Rv3J78l+d/wixmWFKFaS61lmuo01ZyU/bhECXlyVFRuzlRrrSXbwNZSipR5mkoRkTJNlYmllFoKdjMmgMg02mshIkLEOJwRj80hwwMhCMHd2cjdsOdv4kEPHP7bvScOHozifW1wdKcghDErODLRiY6g5wOvlIuWRT3RKXaKyKYCxOPPrzK3v5IZMMKbFronT9FbEfYQT/flLGzzuDlwA3IgDFcPRUKoSHUqp9P8w+9/9/H7D5fnl4+//dvz08vPf/zjz//00+36Cm0twZRMkilo216/bobTcjo9fSCZiYirIFNEC79BmGuztoU5xyqwRLirZlH8Hhg7ABWqF+YqZZnmJyLR9lW3qe236V9POCEGRHFnBchUuLth6RVoMIqDIDKL2HxU3v6pa1DMI94UORZ8b2YezaK5R+8HANRLvWmayrJUEb6cl/PlJMLny3leFmau8ywlUwFmFpEySak56AZJsjK4V4cfDvlQFdmStPc37HlxI/TM3H/Nxd0A0W0iKaZa6hqI67bJJuZ+W9dQ0OxKlrauU/84pqP2WvODintcD2b+/uPL3//NX03L8vL97+bLc2v7169fW2vLXF+ez7Xyy/Pz9999LKXM07RMc3dpAd1t21ZrzcNUd3fLtCxEXE7L+Xxm5mWZ5kkydSJHwFKYErR9Dd+0XYvwD99dEPB0WS4vZxae5jLNlRCZs+dXVt5EtgsCHM2rRmv0wQz2PtOIEDyUGY3GRgi90AEGBxMWvkJgFSQWxOV3v/++zBWIpul/uR8ugPNp+e1vfrg8PTMncUTLPM21ivBpWWopwnKaZ2FmkSxYSaOVwVo6mreOvc13HqmOPaifmTIRkb3DIftIux8AmwiTdBPmWiRZpceR5xBBCEH9mUU4lKowGIdFFioWgoJB6IIgCNQD412PJDOZ6UIMji5mCFZcizK2vbRd2i45ou/xjP3KjJPcqXCH7HAKAD1LxTuCCHJAA98ddgcEIAcEQA4yY8JpwqnIPM8fvv/+h7/67en8/PTxd8v56dMv18+f1q+fviyiZ+GCJAHoFtba7aatMxJElUrh5URSABrEDmC6rXF7DTOOElHD3bi5qrm3vamZFJn5xLLU6bScP7KItqITtL2W00QVwADYgwwAoZMLHmAjzJnl1H44Kvdc4XdLBABvCi1ixCLSp4wc2qUW6q52gEwMgBRDEZ6nWoTnZTqdZhZZlmVeFmKu08SlEHGpE3HOPivUM3AZe8+gY1R43/foiUbpcMPoP3KvJ4ceV2QIoHBEdFcksrapsLnPyysRrtuW2SSR44CG0uuyOroXDqN4LMf9IqLnp/Pvf/v9vJw+/va356fnfd8/f573fV/m+vy0lMIvL10rnZbTeVmyggoD3H3bVtUWYWrNwwbLiiIy1YpEtdRS8nxmeyYCKzt4YQxvpus0LZfTLFKfXi4v378ws/fMdTxAT25qLz3HQfL13OcxxsQDPBAzR2nUM2Nf+0zFdPeBXgGykxmgSBUSRPj+uw9lml9f11LL4wGbpunjh5fnlw+lSJFCROdlXqaJhc/LUmsVpqnUdJpKKT0HnEZ1UcclQzBHADZgZGJ1cq/XYJqP9Au3HnM58m2yqQ7d6/6P7gb3SFSPRaEwOVNhCiYHpMjcZmAMQmAIhiCMrOjE/uYHZ44EDMZG6CpaRBE2kVWkivC/ySuNu+2O3PFF8fA/4s0aQGQ7JiREZmTGwjhNMi+ynKb5vMznc5lnoOzk6eAGboxQCpc+kxmwjzMaBOjhPh6sToAbhKMHRlD2WlcDVVez27rtbS8VqGwVyb2kBgLoXdIBHAiQgQS50pGDAYG9U+DhlVpk9ZwHRqCPSXJvVNDggnEknoyoZG+wEaP5w2CFu9wyUxHuCH+qRbhOtdSa07VYCjFlw7yugzIZHw8PetxoKqEYpcE90hPDxcYe0ALCe1+le4Q0tVUXOO6uIguz5ef2xLYe53RAAuqDiu/HAO4g4Y1aQoRayrJMyzKfT/PltOxFwK21Mk31cllEeJnnUmqvmBkhspQD6bNnGD07xHQXQrIJwVEDenxoX/cAABEutXSuQogy/34I8pDXPMJdMT346A/HEQdWytnWMD5wuM6HL2F6yCiWUkop6Yl2eiLnTr+NeyNAET7N8/m01FJKKUx0WuapTsK0LHMP/EsZBqx0tyn7oYzwwjtjeRzKQ1z71nQnoIefR/3vw7GGoAdV97BQcM81uRMQkO82Gir1uRgEQRgEkV0iCIfUP8gLIzAhRO/OEERMKExyD/jdr2+00uhZ1k1/+LEVBIEI3SExCPU8fMI01cKEZ4mLQCn0mx+ePryczs8vv/u7v/7+r/8GgQFoa7vqTr6Kb4vUj5elFFmmAhRAME2Vl1OZF0ZydQzX1VCwzz4OdwVrFA7m4hAW9nV9vb7e9n378ec/vr5+OZ8vv3M7n84B7XQ5MYTZbd9f9/1m0UhAKkwXCSlxjP6JcKOIADe3gHDdtW17eJiKm6ipu71foUw2GRySW1hz99DmrXl6cJrqCfF++Ak7WBD+8HL5/vvnUsr5cj5dzkxc57mUikQikqohWwVlEkC3BR5B3kPXd33QndB+Z3CwAYCY+X8jWnd/RRcaYpZSEKHqPi0LEdXrysLmHpjdUAAR0Hu7b+iuXLpuBMhd9h6Eiok+PF/++ne/OZ3Pv/n9755ePqrqtt1UtdYyn+Y8aaUWJBJmoMyIIQRiDhSGh1SC46bv7P5oAATuGOCZKmqNCJ6ez6WQSJ3KRMwiYLq7Yw8ep7Ie/X6h651+3BzBEccw08hEKsRwEw9Lg4wjlRoB3WJfte1tvW236w0Avvv+w3ffvRBGTiKEMCEvAsLvo5RP5/Pf/P533//ww1TrNE2ZOlRLIcJSJKt5R+esg3c5uK6BiQfiGbqiO553IeXMVgM3MqeIcDPPNoDDAcgX3VOsu40FOGKtPjKDEya4UziFR5YtAghGxSDCglAIEEMI5aiDuqcHADEBkyO4kAkrRquitWgthekt1fcnsNJQkT6+6JE1l5OlIqzjAQRgpFqYCafik8RU6XKZXj5ezi+X5+8+PH33UZvfXlV3dVd0pWiV6zLXWkVKHxKeGYNSCyK6OUKEejatU/eIcAPP4iTnxFJbi9d1X9f1518+ff7yy9b2p+ezsNd5imgA4t5Ud7UtQImDBMtEThIwevpmsMizr3eEh4GFtqxjNwdzfZcZEAMfHeapF1pn6C1z1kaaUuQxok4mlsLLXGuR03k+X861lOV8Xk5nYi6lihRAHG2qqdOZdBfqjo3iLpDDOo62XBCQz0kZ6/3SBhAHSJZyGFNEQhIGDC6l1BLh0vkFgjE6cbyuD+/Eh0kqPf7z6M0BENGyzB+eL6fz5bsPz08vz+7e2uJuUkqdp96745BYGPYfEZEKycGaxtu3HoA0U7/SkI8KY3dEnOdKBExSJDtqg7tC4J2GA4D7JKODG37AyumuQmbDmhP2KY197Q7GBcLDmulu63X7/MsXALiclw4cIucEOGHI6O94vxCnqX58ef7uw8syz/M8E1HG23AooeNTAOFetTOAUNebb6iFB/gz1A1hGCIAGAI6RoTBodD6sU5JuicNxf3Hd/j/mHHWC+FGpUcioMzfxmAMRBQEfoOVxrI5BqEDKlFhwsjmMVzk35FFCTDuOjrHkn0eHsQoAAMxhHgu4gFTocrAjLXIPOE0ldPlcnl5OT2/TOdLPZ3jumm7butmupeCMUldpno61Vr4dObTE0mRaeZSiDMZxMEU2h6W81BXd7e26X6L8DANUzPdt1u4QhhziCCRq962Dad9afuNCEx3Nw1LYiEzag1MD8IlURKEIzihB7lweEGnntDCDen9ih1e1KGYHmUbU3yJEAIkCDGYaZqEmJZlOp3mWstyOs3LqRSp81ymiZBEeryfmOEIhMAQIsg6eoMs4jzcWhjR0sd7Ok5PJ0vgwP8I1GvOhhfTT0pXnt1XSOOc75szBPIF7tGTQt5g7vcLhL3amHuQBQFA3LEX02QiTH9m/+sgZx48s/t/Ee5A4NHt6nTq0HHEwhJZaXq0Axnn9N1NfuvrJKl0fPLIQOunEal7zN1xYEdyJEfUgOYR4Jvq1ogZhITIs74W3s/Lw5wHQSQja/GhCu1BBed3ivsXfLitAzS8sZf9N2M9hu4ZVtTvUfW7Vupv3DvzZntP6GrJIyDccgpyVlGFabjGPe0jKJAAGLB7cENDAQA+mL+Mj6QIZn5sEAqhEAnhv0MrRSdHzLypAwAjIwohOlJOdkU0wpiKfzi3pZoUroWY6eU8vVzmeZ5+8zd/8/u/+av58vzx93/79MPv4qefbv/4Xz7/9FPbvp5Pssjy8t3L029/W+rEp2c+vSALT2euC7I4RGubA9q2eeC+r7fXL6ratut2/epuYRreOluAHrbXAuczlaK39Ue1X5D98vRsem771ffN2+atQVNoCm3D/ZYkt2cX0N7UF7KPPGOIUDjsG7UNdwAu7xcIBg+ecGLA2xj+U28QQQHMGAClyPk818JPz5ff/Pa7aapPz88v330UKWWaap0PZQB3Z7xvaES4OaCje3ZuG7wPHFppQNrOcQwZH0QlYgZhIR/g0UM6HjoyIwmTZ+IeExtgzsXpwju6DlFAsgPQtck3SZSAyCKllFJLKWUqEhG9zTkRCnWOq6vw+5e+8zpD1T96JNjF/O5j4B0cIgAic6kTiRzp+wHk95SksZwDvwIM/ifbfiA7cVDOhoxBgEIqpgwnZF46BVKgKFZFUOQt4KtGxP5pfZ2/SpXT82k6Fwa8ErYemXpzMVGtZaq1FhHhbGMztPIhYl1fdKx6+CwjX+U+k+6NaMLQRNk/xgMgK04iwk3D7MGIdh1HOFwH721CRnO0sGbazFRtu9m++rbFvkXbCJzBEKMAVwTCw4O7Y6WDg0t1S+RA7uDOoEKM0Cpr47WI8L+llQ6NHGMYJQISUAAGcmTkGQHAmXgqQojMJIJEOFWZ5zov8+lyOT+/zJen+Xypy5nL16ZtvV1RWxECLHWe6ulUpomXCy1PyEwyoRQkjpziEtAM3GNfb7frq7a23V7X189uFt7CFRBKFS6cWKkUIoqmqwds+2vbb0xsurvrUbaf45vBFcIDGoSNQvJAJspOR5wTYcEd3YAFvsnwOsDsHdwOsxTHcaWHLh9FaJ6k1rIs9XSap3lazsu8nFiklElKvauigCF1Dw+y4yV2VxJ79XfKaXY9tf7xbtATRBIgda0UFMAdQzk+fNr90A/vYZQG5Ncck+kGDxO9bPf+svdr07EAMQ+3FYFyeFlSo0k5vMEvb8/j/fzdby/ulS93VyvFFAduAiSWXgwSEdH5BojjYOODL579Do63y2A/Pvw+IByCBuPb26ZhADliADlk5hwZQAtws011beABlxAip+jezbdLREcu2uj89pbwHcgXDsgYj6vS/+33SMbDS4cyH6sQA2WkEXU/sD08fEZ0PDPA1NBKkRrNzE0PrASe7fOdIigzE+9VRMAYDAlVR7FuxoO7ixeEIIQQKMl287+D7T5cfPdoahFAoOhZQQqM5Dn2AAMYS6G0fKrGDFxPp5ffLqfT6fm3y/Pv6ulEcgaoEBIWoQYRzEIIZVrq+blMM0xPOJ0CcFXV7RUAgW+AbB5Nzdy32+31yydtTfdbu10jci6AIyHGhFgQfJnKPBESsiASztOFeSIsgAZYAJ0Cc6xK7Ltd12x+csxGBoAgch7lUoQAyMTTLJNC9mx/e8UDNLlTgeOMZcc5AMgs2sxOmqe5LqfTcj5P81znk9SJWUgEiRG7IN110cAE3UcEiKMLCgx6IO8AAB4GVENE3kDyi9lSi0VcBJHCI7MoE0h5H0dhB1+ee0/DnYneSxMCwLx7OTk+Os9yvF8ZAADiHlLM1KrhYQYYQM7YyPZmw1F4/No+cjF6UkY+elj3bFkTAdnbzN3XfW2qw32NowsIo/Qd7UOO81PufT5h1OhksEyEjNC7s9CzkXJ3x7HJ0JOnByuMIVSrLEt1d2EyN3KM3u0eMgVEvmk74e498Tp2M0+DcI9IdO7HOx/wGG28o6GOlXB4wcfzAobkjNrsQysl/fmIQtMq96xI6CNaIXlxtwjXXU3VVL1trlvYjq4URhgMTl0HOUFG1gKz2UP2EKVhHvtXCzdCwMKuLIheRKaeGYAD+/4prYSQaZ7mvu7NPUIB2BGpFGfmfngwUGCZxT1ua1tvjTjK8uHj7/+70+Xy4a/+h5ff/y2XWuYngCW8eDPbd/EQKYwyPb2cv/tdmU8qi/Kial9//MPnT7+Eh5lmofm2b2a2366vnz+ZNjANawjABMTIzOhngkWqvDyd56UGcpAA8rJ8KHJmmoiA2dmhAJEq7rt9vbbPn5MhhYjRUQ4AMYgAgavIJMhUpklO1YBKeRsgiF5ZEh5ukVMWxqDErtNL745HmZc8L/OHj8/zMj09P7989312kppPl3uEJcZxzCb2qevM0iBmMEzd1SzuRjJlzgGyU3L0O4Mg7CWdLCzChCilSilIlAXSiOkGUri67amY0qgNxMQA6B7WC4yBIlPhcqwFYOQBHbzxG/lBKaVOpzrNJALEEabW24ikgu2TYyO0aXZ8t4w1BGSrZRhdGd2zLSSMUGxoNuWIUG2WD9w8nJjLVKkH+CoRl0JToT6ShriDvzhSxzI05wDOBLUKmGw7tswNcdW2A7B5i6gPqqHn2xJ6rcwIeprs5ezmVNhaQ4wcIYsQRWQOqkXoLbdk5tvWtnXbcADPGLTRwIcxmp/8Ch82tFICwiOwfs+pHRo9HijqroLj/rzj3amrxWNYdLipa4vwtu3amqva+tW3NayxbwhNACoBIRSEgkiIBTGT9IWCKQAyrYUAkYABgTAwxN0xIhzMPCYFt9tWhN+7cO87mcBwCSOgl0xiDwQiZcE+9JwiBGYidKK+nCy1Lpe6PJX5UuYnYkGqvTvFMTElO+yycJ24TkYVqIRDU1/Xzd2sNTdVs227mel+u91eP1trGI5hCN2sBbNpcRNwLMxTTa00BVKRiVAQGJARKZDGNJkIVW9tyPvR5zJzMKgPQ+mTQ0CEWOgd3R2DWIrhKmRZTsR97brnlO1HhYtwKVJrKVMttZZaM107CxEQszc+3mfG9cMbPb5k5hFmpmrjZwaZJnfg7V7J17WS90RsxhAfHDYFOTGSYcZ1sjFjxyYjtwBHbtVwprxDynyMY0TLqIrEXyW7O1sfI7PUzC0VeTa6N885121vrbXIVlBuXSvdcdS9m30uRES01lTV3du+qbYY2UosPIWziHnv5YwoQkF08M1vPLjHP4jQ+5/dndsEwPgmKnDv895fEoQiXIsYOzDGAJepsTu9+FYn9VXNFo8DsmT7TejI9GCHBh3wCIXGr/v9HTNKYZD/KZEwVrBDokRVMbLCHwINAEEIiQc7dA3PSaHuqZ7cNKyl74bh1IuaM1mpO2X5lqPbMByO6cjpwMDobVqIMm0y54PKCDv+Sa10GDIzggghdIRM3kRCoaD+DXO9nAUgSKan5+9/kDL99T/87e/+9q/n0/ny4UOZFwSwtuu+7us1XLM1VdNm6Pt2XV8/q7bNX9eQfd//+E//6Q//8l/DHcAx3Mz2fbXktm2ncEbISTNmdrsZMVFFx5hMT9tTmZGlTPMLyyRlYZ6QxNtuLdruTUMN1KAZbJbapFuOrClxQEMICLJgd2I4S9AE6sOzv6/RwW1nXPowS93Jx4gMwBFTKSyZPzNN0zzVWll66cDdMUklN/qQumkeRdOWDUv31jyiNd3GAR6pukdI5ajz7Km6ItnHkrUKIVm1YkZEZiFmSJTCkJvd31LNzUx7P09LnXfI9lCYj2Hrt1GjfpnZjz/98o//6b9M0/wvf/xUp8VMt7b28da2j55PCXy0NY2Ibd9aaxGQGApzNMBg6iFJoIiI0H1vezOz6/Xrut7cXc3cXWo5PV1KKSwstRJxLdNcT0Q8z9M8TdSnxlNW1YkwhZE1DCdwIQwmF7Zawqg3lszAVDgiATgCBWYjIeRK86m6BxIAhbtnEiEJ1UmQgABLEWQoRd40yowws33b1nXdVVtrZn67rdu2uUdrLQfJjQU+NHxnA4egHblWvcw843o4ku+7jiAEAB7R1ezohqOVGGSkGIEQvaeG9jCOq7q1cNd9t6STtGHGuwkAUDJBNP2qg5A8NiwHK3GyE5g9EaC3MY9AdmDODs3hdZr47RTP91oJAMLDVE0JIYQpmeD86ozRE808hwgiMiLh+ePH5x/+appPf/+//+//7r//35VpOT19nE9n03b99NN+e91fP4c1RI+wXTcIu12/Xj/9JGX62uLaYF3Xf/pf/uM//ad/hIAspHU31d3DauHTUphJilQRAPiyXV9fb0Bk6Ju2+XQ+v3xfFph5Wk7fT8sTghAUAGx+2zfbN9v3aA2bwqaxttRJlA3XVcE9DGCHcEDcHTYlpiheTtAM7BvuJGmH6Bn9w3u/E7i9HoSZpyq1lmWuy2leTss0T3lsiO4TcrwLWb6ba2tu7m7Zp6013bbN3Le93bbN3Q+vJ2/icACwl0wAM2U/ilKkToUIa62lTsRUVUudkKiUyizRh6l6cgeq2lSbWsuxEH3w38Huj+//Pmr25lLVf/mXf/2P//F/IilYZiBRbev6qtpU97Zd0yNLNk81J/D49fV1XdeDqBaR+XQSKVLLvCzExIBEBBFt3XTdm7aff/7xy5fP5rbtu5pN0/T88aVOU1Y8I1Ip0zSdmPn56fL8/CTCl8tpOc2llg8vl+U0CcLMIBgIXhlJCKvAVMMMpOe4p68E6COzGoERAIS51oKAZZaylIiwJJwI6lyywf3EUqAPJnqzRE1vt9v1en293l6v19b0xx9//vTps5ldr9e2tzQt0OduEUI2Fu8hiLjTbo7ZiQmRiUqRo2wZsyVTEUQszGml5qlmrmYWY6eoZAIrpwr06E2WtblqhGcDwwgH3dGUwIkCsZdwEIFwr7AlPlrQC/WuBqVHfpER0d2RJSJQDKX3sUaCed1zKNOf00rwQNGnVwEjHb2nfwzvIolhJCylnM6naTkvp2VaZqkTMafPZKra0v/P/tBunlAo/XbQFm2Ptq37ettuN4SAwsHo7mp7uDkVBCYAAj9Cw+YKQXmQVFUTb0YAMKFAUJb7dJzcfYKjLXRidgTo/eN6IzlAB8ghuwRgfiTnv12dY4EeMFJ3awZh3COiNPyCdw2Socd6jzlIg6E8cJd3LZXN3NO9Uc1BANq0aYMHrJSblrYRESKoA3sC0vxcI9YIMjYiRWIig87/Jmecf/yAgdEj0w/Xt0kA+TXf/sgjtm3/+vpKUoI1Uivdvqq21tbt9upm2V4KcvCBuZm/vn693W4xXJhSajOXUupULYKFc4ISBOi+27artm3d1nU161rJPeo8ufcRb4BYpO2bMfcAYCmcbnzVclpqqQwEgRQEg5LNDoUcAEB9xEjfqWPLDqKfgIAQkIWlSngguEfkW+RaUQ+Fvme7oxshy3EPe2vrul6vV1V9fb3u25Z30hEQ0+FgwvDsUrrzfrhPPeJaSyaIZVQrU+8IMYTdhXuTBaARYR3h2QRKAADYGdPMAtdEKJHjXsKPksHRMgDuDtrxDe8/ofHbPscFqXdtzNENAEGc00z/HTNOAqJ3GTr4kmQ5H5tY9ByfjtZO5/P3P/wwny6Xy0WYMeL2+vXL56u1/fXTj/v16/XzL/u2mZlp020D1+vr16+ffpZSbkab4r5t0TZyRQRBLMjAUIgDaJ7KMlURdrd9W91D2+7mgKCq1Bpv+/X1laVqAyk/rbfmFmYRHt5utl+tbbuB0ezkO8yrVwDgrHRNGUrZAQqATFNBRiQaecTv1FLmmvmgPLI5f3IvgJnORZ1aYkIRvE+2CXdrTgDO2d49RtC9N9v2MG2piFprZtqa7vtu5tu+b/vm5q2pJjV2RP6SOxiCwkTZRie9MURqqntrRFSbJRNcp0lEMsMDIPZtv91WVV3Xfdt1b2p2d0khM7BGPDsbPGbYP77RVWb208+f/vE//1cuE89PVGb31vabu16/fv700x+0bbXUudbRx4XM/HpdX19fD6ZumlXmCYUz2osQqrvvDQAv0/zhu+8g/OlyXrebu+9t1GafTiLSTLdtNzdVX9fXCLjdXn/88Q/EdD4vyzydTsve/va77z4uVabLqVRBB8pWOKXK6QwRQehExChSEQVG4xvvJGQueCACCHLliCDgXl4pQNQDaPRQ7/ogQdlI3lV1b7pt++v1+uXr19ba1y9ftnU7TjVny4TRdK0zQuP459oLc6bqMgIwAyEBUx81aTlBFyIcO2IhInBzZiIM7yozc/eyWRBEZKJyQIAbugOEZK+pntlPTJCEGT5MW6ceo8hYyNF56dD53EcpU/SBAACBWJeduyj+aa0EEBAWQdEVJ2C2UBp5OalUk7zPdi/ny+WH3/x2OV8uT0/C4gHXL1+/vq7a9tvnH9v6ur1+3vfVTLW1bVvD2u3rly+//CSl7MF7yL7v3lYKJcACVJNuJgGEeaqnaWKh27rets3M2q7uBhjWVLntuF2/vkLwvjnieZo3Nd33PdwJg9HdbDdwXpxhh3mNCQAKSkLPwiU7GFViQGzadt0Bg5BH1e07kYKEMT7m4h4u3MBKHZoSQZYrM+Mx2SZMHQHQghwPNNIJa3cP02aqZtb23VRb033bzWzf923rWqkNrXS8Ho4gBQAzqREhqrKqIKLsu4gQUd1bqZWYZ21S+mQqRNi27Xa9qeq6bvuu+25q3hN8Rp+PUcPbJ4gxETF5bwf3qJX8x59++V//0z9JnefnVuZzhIXvEfbpp1/++T//l+12u5xPz09PwjLP8zJPZn59vX39co3eTj3UfX66cBSC7u9tbd9eXwnw4/nyw3ffMVMMnr+pmhsOJ+J6u/7y6fPe9s9fvl6vr6q6bdu6rYg4z3Wq5enpSQpDwNNp/lAriGBO5QskqXwiAHBCQ8oZYzCc1Vxr71rJnRyBQDATUxMYBGbypuPg0ukbONnZbndV2/e2bfv1ev385Uvb98+fP623WxoXyGmA/1/2/qRJliRJDwR5EVFVM3d/S0ZkVVYVUAN0zYahnhsuPf8ARCDqOeOHAmccBoQ5zFyGqIn6AOpGVeUSGRHvPXc3M1UV4WUOLKKm5u4vMqsKVchDarxwN7dFTReRT5g/Zv44JSJk5ijrj/JkBNzqmj3whZkR3Q2iYbGTg/bmNuRqRFjA3YSRwFplNBo7IYBja7QQqARRQg/gBEbg0JK240og9iERXkFYMXRN/W+CS5vSBF6zbQgAgQHJ3VtGxngpnF5mKr9VcXKFp/awpeIHf9HmJgC0+Lc7qKqqSCnrurhDKWstq0rtc0y2yY29A7I3qjVWICcE7nYfNJlA7GkMza/p1snVom7i4bXWUojWdbmAo4iUupoZIyQCMxWRaE0P1BTOe4obQmp0YpRkMCA7IiEnSsycjF4vdje+zfZwd4Y9UovbkPZue4eDBAhmcK1p31jznlqye6p7Uy2nZw+U3vEoshwCRGKyAoKakSoSoiKimjupggibV67bISKAVBFRCd54x5K1wHMvCNml/HXzvJ/mdUNonZfiXx7A1Q3chShFzYBtBmgfUJ3LvrIHFPp3oUmWeMs5HIZ8PEzM0VEPNlTqgU9EwiqSa1azUoqIUKj9AeSUogYGIsu7p3cEza/aVCkAXAwUDAjSwGSECK0lJ0CPVCP0HMGm7N3cGPQWftycGn8FS9t9b7PNvQdRgslrlxQBnIgiXd+MqFXr98mObcKHlEJLgO1NCDr9fA2qQhsn22xCswjNRQy3Cwq4gymYYU+hwBctb5qJAhAcKzqiq7b7SKpEho7BiCAStTyMHp2D1k6xBaqb0ODN9pat1MLfQVsAtlW9HXGAKoAzDmkYU86X8+Wv/7f/PQ3j8eHT4f47JHZgBzKVOp+krloKRkYr55wHJ0ycWws+IkAGt8M03N0doiTNtNJGkoms84KEpZYY0ASUGQERzbVWV3v+9OP8fMppvHx5ymlUkyrV3eKU3f0yn9d1rlIgQ37IgE4ZkB3JMCmSIRCDIWAynywh4Yef3X345n54LtP0A9ymeG0jqofMwXbTeKMo2lCIARdRLqnSjDgiShuS+Q6Y2vyIBndbfmOnjQDQEoXYoMNujfBdPDkoJ0QXN3NEEFaqjIilaHQrGJY18vyjBqnUOs+Lis2XpVYRUQDnvr4xITONAwdTnxMzIydOTObwArVzyr/4s7/4v/7f/sc0HPLDt2m6N6taL2Yy5OHT99+Z2jTd3d29S4lDzF5VUxpSGt0NXc1tnMb3H98/fHg3TOPh/o5TqnfzepwY6Z/98z//q7/8FznniKa5WxFRC30vdIRaZVkXMVvW5TJfVPUyL/NlNrNSRKqM4/jtN39ymB4S87oIyrw8np9/+CLricxIxd0vpV5qpcQffvH+/md3KfHhMOac+/LgzQZGJGtBfYTOumKbzGFlMN2kJHToBmhkdlchTYk3p76lrwFAYjboXf+QKPUctJxTTk1+OzoLTNOYOCXmYUgbBY7YiTCIPESMwmsHMwMxCRMeTBEcoyt569rk0OSDoRkCCN4dL4Br+60Y6C0HAilnTakQUR4isEND1KNx4gEjUwfC+Sfd4nQvgOlNzYCWVBGletAvemfavLMtmFLOeZjn+fK3fwvEh+Pn6e49cz7eP0yHO3fTsphWlQoARAzMkDIQJk6tUjm4L+dxGI6HSVWkLCbqLeGUTKWsBghV1cQcgAAzEwComVk1kHMRBCLiS/7MlMxVrLp79NUBQEMwQDWBDPkuORlkheSIgEmBkDxsWUxACZiJ3n+YPn58QF7HcXhtgfef16D5Zjxut2pbo7pFp8qiUsHNiInikm7A1K+saOe5e8541yaLwcmE0PyXnl4QpSBhInnQVwDgZoCogEiCiIKISBJBlyGvibeEEqii61LUbF1KNIdzD1SC6CwSjcVz4sSYEm0SvthQ6XqFOKWf/8mf/su/+j+n8ZDuvqHx3rTU9aRayjIfDnfrvIzj4Xi4C/1pRASgxDnxYG7gFV2HcXh4d//h4/s8jYeHO0os01jHISP/4hd/8pf//C+GYYj+pmErSdSU9lhMRD7URVTM7DIvl8siVR4fT+fTBZGHYUopM1hZ1KBens6PX57q8gyipGJmj+f58XJJQ/IBecrDkA/TgTk3otodiSGIHvLWeieWcGh2GOI1P/fNaGWsX9zpOk6JRCHcCAuyEojQPAVQNe+NOadMhOMY8nA0DjmibNM4BriNQ24I0czoqG6DTle3PqVxtTTcN1OEOBHDrrgJANAbPsB17exdRM32lntrwYCYk0beyTgOKSdmNvWUmDMAZeToN8sOgMyo9EpU4U1Uas5aj7nFfMBgAMEdqF3pq8NsquKOSIUXpJxSHnLWlMDNpJoJtC5MTCnzMIJxSjm6TbiD9QQcuGbC7AAgclWg24Ax95to7y6vDQwc3dQaz9ObfzkCNolwc0UySu7kng3YANHZnNAczQgdHRMhESOnvi699uDaUcBuuPn+1W66Q4+wtShXBNYQowBdWxc5aAZX917MN6zqZ7uHuUjec0CP+jgAN9zUvfbH4/2hxRzoArroqGFCN4IcRFS15Y/EWREiEwJ2JXnCFsRpRe4t3vdyjQOATcCPokW1WGRBRd/OlyRdjPP2fExU6mFMAG/S8Nb6mil6rWVZF1OtwpTIzItUbbnp3SyJiH7LAjapVWoj8CONOex0V13LWrXOl3mZl7qsoIoiZjbPy3xZWNL5NE+nyzAMeciNeYBwMDVpJto6oLdUvrCVuppMd8Remko99gkdx3rsCiDuYh8K4dQBerPG22XC8Nh6vCDMrYj3x49w3agRYNB8/R7vtRZQa5nugUrgTuDswXMEi4TgBkwQswvBzbUFkjwabURXMeipIoiYWKPfVa2ackqJVT0lTqMZcou7ZQSAcH3MbkZ7bG9U5241jWHDJwKmWJIDbymaACRiMHfRWteliAOUeV7yY0qJ6oXqe2g47Yg+pIw58TSmhyOBx5x3BFnreV1UVKQ6RDkfIhIAWrAjEYRFRGxtncxb6Td56HFtUQlzK2E1gDmCRwqmgRuZsTkaDPOQxMkkr8biADWMbUMRJEfmI+e7gWE65uPdYRVKLwIEsdyEKUc7Mmmz3DfyZeM1VWut3dBllpbU2nmzvhI0si1qLyywlDBaRUBKmJ3cXTkZRyUlBq6ZRgGTozYrqXNQbcTA9SJJjB+pMW7bVFA1UXUDE2F0JKBEmTFCPImZGEPMnwiHxMRITJyaB7df6hqiMbrr+flx1WfVsi7PqvXx8VFE4vhUFQGCzzE1EQkznpEgkFeq1hXRVgIkWk+X+elEAL/61S+zORNJS/e2tayiQr2+hzjlISMSMVJCBz+dzufTxR0QE2FUr2GitF7mH3/163J6Xp5/e/7tr2U9uxmImtmX8+XL5UKJzyrfPT6O4/izbz/e3R+JKFQuQw4shFrCUcqMKaRD2SMImxIRJTN+YSype1Wv6mpNWBWxN6wFCsSKbDEFEEIiZUKTjBwwRoicOA95ZOZpGoecEqfDYYyeEENOhMFhOzioiipC5EaauZtIBdWYH9DlYQOVKGylYE/6YTk0tkLVSqmRqlJEzV3UoqtYGPYxWwmImKZhiKqGh/tpSGk6Hu7fvw+NrfF4QCQ1NdNSRNThFrnf8uA6eLUcZerNMEN2FRGIHTAhtWlUa1lmM1NeKqWc8zHzxLFkEQAyU5oGZhoYpxxUl5qrWTSXLioi2iUfO6toLVQJtuWwhw/TSF8Au3YlacDg4t21dwc3FS0GZizqAuyYajqYk1oWpxp9ktwdFcwQHaeUeDhygjzxOA3D4q8TT5uFQE3pG/Gax7IZc7jRDJFuKSokRKg1uRmZezP92gp59eNadZsFyAUAAiE7pkTuTgqGO+/RQcHJzPDGz8ZW1bTLIIemv4LR+AWgmyTofckycwTg9j8iYtSXElGQSszIqZeWEbVE9heXh4AJBGyZL6dVRRoqXeaz7ex/QxSRUmqneFt2CyAShrKPaI0yLVyXeb6c0f3z508jECIu67rWaq06tzLzOE3MnIdhmg7EnAYeBg5Uen4+IdLd8WEaj+EzEJKKPH76cvr8Yzn9MP/4WcscWkLm/uV8/nK+INOK/rQswzTORe8f7hPTOOXEnHMeDzVsk5QTIQ6Zxhzlh9ibzmHCrqayn14OaqDqXTaRek1rq9zog8YQVYWMPCezcDi6uHGEFBLzkIdhGFIKt5SZaQh0bLaWAwSJ5H2AuVYxqW7qUlw1OH9wJ7fo0hl5TwjQ296EPesiuiyriFXVtYiaVfW1w5NEi+DoWEV0GIaceBzSh/vDOKTj/Z0oDMMw3R3NkYKFQK/SW3b8JCo1czKs3J10H1xdCEqRFRDzidCZwuYHJqdAB60A6EgOSMBmjAjOHOnu5gSGiJ6GaTIQkbIWwNXBvbkaPULlgGYAu4BCP0xC2Gl8tHqrKHtWBQeoVosVB4dBgRTcEzkxWLghhGhoBuZOhmAQ0nZEiZixicFcUe96gXoMCrqLe/3pu/gJXOnnljan3H0NRAsFh9ue2N3G3tAvUI+afYYO0aQjmrfGcPdWTmfhkWHgQoMowCZ50hNir98UMNpCd82ZaOyVd48RgFsxVzR0xe3KbRVPr7fQ6hOB8/Pp6bxUqfP8JFKenx5LWVWllPUyz0zUUmDNay1VBMCRDNCWZT09n9ydEqdxAEQt1dQZyYFiUKmjGoj6WiIbS4ooIXFKeViJGMmJ3d2fnp9Pz89I+O7hw93xYRwmxiFxlloul/Pp9FzPl2Wu0ag+wpBztaIO7rSInstQHdN5Xo2ZpiExY8ppHMcIFKacEHHMNGQiwjzmlDml4eFhnCaqSi8cFDMT6UHPsBZ74DN8oWgY0W40YOcfI0jnZo5dtzbUahtZ0eeLRX+eng0raiJqHlUB1VW1FJUKZlZL6Py4CbhT60cbRSqRMKVE5DtUmpeqqlV0rapmVa2ImUM00e5DCQlRzDPzWsXBhsSLunPKw3AUre7MHJUh87yq6ItJ9lrJhBASQXJKKWVwA0IAA8Qm/s4p5QNRMgJzAzNGPwwM0ekJjUlJFl0YEB3YkSClym4ppTTRMHJKEJmO4HfD3fQeai212uWyuKNBjbzj1rHVXYsAeEqZWnoixqJh1ILn0UyyVH2+rFVUxNfiZq4uFQqgD+9gZCfCY6LhQIagQI5sDiIuaqRIlcjRx5SHw5BHwCTiUs3s9QVqaQSdhg5HvSWStXEVgOFmhqoqUgNymEmZOZlZi6q00sQAgaA6AaA1/YmkJ3I3RwKMpE1SxUDhVt/p7mCI0Wwrwm/mjhgKhIAbJbk7iQa2G+pu5GbUDEdFEyIMKSUmJMyZokAh0TWkGxI3N5DkJmVdL6fLvP7qv/71b77/VEp5Pj+VutZlXk6PJmJSy+WChL022GNqbgGsZV1LLcOYiTgaA9wd7969e885GWTlEQCKy6pSqjyd1/lyVrMS6bUQvC2UOi/rRVUenz4/PX1m5j/5+Z98fP/x/fsP//f/Ecaczs9fvvvNr3/89a+0XOT87FKqWRU199VkVXe0p0+zP1Uiyr8+U0qMMCanzpFGkhRxQuqoxHx3f384Ho539//iXx6/+fbdeWHRm0skovNlyfkyz+u8rLXWUptbBIhIjI5EBpGGjQhAUeTsaKJaVQy8ioR+i6iyMpLFIgrgqIYIURfgZuu6lmUx03VZaimmKusStlKgkre0Y8ewwkPkD3stLaK7B3CK6LKUMIvCRKpqVd3co3zSIRopACKGyCQTjpmY8O4wffjxy5Dzw/3d+w8PKfE4DcM4fHk+XeblBQq9GYNrtSSE5I1S9j4biSMKwEnBqomZEUJmhK2LJhq4mBRAdEwAaOimCUPHkpg4OZICIcCQEqZUS0nDAMQRyvZOdUKwnWbuTmTuPY8LEJoFgdapFDVdSl2K1OrLEkViIlCR3Q6IDgkQKFOi5v06BXml4maQWlspIk7ECYBMu17EzaXZc88I0HpyRiDVO+/Uoh99gYtkayLSSJkFjCQidO9x3xYw6XTqxtu2bBgKtiWMpUglj2K+pnyACE4EBhFBQI+yPtwOqpMbu7NpRPsWNOjYiABbfQxzt5V6Rgz3WgJCDMnYFxaTqWgtdZ2fv3z6/P13a1m/PD+WsoIbakVwULVSNqvXW1DoarKpiJqGTmNiRiT4Fh/u3kMiQDZkADAgMRSFtci81lrr5XKptbqBiLv5ZX5+Pj2KlMfHT49Pn1LidV7mby7rslz+5UmllLKeT8+Pj48uqy2rq1SzVcTABVwADFykCogDAqyASOADWwgJcXTnIMKUEHHINGTilN69X+/u7x/e+Tc/17t3VAXtNgxhZiJVat0VTG26Uj3BqLEn2/QDc0drxAciRnY4GTXJlzCMoIVLECCM81BJK1VUdV1rWYup1nVVqa5qUqJjiKu4e0vianpUrYA3RtCGSvPaUKloOG5emkWmwQ/1pIJu4AMkckS4W0oRG1JaSlHTnNPheDgcp/P5IlVe+COvUKnb5wZgsXxRAwFHAiQHNOiqFK2iDB2D/cAtL4lCgY1TePFm6tVVBjVjdyQe0hDFvgZgyMN0d//+g4rUYZCyupvKGraYqrsZURPlAQBmbkQOuLvFarOssszrUlQURMAcgCEkYVOiIXNKQNizVZXBnMS5ZK+UgAfMTHRMhylNQxpdYD6X+Vykvugn0JMJHamBUThH0Ya+ozp0YIrhZKaqRCjCHGkVYY04uQc3bpFbBQ3NetRks4l3ob+oBwwFFMDuc3czraHo5r+9YDXoCkwbTG3mTt9Zk8TFFoNr/H5z3FoVRTMUX28ppXEYq9hxOhwPByZay0qI4EaewJ2J0hagipKFnp/TeCWmPOYILUWj8/cffv7xmz+dpunh/cfD8QEcTBGhdVwIvnyel1JKtF8EQHVo/BwiMjniUsrz+TSM0+l8Pp3PcymeBj7ea8lmEGXDCcABGD0jRFWuYQQT1czQFXVBVwerVZvDJYYApUYhjjgt4glomlcrglXxZl1zCCmIcN9ayWEUb6UU4lBmBkhuht1ijTLXiKaYuaKH64cIolKFAEFUwtOJhEYVqcG7XS7LfFG1ZZ7LWtxU1iUkAaxWt55L2nnKztVQG+uADiHx4KK2iou6mlcFcxBHNXAAdTRoOk7ehyGGco0BIqxqlyrVgdeSlzWLCKESntdS5WUboZeoRAhMyIjiphqKqwmZ3ckxObEBVTP0GrG4ju0Jg5GhREhpOHAeiWgYc+IkKvO6iGpOqYogp+FwmO4eAGle13UtRnT38dvhcKdSy+VZ13Vd56fHT2VdzLVWNVWILFYiRExRZIzB2OhyuZznZVnl8csyrwLIjgkQE1HOiRJOU747DJwgo6I4GuKSoCIJjzNnsSnn+2lKiT8OH95P7xPn+aKfvpw+f1mWub4wlrAn0DX8QIcoFMRNWLEnKsXxAUitYU4DOBKnnFIUfDNzCkVtQuvOXCO/vflYLb/WqDWpc+wcUNeGal/ZPk5XhGr7w5bz5oZdxWnLt+g03S5RGXolOiImDkFNTBRtTroq8waRt5hNSNM4PdzfE6WP7z8sc5nXxcHmdcEIn2PIqjZIClMwGPBIE6SAGk5INI7T3f19TvnP/+LP/+W/+JfjNB6m6TBO7jbmQxkvp+H5+9/+Rqosy/rl8fFyuQzj4XB8YGYBEEdxdE6YsgM8Xy5rLWL+3Q/f37/7cDpdfLofPsCyLpUOqpJSHoehcaqMiMg5MbOqrpfnWhat63r+onWttSzrqqoGoL0FigMwp/uZjnd6WdNfPtcPMywr6C0JEJGsshapEuYMEaecHXA8HBzR1FKWjTsISjGKDtRd1BxgrRWZVDml5A5qSkxJpafAeSllXVZVmy/ny/lsqsuylrWYm9XVoxWPyJaGFAO23cwWh2k/vDfmNfMiFhGisBDMQR0dMHQPvU3LGInWjWEHACkquDLXxX1xT4nvqtwVPc+XudQXyQFf6egdRxOVVgRbcwdvLLRFU4So/cWm9hyq9Sl0DSJIkzilxL4FoiJH0B0QOQ1IBFXNqwOmPBKiqZCrEDk4UQoz0HtF++as9ZNtw1kkik6kllqLIjmm6JcXhQsUoRLiaOesoAhCWAEFuTopZc4jDpnSSMPAA3O6mJZFyip6O6Y21h87T9055giq+cZ7t18t3m8AUSLP5K6EqNpSfgyx09g9MAf70+zm0tUPa/znzlTZO2rbOzdzCfaDzXev3pxUYEoYvBET6qz+Lp1m+wfbDl4Y373iJGeNfmcGPgyDmkUDDNwQcB+86G5tSgMSAxFQAqRhOkyH+5zz8e7d3cP7aZqGlIac3dSHimpRYR+Dq5SyrCtQGt0Q2AG2WCYSuXtVUdVlXZalyRs5JxwnNPAshgLDyNPUq4YZCfOQOCXTCq6IIAh1SabigKF2IOahzmsA5kjklCtQPSyyFgtVr9sZ15jQPcfd5g5bDNQoe6FuP8YUg97KzsDR3dxDXTckg0kxWALoRUu11rXUCHKv66qqy7qWUt3MpIbLBqLNcYOtPGAbKBvd2ULeDmAGVS0CRA2nvEn9OIB11sFbq23c77Kakyq7c5VcajLjXDnXpYq+5G5faVEmhnHEaQJfVblY40vcnVXJoyYnfDoCUsQQY+tdGoLtMTXFCs6amBAt+okolrk+fvrM+XRcVlFFotP5cjrPZuZaoyTJ6urStK9CLoY5xVxQMSNHqNY6gqmZiUpIQU1j/viO78WRE+URiXjANBEyHDInJzSHEskZCAtBhehrgQh3+fDh/t0w5HfHh+N4QKQnW8tSy1LshXkZGMwIQM7uFsaCReYcXO9vDyKCm0fKWVj7QkTNrUBKKQAeOTGFJR9OjW/2kkdUt8mMeBMy2JIue4TPfROWtJZ3CztlQ9h+XpFuhyzdqmqDcQdG1JkmxK7L3z67RY1uYclBq5S1mNrd3f2330KRevfwUKVGxgB2smyD9+1UESlWNe9tRFPO4zgy82HMss6rihJVJDddzucyz8/PT6en0+n5dJ7Pl3me1wU4jaqZWAGAGNiRGSiFeriBF7FPj4/H734r4gJEw5SRD5jULKc85IEicZ1joQUkFHM1r1VMLcI9ZjYMo6iAmooBQKIBOSMx8qjGa/XPX06/+e7HT58fa60vYGmjK8NX4hSdu3GaJiQys1SlKcv0hP24PdQrAqkXvDXGhaLVOwJQwIy16lQtImspqlZqLbW6dX0Sc1eDDknbLb0OBNzozjY6wtRvJMCGpwAeskag7Tb2+HkfHtHhhiFkA5AMyBy1/7PbEfQSlQAgJ7w74N0RfKmSZjNXcHV3IxFATAAO5L5JUiHmDIiZWlSZwNFUxdWNlYkATMIVpvk8P5/OjvDw/t0yn4jodDo/ny5hQEbeTyIgBKk11k5iTSkjkrvVKgAgVXAFAOgJhw5uQ0pDpoe7EZAppTSMSATsTg7okBVdXVyLaEghrIxCjDgkYsT348OffPj2cBiPx/v7w4M7oJ2W07KcVqk3YUsMD5eZ0DByPMxB43gcGy40YApUQDMRRPRo7kmEpJ7MkTBrSmaImCxT4iB0+vLUR3BvhqO90VODH+ultNZVrTtpuqsG2PIMur20P5dtvEFPKWgsZwOOCFKH43bFow5KV62b2ylXSpnPMxB//PDx/uFj1JDHgEnpypRv5lI7OPdw0jHyHpqDYObq4IxYLqcKgGpo7mrz5bIu6/Pp6dOPP37+9OmyzE/PT5dlceJJxJkVwCPXjDNwhrhArkutv/7tD2v1IU93D9/k4xEd0l3QSZSJY9hlYgBXC31YF/FlLejKrVsSRsNlKFK9GkCe7vN4j0juWA0vq/36t5+q0Xe/+X5Zyy1uQyen44wh52wOSRWAhqFGFN+86ZC1ZUcVALbmKK1wuf3NPZOH3AKRIPpxiMi6lnlZVbWspVZp3LY1beWWjbCBUgPLVmjS2gUjbMaaRwTMwxuA5iq4A1ljbLvmURMdaUPMiQmJgdCADUiBxLEaqIFfwy1fQSUk4ASJMbEzG0JUIUTXBHM3QG8hIG9Fg20qbOUTkY5ngIimZtSUg9xcTVcp5jaMuSwjMZd1ruvs3hpv9MwtNNVre2pqWkfeZmkzS3rxKsSaRsQ5JwyvccxIZOiGBtFPz83BVREUwBAFUBAZGTgRZk5jHsZhzCkzkVkoLVnwkfDyGjVnps/kyCTamJ3NStom6mayeEtYjwvjqGSoRoRqBoaICNZKkLZb6+28/QozVzNl2/rM3kbW9t6+r1fMtO9w6fUpXgFr9/5tjHWb/tW1aSyFWWu9mXomG0W0KrjbnfRAr8vxVuBKCOjmqpEG0UoaLRR/3F0MRE1NSqml1NIjWU3vwLaCnZ5v2LIOgcDNwNEcSinzvJjzAUL2EaNynbvVEYIFzfLEyOd18+DFGr8ZeYBbhQwRpzQAYm+eDKXIPK9reZ1dcr1yG7UcaUHxpdiO0xQjq8MQQCP+Sj1n7LrR5mMDEqB1oG/Yp+ba1Q+3ha3P6EZvX00l3w4QAJD6MkRbel5bobwzlBg5d+1rQ1+scwSN/YkTbcdJnbZv/+wVJMEbtlLG+zt6uCdWzsAqeF5tqWJGVUjVPBQKIFq3ASIQWZVKKO7mLthrRgRJayVKKjYvVdREpejqYEyaSIhZqrKHGyyqCluphGpZq5qie0oDJg//ziNHzwQdiNHBI/0+wtZhVSEGgeSAEK0OFFAV3VEFTQgc2IAAB+KHwzgM/O7ueHd3mKYBAOZ5EbH5si6zrEsQmtfrhhhybuQAwODuiJErBIjWmv1pq0zbDPVwuawtSkjspI6ESS0lRaSUjVNCBO6CktBo7wAXaLAcKGXuTenb3DfJ7zCYYGcq7Zo1XZNBr2mx3knvzmleTzLSWfeI2soFoZtVgNBa9bjvrw8gE+XESGRqbl6rXJZZVFLmccxMlHIac0bEnjTqVURVAACtKW2AGrhTojQkJBwR0gDoUKTUurqa1VVqNZOc8/F45JyN4F7qeLg7Hg6ccuwWHIdhQnA3LetSa3GnUnVeCmCWWnOSNla6m4uAQAzE4K4WcuOCSJwyATEAgYqqObQCPiQEzMN0uHsApFAEHMeR+c20m45JcYcR0IGJmnjb4Exk7sIh4aVE5OatD01vF0qEeRiHnDnxkMdhyCmnYZhSTqaqwuaGvDqQOahZ12SPDISW53ZdWnbHBVfKsVnMsGWIEGEPpTiEsGScBzpEkDzqAzpxYdEdq8elmSglQqSUKWViAs5OyYlf91y8vXAIw4AP9/zuHY+YjimJKD05XKoI1Qoi7IBq7EDMEJ3HBBVxRULzajvxTHA0ZTdS9bWYqqtVscXdXBewmZlyGlIa3GBd53UtZl6qiBr0KT02PR0CN3R197Ws6xrMAxMBEU3jGPIOoZLuYRa6Q/RTAq9KoOiOVAmF0AGjvoTzu+PxcBjePdw93B3GabjM9XSaS9Hzeblc6jJXkZdsNxNyVItFRMBQG/WD3WqEJjOpLfO2aZ6YRpMYFIpeI9zUtzAPmZNia3vVJz1sZFC3e/z6oyn+O1hPd9GelBhA4Z0yv5pL3dDpdFJfxzrb3Idmt7YQbKuPdmtJBRY5Dwju2mmv/QUKgQFAKmpuWpb5xx++n5d5GPLd3ZQST9NoxyMRWt+WZS2lgDuIgBqCoyu6T8fp/v1dzmkc8v2Y0eE0FytnV7MikXs4DMPx7n4wHe4O4kaceYgyK+dSwGEcD+OQVcUdVA2AStV5XhGT1KKhfucA0CYwOnigEoC6mbvWiogNlRAIGEVaUrSDAwFRHg/H+3dIITqgOecmR/2WRXmNP7Qrxh7zGNDYzJ1TOG3KnHoet0I3VIhoGMZhzMxpGKdhGFJOwzSlxKqKLKZKvDiiAbbWihp9IlqbnGZN2k1ux44kxBaLjaZVhJgyRXfpCPR0amwD2MYnREuoeM1aLnCcJSWOGkJKGfOATJiyU3bKr0UVXrLdUVqZGJVBGdyB2YmB3JE8ROTaLLn6D2bxikNoLxGEQgtGkU2LVqibi6mG86VS0dmIfWNxTU09rh/07svu25qCiITuN6RE5yg2dwBDD3AXS7hyd80HRojqcgQmSinlnEKqMbzRUmRdpdZoOGb2yoPr33TdOyFGyC0yPb3Vhmz08L6pUuOborAc1QCREFUNMGIorSliv1HNLb7+1+1s62bKrhNJN218c4v6TrZh15Me+3FAxA1byGSLH8ZzHpEO6H5W30nLSbiC3n4IbTkK4bNGick8z2ZC5CkRuIVLF7fczJdlKWtHJVMESGAIkAZCOEZEJZoZMgGBYUxT02AKiCgRGgGDA0VPEWIipoTNuk2qWpalICNGBWzzz7rD1xxs0CZ2bP0EYhhSL7FCV9xfzzYQo/QkEzGhqFJU8G/JqC+G0O6y9QUiEuDI3YFaZyd3dyJy2PIvfEOlK92926K6DFFDHmTnZ+/9+X739yNjf2B92rQR3nN/gvluvKMj9vhOKFJED1Pwm/Bdr3LaQhuNmG97g10Y+3Z7la/EmEcaJtLVJVUHHSacAETdOKUKKrCsEYU0czNFoEQtIzSk4kHd0dFbIx0Q1VVqVC4jGSGAa2tdaFiruUMp1aKvhlrnrdABVawWMTZuNdmYUgIfPWSe3Nx8LbXWStTkRLeb0RKJAAGQKZkbM5hH5JsQYTxOD+/v7+8P42FwJ6n+9Lj86lef57n8+run3346P1/qst4knmLv8+XdcYvR4811Indnajm3SC1ipq0l69Uji9oIcydzQBT16Da/jeFrAP5mOYPNAOpbT4x2sB7b2dBiR2/5/nf33SJbCEIjAoIW6LLUbsFjIhkitBQjjCUnRhljVJm+HEIIHC0trajIPD//9re/+vzlS2gzEcI0DNM0UkT0zdyslFKrgHt4cDnxYRpz4m/x22//7GfT3Xh3nD7cHRHAlnV9PpmbaLks61qrg3PiRDTmCYlUoQqYw/10nIYJEI/H6e5urLX+zX/937+z3xBS5kzA6GRqVsVbfX5rX4cAwMkpOqdjxO2Pd3fjNJgWWZ5MfGNziDhlQE739/ff/OwjMUduWkrpw/uH4zTOlyOnmwLv7vX0dRf6KkmODhwBdSRrgv+NqPMIKjaUpXEcx3FgTuM0RUevPAycWATVzEFjcDZ2ySD6+vUhEdQnXnuYd8utjT1qCnHEiRMjEiVmZoCW1ekt4gXmTg4eXQgpLPfgEcCijXDP/uDWauUaRbzyBq9syZeoxAzDSMNINTuxMGgeaURMBp4gCdTqBl5rOEoIwb5bL5sAw9Yrwd1dHdxdRIrMosJMAwZwBJFsqu4o4NBb/VyT5xtzoS5VTAkHBs6AEP3UPLqnKrhbLdXcmNm8lfj34I6hNcAnZERiAmPY3OTxMN4/3D+8OxKTO9Xqz8/Lb37z+Xwu3/1w/uHzfFllWeXWQ2lw723RaAsRQHThdHdXcmvlNdFOCVDNHKGZ4btTNAQ0BBBSpFaABj1NsYfFrmvPzdjuCHW1nrqUjt/e5v2dxx2yIXpgdBhK8RXuvv0CBLBWVILWKf5t7XPSnpWw/zpE5yhRtKpaluX04w+/+e0P34MZmAD4kNKYEyKqhYiARa0qtOJHnMbh/Yf30zRODxNlmo7j3f3h3bt7BF+enk4JRUFULusSRWER4ZiOh5S4FD1fiqqPw8h5ZOZvvv34s28+rOu6nC+nx2dwYBpaM1cxq9FIRjyIQDMEgOTAFgVWiIRMh+GAdKhlPstsKtAj8aGdwCkf744fP34gZqlFpeaU3j/cH6bh6XFKL5vCd7XKpm2B3qGeousjAJiRhy5ZyxUG47C+I/Y9DOMwDsxpGMZhyJw45SGAo1V+hMiUu3kP+YVIdMDE1Y1/sWHwMkRblR8TNhWnjkq4DSHqno6Tk5G7G5KhuQNFDVSDBQiVlatZFzP01pbftjcqTlqiCoUUHhIDJwADNjcEA+cMHq1wBcCh5RO2ocrt1IJ7iAhWm2T7UHRLgul2zXV23Uyq7iZulgZ0Fm47Uge0JoyBGtjcV/U4HQgPpN0J7Her21oADmjmJubu6yqXS7nMZV7qWqVU1a95cLHz8IIghlRoSYEbAKE7kFP4UtQjlFFoiz1ksN2QHhqPHDnwbv+2JQ2g6UG3z1wv0B6V+lDZdrxbCm8f4XU33oFqI7wxvAgAQAfrD1rihnc9G9raKLzBmnSLMC4S5SEPwwiuHt1PE3EK3yq4OMKWE9CUtNIwpJw5ZWJ2R3UQ9SqK4KLRR31TTYNoFuLuuJIIi5iKmjmnnCKLl7d4OhFRGw7tMPs5bG7cdgIAEVuIowo9KbfKzMrhrmVAAHWRcJLMTBFhC3aZiSmb6VuXqEOSXy97T1IOP4hgLxyH5NSUHGgLAe5OqqfiY7dN3vrXlhW/ClxsuLBDKLxG9Bolcn118866D+h93kN3/zdSGfp61/kX6BzL7hrAm+PnjcyAqNQgzpxGRvMxERiqIVYTlVqB2KWCCpRCbojojAhIiYfEI4R0XiSbaEUTBOdE3pLTmBCJEmJCJG+HhmqiVxMCoMdEwB1C/o7cpLcDbbEsRgY1KKvVWoVV1ELbOHLSsI/B8PwdQMAqsJlpVTOjoV5WG4qZm6iq2m9++/S//fWPp9P6eJHHi6zV1nrjorRhwdRGVGfYYAevhG4WhbehJgik5u5qzhr137Al7Hdvy6Me5ea7+iCJH2+LYu6+f8OkK8f9YiLsnm+Hfx1ybXTFoKFW2rvPomzDjba3UiuAuD0oV9Uq1Zsngofj4S/+2V++//iNm7oWcGcEjjHbGNKGMggQhR4pp8PxkFK6e/9xNTwtVcXWZQX35+fLc9VVXAAhJVV5Pp2fTk/uripuntIwjkfmlIfx7nDMQ84pBa9JgJnZWt2OgqmKVhZoAUfcdB9aOiAAuaNbxjQejtNhKHOS9YKInFIekqk+nk7rlyeTusyn0+OPSCS1qEhihrqWaTg/P4YZeL1AQb9GMWxz4giC8mjzuflHiL0QhBydMdgyIiaaxmkaR2YOWylyw3tJFiMBUgLKSIaUQv7uaqI10qzdxj6IOlMLeC3FJupIA5u7eUWmK8I4ROcyv75siNCTh6D1rdsEbB0gmGR9E7VfoRJGRStRIsoExjkhOKgjVK9qLA7oUkEqIkHI3EEkd1JmngAwcgvRTcEMDIEwEWmHeSQkRkyBqZs9ZHtU2k7PHUwhvMKIozX+EJ0QgGO9E1FQE3MMqWMmRsbNDwQEJAMwJAE397WaiIyrrlWLuIiutYjo5y+X7377/HxazhUuFcS81Jelg9FHIlycFre4UtIxtBwtPLiWzIUUKk5NZIQMUJuH25vTeuRe9VV6s/Wua82NQdPXresC349gZyzd3u0OR9DB7/bdMS7bQLPr+gZdy76ttg2VCNwp+uvuvyaYBVUNWwAQhnH69tufv/vw0U0CldAM1RBgy3EOdhcgFCSJiNKQiXm6m8RgLipFlssM7stlWcSKuSACswFelvXp+SS1Xs7nKvXu+PDx47fjMLr7NI3DMKQo7DZDByZGMIgead5agEIjXwGAvPUqvWrokZkj5HE8HI+EMJ8nM805TWN2tyKK8KhqdV0u5yciipZZKXECtTrOl0skPWzDB0JD13e8Up97COadYm5vDveo1UJj84KYcx5yHqI/R0oZcZsXUUPtPUWGWyM25AintInlVxap+RD9mcZKhzREl9HqBZjQFt+2VDnsCiHDNOq2tW9cd5xNg6TNQWpsmb1mAOANhVxHMzAL6TWKuR/ZPxwaawCami1oCqytgw2AIaqDQLhULfe4JbUREGDq6s9xot6B169uxdb1HFtFOrWMUIxkiX49wZuP7eRNdgMQryeqBgAMzbONYzDzKrYWUdHLpdRSh5wvlzINq0acUNU2NxmRGbcmOPut27bd2NhuSX8QnHBrKgXo7hSxSUBiw87iROC9mcHWb7K3SFnD5R2l1A5kb9tsmBsrYbfNb+9o/4H7GQA3f/jud9gNPbeOHKzb45stjxBZu5su6m5XPejl0BahlHicRhJ2S6Yc3Y2il8b2UW+9altPN0RMiZFoyEOEzBoQghNnHsZEOgw2CohKyplTcnfixO6tFyuiu4lUJERyVFAVxEjKRwd3i6FhFi0zgnFotZauPTIeThKgi4iaiWoVrSKmYrKaaSnFmqZaKctM1PKVotXD1TO8ve5++6A935eM6x3Z3OBbF+vFE3Hfu9PZR3D40H77FXCzWO0ebO/CLY4CYc84IjgZekPMzk31I9i+92ata6u19+rQ/VmF77iRNb+HB6eKpXAtrJYBByRJbEhmDpRC2RMzkyqKQJnADERMSnQln02tS6m5m4uImSFAwgEZiVpGPwK42ubtkgMHiQJIDH34IwIyYx6QEBvoI4B7a/VJQERAPIwJaFC1UkXFYhkiojQM4ciZmSGI2tNpebysZZUvP54u5+XpqdwfpuWypAGHiQBdtIYiSUbGlKr603JjK8WiREytGc31BlxvcxcLcm2SNc7cEFONQoBd1B0g8oDdXXpWci9x20wa3EHfNhr95rnu3G9m5uaqNW2B3TPbkW4j5GaAeqO1GuQ2o6mdOexYirhtFu71/voAcKI8MCCNDsg2QBqOkzUbqoI7OXCT4CEMgpsZmAExZW7SQq7NjEYHc+REzAAw3A1pvBO1Olzosg6n6dOXT0tZa60AWGudpkMaMycWldP5idc0TeOog9SKDMfjZGYmYqZMaF5VXdVV1Tzc+BpWlLsiIKWEzIfD8e7+kMd8WZan0/lyPpV1Xk5PKjLPl3W5uMP58TOaEnHOQ0qJLJscQDO86r7cb01/3OqUri9s1qx397zfYej2DPXcaLBWrwtmAOhqFr279NreuU39KwXZEeS6GPUVNeQoGNCh6X8hhZyTEfVapJgGO+/tZif9XDpOefcArVEe1nlgMjR8LWEGb9lKoIqiaE4QQmkkyG4QSrdujARkipqAyM1AKhQ0My8uFqor1lBJ1dyAkJgzUyQ6cgCLu4ADXOPNV1vQe+/iCJZx6pw9bZPOAXr2A1DK5MAADsXdTCX6FCESpTwAubkrmKgtq5wvdV3q58f59DQj4pfHc044Hhg5I4GaxO1mQkIGNKaXiaeIXYAxmg75big1AyfykzFqu50QFdzdCLDlPXo0qtPof+YO6oqNXAqO28I63t323czvQHE1z2K9vI6uZm9tVujOGnpjpzto2miqZhbtV1EA2PJwKWiYF6ndAC1zAgEp5RC7oczZIztJ1c0ZIMXNjfQjRMg5esByTsQIbl5XNxWRUlYzQyCgRIjEAAOy2cFJMZn7OB3GcUKkOgoSpzxEb191XdYlKSM5EagKEeYhu5lgr7wEVQ2RfAm0EiluZlpNBQApZWR2t3Vdq0ipMpdyWdZ1nk9Pz1KLSpFaEWBdZkIgSsfjkWAyRLctVePVdmWUtju5/d3pyW1i93t2pVz7zd8jzLYidjC6sZm2vV4Zk21h6wC1+V2GnfoC2IqyPeIue/p6z1zvR9gVnrwt3Ai+jcmNpbg5vpvtBpUcQBXWFdYFdEFdyUN8YquVcUCARMEVASKaQw3hFwt2LHIUIkbjAG7qhEAUltHWerw7kxYhxNuZ0OE43IYIvkXCAexvngCQm6mLRMGhA4SSXPRnRVGqFZGqgxhUtXlel8uyrlLXWqtqNRM3dXTMnJlxGsbjOIKhejJIiMYtAaAPH+wLBUJ0Mm3H070e2L3TDCgGHGG3VSMPNSiLcI0s6h1v5M96reFuFDbku6ka2o1Th65IgbC3jLEZzL1HUDOddtjkN7t6gbDe/MProGt+qzkCafPgbg7JrZjOgNQ4MyQEQyQzlSoW7TGqggMjMzAQYh4gpRC95sQETqAhthaNSxkhN00rBAQUADczcVdmzJmJMvikmnsI21TqMs/EBABEaKphuQc4BuiAmAOqalmrxfHV6t5QCRFRMnEiwsvlPJ4P83zRiPcB5pwJAXI6TCMhHg7H6XBk5uPhbpymnPL9/f00HqbTM90sbMEg9vpGAGhlDJ3JuIpPuHsTvd0uclSAA7iKCqmzi2jLJSFEhFq1VhWRWnUzmlp/Qd0ijrafbte7j71MF9FjmDckQgbvUmotBt1tpf67D6696bRxCp3Y76ZfYImZhbLvK9y+tZUcygrPj5ANdSVdEyKkg6XREZ3YQmQiZWgLNgIA1uqlihmsq5QVVSEvVFYyhYVcKiA49UYOcfAbfdMmc8Aq7E4To6MJAoI69UpdAAB0J3cAJ6joYmZai6m4oQEYUdRegXs1EDUAXEXXalX0y6f589NSq56f12Wu67FKUS1GRz4Ox5zTx7vzzz+8uwylGlbFueiQXvQ4QSJqTam6Vtbeqd6eAG8GkXuE5OKBuwObh4JfMjcnd9g8ON9kSjZJ7W5st6KrDQXMe1Fze9eVDXCEnj53PSjAJvONQL4fPH3NbbaV71DNrz9uCatYRjcRst1mIqe6/oDMkZmIzggDALvWcllrtcvz5enLydQSJqaESDSO0UTlcJzykDLTccqZyQFixc4MhzERcQzrSoIgUmezMg50fz+B+7uHIwDUWpd1NdNlLc/nJwB89+5B9AHcl2UNdqjUVWs198jdF5F1WQOVtHZ7WwUQiTNyWtfj4e6uikgty7yoKBIdDgfwaRryYRqY+Xg4Ho5H5nQ83k3TgYjH4ZBSntcl53xzgQDUXDrSuDfxhZ2VsbMjzNw9lJABIGjfEE5XAyZyw5qsxWgRylou8yIil0tZllpKLdF4VFVEQoGgAdPV6L4uSLHikBkRbfEOBORNqqipCGAT0Yeeu7BNj93CGZhERC3FJYwvMzVFREdggCBzb6fYG7wS1AKlgK6oKyIRJEKOonwABww1wkgii6bQFOZ5Oz9WMGU3UAKuEDocLVP41rzrF6TNge3kmoEYtlin17Z7GPQ1upkrRddqDYVthNYAQ6M2GkUFCQDKKmuRKrYu67oUqVarqFybZqNTojykPOZhGgZXYAFEUAN+EZBvXFi35mAXZu0W6vWdrVYDe33uNgaa7WkYEWEHhF4gTs1Wwg2oO9L0j780c9qAcrfYWbOae3feOIa4+jdqBh2Ybqyvq/PQETZesCuO9TeSqcELTHIH96q2ELA3n5zD3XUTratWXebz6elRxZhSooREXCYaBk7sLoNkzWlgJ+dtWSaEaFPtDuZgiKF/7a7EIUXQ+rItC5S6mpmqLMsKAOM4jOME3joshq0UbXVrFVWTKqWsGo+kupmbePPgFDkj0bLMwzyrVG3C+8gpI/h0ONzfHVPi4+F4PN4x8/F4P04HIko8MKdhHOgFCbBLs/Z2yXeoFE9Gu5AelbauR2xoiIRgKoaoTiCssMscqaJSNRqoiNjWCfLq2QG0Ojhs97QbOE3SETyk4QFgM4sAwKOFBoXx1DMGEFszlqtV/2I8XMdeH1mbB2duaK+tbXiFSgjIjoPj6HRv9BFRDaq5gJt5BVdyBE4R3E8DISGrsZo78ABpdFXknPJKqsAJawF3As3gob6UEDrFtVuI44ohQhP2wZZFamGt76r+EIzCqnciYDMzJ1BVR0d2R0AjSuBOnCglAEwuAyqyHY54b1nVx9FE/Ntv7t9//Pjw/v7+/f3dw/txyA/vl5/97HleyrzasjqvNefTy+gVUivVCA+urTh716o5ddsdaZrc7gTu4bOGYxe3KjjmbljFfcNr9pJDS+1vvl+7ZrfpTe5u1PA97nqLo4J7yx0CcrNQBoKOkQawOXfw8kT7yWxc03VViWjvPgq5m3Ot20aElNEwSm0ZNJE7uqzz45cfy1qbAg8i5YFyzkP+8PH98Xg4TEOG9zAO3rRfYF3Ol9MTEkYBQBX5zQ8/fvryuKzrjz/+cDqd+2yGUuuyLKoq6kUcEc/ncxiS6+Vc1llVy3IJ9JFoBqkq0iSHmACJmAbGEQlTnjgPwzjd3x2P0wQw0N0E7oyQGQhgGofDNDLzOI7jMBLxOE05j4jIlIg4ShFuLpBbzybvqLTNzVDKd3eP5IWofnCMDrcIZBrVXm4mmpjITVrLQgIALKVcLhdVmS+XdZmr1FJWETHr3ZE3Mmezsrdx7W3FM7OeIxKmD4aRhgjgFPYOUEANbdQltEF/c7J7j2/n93WwgUbfv9hesd2YjA/GR2M3HgFNURCUXNFmhwKRpZUgDTwdOeREwjWuFWp1M1zmVFZWwfmCtaAZamGLTqHGAJH/0OYSGLh7dHoADHmlULxBRBSDom4OKipV0Z1cCYzABpCEaqaOK6iooyupIwFw1HYSJ04IAKyUNam/g4mGAojMiZA/frj7xV/82ccPd+/f3X/85pthSD+f8XTWZVlPZzlf6nRZD7/+gtfqWmhkN/FNT+bmWwHA7SII7aVm//R2gegAXfAh3o4eZaHgPbEyHLpt2DhcmaZAka4t19/QldKuY84ctKHcBlTt2KjLoURS0dXXd+h5OtAXjigst81PbABFSOwO3kR4dkMo1A6d2pgEI0V0Tq4jGpGtl6fvfvU3l9COXFYHQE5IaTqMf/Znv/jw4f3D/d0A1e7vRKSUYlteC3gVFdWq+sPnL4+n01rKp8+fz+ezmbVaaoeQcMA0UJoQaS3l+fnkbut8qetipmWZVepmDQK02FNmHjIT0XEaD4eRicfD3TAc8jA+vP8wHe9z4rvDlFIaEk9DYkImzkwt5yDiy6HB1shgyjn3ZKi2NQJLapMsBHBtfvtmNbkrdLsuhgN2KbFIoUi1qU0kTtS7OwCEdNSsqqfT8+n0JCLLMtdagspXFWgsgcMOQbZkgy0TpYk2X0tD/Go09UcIiE2Jer+fG+jp0pBXULqBQsLXkPQGKpmDKIqiGItlREclFyMUB2FyA2BFJ0Aj9eQeQlMGCBAhX0DgBMzg0SIDERGYGhgB95j6ZtU1ssNQEcExeSQfEYXDEaJz6q6NGIvu7mRIMVfNOZr3KZBG+TsgRpFMqIhh40GQEydHwiEPnHicRs6ZOCNnwASYiHPKOaunjJycuJWnXadcqPxpdM5qUxV24BDI0rmgPtO73RpDTr0rzDceB5ordA2pQOf4r997E+26Ik1/4lr92zgmM1DfLvD2BuhkRaBkPy53aAVT0O9KA9i2ivt2GM0OjJy/lwU5kdRahZgUmmY2ACFZSHyYqtSyLPM8Xy7n+XyZHQCJgbjW6d3D3ZA5EazrMgxJal2WJbJkRcTcq4ioVpHT6el8vpRSLpfzPF9MNVp6AASuAg+QIIXgrKK2ONq6mmktawTOtqkRepvOCMgYYiwpMfMw5HHMUbdCiMw8DMOQ85D4MA7EyEiMCBj13rgt/R3xrqT2/gqJVJXaIxvdD9j5coFKYcd5Y542VEIEDKFXRFQSImrLG3otdV0XVS1lrbUEl9TTBNS2Ws1YezoPEUeLGDesQVAcbbTzMdy+GW5QqZMuCJ2s6LJz8R4D641uwdww4iRo2P5/o7nZS1Ry97/5zY//8f/zvxzHQbWYVABPyYgNwZgLohBBHqI4DtPQ4+ZoHjr95mYolUTIDWsBlSa35i3a2FMhmy/Splc4vdj64m2hx0BJdwBrAsmtwycCJFQGN7eqoq7ieDGsgATeO9O1xsQapb/uS5EiioDR+/AwDb/89Hw4jIdpfHg4JubHx+dPn77Uquuqa9F5rT88nvZX7fPT/P/+//3yv/76sQ+DDTSuv6+X+frBq0sNbapfIQk6BsHG4/h1J91G2Xa2keA7kNrhyPYdG0jtnus2m18f+/4zu33DZhl1PLo5tUhPBPjVD+e9BNVa5H/9L38TPctaMBgJmRFJxUoxVfvuN99///lzWctaapEKAIAKhAr62x++f76cDtP4+fHzNI16DZyF9ChoFz85z/O8FlU5X+ZSikfFSVsBEACoKq8FgpVCBPeoBQlQMLu2jnSMZB8M34oQVWVeFyLKz+eUBuI0Tp+i/HUah6isy6FhduV7W9gcehgofv744w/Pz8/7+/Tph+/+1//l/zsM0zZArsvY9WZ4x7S2KHSbrn1FK32DncoEgEe5T61mtq5rwJNIrbW4u5n41o9jt+L1ffYj7ozExu7C7hxp/wQ2l2a/n45dfWdXG6ntBLEBOBEhUa316enxBTC9tJ+GnA5jjrvoHT8aDbZxKFeHcDubPpfaT7w+buP7LUNtG+ybUXFziXav7zio3XFvoXjf3KbdTAbogL2d84bL8Txha8GIPWE/UryhEYLuDkVkX+qVGA9j7lXgLzH+1Wn97mf9xbNf2eXvt0N/+eir+/bbP76y+au3XreWnylqVa4GEyJOYx6ichXA4TpAN1yMnjQ989n764CITNy1D3l/7zYA34aBNXHOrcPlixFyzanZnc4NBr9xSrifSS8eXf2Q/s7d5Nv/vt1UdV1XtWsubjR9u7p1uzN7uflXnt8O9w1W77oAbfbX9fp87WZe9/n6ZPDFG95+6atXAa+/8ObJHjv2iBH+5GH9cfvj9sftj9sftz9uf9z+uP1x++P2x+2P2x+3P9DtpRt4PB4fHh6iA8x/lwO6bp0n6OTcPuK4Z/7gay79P3wzs+fn58vlsj0zDMPDw8MwDP8I3/YV+ub1+9z3v19FeXAjHHah33+sS3S5XJ6fn23XXOiNhF94gwF5vfn1XK6HuyXCXLebcPb1dBuLdKVR3uBQ9hGEl4fUqhX2YaZeTLZ/1y1XtV38HRV1841mLnKj9oK4VX++Pog3n/h7bfjyj9+9W/zKsbzx/H+zzd1FX6rj38TgiOhf/+t//W/+zb95//49fJ0U/Efd4gpYS3FzFSm1mFlOKQ8Zox2dGSLQxlQjtUJZgE68N571H3g1Hx8f//2///f/6T/9p23W/fN//s//5//n//xXf/VXP/m5nwwowC3BeRN22X2+x7pirG+vWYvLuLbkdNuThQ7AxJyaABhzQoQQLUKISoWv8pg/vd0Qu/0wRfU//b/+03/4D//h6empHy5MI49DS+FBuqbGI17Z5NjZdcZ34rPWqmrYpSm7TgSqm5g6ABIBI4YwGSJiC6cSUc6ZiFS01mJurm56o90Tl253StcMmggtpeiARDjmNAzZ3Zd1LbV6dFVz6N/C7q04zbT1jBpHnsbUI37YrjbA6VJ++ZvH8+XaqHIc8nEadhcGdqvItWzgxYK7nceLSXkNOL1OX9z22oMJnal/+fHboNs1VLBFzwChx9z+jktN//5rJPc29CRqP/z4/OXpsv/ES1T6V//qX/27f/fvfvGLX/x0tOIfadtA2cykVDMrZb3MF1Udx/FwmAjRTF0FEVPO3LLMW5+cAKJ9JO4fiEq//vWv/8t/+S//+T//5w2V/vQXf/pv/+2//Z/+p//HFTbg9Wx1355DeMsG2uIhWzKlvWiH2YCpj3CAFtlsGbpmta5Sq5quyxJdhSOalVIahoGifUsakDD6rCK2eDLsR/DvfYFeo5KD11rd/D/+x/+4QyUcBzoeEyHlnK4y6gANa/A6P9y910AhIKjasmKtlZASMgEy4oCEgFWlKDoAJsbESJg69g458onSNE3MXGuNNEIT1ao7wxICxK/n0TN1Q0sLEYbEY07MdHcY7w6TuT2fz5d5NveirubMaRwPzMndTSN+VGtdAOD+fni4H5CwNzaJFET64dP5x8/nPSrlxPfHkbuYdwsGbzZmA8prwH0/gl5abts7tkym3ZOb0Yoto2q/RkD/2o5BcVvoaikihoAkAkCPQALtMwEAEPb1kS+jdf039oPvqOTuXVN8XWWey+PzZX9et52XoolNSlFP+E8KSbchXVUFM1XgSBEDB1OT6ogmEqoUKaVmE6Qc4juhH95SGABwa5H3991i+d0/Q0iJU84Zt4N+c2LvMyDhJ4DJe/nHfhnHzZTqa1tHJQBWUrv2XQDdDZSeFRcTI21dJVIKnWxiauPuTdPnJ7evfaCVO+zf2TRmru/2q0BeZJu8XvcDgHuuBlCKRkKh5N2Vtr2LVsaEidPkqOwgZCIm0u7IYavBaknJ7oBIHErqkUaIcUGiNRkTYk6cExNhzinnZO5DzhI5iKAO1vobhd3Z7pK6MwLkxNGUkPbQ/1Y5Bb4wZF6YSG3yXwFju3Lh2b6BSv2TcGM6bZDU82DoBpU2ELuxj/qqEcZj6PZBtyWx4/huKPxu766vQPHuEHzrY8HgZqD07SvtPXe7+yfaXpobplJUalkuy/OXKgXM3dXda5Vaa0r557/4xceffRNq4WHp49VWwjf3+nc+qH6zXxzqbrnw3Zf4/pM3B/CGMdVHnVP3z3bwhxusXT24ljSGiIiOGNVUUusyX5Z5jrN2wHEYCJwTI0THF2fn/aoJHZb+jmvOTa5dmHIvs8valGsrq7ub6ZbZSURIrellLPndpeuH5D4kSpyZaEyZiENUEMzJ3V0BnJBjAR8S55SIaEg5mn0OiROxIYBqdC5xFwfYurKlNDCzmZVSoposui4PQz4epqj+TYSEeHec7o6Tu1PiYZpE5ek0QylMnBiZAcM7BhBBqQjod8fxOI6BmAjo7mLaeh69upDtxu7wIu7LlkFMe1jCbk8DXPN2b3fWMeYKTNTTGTfbtKVdbp/YXLN+b7fRTt0JbSqvAN2GgqYl8PoI/PbPF2ZGe6L769hsLER/C5R+EpX+O27eO1lqXctyqWWVWmpZzWwtdV3rMIz3Dw8P794lvM5xuF7hf7INv/K48/Evt1gyELfENuySyft3+GtYa7rdG0x6r5OqZV3XBQDMW8HAOCSAZMxu6tDSWjuYXhe6F8Pp9zzRbZl3fAuWwkRto7on8fUyFsMmjBCe1JaZuFkCzMQAiXkYMhOZqLr2Ur2QbvFApcSUmYkoMTFRIg4BZgIEM48OFNCqNKJhzzBwzoOZuSuAIWFOTEzjmI/HKSVuJQEE4zSO4xgWL6dUal2KiOpmKzFTHhgRmZ3JEX0c8pDz5t7EOcbVf+sSNwjptkxDBOprx4ZTeyP4Sqm8tfw1u+iKSogbGdT3eeMW7taoF8RTx9aQTtz53Li959VCi1dzCLa12m+Gje8xtePgm2PtDxWVzAKG1vkyn57LuojUWlY3q2JVDQFUqqka9X6+AHEZvP38RwSnrxka+ObDN95ya2Hd2uUIL/TjYIOSjciHEAESqVLXZVnmS0jOOiAB1GEAd+akagDYm1a93QXsxVe9CVV/pyu5uSHbGKfeCzpGeG9oAleIbR+EcDlTL+yQUlcVA2emnNgBhiEPQyaiHLVp0YEIkQgZKRElpsTsqeujIeQUvZFxGHLOWVVF2F2ZOQ+ZmYYhpUQpEVzp8EA0JCY2Tu4550GUiFJO4TYyIyFCK3/CMGk87AskMyMkRyd8OfU6kdwcIoieqU28f+fBbZ/rd2jzgfY3aFtkNrToELO5XY0/6vu8eoUb8l3NsgCfq8l2RaV2u+jGf9ttfWy9GGX93d6aMbe1tS+9W9O2m+0PBZWu9VXoAKBS59PTfDk//vjDd7/86/VyUa1aq7sDZeAk02E9n2VdwM31ADdLSJz8PxYoNZQH+Ao0/Z772AYX9jt6S5FvaHEd1DtZdvday7rMyzx/+fzp8cuXIG0Rqd4dGWEYBjdgzokTc7bsRO5dhbg3mYPdqH4xzvfLMewP7MV1eH1mhNA7RmCYP8MwMneFXPcoh/SdvEHsmZGO0zSMOad0fzzklObL/OQiFYCAmADhcHc8HA/RYoKAmn1BlIjGnBKzST6MQ2ZyMEcDhHEY8jCEp5ZSVhUiywlTSoe7Q0opJR5zJsIoZXUAczUwREwpccpJVNRzyiHgQ4hIEAR5YhJKAM7Uen4yc07JzMBcHBMlvKU3EaH1ctswaCt76tOeaXcFXwy1PULFnboi09UKRgwKETYoarGGDknbmrBzozfw2buWHZWu9tSNT7BxhPtz3D25GY9BoF5tbSAIAdvX5vYfBCrdGDvNEtBa1rLM63y+PD/O57OpWBUAp2GiPDGRSFURYm4qVgAAUZ/s0H5d79M/1fZ384puLRV88cItWuyecHf3ECmrtSzLMl8uEahApMRUS0GELKOKIpD5VpP5O49kR/T0isEX5/b6bF8+2dWTYwwz0ZBTSklUPGRRvSlzuoN1sX0EIISceMh5GPI0jTklU0lMppgSBQ81DnkaB0JCi/nYviZahTFRYsopIbhjqFnAMORxHMLMSSmp4lCSt+5JQx4yRUsVaHK0AHG1HBGIEYABcBiGuETEzeeiiK90W4mgyT1ThBqjvxgxIeFb16eltFBzlHrYrs3SXnp7RYN2719Z0BsncL0dfdncAKWZZvv4GV5/IOxve7eJYicbt337axsXG3fy1sjaIKm95fqdzalBj8bMf5i2EjbhsQZI4KYqZV2WeZZaIzgChM4EDk5sbmCqtZRlAQDbl/Z1TwXgzaX8H3t7fXfwKyD1Ao9ee1Gv9tzUjppoWFnXeb7Ml3me52WZo3MiEZeaS1kBPeUhxInyOJgpEW+mCb7tzN1+XV/k/k5XEQGYOIU6JBEi5pynaUwpVWFAUOttUxxURUUh2j0Tc+JxHIecc0rR7jblNE4jMzlE3x8cx3HICZHIMITu+/SOGedMNA45JQL0aLY55JyHjBHdQ3CElNgtcU4hlgMAQcAhAKdoaAbmahr9VkOvsopIMEqISBQ9WVDBwMkd2FuHMHdvzZfMoqH7a7q7t4BslkcwZRshTZ0DuqLSG/zLK3cAbx5e7Z2N9t5c6+t79lgE1yc2VOrv36DrhTuK2KTHrpx83/nrQe/9l2+/d9I9++0PApUA2nm4h2CYlnU5n56fH7+U+ZKIMGdGjAGzFF2qgNQ6X+bTk6ncv38PrYcB/j4T7r/R5je/3v7Om7XirVf91V9fOfQuKhJ0ktRyPp++fPk8Xy5Pj49Pj0/EPI4TMxPDPI+qFQCJUso5DcM4HZhDK+cm3+T3PtPf982ImHKaxjFSN4gp53x3d5dzXkuhmdWUiJgYwMtaaimIeJgO0zAQUR6YmVLiIaeU2D37u6OqMXNKaW8NsHN4cCET6O4hV5MTPdwdHADIgRwQOMVnN3UBnMacExFF5lNkMjmAI+IwZABAAlFxgxo6SOa1qqqnTMMwMCMzpoyIwMiCDgZkRMYAAOqi1dy1huzKy2lHiL0bN3aBhE24oj2TqDlzjZKDHXL0K+03vvV+JG1xkc1uamzRLajsAAdu7vDViLpaUtvX9v+brdQ6EPoWoOnYhIA7H2gzQfuf3nVy3goHvI1K+AY2/7ffXuZDBTBB6zNZa621qCp2yZHEBA5EITJiIR2Tcu06xNvk/wqt+09yUl/ftm//OlH+conpGphdFgYaFdO6BJW1lFJKqbVWdmcWAAjQIkZRERFAtMbm/C4Vi/9GW9eHoQjYp76pGScGBWZOzABgaqaKiEOOzE9MTMStoXTYDiklIks9s996dULwSoTRJJ5UzUyDMEvRAILcOVwt6imLrmqIEK0quyHQwoQAV/oZOoSpqEjkh5k3mT/H5oUhEniQNQThi2x3qG32liXQiX/a5IoQcHPlNs8ON3sK3hq8e4ZoFwa59cY2t+vqmF2hHbcd3Oz8+uwOj66gdMOJXG0l7w96UsvXxtqeAP5aQuQfiq3UpVtNag0Fwsv5cjqddV3qZTaVzCTMAL6uRdbiqpenp5RyKevDx2+Gw5GIaZhwS+q74tQ/9pH/XV957a+9irn1j2Pvi41dtcrMRbTU+vT8/OOnT8uyPJ9O53nhlAwxmWKmcZmriSMhpZzzdDzc1eKeiImaIh42xcGXX9vh/HWMZ2ec/9TVQEw5j+MYvTzDt4o1hBDHcXD3Zvg4ECIBEOJhnA7ThLgFZVxqEQE3i75+zZqAUK92AKBd8DuOTq1V3rTpxnE8YE7RIDe6EMFVgshUFHqaJSAGpMQ7RdUdTF8snSFPiC6uZhjgpeYOIIiCvtN7ajpQrzpWIwagQuuVE6ZTGE3NVqLEtEcl7NCC+728unMv17QrCbT76wWqvLijLywnfPmW6xh44QDEU5GkczWeus5a31ezoPpw7/t+eS5/IKjUXJfIcCvrcjmfH5+evnx5tLLK5eKqOdHAjAClllpWYn78/KnWery8e/eznw+HY8rDmHLkDQLAdo3+O1lIv2Pybma2dyD4mpt3Y7M7qGqpdVnWT5+//Oo335WyPj0+LfMl5azoKSdD54GHmkVNDXLOh+NxfXjInjlxStwHKL0N3K9h6noUcdhX1/W19RVO0PF43Cx8omja58h8OByQMHHKKQFAjr5LSHd3x+N0AHCz6mZqsqyLmkTwnkIMjggBnMA1+vkA48asA0ATw75eMEP0Pp0R3T1QCZukHLmrirhFikBEyjyk0tZS1rW4A1Mi5H0sJqS0TdSsNgvLARysuFYHAzU1NaSmsau3hacxNakjETfN7yb5nZqRiA2VKBq3NNsKtmnciIHdkHnLDn7h4oWRBi+HJu44xL2bBjePff/u3dO49ZDvuee7N4cRtUUzEBEip95bo+zdWdxsfyCoFJs7dN5ERarUWrWKVHFTcIp+UiEaDwBSaykllyK1SK2I1INxe5vzn4hk+qfZHHp6nlmtdV3X5r+JAqKoAjXHDRGSVJGKAKJipqrUZaRxgyMHx98NoC+P4Sfsc2gC8oQtfad7NQDYGxpvNRlETRKfr7nMaO0DpqrB+ngLrDfGog/8K3mKO7fpeoweHVwiK8YBwNzcDJCcPDyPpgnQXQ9o+hRRAG7uQJGXGus+XgVVvfdxQmjBpcjcBPfQyKavuyfX4NrGZ7e+5j26d+PiXVnqhkg7x+s6vLdOr1eQuN65vfv11p19C4zeesvu+l+ffoVXL/68fT7Wh5dPvvzaPwRU2kaSm+kyL+fT6fR8ejqdnp5PZVnmpycTGVKaciLERM7oRLRcLmrm5p9/+AGIp+Md5QFaQDY1bP5HRKQ35+bv/3349rj9yozvyT0mIuu6Lst8Pp2fnp5qKafn53Vd8pANLA/ZVIggpVSLSNUhD4fj8Xg8DsPAzDllpFiuom/cq5HaF8G3xs1Lgh++crCteZmpmyuCuyEggTkBUrQpFABQlbhFKlJxdXd3ATc1MTVwlyqqCoiJOeeMgOgOBgggJgq6hZfMFMiJEVo7TwfvbZxbDKT3CAVziyofJySglmTY86ciHxuJEgAwJyIGByYHACLKzMRR7gMW/YxEwR2N0Qk2hCPinFIeONWXcaue+96yAJqnBt04aq7c1YPrTh/ANULfb8rNjfmquXR99XeNz5399ZMk5OuR8LsGxc23XAfYmwf0h4BK0Jc+N5V5vjw/Pz8/Pz89PT8+Pc/ny+Onz1LrlNNxGJjwfsp3UyIig3MpRUU//fC9mN+/+3B8+MBp4AytCdc/upH0D/yCFytNHxB7c3ofxYhZK3Vdl2WeT6fT4+NTLeV8OpV1yUN2sDxkkeJgKfG6lLLWnPPheLi7O47jNE7T4XAgD1OFXjpwN/GZ3+Ps/O3RG2WxYe6YGkBUTQN5Co0SVZK4PeYdleqq2s0bV9cwe0WliLh7znkcBkJKSCk66Jq+aG9IiJwomGvvit5xXtiK8lo3KycLK4cJw7aLwLY5aFMDB+KEiFHQ0t0uCCqdiETU1EWslLquKzhkHhIN3ZBBJOI85HFIrzovQUefnrXUOKaNV6KeTnl9w5UX74Pjdni/iUovkOOtV/H2iRuMu4UzgOaNvV5Kg6R7+bVvfefmLm5U6dvb11Dpd6Hd6yF7Pfnf8dnXaNGDid18tgjOqJiJSq0itZIDAzLTmFAUGRxVEUlF6lrKstRplVpVBIkcfH9N8fotN4f+4n79YXh6bxlL3Tfxrffrq42URAQJuVKt1d0ZS2F291JKWUtcq5C1D7fl7w/bv3N0vPEBbH1VWiYlIiBdqc52918u/Q6t/i28KjRHjOq2Fw17eqBqG+ptHW53v6NT/OxdkgCREK557t0ihf7c1XUi3ALl3fXd/hmAe5iB2Dnd5hDe9C7th7p7sGPrO1nUTwc7D7QtUttL/X3X24dX5mJ3xbfX4vftzHxx77dy8Zfv3MMHbu/rl/j1dvPszih6a2B/bfz9tK30AjT/HpuD3169r7+zefPW5l0RLVXmtZ7mpawlUzkzMZHUUW1KzIcDjA6Ay9OPP5Rlqcty//DOpE7395wTDtgbzwHAq9Hx9oG8aQL/421fsX93B+ewCxipRvLk5XKZ58tallpriXLBWsQVEqTKa81FKjOPOY/jmFNKmYnxcDiM0zhOU0q5CS0hto6ru0yT6zFcbfnf9yR2H3aIupOXQgjmjpHPjQgZmYkRvBEojXJxBBdFB0QkZkYgAFQ1BPDotA3QUg+hl7RuvLdimGqRWQl9rSPoPb+JUkpMBOCIwRu4mjbgi/ZrLVaPRC3XCS16/4GpuqKKmYArojNTBoA8TOMYzZQ8OH41L6VWkdcZMNvBRoIC9T+3n3TznvYMdLSCLR53jaFu2Ht7W3bz76cJwZu7jbf3vv/1Yg+9eqm95ebdDs34vxZ/+XWRuL7xbZfm9/Hg/O8JTD1du4Pby6PaHV2feuDREl3NRLWKrqWe53VdVgYgBEZCUGKIenFGcvPnL1+W88VEP377LSI4+t37dwAJAHtruLZYv/zal6f5tdP/fZ75u16iN77uK4uPO0BDbNVay7LMy7KUUiIWUKSutbKpk3OiVFOpNepXx5xSSnnMKfPxePzw4Wfv3r3PwzAMg6VMiBjeyRvBuBfm5tdO8qughc2PuZ5E2D1gaG6uhgCcYBPsoWbFAAI6OiEZWMj7QGOpDN1NDdQQkYbEKSEhIzeqhloOrat7S5viluLkBgCZU0oJEVNOkcYZqCQiVrpBFtRTHA0SMTFzm3lm4Raag6m5gRmCE2EGhJSGPI4IGA0hAUDdVUT0paeJsAOdncVEu3/9gsCWx4F9BgcYXS2sbjS9tpXiy/xWZeAVML05bnvCNgB0djo+6XjTZe3FjvZG2U0WZUeCvo/r0b759T+BSr59y/5E/MV+XviTr/247Zy2NNA3rNrriW15dzFeHbDlsAEQoJMVsVLFHaqamgGoiSigllKWpcyXejiIVJaElJAoFBTCJX5ZEtvw/KWL99bZ/fT2D4Mkf/3UWx+4fVv3RK7GSJv35hGNJlNRBMRa61oKcyp1rbUgYsSPDCLV+2uZXf76j7eH/u22+RZ7lhcRndAQ+31sNlpbLfpdiIRnQCAlcnJwcgBwciBsfhOYY4TyUo9QUXetMHqTsrsHRQObG9ZoZexiJBElU7i+gwIRHGO8bAv8/nwDubZ27teoPW0mW7co1MzdVF/mK91cq5/2or3J5cUl8i0Qvw+2vXFbXu3mxa36/V0g3M+Vf9iGLdMyPMKf3uffw1b6+iW4AlEbww4WABWjpjv5L29Fz7sC4nS8uwOAy7xMh0MeR2KuqmsRQGgZsPNSwYbEAESOiYnUIfFM8OlXf7s8P9ayHN/dq9zn8ZAP99jCyxsaAUDEjNu1uRqaP3lS/422bndsv3cZd7ff1izhfRg15EoAGYlTHsZxBNiofXQAMwd0qIrooVjJok/PZ06f58P68dOnw+E4TYc8jCmnSJIBgN2c3r78KzC1TTpvB/8GjbiFsWN5pNZy0hCU2sebtoZB66QICAREOI3TkHORauhFWN3A1RyYMCEhgFUxEiQcjmOaBnDXLU0REZtAcAZAMPBwFcEiwM+cIlMpcWJm90h6VwRkSoSOBMjgAFVdrEO8GgKgGbi11gAWVHtQUmF+IXMmTgCxJLiaresqUud12beo3G5tZ4yuc6HxVG2oXqdQeykCmzsIb5/r9ehxBXZGwk2gBK5v2t9N3M8K3z/o9y9e7uaPb7vB12B3fW+3iV64jgghZ/I759TvGYP7PTyUl5C0Le0xfrcEGXxzwAMAABLROE0AcDgc8jByykAsarXV3yIg+griNqR0N4x3ORvR4M7ChfD0+ce6znkalvMzMSJxOhhCLLdd06Xtpx1irIWbb/xPs72oBvoK8l1f6D8bgsTCzswpZ1UNfWhowmgRGDfEFjpgonlZ0umsas/Pz8+nZ1Vdy3KQIzMw285/2q2hvgsFXm20tlZfJ8wrUOrwhuFKg4ftwkTUEpGwFYIBgFcF1W2IIOKQ8zSOxLRqDWkoNSSARJQ5IYACqgMS5mEYptHda60isn09MQ15QEStplXdnLrcIYcQEzVRJjdUEHcIhcXw3JDRAQxUWhY4mDkCkBlCbzwfAsXeg2MU+gCJiHoGPphbqRFmKG/V58IrO2kH+bDNouYG+dUbQoCWh9h31df6/cC6GWy+Ycmb0/itZ/ZT5Xpwjm9/Rfue/Wd2a+meCOgw+Dtw6fdEpd2Rv9zf7Zf0lb8bAB4ChHjDXfwExiETp5SHYTwe7+4fHk7P52EYy1rVTNUiS00ECbRUWUodmIVIEEmsrAWI1ss8n85IhDQMR4WE5IghcuL4Ys5dj/krDtxXLt/vAdNvfeqK2DFKfDPvr6NsG7O3zzcqmBMP4zDKeHd39/7dw5zT5XIRqc302+jPHiEyB1Gtta7M58v5+elJVef5cjgcU8phxfR0mL2tBD1n8MVq6JtYTG9L9HK5FLMqihg9RdwcgFpY1Kn1ejBrMyncnsQ8MKeUohsLUqNaEJAJvaESIiDnFPxwCAuYWXVz00Z7Bw1iCs1W1C6DCQjoZk3Km9QBQgIJInUhrm+L9YFba+7g5k2oLFxlZnA0A3CoRRScCEKyl1tYr2GuEyUmjRK8/Ujp57VZp5uNunm+twNmv1q0By3XDN74wP5GvPGHu7/wrG8O7eZTt7ffX7/tjfdv8oUdmOB2ZO8fbw9en8NPoNJXgePlE3tI6qDUYqamgUrMjK3yym8M0e2jiOBEBMMwMqd37z78+V/8s2k6IvBvfv09AM3zfDqdzcydVExYH2lGsTEnfgeIgy6rf/mSThkxTceHw/39xz/T4XCXxwmIkVM4tt3i8FvPHAxebb/D0nx9B3/Hm7vXs10hiOtzhbjm+uB2TzfIb7SH0/Fw+Pjh/WEa/vKf/3lOcD6diGAYuIpe1kVUHLDpBKEjgZnPazH3eV2HX/9qni8PD+/GaQS0aTwg4jg6ESVOuG9/cg1fbg9uhmKTU1G56WUE4O7LWp/OS6xD7s7MWZ2JKREPKSZZ5AslJ0JKRMdpvJsyMY1jShkEkAgIAQkZGBAG5jEnQmIaExIgeiJgqlKXs8qyENM4DEQELlqjStmkGHhLD2owVNEJRcUp1FG8UTRBy5toFXNXcauOiOqOSkzIA+cAnpEQ8HJZyrK6WeY0TgMRUuZ2/TIbY2J0G5mwFOfbhhRhSLYCt5663UVNXqxGzfMJzw63ed3slnaf+mx6MQhvuIG9Rb6xVZulcMWIWyLD30KUzUGDNlLbOHlhGW2O/u08b3vqzsnb6Sk/bSu9QMO3nnoFSXv/ZFtLvakfvu0pdWMVEYlTIuJpmt69f2/mnz59mabDPC5rqc3PF3NzN1/WckEws1LHmpOB4LwI18vz8+nLF61yePigVZiFMt18W7v2N1fkDQB6Vbr699pe3OaOSZG5sylY+7ZWEkZcveVe7w8HkXDI6TBNRPD+/bta5nHIP376cZ4va6mrVDHbgi6R6YMAVdTdRfXp6TmEdU+np3fv7gHgTmrKGQCMnMyuiRRt0dslAG2n083NiAr6FmltJwiitlbZniFzR2IGBqAESM2Ii4kRGmk5p3HMRJQSIkUXk/6PEBFzoiExIQ55GFIGBEEwAG8Z1oLACJGy3bIlTd3MwIEwOWL4QgZAhlFLAojeKj3i8sbtUDM3hVDKs5ByAyLYWqpkRKylRuYlEeZExAy8+Ymtzj8nBm9KUy/GxBZT6zx8O4C3ZkZPRQr/d+dX+47E+eq467FteL3IdnTZmWo33lYbcw77qNmLD71hW235TTtz6fVxdQzDW1Rs21dQ6cZeu/kN/f69/sBWWVRqEanmrlrNNKU0TVOKEXcVPHh5MB3W0AE45fv7B3D82c8ev/3258wJAE/P5+aiGxh4FVuKOMClVE6ckxGSG5SlXB5PVuzu/dP89KxVprs7Zm7uQ/uOBpJxWdStZaxc6WcAgLUs8oqqfAuqXq0T+8vSfaoY9O6uaqri7qYSknWtoSMip4TILW9nD0mR2QJIzClndz8e7x7evUfiDx8+1CrneZ5LFTNVMxHr5iq2tGZS88u8IhIRf/nyZZrGu+M6DgczzXmYxgMxRzAc2oSJKBW+AOdAITVVkWiQ+WIsmENQ2NG6jogdkFmTJ2QkIoxmLIBMnogdPQo33BFQ0UikbiYYuiM4GJoIUKiQZHeXWlfVWiu4M1HoxiVmc2s1oAkYGRyjSxM4ogXPBYmDSEKNMySMwB/2nnFuzR8mbH0rm6nlACCE5G6t6J9bba2BR4fcpvfWXQQifglKeINHzYnb8iav5tJ1DDWfueHeLtt04/neRKbrjbn1w67m2BVhNsO4vYAd0cIYa71pboDpJ7bd4tboRWyxXt+OYTu6v5MH9/XNb37tXzAwNT2dns/ns5lWqWY6TdPHn/1sQiRyxn3nlp2p4uhADkG0+DAe/vQXf/bNzyoCPX05ffn8Oaf8+cfPs7mrmZqjX6BWkbGmlFNxm1IGoyn55cv5k/5mGEbm4fjwfry7e/8nP8+HEYEEXDFqslrslwERQFRWKeoalU0NXN2f5sci6+vT31u2uH/h5rx8j0cAoCoi0XqzrMtiZipVpSLCME45Z2IefOIELX7dfaiwdInIHYc8IuKQh2+//fnhcLicz1X0eH//5cvjeV1rNIGRVdSIkLi1LouqWBU7X+bzZT4cD+fz6f279wj47t276XD0h4/R9ZM5bZ2TANt/Owc0zh9EZC1rWVeRehPtATB3CWN2WatUJs5VmCnnpKrERB72EFDOKQG6qxSpBgilOiBIy/kAdMfQNDJTrY6IiRO6ui/ny+P5EmbzkHJKacg5JTZTFXBwyokoIyBAr1ATdTFESIRMoAZF3cAJiDkBwbquUouamTEYA1EiGtKA6GAqZohIxohoJkwACYfM48BIVESqqIdfawqAgZVDri8qTrCru7VWItjV+ztU3cwMb/R5c+Taa/3WxO1AfGEl+P6n+0szqePC9lU9ORNuvhy3hq+hH+OA12Vqr43/wmJq2TbXb2mgGomru66H0N77CpbeRqU3gPClbfQKhmO2uptblbqsi6qKlKiu7IX+SOS7qfzaAAQAdHfmdDgcbBgf3r17/+F9mAbMiYha9q27qIahuIqkygioogpUsa7n2VZZTpflfAEkqcXdwNHAFGxbkKjbmOYq1qQDQ/HezNw8mom/eYmu5/yGZ7w/r3a08Sg6HobaQXRNklp6Ag2yuyUj30y6q72+uXjExJ4QcRynIEXu7+/XspYq0VMTEbfQdduJRYKhrYhuRoin02nMTESX+TwMmYjlEEWkYSsZALXsieZENEO4nw+oqapIt/VenS+Yu6iKqJEDkTkDYhZhYw+iBNE41qCWzw8ABmah5d1D0dhC35EW3ggVBI8qZQBIiULopOc6uRO6AxOlnBAIPP6BeXOLmSDEllFblnnHA28NkxwBCEMBigjBoxvdlXx2J0L3DV8QoKVgxskgImLi1jPg9bjprsst891fuhlJG9XT8/2uwLBZUa9n9u1S8TVb/vaYbs20vgjB1aEPm/2qj9Q/dgsOuP+1YVNLwLk+jW8fOMDvsJVen0tnLNq6ufNF3aH2UOgPP/zw/Q/fq2opRVXu7u7M7Hh/d5wO7959SDkREBLtrmkb8t4iUwAAzInJ7+/v//QXf3p3d/f0+PirX/7J6fl0eno+PZ7cPTp+gehpLQquYnc0oCE6DVAg2fnx6dN3vx2fTzTmfHegnDShMYG7q4WwIAOQw6rlXM5qKipRRGZmpvbjl+/n5fJWFpzvH35NUj0QzUylipku63J6fqoil8v5+fnZTMHUTZno/uHd8XhMOYcZt0kxtuu7X/sg3A3POQc/9e7hfaTV3N/dLcsSBbHhbqgZ7ITrqxISrrU+nc5IqAbvHn5Y1/LwsCClcZzGYbTJqAuO9PNo/SYDqmOBKaWcL+d1WU+nZ9s5uYiYE49DNlOpDKbENCRiJo7Z7QrIkXtDXVqoVe2Dh/ukjqZgcVkJEWAchsOYmSilHM26VSMNFIlztKsEIHdsDVTAkZhTQiRXBEM3J2KPPPAwlT0sGzMwcQUEU02cCEmN1LoSuMc1jFUfg6rrKSyeh4GYAdHMazDlqmZKzBmZOBGlF7AUNxappaO3NEzaOLSe7tkxKz6ycU/9KdhN/+trgZjtM76RzbgfnVcTqZ0TbOJNW+cD71aPb5cArkC1AUOHqrdnRn/TznbaDmjr1fdWatxPodLmqGHjjOJPb0XZfQH3hqC2rMvpdLrM81//7d/89d/8tYqs61qlvnv3cFnmh3cP3/zsm2GcDnQAbkvENVus/Qsi2wkx5USIHz5+/B/+6n9YlqWW8umHH58en375N7+8nM6iru6mJm52ns/rug7jHQ2g4NVzRSN+/O0PgpAPkyWg48BjxuMIYzYzWYuKIDi7o/siy2l9EpNSy1pWNxcVVf30w+fT5emF7XNde3YLQfy1t5T7THaROs8XEXl6evzut9+ty/L49Pjpy4+qmhASYUrpm2++ff/+wzhOxAmJItmPIfkLi95bWjMiDsPEnBKnb7/99nA4EPHP3v9SStGq4K4iBhDhvW6KRa68m/uPnx8v8/J8noHo/u7um599g8jH4+F4uLs346YpzWE8uIO7hVqxiqzLLCrzPD8+Pc3L+unzj7ozlxBwHNLdYVBVrSuaMvMwRPoiIFhYYEhI6MyYU0tOCAtLxcTUHMXQvNfpEx2m4zcf3zPRsq7rslYRERNxTpTSOI4ToAPG4Am9bkdOKWdCMnSVTmQiAgJhFPm6qJQqXsFDuwt8yNkBqgAINIo8riIjYrRjcHPnlO6OB2o+GIXTupSqrdO6J0AkTnnktHzdg9vO7yqJ21CpE03QWacGG1dQ2tCqvRgNX67kjbcPeOdwwvHDDl8Im9u4Q6VrQ5aGPsFN9vTcYPs2b+7WT8CNkdpPlg3nms/pALErQnT3lx1gAOAnUGmXFHW1kLbZ1qbg5jS6NyXpWtayzvPldD6ryLIsIpWIzpczJ7473jVSuTsp3r9qZyjFyy1emnM+HA7MfHd3d3d/p6rDOCAhGjo01QlRdbDCqYoKm4IqKTnUtSzni5ou87wuS3LDhJjQ1UoIxYGzGQKssixlEa1x/NErW0SXdRaVlybQLfpsIqA3gATdm3UzU5EaIm3z5TLP8/l8Op1OqpKJMmNOeb1bymFBRBEx1eAXvYd/b29v+9ZIFDDmnIdxlHEYhiHnmOXtejaSDgABCDB8C1KzUishppQul5kQj4fjui7MlNIgUsHdiIgdAFpOklktNXixZV1U6jzPl8slyvFubEkECilF8EQkIbzPxHz10Pt8awLYV+LX3R2sybK3SxvnTUQ5ZWaKri2h3u0OEMlLxNH8pdvdsM1lbMVm22UghF7JH5pLkZ8UEUdGInJAIt+nSUCfvf3eboLi5C3hKZLQrYmnxGK7D7Ddbju2G69/bl+0ET37OX7FpZ39c7PPfk13OQS+YUWHpP7Jq8UFe4C77rcbR1eu+jYz0q9m0P7ub9Pg9hjxegui7gS7nC7gyzP5vevgwMFFaqdFiptBv+CiUkVE9cdPP/74+dNlnn/13a+///RDQ6Va53XJQ35+fgbAP/nTP42+F4BDS5ABdHBVEzUzq2sVlcyJ+UCQONPhOOUh/emf/fz/9H/5Pz4/PYmsz8+fl3V9upzLOquhq5Fjgvp8Waya5mGYyDjJ5VLI+ZLTL+9s4DQN0zcfxvf35rYuSxUBMzcBs2LrLCd1EZFai3XBkHk9i9abi9KZcHgFRt6Ru62oqqWsInWZ5x9//GGZ589fvvzq179a5uW8nE/nk5lmokSYc+aU1PRwOEyHIyLmPCBRyh6u1H5wXjE9km0QUkpDHqZperi/X5ZlnsswDKXWKlpV3B2MDC3oVXA31RlRq5japyHPl4upjeN4PBzfPVykFE6JmZnZHUKpwFTnea611Fov51OVuizr8/m8ruX56WlPvSEAE2TChAx3h8OYiaMvyKbMiypqRQEAwcyN3KNlnJqBqLs6ILbq1PbPzGutKrgu6zIvRVREzALCwndz0aCEWi1uEhERQpRqUg0cGImAAN3AEcyijSUEtgFEDWYOKwc5AQKmlBIzEuaEzLTd9OiVgIil1KUUbbWY157ZyKzmVVReSORC6+KZ+Goc7W2lsB2aWveGyi+wzQHQvVk8exTo86k/sUOJ67s2bpua5YhEgYfh214/ZFtauTUL6cYbeMmYdSDa+4q71idXKOs01R5/99vvo2QCAOhupZZai4osy6wi0JF+XpfzfKm1/vq7737z29/My/K3v/rlb7//XkTXeZZSj6eTud8dj5zSX/4f/jLlNPnIqXnWhGTuIYerqsuy1FqnIRp/ccqc0uTmf/4XvyCC8/l8mZ9/+8NvzufzbGtdFBw0iiQVv8ClcNVRD5g0GZjAeqHEleFU53QYP8x/+rB+Y25zWauImda6mql6FZgdNEhcj7XP/Tw/Vym3N7ZBDvRl8+Z5dwCIikwVuZyfy7o+Pz//6m//+nR6/vz58Ze/+vW8LKK1anX3xJSJUmJwK+tyPN4dDkdEGKdDStk9Ys+8X3MD9SJdKL4upQTjeDgc3r97LyKXyzyNQymrmYZcawj0U5j3akLoqitTWQuYDuNQ1kJEh8P08f2HWtZAyZSSu9dSVWqtcjo9r8tayno6PZVSapXLutYqXx6/6C3hzYQ5ISFNwxHCzBkG7s4OACyX5aznKHJ1EycmpjwMqIprdRcHQuBuVSEAmlpZCyEu83q5zFW1FFWF1uANyNxqNVUNownQq2iqlQhL0VoEEYc05PBKwQDMQONBN4UwMQ/DgEjZUS1yuQmRmHAYU+rFwPtbvqxlXhZRrWoQSQ+9aZKalyoiLxsSYBPtptZNADoq9V61ANDzwXfx89vJ28ln7/YkXomnXSWa7z64GU1Xop2a+9a15ZoHt50jhv+ODVQMOmZds5I2I20HGfjiWzcTbHMotzN7zdgC/LSt5N59086SWPDBpVSp0BeOyzJfLpda62W+XOZ5Wde1FtFoWqOiKiKllMS8RgOwWjiRSI6SJENydxGpVVSj4VJlIlVRY4DWaJUYx3EQrcM4DGMukombOLJ7o0tErbpKUlFjNEBHUXMr67pcLtm1zEtdF3MXqcEc1VrV1KAqioOGc+AdYV43qIAta+DqgHbCvjFuTU++CY/XUsu6rsuyLOu6rGUtZVVTMYm7jmQAUKvUWkrNpZRSViSutUZpVXBJ2P2eHmhoEZ/utWCUm+WcY3mPLml4HSlXn44MTA0BVLSKIGJkKhDiOq3ruppp0hw90mop0XVmXZZlWaJVby2liJS1VhEV2c2cZpHTVd0ViTm3FiVhrYEwM7VeuM3A9FZLbOaRmN7izs3JaxSBR58Sjc5v19vkPVbiuxviLSCGsW903FS6cUtcw51MP+426C2YmkN15Zuh5+/0rdXFQQvPXX2zjSp9Ma/ilDYRpU5yY/M5+5wOD+VqJL1gCX5y61ZWixfC1TbZQxtu7lMLBb504mAbP9v4w+4fv8xk2z7y6hDx9vEVZfeQe7u9QKW4kgqgAJHXCl0sXaqs67pcLpfvv/9+nucqdVlXNZ3X5bzMIvrl+fHL05OILFIgEyGzZHAAwrUUQPjy+Pir3/zqfDkf7w7vHu4jx4yIzPxyWZa5RHBHVQ/TqFoO4xialG62rkvR2aBM9+lnv3g/nPjT6XN6RtOIxqGoXbwIKgCOaR5TGjKNTsQ0Pz6KS54GyuSuTqQZjVDNVl3VzEHDJHZHN3JomcFa4bagAsytlnVd5uDlAaAnhFxznWst0Wv7y5cv83w5nZ4/ffr+dDqdzudaF9WioSIFoKGC5n6+XMxsWcswjvN8nqbjfFmm8ZgSR6M0Qor8Rng5unyD0Wmc7g5398e7h/t7NyeAWouohlHSoEwNEAUgZv8yryqSmD9Nn8fzWWoxqSmnYRiHYQTwEqgkcjqd1mWtUi/nc5UqImsRUSllfcErJYJM0b8vtVrYlIiQOaU8IGJGZHBTAzdwE7Hn02lZLma+rrWKIRJSRiTMTDkToYqeT2cAP5/P8+Ui5qWiCiBSKZW5uLcMp039QVXXdUUAERcxBARzIUEEZkcCcxuGlBLBNiVbka65txRWV7VmZ5oa9dyIuJDm5su6xk1HooQNamN2x6KCxC9clGh7l3izlbAVI+IOlbYJvH1jm/MvJjL2haCBHTQv6TrnW5dybACJm0vYNTmJIDqp8LWlSuPNN+AXNUULojOSRSNTFncotJlvVyzZjrE5m4GyV/avY/1LH+61rWQbKvlmYyGYS63rWubz5fn7H3779PR0WebH56cqspT1sq5qupQy19Xd1QwTIQJLAgdEKrWY6ePz03fffXc+n+8f7ublXacv2NSeny/n8+LuKmpmx8MEoIdpEqm1LBb6WuiGMt7njz9/SBNO3w2cERDUABzUbBYpoAA45jQqHy0RMivqky7rJY0DjxkQMDPeH2DK6rZakZbJ2xMqgDqfAr3y4Lq5WS2lrHPosPVBbOBBdqqZrctSyrqW8unHH07n8/l8+vz5x8vlvCxrrYtqtHl2AFckczSz8zyXWod1IcLL+Xkaj2WVcTwMOR8OU/R8bIolfehShHAAQ2EaHMY83h2O98e7h+Odq5nK5TIToICKdfMBrNXuG4D7SqjChJgT55waKqU0HaZpmsAheqioyvl0XksRkXmeIw8pbNsXbDeGB8eUmKKAFhGDgsk5j9NERBmRAzWWZV0XMzufFrOomEXz6H0ChJyiGh9Jpc5rMdP5clmWWQ2KJTEG1Fprb7e1ZWgggImoQwWAuI8AoKhhBOWMERLMQ2rTGREA1Fy9rTLN1gJzdzQEUDbyLv5tLacgyNBALmLM1+sQodJ2k25mHSKmiADQZk6GababodvUDvfJwFp8aSs1aeZYn/ZbEkEHgZ1o1g6YfHOloqFeOI9hyvZOUBABW2hFymGCKiHG8odxabrV5O14d7Lze3ja+PBuJmG85O2Qf3dmQPgsIrVK2Q4ndlZrFanStioioSVWay1aNRL1g9pCYEoE4GpQHQ3ifCpoKeUyz0iI5My4oZKqn86X+bKau4mam5kMA5eyqtRaVneLNsqqqiaUkDPlgYchC5pXU3BvgXBQt6KKCAODKoATqaKAEsm61nkBYUgYw3Wxqm4NitrldXdQFVVdlyr6svo0evaCR7lUQyWH1l3ezKqUKjX6QYWUuLXO8xv31C8teAyapgosVGst64pA8+Vi6pKzm7YCLEqxoMeqyn0QccrELCLQU2lyjkTnnBI3rw231JWNmmoC+4aoqtGsqVYptZgbMzOxA9QWyRDpAuE7LQ/baR5cJx0hJabmQ4aN10+A40+mlIgQLLFpMtOi0rpCtoQjRPz/t/emzbEkO5bYAeAekSRvLf16Vo2N9EHS//9Hkslk3bO8flV3IZkZ4Q5AHwD3iEyyumc+yLRYRdXlksyMxRfg4GAzEEVUK8PhRsPJkMAmZyojX8+rm/I2POOBhLJcS4a4p1RiokgBDkPYJ/M6lz0BFv7vwRoOi9HzM55iJr6eclvnTvvcgptWW94YDb5qcNw0NmTs7/tsxPR/I0M685/ffXaKr5QF6c2fqGpy7dGcLsAdF8miw2HAGpkFVcCuAGBsDDYYjIYgGpogM0vGKz7cgY/kN+58eneDNY5HrHS9vf/tt79KmfRZciu997e3t23fXt9e32/X2357v12/v73u+07CKCKFl8qMSkS1LqVWbXr7/t6ue/Th6G0nQtBDT5f1+SUgAEdv1dvWWwu0oWYqzJe1ioSXRgGsl/r0tIL87foqF6xefv3LT//2/e+3W/v9v76+t43gClfgXTvd3guzdilWC3PVWrWg69s//da23Su3L4uupcOv0A5nI3YO6iEii0P6vr+9v36/i6Lsvb39+Pbt939yN1dNcO3mIVnMzGzft73tbW9vb6/hPu9dU8gHqDYfkYeD1HA35hAN1+u1yOuP79dSliJcSxnFDhnITU7My7rUWkXK8/NzXZbeW9s3uC1Ffvn551qKw2/71lq73bYb9snAxA3EcPVGpsZE7+Ua/WwJKEW2p/2ybRRVK03DGkp/xL1oeuD8melyWX7+8jI4X4jIuqxhrUeFNF6q+MXNn9ZFVVvvf/3rX9+/39wRIkmkLBUihaFvpIWpCtYCgpci67qo+b4Zurr6druqtshoYWFmFCEiLpXqIswUHgUijuFioaWyFIY71OC+bfv721W7kkRsONS8B2sHc1MjkPLoSxfGQ8hHZ0It4oBDnDgwVkRaeqhqfWS7zxZcktzCk906ZJEjYcnZKjrU2iDpActqmLmgJq0ckohPWCQE13D8cS3MTIWlVmGmKlKrZAQtJ3iMHbG33lXVbNuzphApZi89z7umc9C3T7F10oYn6ZQ25SdI6SOvtG/bt+9fl7WEhnOfY6vX2621dr29b23be7vt2/v1fdv35emyrpWEChVmMPPT88tlvWjrxWXj25Xo69ffr9drpCLUWpYq61oHAcru6Opm0WCrm0YAYIcbDxfx88vTTz8/iwgvLCtVyJefn/7uL79c37b3r9uNNgfUAWAztV2FULy8kC1MBCtwU719+7Ftmxa+vZe2cCe8k3c4m7AWcop8AffAhv12vV7f7/LgTPX6/vb247u7ufYRi+4Jd83cfGt7b21v7Xa7brdbJJdMPTuwyoRLREB3d6Ku6m63mzDJq1zD7M+chUwYokCXzBzdAWqpP//y89PlydzNFW61yJfn5yK87fvz6+smJZqAhyi0KJySTdO4kzLbzrzd9l50wHhRNVXLmBJ3M2ut9dZjRaZM8keRFHe41Pp8uTBTwP9SyuWylGhkBAbAtXCgRSIHbdv+T3/727Y3M3dngIoYk8DRnG7ehQmrLFLCp74spavx7gFXI0u3FGFeiUrk5DDTUmRdCzMv9VLLhUXWda3Lwkx14VI4nsrN3l7f99tmakLEYAccypGj5MPuTfI5vFSEkUYfICOqxjjYAXWNJryjQpM9kLqDwSE+ud7OsgMjlCevexA1A6blGgpw58yHMXUnBgZnzj4cdZiXAzMVZmEqhSP9aCmy1BrwNrFS4GEzZurKvauZsYIoubeJGM/RS3669iGM8g4SIY1SBJ8KpQcLDmi9v1/f397fUhAPmJwLblnW1i/rk6q/37YwX0OBc5rIYOYiUmshR5HSs3uyq1nrfds21W4qsJ7po1GW0MnA7g5XIgOMyAAXztIQpZIIc6FSQtHh6eny5cszE1+elutaVL01C+9SRKB206YdzqKmZkzwrtS6GWkxdVaCMzyG2AjOqtpbt6hw2Hrbmt5bcGa679ttu7q7p+EYoaoY8YbeWzr45tYFcF6ahy1wesVA7G7RW4hMSSMj3NxiMiPsn1kCYwKkarW2Uorb7MoBApZaAb9c1ufLk4hY1753M2vq0LRACMPv6wj3Kin1rq2ruZfWSon6uVnJXzUt1OGCHFboBz/KxPCU/ubh30o2C/BsAxfORebBeNyf47ykmanWIkylFjPr5g3NWUEQERYuRS6XtRSR4MeZpMTO53VZni7PIrJeLsu6ElOtxEKuqkVMrbdeSlE1S5dHUsIMYibBDLtOVjwiewAwuznMArAct56iP8nDh47eYzTGWTGaC3wcxWCFh12ZL/hpl+cPI2qJMLz7FI1+0x4dzYdzZkYjTF5qEeZSZKmFmWuRJWI6coEh59sivIQIFFVhHRD2WUYvubhxh4f1eZ7GWbsk254kLhym691xj5Ucr28//uE//cP79c1Uoxh9+Aoul8u///f/wy+//Pp0uanL2/tNnf/hP/9VdWOSdblIke6mUBF5fnr68vKl125vnRr2sne12966trZfmbEKr5WFSJZSaiEmKRcplQgsxuIsXiuEUVJ+87quT08LC5daZCluzs6//vTz64/3/bqDbLu1339/7bqbkzkYeId8Q69EThBmViZ3bk0Z+w17gTH1KibMVI1BJNv19v5+VbV9by1KnF7vfEx7a799/e2//PW/YDh70mcxlok7Bg/ae2/uGhAG8EjHCseTqw6xFHwEObk5QG5uRC6j+EPsE1Xr3ZG5qRE/LcJSa/n1lx9Pl6e6lC9fXmqtDPz680/mJsyFeNv335evC3Pv/f16vW03j4DDEClqZtShOzdlDRHFLBHVQKPXtru13gMi9SFtZ4j1w5IKlQ6CcAQGhMVJrmY95bhQliB3ggiBkk4CcUgDms4adzitS/nl55daS621LIuZ//7aXq8NoFLCzSeXy1KKULafRe/73m5M9Pe//vr3/+rf1lKeX75cni4gEBvgqn2/vlvvv9VyfbsyUeu2tR5mBbM7sJZCwWEfMMDdQSmyqbW+NzV3IXKi5CSt+4zc0P7gMSFCESqjISVlBTg+U92xNKJMpk0C2bPVDVITRoRBpP2BASES5jSTo2PCacsPWTjUvPC6VBEuRdaAkKXUGr05ozvNSJs2W/a9RxwJU2+9qTK1CFqNKNHgxTEZ01TEh9qaKb3k4DAtHeZHiNYfSyX4bdu+fvvqsL61vjcC1VKLlJ9++ln+g7w8vxCX961LWX//9o2IzQBwkSoi8A5ARJZSL+vawEtdtHRm0cws8753InSGFmKiuta6VmZZnoBoIlqcGCJYVi6FSuHLWkSk1rKshZnLUkst7mCXl4vXWn/6+fnt9Q3k9N3Mw4yDgXazW9POvPb+pMruDLeuxujNVFyFfS0uYgyu1Ql9a7e3m6puW0Rltd7uQgRV9f36/uP1+yTeOFv+UCpCR1gudsJKnnmO03wbiGNoMwYbO4HU3DHIaSLz6FAWbVrVPSKTPTU5qNYCs/1pu1zWWoQAKfJ0uRBRpBrv+963fXu/NpHeWm9sFq6lsWw86qaps4WEHSxHNC9iEfZMOs3Hipsf/z4TSvDBqNJp2SW6jGidlOWcOciehO0M6cbU9eRehC9P67rUp6eny9OTOXjZl/dw8wszlSLrZRFJVzeA6/UN3ojo5fnpL7/+Uuvy5aefnp6fATd0c9XetirhWl7Wpfdu3tEyVSvurhRhCSw/9phlVqlIide7RrohYTSpgGcrgpDyDwMUYzLb5GI0yD08cJQfcvJAZUqDwPTjT0MLBnCliUyjTkF4F5KGB8KgiTcFpVVE1qUW4VJmyb1SozUCExM5oKbmampE6KLC3HuPVByNly3rqFDGFQad5J4BTTRtfB+RCozk5MzBhs+E0gcLTjXb2Ldba9tORE/rEy2kszgZqLe+723b9ggM3LZt3zZR6d67qYhs6/uVRffeb5u2ZhloRyK01oswLoVfqginVCJiLgtJYUYtLgWl0vMqpRKzFGEmCGWrVXZwGLBSpPrlsv7880/brZVSv39/713dPDpUmKOZO6yp7qrsXoAibAawk7kwERcXkVJlWYhkL9tYVeqmWcH2dATDsm37cGREnebDrZELBR6+IZtogujYqHSEpeQ6nTY/HVwDEJ2DEM4k4TARc3oHrkZkyZTCpmpRwIiJmWutl/XCzJfL5XK5cGu37ca7ADYXQix1Mlc1d2K2qD3Crcf+rs5u4piE2/AlYkaX34klB6LGSJgGzGxmAIkIzBBSKR8McHZnNSXKdkkZNslcitRSCnsVE8aylMtlWZe6rnVZipmvS42+UomVhNelSDqTAMB6aVIQGYDdjHOLEYOjrwBci8Ct1nJZFusKEjUys269m4aIlyGVUq5GwCRzlHMztc5s7iAGi5l3YVEGPMRtrYXvtx0NU4oGvZ3LYgilSQUzyAZfM5xoacO5Y6TaZsBqLVJEapF1XTgb2cmIDUVEY0WZ5RBbIrIuJXwQ61KHb7TQOBzOSuakFCXzESxhoCFVYSWiqLzkRq4WGjfr+Q4png2G0pcZWSzD3LM7MPcHUgmO27Z9/fq1675dt/26CckvP//iz35Zn4i4lAW0vV+3799fv397/fb7t6/fvwG+lFKKdOtqnZlpb+37m6lvr61tvd12cwdhWddff35eqnxZ6y+XpQgvl6Wu1R3brq0pMy5PVCqWRb78XOoiZqbd3F0I4mCHeFQ85WUptEqV+h//x//wyy+//u1vv79fb0TYt/32dtNuzekdXoxKa0ybMD8tC1CcQOTsYKFSVl5rWS71+QtY+r59hcG69aZts9b9vr6Sqr69vX///n0wAyTMQ0XfVf8wi4ieqEA0/y7iMHZmNR8V+zMSGkQB7ONsBCIfhjsKEcjNNShHd+1Nm6r29yJmCvf9y60ISeFaREp9eXYialkEybZta71ve7KWROk3HPsARGRmaspHrAAttZTwMQ1wZWPFZZS73RFkZvZ+vX779l2EI1eYWZalMXMhWrJDm0eArjM7c2+dmOq6uLqqu6GIPD1dLktl0sqdCV++PP3l15/WdYnYdXOQ1HWNeo9ZWmlZCg8SC0CBetsBiEP3nd113bVUKbwutSyinWFNhV+en375+adlWa63VsqmZnvbW99ByAIsSAvL3V3No3KDMADO8pVOUkmKu5MrwwhUShHh66ZSBPcHZWngySsNtptOliI5ojkVRq/KwNrDLHK4MzOhMC2lPF/WdSnLsrw8X0SkSAKfWFAAOF19UVEQzFxqCWFUS8n1KTwCnzIIJuhEYWpNShcz3YVL78E2dtUW4NkyjHWEv2ASp2bHDSPjaNyHWg1z8ghh+EQqRWzbvpWbbNfbdr0Jy/PlWVe1rNnGAHrv+962fd+2wEr7vu2motbUOhNvzKzuhraZtuEcJRLhdV3WpT5fli8vaxFe1nW5LGZOuMEaM5ZCtWCp8rQudeHedbdmFgYLomBllHUWEeaCFV9+emEurfXLZV3WatlAAwrv7u7U1HbV4r6Epuc02RlUc1LqslSwRLJ7AOXASg8I3N1ba/u+D5wLESmWmPk0qTS7k0/mZWqhI3js9I9m3Y7Bh07KMtwXzuxwSxLLY02A0HvvjXstkUYLdyIW5lrLaqtIWdc1OsfFPnGXvIVAPAAMREZESkAHM1E/KN6hsIbc8UG5Oj4acB5lKrddhOEwMREDwMwQLlKQho75dKWoASQs2XENRkylSK3CICEXxlLLelku6xIeSHd04yCAgu1mplI4cE3ccytSi7iBAVc1YtcIfKVwyJBbEYFprWVZFjM3o9Zd1RwWDSwzVYaIwUzsZkqZXBJEkIgUpngAEnH3cTu01CIiy0esNFDSAE10gKZ8R474fH3Q3QOY+vEDpWqkWqSWsi5lXZdSpEqppU43fwij0HXJZzGVUpiJWUoRyjhvPk83EUjJSFVKCJuSkNa1cBDfBmd3JSNi95mMM106ICYfNl0KnxCtNMqpfDgepZKb9QiY1K6qscdYmJii4u2+77fb9f363toeiVdCBDUnQA1qTtbft9umpra9t7bb+/Zu+w7Tp3X9d//m37y8PD0VfqnMwK7terup6tuP6/vrTYR0o1qpLuyt1IVjOwIwaspERL3oXhoz19qlLG641Ev5svbd/u2//XdLvXz9+n2/9c1usJTTu9qtdWEWKcTiBnVXRm/d9yaEKkLaIyU8+qGUKotV4lSJZ6kUCeJExDwaZLkTkYizS86ow9xaaxF+GGHQgXJGCKKfZokIUQ324FM4FaRH1XwaTozxhiHP3CPkZ2/ttm3hfLrsu0eBlwFkBiN/uP+ycGIahZSbOeTUcH5nJp0Dp9UzcRMyyPdRLkUJOiAqzMA82owwQ4LZRviN3M2g5OZWa3l6fupdTW+9eyDEYECWuhTGelnXdQn6Q5jMsVqwPxQWPjNH0M3EStaWdruENg753fZ9L8VMpAKoZh1usUUlDB6xUgqRdZ1+wdz/yQExM87xfxCiwmLkxASGGQqTygiVfgjrnoIp4U8qJx6C6Hjzaa5jq+fNJD2Q/i3OISrrurw8P10u6+WyfvnyXEopUqrU1CyBRjhKA4wWoQcq5zFwOXQDCafW8Cji6elmESJjHtZy3hMTGbmfsJKNMGwf5Gqckt3DD9zBgMl/C9utvbd9azdue2u9OwAmqYWFu/Zt295v799+fP/67ffb7ZbuWBbv6mbeO2l399vbdlPTrq+v1+3Wdu9Nb+T6y5cv/+v/8j//5e9+JW2su2n/z//1v/zt62/73r7/9cfr71dhPF+kViqVXp9JCq3L5eXli0gxM/OGUEpMxHx5elmXi9Tlp59+Xdbn5/XFunx/ffuH//Mfv3196928WVcl92sz67swg8SInNAVxi7Afr2K9hVEl1WqmSsLS5UViwi31r7XuyEy87CDYokSoahZESJQZ+YOZIWgkEpRCWTbdzOLqPjwsnt0n8+V4GRO4hRVOUDB+1MWRx7ecbgPkhuzvabb3log2dfX997NnJbL07JEqHTEy2CAo3TijHgji5jRsDcJpGysRATt2rswk2nVGiL4yPYFpiC1xzodQISAmLEDIsbMas7M7NVrIRJH+BvdzDpghnVdf/552fd9uzXVzdyIIIy6lC/PpVb+8uX55eVpXSqTM8EcIlg6AJTCQe3WWhLXMOAQd+pQNQf3fbPetyJwl8pOvfdCBGETRilca1EzNXSFqjXdaM+kbwAEDukT04CEqubulcVKNXfniMOFFSYXUPDZeGgHN0USp7sx3fmEu7cNwROOyeSSKRh0s8GtExNdan26LC/Pl7/7u19enp8ul8uXn38qpQhL4UkSHSKPpsw7AbR8xzC6ouE7LBzI5kfJGC9Jozp5MbMmGQU9CdTMpgpL14Z4QvyQJl74yEhNs+HCvyCVAgxM2yPTYCgJeevae+ClfVftlDF+kbFHYVzGdnTV3vp+vW23vZM5KciLyPPz85cvX7xtvpN2BiHOt932/bYxQVy8szbASQqgvBZFYTNoFFSW5PeEK0MAZnAtdV3W55cXc748PUkpxBLNMRxQ9+5wWDdr5iD0SK5Vo67GVEzNjEwdnkhWXCDmxo+CPNNwKYJUiBRGFgg5YnrTS+pm2keGe1jnOnFSKo4TVAf5geonIPIRrfdhYR/QxcyUKBCTRPRnV2aNdWcnOHMC/uMepjEW+MVyiSoRlNxJxViNmDzh23ATxabxx5tLF6M5UWbdOcBm8BlP6KNQzzAFPbJkaNb2nTfMRKVILRJUbilMAJPzcHARUebAcqS5HJswLBoiU0VXN8R0dBD31oidmahCEicmZ8wxixOljAcOURIzRKPjnmEUwHJPkXSUJaGsCgA8iqWTgDj/f7zRk++mETk15sfHGGN4TzJSvJay1Losy7Iu67qUUpmlcEGWasLpg/M8OV0I5TgGPZflQNQpBwOgnSO5iMAkThYO4yz0jgxySdDtg47MNsruiCIYDmcOD94nA/TBgvMoZhypTx3k77f37z++d9V//Md/uN1u//Tb7//4j//wt7/99vb+3m436727X7sR0G+3tt1gDlWoqdrttrXWTYCFmGm/3f7213/Sttt+s/2qvf/1r//0++9f297fXq/X684E61SEpODSRArtG/UmIqLdWzc4pLBUJqLXepVSpdTff39f1qet9R+vt6317baXUpf10tGaAeZm6O4Gupl7UxBU4OTMqq0LgG0v2020qFldCkvkYfpe9lILnXpIJIwOdiQBtZmPejMeJp5GQnnrLUIPe+/mFiGa2QZDFeeyF2MdsBpBR/L5ES8eZqOPVBgzy8w0wNy4q7uX17JtezdjlrosAXDM/cfr69vb+x66JEteH3Zcpkfk3vR06AIAzKL1NjGTyNwNFO+nYU487Ldw9wBkFt7McLVllLARRd8roljBDgBurjDt2lrb9ybc294rM8nz03q51KenpRQqQpHX7oAUXmywSBHQMOiyuH8psq6lqO97CubWu942wH+8vzl7LfLyspYib2/X9/dt39v11t7et0g5tkihjDreRDIyOpgDw0IJ8VSdOxmcyAkMoijEhDRhaPQgPu2x3GkHw/uhb9qpUOOJhKIxvMlRchW+LPV5XZ4vy8vz08vL83pZL5enUs7hUFPUzTiooRUy/NwDUKt27epurbW+d3NLgymi1dTMtPVu5+ItQMQQgBEjlEmhERwR7pBxJXJ2jxLG5k4GS2YJj8ejVDK3qIzUtTXdzeX17Ye7v72/mfl//etff//69f/43/+3375+84ixdd8B9SvMrz9ebz9e3Y0jTNvRTc0dVUhWYdne3//Lf/pPP759tXbr21W1/fW33/7p97/13fbvvb0aATd2Ji+VLzcplUvprz+UiVvr29bgvq5lXQsAAzsAEqorSSUWKiuxXK+3UpfL88tGW+9wNYM3Mwbeu+/eQXAhMBhaty7mKszv76UUNV3WxdMXT7fbVpd6P0LRzWy4ZwEd7EMiIre2967dzCN7JgS9j0RzH2gU2Ykst7mzCLtIV4yQeWIzj4/0rlmsPgqJmbXeW+uIItPA3pqqSZHrtvWutdZRT9K//3j98eOttbZtt9ZbRGmHMLUzlMLBV7mLucfdRahbASRqRI5oJhqQ/5FZirzXaLXiJgITZ4rQUSW4CKK+JkVIOkUYhWmWpbjtjH3b1kJMl5++PL08X16e1qVSEYqcYxAZikM8o8NsuAcjABIAamU8LaoO9KjTsLfWW+/a395ft/12uax/+cvP67rebtvr2621/v6+vb69q6r6rt6Zgr0I0h0Mj5QXYnanKCHgZr2zJXkPMFUpoGpme2u9K+OzI/EIEg17SiYa8gojCGCYewOkDOEoRMy0Fnm51J+eL19enn768vLlpy/Luj69PIuUAGsJtQOwJAiN/jdDnUZVBHN3763v22Zm+y3KbNm+tz5bJGSAmp31UOwkJwrXw+C94A4dJzaKCPgsuUPjDewedBxwyOfPpRLdfYNH7dremfh2uxLR+/t7pHeR5/soIhDMtbXempuLY3RpN3cESg5mLIKGdW+679HncORVRU8LVzUjB0FVwA4YoRNz2/u+tTS2EeIA5gCxNwPvLKUsICm9d4weaEHCOBlAUaKFLJBkaovoJuDZjtcwPL6hi6QIfTB6B1by8UtOhGaAkocN5W5Bb2NE9rhF3IenIQcETQpyM+Yohm/O7DBzYrDPj/qwCvNE4/dhfkGJWm/m1vay7buZR/iJR/ZM71msNWB53vJA8KfdglzGc4RiafF4IYtQ/HHP1oB/zEfJjaOq2fld51U2QMG4l9iT7kQownV0MIp0CpHQ0OwQh5NGCIwHa5/QKfzf4iAPJhcOM+/uveu27ddtA3C7NYD2re+t96Yh6M3MI04ozkPzrAFg04QdoUYnXmb8YZR+xsPoPi6jTPQfGHS8d5aiPY8YjTce1810fxbhEkGTwjPjPeysXKeBgZkyFYsGc3BM+6gwHw1UW297M/OBlTJaLYzWFKDzJEe6y7g/x2gDmzGTBD+8ztOwODsY749HqcQiy7qsl8UoUnvIYXvbVZUc7z9ev3//8fr71/fvP3JkQAIICO7aNOoi02GFEuDC5XJ5kqf15fn5ab1clks321sj5+fLS/8Zvdm7txt1N9O+myoJm6ws0oCuBPXWbO8O9656u+00isI7WHl3Yic2enXQ1vr1tqlmYKAz4EHaQAeedgcM4lRZIIVLrctaJ7E9xsnMRD4GmwRTmdb/AEC2b9HlzbZt3/fm7qp9sEhZcj4g0qQVJVjkqIwgGn5ZjQaTbMSc1Lh7a31v3cx779q6ubW2995HhBpYWbUzc++9mxaR8H+743q7XW9b77rdbq01G7WBfCjJY4FmqB6MHFFLxMyM3MHiRMbE2Zv9QX0dg0PLsrw8vQRdD0CY11pFeClc16j3O1rVRYsL8iK+FPcqPz2taM/PT8vTsqy1PC315Wl9eV6f1rIULoWXwkspIFIqhuJwkywj07q5GY2K2sTGQmq+NfWrG+zW7b3Zvrfff1zf39+X2raGpdZ979f3m3bb9+223QC/PMnTU2WmpUqNgCV1uJL7qByAwZFBhGkQumG+IrJPBn77IJsOqT/W2cEt0ZBXGFQ3hgeWgQAmRKjCRWQtclnq01IzkItn0c9BRY0rhtV9l9MfPLRpb33fdlO7Xq9vP95U+/vb7e39amb73lvXgx1nMGeURDat4dkgBQfXSYATUyx6InLOrNxBFTxQaR/E0qNUkpRKqwETFu9tJ6f2fmOnHz9ef3z9+v7jdSQVUmEuEWpjHlFycMUpP6qwPD89Ly9PL08vl/Vyqeve1WQn8NPlC8nSu0Fv5pt21Rt134mLyepS1LSnreu9ubuRBhkeaosd6MQKUvNbz4A2sADU1R3sRM5TJWXKfGDZCjgJceGylGWtS6WTEnC4mp0CI8eQR4EoYAQSUsC9bWvX66amt+tt2/cwWOyoV3kIIxpzIyOyzdVMos80STEiZjEmsoy69tanVGq9NfNo7tCHAeUANSIA275t+42TAmYAkTmjZrfb1ls3T/J9ovjzfsmFY0YEiwpHRMwwMyaK+jqTYEpFeFpVRLTW9fnpWZiLZKj6UgoTSaFao9yjmau7E0PgBK9CLoTKPz2vYn5Z69NS11Kelvr8tH55Xp/WuggXoaXIUgXEnYpSQbDjiOBS1iGVmNmLycJm/vbeoinTrfUft75t++/fb68/3kuRt3etpbTWt9umamZNdSdCXZ6XepG4XGH3KE4aujaDBsIMoUwrC6Ttp2XpAyPbR6F0ijlw92GVjTptQTLm1nWHg0eMnYDATqBFuBa+VLks5WldLksNh4AwcwIpvxdMOVWBZyapaGq99/229d7ffrx9+/qtt/799frj9d3Utq69K0a1TBGqi0hEky05pyKcQVMjB5hGF1J22NhQKaSGP8enSPrseJBKFBE6HHpWxd2hgFEsJVc31WiyTBjDOYngHMmQ8xi1U9InHV4Ybdqlx2710WAiPwryKBcQ1laENhjUPMLaDHCn8L8gaU43oMPUoUEAm1MQb2dRnFBpyvxpfU32OlZRGm4guNtx83cjNDZfCIPTXz2ovvBDqtlwZmLILwBDoc7/DUDEeiiZA2oGTQvAmZLt9qS9zY/ygONIa4zgGpS1auvMZCGYAATDHSbqyBY57vnhmJaZPxRmPj0/HavrQSjl2PAoxMixafmwv4juNov7+AiTMNdSl8WWUXycj9Jxw8edkRRpOjk8YGsaWkw0unKCiDM7PVenqu6tR4X/bgal3hWOKMynY4ij8XSsBEpP1/RPJZ9oQ5xPUi4lDEYAz3l+PhvkeHMawxH3Fvj/POaTKQh7DVnybrgLg9DOwc3w3WlY3Yukz4/xMOkiVm0t/u/73tVsb9rViKDOTGROmfxFJGoQJkNE7R0waK4GP/12mu4cNB+/fHabn1hw9bIuzxfUIuvi5r6rN7Ou7Xbtt0Z7f+bCyxoZYAhfQ4QqTGSefCYyzYVk21o0MCLwUgvDxbPg1nXfmtrttt96U7XdvDlUzW47t/SFpQ0U9XncRYCo1m2hA1tTM0dzNwcXKjNIJOM6EsOdUmQjpBm9Kwh1r9veHCil1CXTweE28rXujtPmgAMuTmoReBTSs6vuXd2s967JK/l5oQQTQcDYrtSLRo1rNZci0RqAmKeR1SbbHaLXXc3UHED4+zCgWGNtEeQ5QnUHve3hvBu7Zeirxy71PtvQhepPUT3q7kTRuVkYiz8MkYewJmaJCEfKjBwhFhDB1c3VQ9+Yu6NIYSq1LIUW/dmK8POlVOGnp4uUyhyYMlMhLcGhYnjcQkBaZRFnjkafiCa6DC+Rseb++vb2T7/9aE1fr7etqSrIW5Fw/alF6eCoY0ACkrDFgvAJX5oDpt2V1LyFKxMZ/D8q5cJNnaCmvfeQdngc3lRdCO7HkS7XXB+HlZVJgYAwlwJ3MLsYM9Gy1KXW6AAYIjwlqPskf3AoXzr9Q34fXrje+3bbW2uvb9dvP972vX/78f7t9d3MWzc1I6JaAqhQNy3CtYoDIlRKlCoIKIOprU5CfLqmfYJzNfcsrRd5H4+C+6NU4rLUui5UioRPmptRU6emZtuOrpcklkMqUVPdWw+oGlQUhCgZMWIQiPe9JQuvVkSean1ZKkD7rd22vavte9+7mlkz74CqN+8nhpQI4GhgFd7q4Rfoare97607KNlOMhcfzYmHtqPJPk65bU5QVRBa621XgImlZhZwiKSDQZnTeVC3RARY0qrJc0XoWXD4rfekt2dyvQNp+sbGtXDemkkEBJtD1Ji5iMXeCo0SdHWoNR3oKQ4dLhVVcwcTNe4plUa2cECkPjwp58fx8/fESsc7kso9BNNAQkMqffQGTAaYs9VKIB2wEAsRIcqopEfHHEBk8gL0tDzDWdirgAnruhYZIinSDKcMpcwESrcGUAqbOUuYGwDInQgm2TXYr9fb12/fovqCqhuBvSu7mfVu7s4EoShawIQIzD5x0JG0re5A77q1PtyUqZuj3kO2vbToWDfjVI/DsxipE0euD/FQEsOsOI8leTTFjNa1FqFRvNSy1DLakmYy2bHCTxDtzGzToH9GpJxHYlUU7bletx9vt31v399u315vY7/6SP3lIuzkVdjcmVmMHZgFBuL0sTEGgh9wcoD6iBuIp1Bz0+jh/riCPkRRpmlB4ADKIAKDRuUxZyAaVgAMEoCimX2g6KleJy6J8TZ1kPWubWsmyupFnYBt29ve1ByOIqLBp0y87J4GQZ4uiiVEYgY8vH/B2w1yZUwlMbGRRVbb5IqmlCMfMTMDbnc1UpVu2sOCOnb+4xB9PDJEe6YQ3B0+kf+wVA0UgdpkSZ6aO5k5s5jFQkzEPsy+4ZX1e/sNs0vAtOYMGQfkOYHTpMAESI+PdCJB6f5L/jgl+5B26Wm6p74xp23SKpzzQlkm3EGnsgNTaeTZ0ta1dC6miM+w4bHXJkWHEe1yyhd0JENMuSyyJxKIYJn6Y6re1cHoU5BEbBGPEM/0KsMsajQEzUNzX/WoMxVjTAAwak15XnKsm0+ok+H6jGcA3Py8nenhY9PpBhAz3O7s2RjxRGBmPNy7cZlhV4W8Gp2+fQ4XnS3OEKFqGagdIsncI3NLyYlc1Zk8el9R5npySO8YCg/+IwdiCqMZf5CL9VjPn1maH6USQciFEpoGxc4JM0VdnJayggPTcozr1jrIwVGMhogFxDDXW/NurmZ7905t69v7zoSF+I2FgGvbr20nkeWnn3768kXN+P0aoTfhLWLmKK4aVePhMCKj4u5K3mHq1My7zjBYoEBYRArIRuGEXCCUysjI3D26CsLdW9PrddtbmjiR7USMbX+sRTkl7VwuIAIzfFTkZGHJnhUYkU1Duo3lPYoFOBE7xY5V5vDliBoxa7GzcaSa2yAiewIZmauHtZu4YzDXw68dx5z3CH07hBNSHp3B0UlODG4lUo9nIwAZ3mcRRNb6/c7z6ILUsVM3s+h4IMyq1kyR7Xi7O5iFM69diNjN99a1KxNUwITb3ra9RZa/GoEJ6j77SsJoZt6TZ912dzdQeA/Dyw+rwsLU2vb6+kPNu7I6CXFnm02PYp8ykTt1RWtmSi7W2YfFTea+qanZvre326aqEaMAZNQggOA/o3/kTIh9GB8zNzUwRblROJxHWD1GiOmUJqMA02mGqNYSMMnhOro0MrObEnmY7jSg0SCiCWdrPcbOGRTFya2pba1ve9+abk0tSBIPoprEXN1pR1dWB3EXYTXxSI4rUgyD9HJkbQW4ex8hehGZ0tV6N3Nvql0jeuZflkpwJmcEe55xB0FVurM7AbXUCGY1Yge23sMbQ8JUCohICligpru6mxl6M2d0992MgN2xO5Fj037TJrWsX36+XC5do0IrCNr2nmKRhSJ/ITrWEhlFhhIZSJ3UoaEBKKc1d81wI/pwaSRRADZymA8PKsU649FBJz5MjN77nYtqCKa7H6baSvrRhuV6UOwHXBow0A53S7yF3N2IATXJRCEezi5Ed0abdFJahXavdk4BTKHaw3w+ME8a+Cee8ePsj3V8PNYUTyOXc4yQsLs/JDF5Uv5GFA1m3OHhEzMzszaJewDMZSSJCIFDW3fVDK9hRJp469rNzKMoFlyNIkJhwPoRwmaDUiEEJNNu5uQeHTu19+126wZFMYjAiCEUmbQlfY4OcjJD1LlwNyULR7gQFOjmXW1Xve1NdSrDUdgBg4MiVBnB1Q9SO3OSgIGRKAgDyjyeQTdN5J2zMAFVJOVK1B0JkKOmqto7wVWImZ0gAYc4y21g8E6xaEc+C2FMmZq1bk2tq7XMN4NH8d8oHdwtoiCIKSopp2HO41wUUGVIXoe7j8Dh0KM+Si27amKuj9bIh9huc9WI7jbtBnNWI3MgugxWUqC5w1Vtt67u27633tUdRaJRecQzRJPy6PAQuQdwp+ytAzaCew+7W713bdE+oY+7dndzCsKf2YmHL4RDozlxzH94IzDUPGhA2hPpF61icsOFry2KOIhQ1p/PUI/8bNKbn3ihxtYevw3jKdflCWVg3A+GCLsLv5wlvOYPcHMnc2OKoLWxjJOJyFub1MGUd3knGAbfuDfKCwyX4R2ZmnJoGFgYxEByDymTeFhudKDN3C751vvBidAhdXehLGJhbqowN/PMXmMWEBykZuOibmrRo4oJRg5DU71tOzHWRa7bWnqADzBTRS1UnBEkRyZsabiknYDsr5ulBUCjHlBXv3XtRoXZZakszFwlFUthyYTOkEqmREpExVyZu1mLXnhRNysp64nSYzgsgwZh7NEhwu9HaKSwzjmwCDeMdEOKbDEaQZbT1DoY0aSxLLDG3jpx224b3LUUd2NmIdKIXuasUpJCIyOfaPKSp5U5l/OHNQ8PT5a5UxDVag4wk6jyKFo+DHwPZ9QJK2FipWxI4UgL8SFiDsCn9ZVut11q0W7aFI7aIApEJjqqtr7/uGnv1719f3tvvb/39tp2I1pqrVKImUohKQB1ohZSyShKnVjvMBdDUwdc3RXGbrfrhtd3M79F+1Qz7wnVK1cRcfPeGXASoSjLKGqmLuBS5byzibrqTMYBYB7kZqRQEULvg1l4KQszS611WUYj3wQ0QW9+lEoZBY4MELcpRXMzM7GwFCclFmIjMxAnO5tUQqCjCLWdjuGpzJzcEC69edEJkUaY7XBOD7g0vk72aiKzQ8uO9TfflPd8gKRJ8px6cIckIE61yJys9dgvD4t3b+39dqtRYEQY5nvrTGRQsw54rXVZFyL07ntTZEYhhn9Ag59kwvv19rev39Z36X2HeykinEVgv/z08uTEwuQoAu3Q3Xo3YpiCiEx7YCWYFyIh0tZv19u269f39r71tdRfnl6WUquUy2LC7EsRYge1Zq0Zkbs380aEiFBQs601Nd/2dt2z+rnPnkfRYgDGZAC4KZPftk1PhQM9LVzvmpWCCR4FIyYmIkrFS4NSHZJvxJ4CTdOP9/Z+66rb1lQ9IirWtQpzKVxFiMBSiIUIFMFMYJICkoAtQ9sFwYokajE2wFgiNtZrU1MnhxKRMKmZuTKRiJTCGFWaArXHeuzmIYjDIa3qLYo+m3XVvan+ixacmWdPwqbajRysAUiplEqrkNNOe/i/r7dtb+1m2qwbUXGfqxbMYB6hmNHsDx7aLPz53Y9dT9aayt7MXdvY5YG1hjl29CBNHsfBHLFJEGaXePRYH2nTIGDI1AnOoX8oqQhmzkZGUTos445z5t0PGHLadRhgxCe6OfTL8FWPRXXHf/vASpPoGZPuHkkxWU/UCdDoTDEw2HBXpQttPpGPAJAzb3W+15OOfTQlMG7mjlqdrAZNA4RGjAcNNuJM6j9acN2stU6z1A4QsaQx8YAXIIYavZ38iYnTw9uuBjD13m+3m6qsS3l/WmspQllIYLmsixqcTNwoMtuhGiSDA5l2GG0c4tYjTXpv/f16e7u1XvrKFQYvXkhcRIQTqxpUncjV1LwDYGciUvO9J1ZqpqoDgGa+mhGBYdE3x6CAfYKVgGB/Y/SD/UgLDsPup+isEBzGNPYTVztcw/ogtKZE5IYiN+2lFoFpeM08WgOIihQQsRhHZzQnkjBfcsH4oaswoYvfT687jFwdbuAEPsFbIGrLJLLL1EkMwTTjDb2b+anXXphysQAe1uXHSiaAMpRH2CIcHHupwwE04g3UiG6gzbE7NkczOHnrxnsnYTZAzKJ9WD5kwr9YqeSuYYTENBLtqth395x1BGPq6KZ7axIujwExMjSV0udcrIZ3NfZoDH3YalF+gimdRZT1rYhGH9XxztAVPgDDNOo/sALpIbIUWO7Z5sFSDg4zccgnoqnqApOMKTi+DT4h0Y1FIG+2thhvO4zEg8/KzP1hXtHozHFaToMmuhMiGXl4XnSDuJ9k1DRC+WSK0pjHMDhOa3eOjntr7bbdzMqyFA6mAVmrWwqY2AFVA1HX3LRZNSidNUCktZvvvb9drTSuRZ7WtRQxVVdlltvWXl+v0QKzlNJa+/HjR2t7qhyiy1qeL5WZtAuc4S5MtZRu0SPAiLmr7mhw7NREjZlaLe7eu/auRN5N1RSIypQwR7Ngam0EWdCdXDY3V7gSUNj5zo9w2t7u6s5TJCEVZrAUwUEEVZtdyRhsp/USbDK5ur/T3rqW0ruaiFSRZYmi6byUQpwNBCOpMxRwWTpL9TGDPWsu29QiZ2EQv4bKDF4P8Ag1YhApqIMzUs8neeEjfeIslYLWDpzoDjXtf9Am54NUMkJndEYHeohPMbCTRcO0neSVeAe/On647+a7+q7uBN+alVtgJWZWtb33lrgCCAPOoohUcr/Z4hzQfb9FLaTk7tPA8NZwu7HIsMTp8LoyS60cvVYDS5v52VcdGyoYc49vOWojjoZJSvTQyvWS1GlIFKaTF2zOUz7FgCuW7cx9JHGEYOLhKIhNzpQiJtsdngirtIMiF8rcyeKvdwXDff4Xv1I+VnS/TifggPingwZdejBAPugpuJvzQVtg0G1pwck5iDhF0jArfa7aezjp7tfb7dsPin5ZQSS5dndbL8uXL08k4k6tKxz73ratpVQaDgkk9DNy79t+2xqT92gCJnJ9e7++35jw/Pz8dFlFZF0vtdbb7fbbb7/dbtuc+X/37/7uf/qP/2ZdKlllWwCvtTxdVmdeblqNyLFHemHp1q2wuJsIa5FtL7e9EHnT1nV3WBTyyIoERKrWNAIdUu8M4GrammljwtMiVXja0ccOg3e3bk6UBR4taihk5DYxYBZBbQNvp1KNRWOREwQnItz2xiNNlyji4wszVeGlSPD0RQozLUsptYjI08tLXRZi5lKI6bZt4XxWt+wLNuTR/D8KpTo5yC1sOSImUnN1C2tO+NBnc2HYDAtwRNRpFJILaRDh4/8NPjgnisRcm7FWyZApkYE6UQca0EHN0dw7POpyq7l2JXZiN+bMvUhkF7tgSNAphYdN5lEk6L7mavhij7setLENviRCZjhBgpulwTY/jyPoau66IXECJXFmeN8bMoM4f9CEGLce+8Z8jPtx14GV5mnGbUyZQDmiTvOafuzGGd6WCH/eyiSrfYxXgjo6Lkc4IBBOtzHwWrzHk089w8JxY3Q6MPAehmExBgBnZPcRK6lqa40IURDH3aInWlEZp4r6hLFAbWKlscEpVU92hGoE27Z925uwvr9vrz/eiKh327YmLJdLr7Ver9fffv9+u95imJjp5WXdW2fmAol2VTwq4ab7ylybuaOrKiscUfWBCJkqRJi9OZv2bkZMJAVRpMXcZoLIWHVB66qqMJmJ8ydYCckM5GyOiQdFjHdYbambYhWGNQfMpT3sdQCkmV4WmkeYi3QmqsJ7FSYqIqUIM/Ve61KkFCrFAWIpcBI2y3YAgw6IGzrPbJgoHgQTkZOTWjpBWUHk7uyI0AA/SyV313DJAdEEJRnunP1Jht4dHyqZxJYFW8ISaDih1fbWtfW99U11N2tuRuSRFREuB3dVI8sEfhvlNnI7UBTbrTgxshIhTilsyRGFmXyq91hDw8UGABFAAyCIFqJET5QMyaBbAjycEpqPqSPKwv0TVWFGfvGQOMbM/oHuPthlSxtTR1r/THg97n/u8LHXkNngmLc1RcXc1SFveECHlGDHhk2RkJMeJiXS6f9xgseszkWdF4i38pD4ObbE2UZqUHlZO4xPCtDdLbMEP71imHhmvvcurYUjk8L86epAlEOAQ83DJIwxnBYvYAQFGUMFAKib33Zlsh9vt69f3wC8v7d12YhIpArz3trr62vbGygbOP94vX7//rZf2kK9km633V1L4cX5si4N7N3UdnSb2kdNt23rKs9tCWCURXqybI67wq07aKZNAOak6UCJdg9RcstJ3btBPwhuQxaeHZoS7ogGyWwYkChGwzO/LZQpxr4JS8NwklNzpkmIQCRMZaCnSEdZFqlFSikvm66XpZSyXhYpsm3ttu299b1pN+shR5LsOshJDE4r6xmQWSwJEBGJu/rRgMzHPfpk0IdXLiJjMYqOfhYY8BErgTnaoI+Sddqz9MVt36Oj7HvvTfvmrkwm7G5hIQWbOHejuXcdidRAsDpS5NDIY/UDWbvYxzgPo2ckeg5hghN97CMkLL3okbmbNJvlKE4D5pARmCJvtFKmsVlnJ6JoCzNMsodVFStyCiPNUiaqFv64MY2UBpGDonpSEKJhf6XBkgsq/1HWpYp6tANjnWVqwr0DzPlYq0MWj9PdnToVeXqkfbqFLcp1javwSA9hCefy8cMcKEvhDfyRVPI0Ura9ARDmpYoEVdy6msWcAmTRdtOh6q0rhlKEG7w5rDCWAmZu3d9vjRy/fX3/61+/uflSl1JKAJwwRiOligQizEIvXy6//vbtaa1P5empPN325tbXyk7l+Zm9Wt/ade/aFcheAE27XbsIv7ysajlL5uRGZuiGyHCymTZxoEWqS621JM/ogHl4mfsj2Z1US/jgYg2wgzjFUEyt8d2CPaTSULgZJ+0YqjDL2I6pnuh86F9QLVyES5Wff7pe1nVZypcvz3Uprett76oeZW66mUZJh0HzTZhNDjMQgS2+QzI+D8wsbLmEQrHkyhz/O45zmt8ZHP8yrzSW86EYR9yb5v8eXJ1P8yGXUmrg80nycebfhwyKlQ8CpyUFIKnbGHj65JgXOVlI8X56eGEYRANdhHTAFE95V0NFTjPldPVj/h8G5uzSO9I/xuvjPff38nh3p9+H/YQPRVI9dNNhng2hzMdSPcjShErHb8e3YV+4G3k0GBuDQMRH+Q0AGAXaxlXGuJxuOeDNkZmBD0calRR7h4a5DcDcyKalOUqDDPbhpJVsKNo8v7mrOhy9675nrnGmU/WZSeVAkB/GTq3p3hozFfQFPTTHqA3EYuSiTKR0hGSFfYGhk4hnzCHmzJqNZK6o0T6gsc/HHJsiscaH4Znj5p4zbECUPsnyByMHhfKVURMbQ8/4rM48isR79FgehOEx96nYGFDjIlzMlqUFN7Kszcm7HpGNNj9Ox+TmGPgoizweIcwj8niGLFQCm9bm8XEHnXZKXmL++nEFfYgMUG2t7W1vu7bW3b21U5vD1ntXcyMCMy3LoqJSRLp4JOyxYGyY0PfZO4sZIzqYhj6Oxc+D1hlOrfjtEEMHSKJhB53Mh7juVNrxAw17Ls2gIZU46xLmwUxSZJCFh8SiaE8YOvdRpmSgkGV94MiBTiwa6/UQ1sxRaYcoyuE5PNofHzDm+EoDYCFvmE7f+TSGSSveP8sJuAxZNJXVyEca8A9kOkCT+0FgpR0CQsRuUwTW5yDw8AjBfHYTeLRxiajWerlcRGRd11qLjL5jTthbD/wlUgijUH3kjpsRRtQBKHSVUzjjsHe7bg3mW7Mezn4pXFdmunAJ08mzhYa5K8jV6fV9a01pJVl5azqL8BRBdWYTfVqKcJW6Lqswm6r1DsK+7z9+/BDhepG6LGbWHa4d5GoUPoJhophaJ4CF18tCgDC0FDiYEJEtDwrHI0wvAlcICJcrgwZrE6A6GFEeepOHxs5dYqlsJiU0oxZ9IBGbKwAAUTFjptKNZNu7La0707IUG26yphoOjfBvMDlsBtsk+AotOov6Gk1KIoRskDAPKxtDm+P+L7hbOqfjY7yStb212rat7Xtzi2rHauYZwj0QF4vUpYqJqUmRCTEwJAoQCXFRq7QMeZTSIRoK8gjLPpNen4rPw/waUmnSODZCHjwNfZ+dPWLljGT34wbyEXhmdaURHrNKGRVWusiDG85HCJyNemxmWQdZjyC0NFiJGFHjh5kcHmkuhLPH/2FiJvQMgUgpypEpNIOvTXHFwwige2tqCKf4fbp9bZSgNBOfVv1cu3dSkFMqsgRTkU1CgyOKih1HDP3dNJW6rJenUmRZl3ADRZ0N1b733d1FJBKTTDN3L+qbB5sW0zwqc0TvPrSusN0NW9MejTqllmWVIs/Pz8uyuGdNq97bvt/MrTv/eLttwqxcXfau2ju5MagIL8SKgqdFi1Spa12YuO9ttyiws33/0UuRX5efa72YW3c4mMh6JCsh15ZaizxVEb6sCxGJsHYNEOdqTo+1TN2hHuXeR1gkEWXdxnQrcPrjfMJiTuJ7qO8DKw0LLvdCbtCJoXxYYXESEVNQ3XVdRAlLLUTho6Zdw88+7DHPFM2Y2NPtHws36rqdVrHziPiLD034nvgIA9Kf1OfH47EfXG6zUUw7sq3yx1NAw7HDg59x9sMCG8bFAEUzhWoaY0fS87Dp6A7NjVs+LfiJlSabcoZIdnKjD9Jl3stBZB2Sbdzm5Jwm3/vHb5+DNHHaCY2Pux2TGOtrgrxYYzhrTbqflgnTMFik+xuZTMMgnwfMPJ5zFp6dAQIOTPzvPupfOZFHJCqZ5Y2Mpx+74IM34PH4+Mr5j3QM1bQBh108ZdnQn1nAFadZGD+ms3J6l/2EfklmSl62+GF3diYRjth4gzLm0iVCpLOxM4OdnZmdR0V7gJhEwm0W3XbDLqOxpijRwsFvzIE4VjUzGxuMiNxHhaaH5ZPr5CANxlmS5Du9co84DrN8bO15Jx+taT/EhccsGJzS/DQ1VjUVI8qwquNhaTztqUzmOGVApQM93S8Fevg+HoDSiXd+7eGdp+NOKrmj93693UAUgWRm3sNqi/y4cEOmzUNc2N1VlTsfWOm8z0976SBQgthgCsUyurBPhDq2+NkaGbzKMJMnf+t+X8wMALsb0zGX9ChqMLDSlHM58EREYCkAScScyaMF58gQOPNTccgw5Sa1Q+PZmaNuOItgcuonJXmHlQYjEfclGTc0k2LjZjBKM6dRd2fCjSU7beHESmREGcnFHFiJ457JZqq759ylC44ynPJUCPIOsFI8hD8sK3eo6t6aGgPeVaqIXNZM7JVC7CDq0SCeWMJLTa5RPGHUWZMSitooygA49+5mcCIuwsxlrctlYWEUMjKHG5u7o5BAHMyVIeLBsu9d3S/r+ne/0qbuV+PmnbvvLQJ0Wt8AWkr9+eefiKj3W+83ZKpbkLMEsJtF0wGPbCjAgSKFhZdaahWAeu8pIKQQE0n9QCwmps55GvKIRswacNQ49dNHDrhyvyB9tFd2p6ykG5BgmA5DeqZ2c4I51L2poSuxR9U5jykBlSLlWNI5r1PRuR9MbKZ9DBwSVMPJ2hyWPobSAcDwoMrHisOH45M8uG3biEkzLtt715EvY2Y2lQKQ2LT3HlqFBv1Oo7ToSUOmLEhbl5NXZeFSBIfRd7Y+7oyDefd0vw0CJakqhk2Hgd0wegfMk5+HwAenfj4bUdpHMo7HQMpZdif8FGnDpZN2ChgiJhpjBTCnVEq/5p1Uik9MPzEhwj8laaQs5MgiRQhZvxjDLL2fvZNMmio06rnHmlNyNncntaxzeaT8jvYXMVApiYKJ46EWTxb6WFR4vAPvo3cuuamy13pZlzgnU4mL9q4Aai1cCkCgbHETLDlzNC/wbPwYmfsWCQEUVndZS73U8J3ZwIEOh0C4AM6VweJM3dB6d9C6Lr+s66a2YzfuO2EvbEaRTgzD02X98tMXZn790bdNgdESdqoSR2/aWh8YkKRwVIKsIrUIgJ2zajWxAEJSPio2z2IzuRJS6E0JP+S+n5fJ3NunVeODUPcEwO4IoeDkWXiAhw2Su5HJRwXqKBPMHvlEWQyAssCMTGvguOxAVHS6xwPdnrZ+IPJ8h59iIMb6GQ90+H/Px8culZMcPz39+YPDHsNYlCzMxvdSKdcXHk2AmfuTwpYmYOTxzmFP3JU1GiAifz5tBh424ERPCF/PqAUxq7t9IpIGap2fnKIwTbRP03PT+jjA8T0mHU+ReMaJmDjbVDiPKuX3unBS+CdgxwOazB9o+gsTXp8HBXe6d16CQvHOEcig0rHcjzPwAReHXp0PRJhuSjpdkAbEOk1T3hdhlhOb7/E5CfMqx0id18vxdbzTD5PlMIqjngTIk9CjzDKMgHJz0uyF6GbuFGKReCRrCpMIF+HuYLKoAxgpSSwJSZGqDj6YmxP+Hs6HhNTkGbsczUOjpxZ95vj+cIwtcqISxtyMCTim0k9ufx9tMnKQAoKk8xmY3tI5p0hQwWMJne4hV1uU/AjhNaXSICbGD37cctbiGJN7r+jjZuYqjy6oIJ8evU/B0keplKVafFilIYXcXSSt5xKFkeey6kQc+3xq77nnKNj5QQ8SWVgIxOH0GjVoImjvGIBo03bM58lSmPb8GIllWeJz2QPS0ynmdOzSB5E0pM8QPUTdQSCRLCUfKj0Kgt+NT4YIYqbNpPPMQ004kIwNs7O4g4idwIe4x9jLJ7k/pPNYIbF0MMij5N94AtX82z1+9Nmm1ccy9flXGq/HIiVO1MbpR3Y7ro0pFjHiTTEX/pzfoT7uFxWRiNSlElFEX1lW/NIhbog4K0dNjQIM3l5S2Yv4KLMfOmQMHgWSpLJwXQXw3lVNiShQZe/W+uZmRIW4FubF0SKpV6SWYrCl9EWJXfRp6VXa3m9wM1sq18rC/HRZ4E/xxPu2OdA1KrpqbHEWLnUl5lJlWUqkCUSLx9v79f26AezUQeV228weNOy024kwQmR5Qg4Ao+7wad8G2z2ZZB9Ii6Ij7VxU8/sUG2NipnIrozyWpH81ptqZUQq5p8HwQFeNdQIcu+q0IlJoHpee7KEdK9/ciUPXDzwlD55kAJ9IJSRTMh+LCMxkRrGUWESKzCCjuImoyTFUXmo2RPGOGLssl5D20GRsD+p2OpQwKMZT1t5Z20wQcKhdCk3lIpJmZrjHBjX5ESUNW4/co5LGlPeHWReGhj8uqSnM5oSddBtNxBH1coQjcagM29V9zO4JJQ2ldZJKx3OlfMr6IakYQrIPWUtT1pwWCOY/okz+RGYFjEKYDoRwoiOWYsz6dNFP3XeGSDERH5UcADCLSEno4O4ONZPITxgx+uniGKCbeQTEMiFSzdizW0MUSMq1HTog4yPKwmYGMzNlcFBxUFftqsoMETb2Bu5kDAZR9IMqQoWZil/W2oUZ0NZUIYWLsAjXpZqtMYDBE3WHe9IFcf+lVhGpVZa1EBNR6y1K2+/bFlLJQVFS9Q4szez82MZ02mipb5D49DCOcJqFAy0R/Ei05uHjmLHDwVTzOM/IsSIRHq6C6USJiYOA3GOcJgQ9OIEzSTEshdO/8UNC1rnM3d0pE1Tc3WA8Vs/Abw9L6EM3gagBXwTOCY4txR4zW/bbKpQFsXNJs/CA/2e8fTgOw5RxD74HM3BprnD36UDK38/zeGKcJlbykC9xY/H7KeVjgO6P9tfJTMOY2pjM+dfz10/g99lWO36ms3kSa4UtdBAsqsb7sLGHmYjj036emRA6h20zx2pMoR/XP/0+7256Z+7v93TPNDF/wun52mFX3X1qorLzt48H5aaleFx4ergiKJGCs50rEuMejrFLGSvCRICZM+DZTjkqtmeIAs7phyGXyZHZpW6uaq2rsXViFTF3qKKRmsGMYSDPXt2FdS2mVgTmDcoEK5H/FIUWHWxugAgvaxFlKbXWEdQV1mpWCXciknRukOOhuO3jYNEcssMiAp1267CGj7NMOy1Fl92f7Tg5zSUZZzjCxXksqtMn4n2Rq+0jug5+iBgA8FOY9IHICKct5LlBj4ISU6cNbuCY90mkPByPUqmU8vT09PT8ROBhd0RwvWfk3dgbloZeliuK0Uqp5CkpzTByZ2iIU4cP6E5EhJGIarAJ7M7P/firu5udIh6SkaWPFpy5G+5I3PjxLJUSj2RRVYybT5GnnxUS9OlDmWYSjfFlhs9Oyg4Kv9C44YRJeZX5QLh77PzhLgHqWE1z4wKjFM9nw+RTMXz4O07SNG3PkzS6/zplIsZGOSHicZ37RUUkwiVqO0IAZ6LotMRO7kxEs2NwuINAM+6KwABBRJalirD1riA3MwGxuoPEWZzFDdo0iutQOBNMQYB2aPfeYdr3vQnT8oyLlMzzxhZpuBXmBKnwwlbry5O4uxla+wGgEIfbMFC9wclM3SrJc6lMBMo2Um4jMSvSjdwLl+eVHVl19fohDncom0PX8KjMPcTF8YbB/+QP/jDmDuKp4u5WaqrG02ePclkpnxjDUgmvWZSEg4PczXlyyyctPfX0veGG+Q7Y/OGOJgFZGJ3u5DTths+6UeBRKhGYuda61IXAUZ1omJejPHgWOnAycriZMR3d18ZaHRcN08FjRfpY26cjTSp45BzcEyUniHSCkCc4dIABAj7EVRoyIY7orqPJ4xLJDTEv51Ny3aGqccxrTsEWBD4IMaspndyzu7lnxp77SZjiBHhP5xujdBIBTEjThu5kxulmHu7vjJzOuu3+zWM50YzYPUHpsxzHScPNneTj2T9oOsrGcQcU8FEviQAm8hGhmSbzSYvG2ZhJShERArmqZYoSslc2OzjMKTtw1nDCmcF0xChBmWlftJkzISuywgEI4AThUROGxIHbtr+/b+5elrWWZZjkzNHM20mE18sSTd7jJnq31jw2QpCxTMyFHYhGcML0YYRiVMd2HKBoYqQUhlNlni1pn4MFhPvEpuw4lbEZog0B1jil0jjr+dTDgAqs5PDozjvZ3bmMJv3opyV4qKcQP6DRsA+TljL4CF6nEBsHwJv78u64k0qUUdfhhGaAj1M7QNMdkdclImYyB2eU+Ti9Id0l59IaCUUwvw0i4+Dj554876xJEJ90wjFWIETRiUMYudvoWHvGRGf54oNISk537K8JBOIH/gR/Bz6agPuAqT43bkji8DemYHM/DM8xADkG4/cTt4VDKk1Jfb6TcfUpGo5BHd8mZPpUcp3u+wg6+nT3fHz4+xN89h4K5c8jXD5uhYk+pMr4GKIArPFpmJp2BaC9995dVW30Wc4YLkLWkPYoyuYGN4VBuwLEJBQJb0RSwjlDPvxpICCaewyOOaJuRLgUDlGSrgUpzEXdVXc3sIQPws1hqj4y5mJSmQWD8wkR7z6D1O+HiCZkOiTI/dcQTfeGPM7YeAhy9nHNu502z3womEMAHULw/In4U+y+MR3nWR3b9EMRr2NpZBzAXbxwLOkgFB3OHNzmUImfrbrHjt6RvnRZLyOtMteKR9ndqB3XGyIanYkiJUgmInOcgtBlFK8Ll1ga37ke/QA5DxvqM6NpbPC8z2GhHAmyfuKVJp002RofIUXjOo5w5pTUJTKnH0iQy6xS7gMV48Ocxd/nvZPDwRgFBD0vMIPPfcDM8fCe+3E88wR+ExhOhPKwos4jdljoyDmaACxPNan1iZim8wbps03t66eVRBicxrTeThe+x2ofZTZTFJ3gUmr0QYmDCRzDPkjFnKvjGcLTDXOnRqyirfVtM1VYtEA1EZSSnjtVg8O6ubmp9y261xKBhaUsVFcRprqukALAeiS2ODiMx0zribJ/DpiJWTX3mq2LZV3Xuly6GXai3jI/isyj7YV57966waPZRpmbc2qFpT4uoSl3MlI1HaxEBJnVv0aKFJ/mYeCjuyk4a+sxjjQm0U8oCycRmELLT+biUIlj3c21eSzS2Xv8tOjmQ3nKYURlqMQOM/XTR1OXqOs7sA7os0zTT+orUfgMc4VHtTyHO2TcDQ24QIRhF9J5w8+Z8WOWkLuAHtexz90xQcTxNx8jMzbXxFKnt06RNItB3kt5Orb7af7m5+fU8NiBEyU9ZPN+OFIpueMIYj3bLYgnxpinlAkpkSkN2LjHHMDhDj/BasxfP17943GIpTvb917wn+8/Ve2Ro4uTMTUv88kN0N3FjpeHxcEc7RvCdRXMnZ2Vd97kWVWko8ZUDRjcpVlUQo2TR1wnxqqI/F5V672bekTmEpGwRKNrEQn9MC6WaygEKDNFWX8HRKI9gYeU4JEOSWaiIm7IcNTQhiMNy9wdEXB77P9xPZny5OPkDRKbxqBNIXIPnA7lNObmccCB2Kr3fth52rkox2KaC/1ECxyrLn4fu+Z4fQilQ1EdczgNBcwed6kzp3k+FOyd8/bhqnF8UslkLsgASVE+0txHWb7I8JzO9LG1iWwkzJtnSbZZKXzAnbvL0MehGNel089+/iGrs6VvdWxvAEi1MhKX755kTOUw7FJiYsDViTomDnED2Gw2PPnkoNOG/OQx6BQIOp0Bce902O0n9yKldz9MDDqf6G5sDlzhj3+Y+9snlpwSfXw5MNkJfOYsjdXkD1f9/DhG+e6xmbhkhd1Y9XlNDt8rAPgM4fEMqU2gyiLgqN0qzEJeqC5u6qroHXCRZVkqEclSRQoAIcDgBYtY9KdkEgBSSWqGnQRQD/cxCCjpG4ugOSdyJgeVQivEHYWiV49IfIczC7OCnMhAxAwRSa4vHPBSuAhOmP7If/4ALE6wHENoTER0kkXjXYchfxYboCGZc9aSBpmzMkTQlJV3+PfQDYe0mopxXuM813QK4XxQ7DSX1fhx7DHcXSSlAWU5VPdPF9pHqUTn3Qz4yG001R4lqlW7muWSQ+LMoYnih6yYkZzj1PtjWI8ZGWOTRteJdZmSMV8Zu/ewSwJFTTWALF99DBfNn49l4UmuE0aK9giOndVj8j6y8OCnUul+Qx5WzvmmKepq0phCP4TCEAeHUDgeaRQkwpSl85H8WDF+jn2fgn8Oy5BCg9M5Lhf4widsuAOOac/dCds7JTGf7xTFcXcQSJirFMnSWccCZ6YiTITee9fuI5TEASEKH3tZKg8yiJmdyYKmbnuHw31Z6rJUImh0zgXJIgyGE0PGKgEAJ3M2wDkHwlmylwRXJuG5P52gsXykygI4SeSqEEmpzOKAiBQUdwcUMGapRdxRCi/hOAxHcBTnz/6cWaPhg1CaG2B8HTIkkeDYF1Ntj6CjqfyOBXfSKse/mMXTJstvU/pNKRiL7DTFUy/fz/j8lnLvwYRITHXAqLFM6SSy4s7TbPQD0HxYRH9U9W1cLC+ZJWGPwlDD7vig0QdjEjc2KaETO3F86h7J343F8eh+ktJnaDxRkgeySN/8eXSHgPNpYM7zzTnJTXeW/J7ABaA52f/scYCm+8vHvvuETL4Hgz5NW89I/PO7fZ7/MOlPMnZIpHHfD3LmTnYkXDo/6sNZ/thaffzDP4OmaNaOm5pofJ1GyWRDMLZaHJxJxzOQnSJ410esu4jUwDvw2CVMEi3rBJIZqQ7AFWbeAQ8HYOQfDcIwWs+PBz+BiCgPxk7Raum0oYloFl+LYm1EBAfDZRI0ONXzmfPxBwtogqFjdCa8GW+h4+YwEf35Y7nQcrnmWpmyYF4EdLIR50sPE/pHt5n77HiFHv56aCsaavPuA/M3+vQ6HxfSZ1LJJ1Pj7j6qmniUotRR5+QEaoZOt3h5tFcKXnM2P/pnnn7qUxqiePx2QiCDghk1nkNUEp0n7O6IUKGINTE7YquJRuwGjchpeKR+HkOeO+ITUmDCtwOS3oOJ+QuPiOsUTbEVo+jMWN4nBnGM5VlPjddDVN69+w7FHVx6IqXcDz6A0xTlGKrjUR/e7YgY1DkNea+ntw4D8jO45AxnnJtuE7LjzByik5kATGkRGM7M0DsxBZ1EEVRZK8GLpNuME6pPXR99a8RThwZK92Af4EaA0JBLwswRoKTuDiYu0ekgWsPDHRpVDWBRCgWZmcARVOBDBJmRAW6u2RHWe/YbmxzBJ9J7Spo7sf0wlrmy/BB0J95oagU/Pn83n6lsp8o7Bj1ll4fpSedzne2pE4y/n1w/XeV08SmL0vdMA57Eeh+5uAMqHRf5RCJ87HGSR5SjBqBRj9ozkD+ygZJbSkfrsUHOmgWzGWEuukwuuyOej91Bc0MMpXpWoodgUlVAHW4URTEHMh3H3C6afQRTtp6ml0RONZ8AwE2jqUsC38jV/zRJZ97xaUHc4cDjZz8MT8qxpSFjsh2pD/znA/ndLWMiH6VHfVhw8+oPbLYPpHRo6WHBDfF2LIKTUDiegzAlEZiOqTjND/kht/zTRcVARBRxSAvcRYLmmcaujDsMXjlOOQowKBRCFNJChIkqgJwRQlQKhUeVbBAgpRQpoTo96lH2IaMsk9eCB2IWjuQkVTNnpsKFmLulPAn6lEAM4azncVqJBB+OZod7h5nvre8tukhlU55RBucPAOh5rIFYe3fSKWSLp84c7xq+pIGpE8kAj+7QE4K6m+mT2svaWjQIaBrXnjLjboFhXuYBPI3l8PCeeU0fwNYjgG/c+DlJ6u74mAd3aFTkbvHBR+T/E/D7sNgTxYw0/XGjJwA6rJKQNGf5P0yqqVWO+6TTcX7xQIRnxurusvAP6W/z693ZkGYhDaVxvolPzn6+0Hn9xIOd/gSczfC8IUymncYouI85nivkASx9WAHHcRJJfv8CPnzoj85xB8/yqncDhH9mDD6eCzghhJDJh8IZv9Bp+k/TMfpzUTbDG+rstHjuH2eI2xS+Z8WeI3968WGEBuDMBZ2LZlgJEWQAspFemsgryj/4gFQRlGDupqpdbYhBOi3yh4E/r9nTrvwXhvjBvJ7i4sBR5yd3fL5sUkwd1/OHH/zDjZzf/XilD2/79Df/g9f/eF1/rBmQLnZVGxVgj5ZC8R5OTTqCssfl6E6MEIBo6XcoazoK1MZxMo/Dbsf4SjhGHBMBhRARkTnxPsKUPsVWUa/yjKHmR+KvsT+YWI5yB4RZ4ftzAH6PZuZ4j/fyBALnyTiqhYbW8BFnB8p+zu4PQmlA37kwTn95AEnnH46vx4L9oPQI58c4TGAaumTCvhOEPa6SQzpc4eczC3GN2k+PN5ZTEw2mMeYiJpSiKU5vM2AS8MLsQX4DJWbDOFzPGoLDU2iYOZyEo2VjckYPSC46SjNcjMnI1LqaqjLIWYh5b31r3cz73nTrIFrqpdTF3G66d+tEEAExop4THHvTfVMz31rbW/N07hERlVJYpH9schKW4BEfCSK6lzkD/4+JOqGkU3Aj5dDSHNs52nQ3wTRn+P4i8+SntThcpkOufZDodIYtp2843CwToMfJhyngDgeZj/j6qIPA+hFNfmLBjQq5WfbtnPIKDEQOZ4kwuONJZ3TPlAvOufiOYg4Pd+AIj+ZRPeDYDHdIZxg6IRNTco0q1HdCkzI9EvMkx/2cBFNIpzCumSOa8gHn4fzKPM5K++FhJoHJj1poaGIQguQ4xBDg2coCJ1fpmceeQQDzcmmLHct98LaH9YYZCTfl4ZR4J5R3Iujn6j6N2MGzjWeZ/2i2/7ofn4ip5qMwwxyccEdQKSI4nOhztOHeemutxZKBexWhWmPGOUMMo1sU1L1HpQp3OJgMaiEL1rrQpC4OSJUwRuBFs7dz76qq7GTUiXnb2/u2m1q7bfttJ/DlYsti6nbdr7u2qPXBQsGaumPf+vXWTW3vfW8NhFqqSObci7l+lEqJFfkkFuhkTozxpnyIAWXvg63POiqX02RhH10mszbzNCPgeRvAWT2ONyY1dJp5P8/8WFg4vetYg/Bxq36AzFyC8UPWNaJgd+UjTnyokOt7a2+vb6b533nPa2And7UBanEMDQGj6tsxxj5GYZDN8xlHyaWBnpmi6iOdJuhhOJIvmUt5BE1mhdz5FDPXwUfgd2+t937I1lNHbyvCxJ2p8xGCOyYX2+3Wez8PkZlu1+v17fUj9pzaaDzAsSWGhhlS8ZCip28PL4x5Hk618xvvPjHn7vzD/NR4Zb58t5ZOld+BKYUHCYQ5C3foLxdwlB9pbb9Dd8De+vt1p1HKZI4ACXNTHJW5fExpCkE1jXaJjnAHeGPTFrwPLQO9xo11J50bxpEUNpFI2aoy8a5B9ETJi+DmDHBh3rvX0rvqtu+qyqLcDMRba7e9qVrf9nZrRKQue4e5XdvWtFNIJSZEGDpo3/pt62beem+9A1CFiDFxqWDWbe8PlUy067Y1+PCUEeQuF4eIiEn5QDhD+B9a7gSjxvxM/ZBDftYW842ndwRpeGgl+vCGuT3nKsaBP/1h1R1vGX8aVU5P9U7dMcuo5x3f9tZVcX88Sqm/+8uv/+pf/6tSit9VBLoXB2ORPwJTnOX18bqf7v540e8fgojuBuZxgD4MwbG97nXy3fzEq2GTzo+czTxON9uso3k3Lqr69fevrz9+zNcvT09/+Vf/en16fnic0wp5BMrAh5l91DKPMuX8uTtldC+lH2fgjK8+Off40/j0Rxg4H+G0ph+/T+USmvztx4/v377ZWFgi/Pe/vPzycgllfhZYIcke4eXcIIC7d1WbFpyDmSS8c5FPj2N12CTDfN4PUdYZFyLYpJ0nf4CUgNHWJuOJstiDgKBmQQ1Z1+CVokqyu3fTyPTmUa8oQK2p925JkJvjVKUnvm97//b9urdDt315Xn/+6Ulkip3BE9yrhHuZcvx+ggHnabmTQp8fJ7F2d2r8wVLA3eL7gxfOa9s/vjiY5/mWIUnGY6na12/vP95u93f68eb/xcf7f9nxGWz5wz8lYP3szZ+f/MM8/P9gfP6Z47/32T6OD4D/p0fon5v/03v+2YE5Qft/4fDPT/RBBNz/6f9ji+j/xuOzFfTn8efx5/Hn8efx5/Hn8efx5/Hn8efx5/Hn8efx5/Hn8efx5/Hff/xfTVGNHAplbmRzdHJlYW0KZW5kb2JqCjM1IDAgb2JqCjgzNDU0CmVuZG9iagoyIDAgb2JqCjw8IC9Db3VudCAxIC9LaWRzIFsgMTEgMCBSIF0gL1R5cGUgL1BhZ2VzID4+CmVuZG9iagozNiAwIG9iago8PCAvQ3JlYXRpb25EYXRlIChEOjIwMjEwOTE2MTQ0MTEzKzAyJzAwJykKL0NyZWF0b3IgKE1hdHBsb3RsaWIgdjMuNC4zLCBodHRwczovL21hdHBsb3RsaWIub3JnKQovUHJvZHVjZXIgKE1hdHBsb3RsaWIgcGRmIGJhY2tlbmQgdjMuNC4zKSA+PgplbmRvYmoKeHJlZgowIDM3CjAwMDAwMDAwMDAgNjU1MzUgZiAKMDAwMDAwMDAxNiAwMDAwMCBuIAowMDAwMDkxMDQ2IDAwMDAwIG4gCjAwMDAwMDcxMzYgMDAwMDAgbiAKMDAwMDAwNzE2OCAwMDAwMCBuIAowMDAwMDA3MjY3IDAwMDAwIG4gCjAwMDAwMDcyODggMDAwMDAgbiAKMDAwMDAwNzMwOSAwMDAwMCBuIAowMDAwMDAwMDY1IDAwMDAwIG4gCjAwMDAwMDAzOTkgMDAwMDAgbiAKMDAwMDAwMDczOSAwMDAwMCBuIAowMDAwMDAwMjA4IDAwMDAwIG4gCjAwMDAwMDA3MTkgMDAwMDAgbiAKMDAwMDAwNzM0MSAwMDAwMCBuIAowMDAwMDA1ODgyIDAwMDAwIG4gCjAwMDAwMDU2ODIgMDAwMDAgbiAKMDAwMDAwNTMwMyAwMDAwMCBuIAowMDAwMDA2OTM1IDAwMDAwIG4gCjAwMDAwMDA3NTkgMDAwMDAgbiAKMDAwMDAwMTA2NCAwMDAwMCBuIAowMDAwMDAxNDQ0IDAwMDAwIG4gCjAwMDAwMDE3NDkgMDAwMDAgbiAKMDAwMDAwMjA1MyAwMDAwMCBuIAowMDAwMDAyMzc1IDAwMDAwIG4gCjAwMDAwMDI1ODQgMDAwMDAgbiAKMDAwMDAwMjc1MCAwMDAwMCBuIAowMDAwMDAyODY5IDAwMDAwIG4gCjAwMDAwMDMyMDAgMDAwMDAgbiAKMDAwMDAwMzQzNiAwMDAwMCBuIAowMDAwMDAzNzI3IDAwMDAwIG4gCjAwMDAwMDM5NjAgMDAwMDAgbiAKMDAwMDAwNDM2NyAwMDAwMCBuIAowMDAwMDA0NzYwIDAwMDAwIG4gCjAwMDAwMDQ4NTAgMDAwMDAgbiAKMDAwMDAwNTA1NiAwMDAwMCBuIAowMDAwMDkxMDI0IDAwMDAwIG4gCjAwMDAwOTExMDYgMDAwMDAgbiAKdHJhaWxlcgo8PCAvSW5mbyAzNiAwIFIgL1Jvb3QgMSAwIFIgL1NpemUgMzcgPj4Kc3RhcnR4cmVmCjkxMjYzCiUlRU9GCg==\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:13.259063\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n"]}, {"data": {"application/pdf": "JVBERi0xLjQKJazcIKu6CjEgMCBvYmoKPDwgL1BhZ2VzIDIgMCBSIC9UeXBlIC9DYXRhbG9nID4+CmVuZG9iago4IDAgb2JqCjw8IC9FeHRHU3RhdGUgNCAwIFIgL0ZvbnQgMyAwIFIgL1BhdHRlcm4gNSAwIFIKL1Byb2NTZXQgWyAvUERGIC9UZXh0IC9JbWFnZUIgL0ltYWdlQyAvSW1hZ2VJIF0gL1NoYWRpbmcgNiAwIFIKL1hPYmplY3QgNyAwIFIgPj4KZW5kb2JqCjExIDAgb2JqCjw8IC9Bbm5vdHMgMTAgMCBSIC9Db250ZW50cyA5IDAgUgovR3JvdXAgPDwgL0NTIC9EZXZpY2VSR0IgL1MgL1RyYW5zcGFyZW5jeSAvVHlwZSAvR3JvdXAgPj4KL01lZGlhQm94IFsgMCAwIDQwNSAyMjcuNjU1NDM0NzgyNiBdIC9QYXJlbnQgMiAwIFIgL1Jlc291cmNlcyA4IDAgUgovVHlwZSAvUGFnZSA+PgplbmRvYmoKOSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDEyIDAgUiA+PgpzdHJlYW0KeJxVj01PwzAMhu/+Fe9xPZDGSfp13DSo4LapEgfEYcpSoFo79QP293HLGCKS47x29Pg1o6F4zXgbIRc0GomLvMtZkxbVktOJ5NOSjclUmiTOJlLQ/+U7UU09MmWWsIVWKbjIFVvtrMtyk2IIeEaHeG1+ZjYSF6GXiLfh68OHfbmBHwVjC8Y8n4vihvQt4kfG9owd7dD/YrTiRNzfaLMsr1XqaebcCQisM2Vzk7ORRZiV/fPlW9pUiB/kk0FVL5tXR3rBah/BOWUyndvlYBX8uRun4dNP4Yh6iGC0ujaX/rkVSI7TYQrdNEZ4RfVE9xWJZ/oGwipRdQplbmRzdHJlYW0KZW5kb2JqCjEyIDAgb2JqCjI0NwplbmRvYmoKMTAgMCBvYmoKWyBdCmVuZG9iagoxOCAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDIzMiA+PgpzdHJlYW0KeJw9kEtyBCEMQ/ecQkcAf+E8nUrNouf+28jumWyQqsDyE3EcE2fziAikHPysYWZQE7yHhUPVYDug68BnQE7gGi50KXCj2oRzfJ3DmwqauIfHbLVIrJ3lTCHqMCZJbOhJyDbOaHLjnNyqVN5Ma73G4ptyd7vKa9qWwr2Hyvo441Q5qyprkTYRmUVrG8FGHuywz6OraMtZKtw3jE1dE5XDm8XuWd3J4orvr1zj1SzBzPfDt78cH1fd6CrH2MqE2VKT5tI59a+W0fpwtIuFeuFHeyZIcHWrIFWl1s7aU3r9U9wk+v0D9MFXHQplbmRzdHJlYW0KZW5kb2JqCjE5IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMzA3ID4+CnN0cmVhbQp4nD2SS24DMQxD9z6FLhDA+tme86Qoupjef9snJemKHNkWRWqWukxZUx6QNJOEf+nwcLGd8jtsz2Zm4Fqil4nllOfQFWLuonzZzEZdWSfF6oRmOrfoUTkXBzZNqp+rLKXdLngO1yaeW/YRP7zQoB7UNS4JN3RXo2UpNGOq+3/Se/yMMuBqTF1sUqt7HzxeRFXo6AdHiSJjlxfn40EJ6UrCaFqIlXdFA0Hu8rTKewnu295qyLIHqZjOOylmsOt0Ui5uF4chHsjyqPDlo9hrQs/4sCsl9EjYhjNyJ+5oxubUyOKQ/t6NBEuPrmgh8+CvbtYuYLxTOkViZE5yrGmLVU73UBTTucO9DBD1bEVDKXOR1epfw84La5ZsFnhK+gUeo90mSw5W2duoTu+tPNnQ9x9a13QfCmVuZHN0cmVhbQplbmRvYmoKMjAgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAyMzIgPj4Kc3RyZWFtCnicNVFJbsQwDLv7FfzAANbuvCfFoIf2/9dSyhQIQCW2uCViYyMCLzH4OYjc+JI1oyZ+Z3JX/CxPhUfCreBJFIGX4V52gssbxmU/DjMfvJdWzqTGkwzIRTY9PBEy2CUQOjC7BnXYZtqJviHhsyNSzUaW09cS9NIqBMpTtt/pghJtq/pz+6wLbfvaE052e+pJ5ROI55aswGXjFZPFWAY9UblLMX2Q6myhJ6G8KJ+DbD5qiESXKGfgicHBKNAO7LntZ+JVIWhd3adtY6hGSsfTvw1NTZII+UQJZ7Y07hb+f8+9vtf7D04hVBEKZW5kc3RyZWFtCmVuZG9iagoyMSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDIzMSA+PgpzdHJlYW0KeJw1TzmSBCEMy3mFPjBVGNtAv6entjbY+X+6kplOkPAhydMTHZl4mSMjsGbH21pkIGbgU0zFv/a0DxOq9+AeIpSLC2GGkXDWrONuno4X/3aVz1gH7zb4illeENjCTNZXFmcu2wVjaZzEOclujF0TsY11radTWEcwoQyEdLbDlCBzVKT0yY4y5ug4kSeei+/22yx2OX4O6ws2jSEV5/gqeoI2g6Lsee8CGnJB/13d+B5Fu+glIBsJFtZRYu6c5YRfvXZ0HrUoEnNCmkEuEyHN6SqmEJpQrLOjoFJRcKk+p+isn3/lX1wtCmVuZHN0cmVhbQplbmRvYmoKMjIgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAyNDkgPj4Kc3RyZWFtCnicPVA7jkQhDOs5hS/wJPIjcB5Gqy1m79+uA5opUEx+tjMk0BGBRwwxlK/jJa2groG/i0LxbuLrg8Igq0NSIM56D4h07KY2kRM6HZwzP2E3Y47ARTEGnOl0pj0HJjn7wgqEcxtl7FZIJ4mqIo7qM44pnip7n3gWLO3INlsnkj3kIOFSUonJpZ+Uyj9typQKOmbRBCwSueBkE004y7tJUowZlDLqHqZ2In2sPMijOuhkTc6sI5nZ00/bmfgccLdf2mROlcd0Hsz4nLTOgzkVuvfjiTYHTY3a6Oz3E2kqL1K7HVqdfnUSld0Y5xgSl2d/Gd9k//kH/odaIgplbmRzdHJlYW0KZW5kb2JqCjIzIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMzk1ID4+CnN0cmVhbQp4nD1SS27FQAjb5xRcoNLwm895UlXdvPtva0NSqSq8iTHGMH3KkLnlS10ScYXJt16uWzymfC5bWpl5iLuLjSU+ttyX7iG2XXQusTgdR/ILMp0qRKjNqtGh+EKWhQeQTvChC8J9Of7jL4DB17ANuOE9MkGwJOYpQsZuURmaEkERYeeRFaikUJ9Zwt9R7uv3MgVqb4ylC2Mc9Am0BUJtSMQC6kAAROyUVK2QjmckE78V3WdiHGDn0bIBrhlURJZ77MeIqc6ojLxExD5PTfoolkwtVsZuUxlf/JSM1Hx0BSqpNPKU8tBVs9ALWIl5EvY5/Ej459ZsIYY6btbyieUfM8UyEs5gSzlgoZfjR+DbWXURrh25uM50gR+V1nBMtOt+yPVP/nTbWs11vHIIokDlTUHwuw6uRrHExDI+nY0peqIssBqavEYzwWEQEdb3w8gDGv1yvBA0p2sitFgim7ViRI2KbHM9vQTWTO/FOdbDE8Js753WobIzMyohgtq6hmrrQHazvvNwtp8/M+iibQplbmRzdHJlYW0KZW5kb2JqCjI0IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMTM2ID4+CnN0cmVhbQp4nE2PQQ4DMQgD73mFn0AgQHjPVlUP2/9fS9h20wseyYBsUQaBJYd4hxvh0dsP30U2FWfjnF9SKWIhmE9wnzBTHI0pd/Jjj4BxlGosp2h4XkvOTcMXLXcTLaWtl5MZb7jul/dHlW2RDUXPLQtC12yS+TKBB3wYmEd142mlx932bK/2/ADObDRJCmVuZHN0cmVhbQplbmRvYmoKMjUgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCA0NyA+PgpzdHJlYW0KeJwzMrdQMFCwNAEShhYmCuZmBgophlyWEFYuF0wsB8wC0ZZwCiKewZUGALlnDScKZW5kc3RyZWFtCmVuZG9iagoyNiAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDI1OCA+PgpzdHJlYW0KeJxFkUtyBCAIRPeegiOA/OQ8k0plMbn/Ng3OZDZ2l6j9hEojphIs5xR5MH3J8s1ktul3OVY7GwUURSiYyVXosQKrO1PEmWuJautjZeS40zsGxRvOXTmpZHGjjHVUdSpwTM+V9VHd+XZZlH1HDmUK2KxzHGzgym3DGCdGm63uDveJIE8nU0fF7SDZ8AcnjX2VqytwnWz20UswDgT9QhOY5ItA6wyBxs1T9OQS7OPjdueBYG95EUjZEMiRIRgdgnadXP/i1vm9/3GGO8+1Ga4c7+J3mNZ2x19ikhVzAYvcKajnay5a1xk63pMzx+Sm+4bOuWCXu4NM7/k/1s/6/gMeKWb6CmVuZHN0cmVhbQplbmRvYmoKMjcgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAxNjMgPj4Kc3RyZWFtCnicRZA7EgMhDEN7TqEj+CMDPs9mMik2929j2GxSwNNYIIO7E4LU2oKJ6IKHtiXdBe+tBGdj/Ok2bjUS5AR1gFak42iUUn25xWmVdPFoNnMrC60THWYOepSjGaAQOhXe7aLkcqbuzvlDcPVf9b9i3TmbiYHJyh0IzepT3Pk2O6K6usn+pMfcrNd+K+xVYWlZS8sJt527ZkAJ3FM52qs9Px8KOvYKZW5kc3RyZWFtCmVuZG9iagoyOCAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDIxOCA+PgpzdHJlYW0KeJw9ULmNBDEMy12FGljAeu2pZxaLS6b/9Ej59iLRFkVSKjWZkikvdZQlWVPeOnyWxA55huVuZDYlKkUvk7Al99AK8X2J5hT33dWWs0M0l2g5fgszKqobHdNLNppwKhO6oNzDM/oNbXQDVocesVsg0KRg17YgcscPGAzBmROLIgxKTQb/rnKPn16LGz7D8UMUkZIO5jX/WP3ycw2vU48nkW5vvuJenKkOAxEckpq8I11YsS4SEWk1QU3PwFotgLu3Xv4btCO6DED2icRxmlKOob9rcKXPL+UnU9gKZW5kc3RyZWFtCmVuZG9iagoyOSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDgzID4+CnN0cmVhbQp4nEWMuw3AMAhEe6ZgBH4m9j5RlMLevw0QJW64J909XB0JmSluM8NDBp4MLIZdcYH0ljALXEdQjp3so2HVvuoEjfWmUvPvD5Se7KzihusBAkIaZgplbmRzdHJlYW0KZW5kb2JqCjMwIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMTYwID4+CnN0cmVhbQp4nEWQORIDMQgEc72CJ0hcgvesy7XB+v+pB9ZHoukCNBy6Fk3KehRoPumxRqG60GvoLEqSRMEWkh1Qp2OIOyhITEhjkki2HoMjmlizXZiZVCqzUuG0acXCv9la1chEjXCN/InpBlT8T+pclPBNg6+SMfoYVLw7g4xJ+F5F3Fox7f5EMLEZ9glvRSYFhImxqdm+z2CGzPcK1zjH8w1MgjfrCmVuZHN0cmVhbQplbmRvYmoKMzEgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAzMzQgPj4Kc3RyZWFtCnicLVJLcsUgDNtzCl2gM/gH5DzpdLp4vf+2kpNFRg5g9DHlholKfFkgt6PWxLeNzECF4a+rzIXPSNvIOojLkIu4ki2Fe0Qs5DHEPMSC76vxHh75rMzJswfGL9l3Dyv21IRlIePFGdphFcdhFeRYsHUhqnt4U6TDqSTY44v/PsVzLQQtfEbQgF/kn6+O4PmSFmn3mG3TrnqwTDuqpLAcbE9zXiZfWme5Oh7PB8n2rtgRUrsCFIW5M85z4SjTVka0FnY2SGpcbG+O/VhK0IVuXEaKI5CfqSI8oKTJzCYK4o+cHnIqA2Hqmq50chtVcaeezDWbi7czSWbrvkixmcJ5XTiz/gxTZrV5J89yotSpCO+xZ0vQ0Dmunr2WWWh0mxO8pITPxk5PTr5XM+shORUJqWJaV8FpFJliCdsSX1NRU5p6Gf778u7xO37+ASxzfHMKZW5kc3RyZWFtCmVuZG9iagozMiAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDE4ID4+CnN0cmVhbQp4nDM2tFAwgMMUQ640AB3mA1IKZW5kc3RyZWFtCmVuZG9iagozMyAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDEzMyA+PgpzdHJlYW0KeJxFj0sOBCEIRPecoo7Axx/ncTLphXP/7YCdbhNjPYVUgbmCoT0uawOdFR8hGbbxt6mWjkVZPlR6UlYPyeCHrMbLIdygLPCCSSqGIVCLmBqRLWVut4DbNg2yspVTpY6wi6Mwj/a0bBUeX6JbInWSP4PEKi/c47odyKXWu96ii75/pAExCQplbmRzdHJlYW0KZW5kb2JqCjM0IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMjUxID4+CnN0cmVhbQp4nC1RSXIDQQi7zyv0hGan32OXK4fk/9cIygcGDYtAdFrioIyfICxXvOWRq2jD3zMxgt8Fh34r121Y5EBUIEljUDWhdvF69B7YcZgJzJPWsAxmrA/8jCnc6MXhMRlnt9dl1BDsXa89mUHJrFzEJRMXTNVhI2cOP5kyLrRzPTcg50ZYl2GQblYaMxKONIVIIYWqm6TOBEESjK5GjTZyFPulL490hlWNqDHscy1tX89NOGvQ7Fis8uSUHl1xLicXL6wc9PU2AxdRaazyQEjA/W4P9XOyk994S+fOFtPje83J8sJUYMWb125ANtXi37yI4/uMr+fn+fwDX2BbiAplbmRzdHJlYW0KZW5kb2JqCjM1IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMTc0ID4+CnN0cmVhbQp4nE2QSQ5DIQxD95zCF6iEM8DnPL+qumjvv61DB3WB/OQgcDw80HEkLnRk6IyOK5sc48CzIGPi0Tj/ybg+xDFB3aItWJd2x9nMEnPCMjECtkbJ2TyiwA/HXAgSZJcfvsAgIl2P+VbzWZP0z7c73Y+6tGZfPaLAiewIxbABV4D9useBS8L5XtPklyolYxOH8oHqIlI2O6EQtVTscqqKs92bK3AV9PzRQ+7tBbUjPN8KZW5kc3RyZWFtCmVuZG9iagoxNiAwIG9iago8PCAvQmFzZUZvbnQgL0RlamFWdVNhbnMgL0NoYXJQcm9jcyAxNyAwIFIKL0VuY29kaW5nIDw8Ci9EaWZmZXJlbmNlcyBbIDMyIC9zcGFjZSA0OSAvb25lIC90d28gNTYgL2VpZ2h0IDgyIC9SIDk3IC9hIDk5IC9jIC9kIC9lIC9mIDEwOCAvbCAvbSAvbgovbyAxMTQgL3IgL3MgL3QgL3UgXQovVHlwZSAvRW5jb2RpbmcgPj4KL0ZpcnN0Q2hhciAwIC9Gb250QkJveCBbIC0xMDIxIC00NjMgMTc5NCAxMjMzIF0gL0ZvbnREZXNjcmlwdG9yIDE1IDAgUgovRm9udE1hdHJpeCBbIDAuMDAxIDAgMCAwLjAwMSAwIDAgXSAvTGFzdENoYXIgMjU1IC9OYW1lIC9EZWphVnVTYW5zCi9TdWJ0eXBlIC9UeXBlMyAvVHlwZSAvRm9udCAvV2lkdGhzIDE0IDAgUiA+PgplbmRvYmoKMTUgMCBvYmoKPDwgL0FzY2VudCA5MjkgL0NhcEhlaWdodCAwIC9EZXNjZW50IC0yMzYgL0ZsYWdzIDMyCi9Gb250QkJveCBbIC0xMDIxIC00NjMgMTc5NCAxMjMzIF0gL0ZvbnROYW1lIC9EZWphVnVTYW5zIC9JdGFsaWNBbmdsZSAwCi9NYXhXaWR0aCAxMzQyIC9TdGVtViAwIC9UeXBlIC9Gb250RGVzY3JpcHRvciAvWEhlaWdodCAwID4+CmVuZG9iagoxNCAwIG9iagpbIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwCjYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgMzE4IDQwMSA0NjAgODM4IDYzNgo5NTAgNzgwIDI3NSAzOTAgMzkwIDUwMCA4MzggMzE4IDM2MSAzMTggMzM3IDYzNiA2MzYgNjM2IDYzNiA2MzYgNjM2IDYzNiA2MzYKNjM2IDYzNiAzMzcgMzM3IDgzOCA4MzggODM4IDUzMSAxMDAwIDY4NCA2ODYgNjk4IDc3MCA2MzIgNTc1IDc3NSA3NTIgMjk1CjI5NSA2NTYgNTU3IDg2MyA3NDggNzg3IDYwMyA3ODcgNjk1IDYzNSA2MTEgNzMyIDY4NCA5ODkgNjg1IDYxMSA2ODUgMzkwIDMzNwozOTAgODM4IDUwMCA1MDAgNjEzIDYzNSA1NTAgNjM1IDYxNSAzNTIgNjM1IDYzNCAyNzggMjc4IDU3OSAyNzggOTc0IDYzNCA2MTIKNjM1IDYzNSA0MTEgNTIxIDM5MiA2MzQgNTkyIDgxOCA1OTIgNTkyIDUyNSA2MzYgMzM3IDYzNiA4MzggNjAwIDYzNiA2MDAgMzE4CjM1MiA1MTggMTAwMCA1MDAgNTAwIDUwMCAxMzQyIDYzNSA0MDAgMTA3MCA2MDAgNjg1IDYwMCA2MDAgMzE4IDMxOCA1MTggNTE4CjU5MCA1MDAgMTAwMCA1MDAgMTAwMCA1MjEgNDAwIDEwMjMgNjAwIDUyNSA2MTEgMzE4IDQwMSA2MzYgNjM2IDYzNiA2MzYgMzM3CjUwMCA1MDAgMTAwMCA0NzEgNjEyIDgzOCAzNjEgMTAwMCA1MDAgNTAwIDgzOCA0MDEgNDAxIDUwMCA2MzYgNjM2IDMxOCA1MDAKNDAxIDQ3MSA2MTIgOTY5IDk2OSA5NjkgNTMxIDY4NCA2ODQgNjg0IDY4NCA2ODQgNjg0IDk3NCA2OTggNjMyIDYzMiA2MzIgNjMyCjI5NSAyOTUgMjk1IDI5NSA3NzUgNzQ4IDc4NyA3ODcgNzg3IDc4NyA3ODcgODM4IDc4NyA3MzIgNzMyIDczMiA3MzIgNjExIDYwNQo2MzAgNjEzIDYxMyA2MTMgNjEzIDYxMyA2MTMgOTgyIDU1MCA2MTUgNjE1IDYxNSA2MTUgMjc4IDI3OCAyNzggMjc4IDYxMiA2MzQKNjEyIDYxMiA2MTIgNjEyIDYxMiA4MzggNjEyIDYzNCA2MzQgNjM0IDYzNCA1OTIgNjM1IDU5MiBdCmVuZG9iagoxNyAwIG9iago8PCAvUiAxOCAwIFIgL2EgMTkgMCBSIC9jIDIwIDAgUiAvZCAyMSAwIFIgL2UgMjIgMCBSIC9laWdodCAyMyAwIFIKL2YgMjQgMCBSIC9sIDI1IDAgUiAvbSAyNiAwIFIgL24gMjcgMCBSIC9vIDI4IDAgUiAvb25lIDI5IDAgUiAvciAzMCAwIFIKL3MgMzEgMCBSIC9zcGFjZSAzMiAwIFIgL3QgMzMgMCBSIC90d28gMzQgMCBSIC91IDM1IDAgUiA+PgplbmRvYmoKMyAwIG9iago8PCAvRjEgMTYgMCBSID4+CmVuZG9iago0IDAgb2JqCjw8IC9BMSA8PCAvQ0EgMCAvVHlwZSAvRXh0R1N0YXRlIC9jYSAxID4+Ci9BMiA8PCAvQ0EgMSAvVHlwZSAvRXh0R1N0YXRlIC9jYSAxID4+ID4+CmVuZG9iago1IDAgb2JqCjw8ID4+CmVuZG9iago2IDAgb2JqCjw8ID4+CmVuZG9iago3IDAgb2JqCjw8IC9JMSAxMyAwIFIgPj4KZW5kb2JqCjEzIDAgb2JqCjw8IC9CaXRzUGVyQ29tcG9uZW50IDggL0NvbG9yU3BhY2UgL0RldmljZVJHQgovRGVjb2RlUGFybXMgPDwgL0NvbG9ycyAzIC9Db2x1bW5zIDM5MSAvUHJlZGljdG9yIDEwID4+Ci9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9IZWlnaHQgMTk5IC9MZW5ndGggMzYgMCBSIC9TdWJ0eXBlIC9JbWFnZQovVHlwZSAvWE9iamVjdCAvV2lkdGggMzkxID4+CnN0cmVhbQp4nOz9S5MkSZImiPFLRFTt5RGRj6rq6upZ0M5iaQ+4LQgHEECEX44rcMIBF9AszS52Zrunuior4+VupqoizIwDi6iZe0T19BwGp9L0jPBwN1MzkwfLxx8zfwzwt+tv19+uv11/u/52/e362/W362/X366/XX+7/nb97frb9bfrb9d/+YXf+xkigLt//6H48Lh/9S3h7c2+edi3D/gXrn/lc795J/sP/vWv5vbNQPz1680Q4ffH4v+P13/913d/u1QQCQn77+Ix4I8jjq8WTh+k70zp/bbu8GrOEL6z+h5ui4D9Fq/uB9+d+Ncv9a+6/L9kZL/ZSYiIf2Xv/Ne9/rWv+jjcb+buv8b1V03Nfs2Hw+l0IiJVVVUAQHBCQABBIHQmzEJMyEQiRIjMJEyIiNBHG5GAsN8c0c2aqpm595XBzMwcxq9/cDd3dwdzc3cEJCLEGBB3AHczMwAgJmaOj9M/UzwTMBY4jv+IkIgRkYiIKN5YvEMzs1dLC+N58S7i1u6w1fYf/vjnP/3yaR82JpxyYqbx6oDYX5g5hgWnIiUxEZXELITQx+WvLH+/v4Xxt7/aga/nKD6ig98//6u74Pg/RqD/6LVB9vu34/vHx/Txi9tQTCwR3Se3Pxvd/T/96eP/+o+/bLXFD3Mp/+a//e9+8/s/gNu2XFtdrbW2LqbNAcARADnllCckynlKpRASp8ySAIEQkbDVbbk9a9ta29blZqZu5qrgMUmAiMxMTICISIiUcj6ezynllNI0TUTspqbNzZbltqyLu/V1BH2xtdZut2trzVRV21hHBgDu6AYO0JqZmjuo2VhnDu7MLIljfQkzIACYg8K+oh3MwB3WZf348fO6bvv8/PjTz7/5/R9STn5faw8GHMbgIwAg4X0yxn+Paydu4ft/iEA0ltyYQSJEwLHpMKVMzDGGSNhf211VW6vuvi7Luq2mtqy3Wjd3b9qsj4COY8jH4uvvfxiX3YrdjeDrv19ZIVX79OnL8/P18WPJqwWPeDqd/+73v5eUtm3d1hXAGZ3AGWFiTwRF6DKnLJQTH6bETCXLXDIhMhEhISCKEDEgAhIgttZuy6razEAdwCHnVEohRHBDtxgRNXXz1pqZERELE5HH5wVXbbVVAM8555KxT6G7uzY1MwRE4JjPmMyUJKVESJIkiSASEROxuTdVCxCEOEwSAqCZqWpYT3P88nL9v/8//99//vWzWx9IEb4cS8kCYykRAhEQYkk8JU5CP7ybn04lJb4cy1QSIjBSmKVY03dbcJ9Av0OG3RLD4zJEePjOASzGZaA5B4hbEGKcEURETGGbYoH4sEPjdAD310AF0Xdj1G8ixEwY08GISMh9rADU7P/x//qf/vjL590qTfPh//A//p/+j/+X/5tp/fqXPy4vX9p6u376S11vAGSGADQdL4fze5F8urw7Xd6zSDme83REQhEiwuX2/Osv/9tye75dv375+KdWN6vVturu5IROiJinklJCIhJB4tPp/Lu//4fj+Xw8Ht+9/yGlZHVr66LaPv76y8ePfzFTdw17pNbc7Xa9/vLLn2+3W6vbtt7MVE1j9s3QFM18Wdq2NnOvtTU1BzdrAJ5zmudJhHOWMmVEcKjuFcDNuj1q1c3g48fPy7LuVokQf/uHf/gf/8//1+PpbHHQOnRjN3Z6jHusYmZGAEJionj6jkMxbJJZP9HNwJ2ZJCwOEhOF6RFiIiql5JREZD6eci7MlHMmZghb7L6t63K7qrZPnz59/vxpq9unz78+P39R1XVdWq3mWq2aa4cRw77H3xaG/A4RulnCAWv7IvRXVmlZt//53//Hl5fb409fWSUAICJJkpKoNmIKq8TojJAZMkFJNGcpQqXIcc7CNBWZSyZCRiJkRCQWZAZAoLBKLOStsbmrdas0TZmQ0BVjoWgsCG+NTC3eRlglA3Pw1qg1cPBScpkyAgJYDIfqN1YJu1XKKRNRSkmSIBKT7FZJzWLEHACAYhjVVJuBuwHG3XPiV4YbgImE6dEqxZmdhXKiLDwXOc4pCZ8PeS4Jw0wEBuom6cGzcAD0b04VcLtbpW45HvC3A5hhrAEbVgkAHZAImIgQiJiZoGPGYZXG8h8IazeDfeEAjiEkQkBmIRZEFBFmBkQiQUAHcERVO0yZHt4YIs3H09P7D6aNdM2Cdcmka80MjmYEQPPpcnx6Jymfnz6cn96zpPn0lOfjsDB0u06mL7fCSdDatW6r12a1gjkBkTMRlXnKJSMSpUQsp/Plp59/Op0vp9Pp/Q8/5pR1W9u6qNaUSARfWSWt5vbyMtW6psR1WxcB1WZmTdXdzdCUzByxMjU1J26s6m5m7G6l5GmehLmUNM0JER3YgdzB1LtVEleFnHPg9P1KOZ8ul+P5Ytbhv7vvgKUPYlglChPTrdLjAQNuCO4OASTDlwB3JhLhgAhMjIjCkpiJaJrmkrOIHE/nXAozx5/gFlZpXZbb7aqtMjMRbXV1V0TX1kSo1s3cqq7W3RpzgG4Tu3UydwBzj7MOu+9CMP61r95HC4TI/Gp83lold1/W5ePHj8yyLLd1WRAsEyQCIYBMJgiJK2ROJJ5BJnA25AYrIjZAgjhoGYjdwRwMQJuu69ZU3UHNHWAVXpIQIoEROLirWXfxzN2diESECM2tmbqbmqpWQIA2oZZwiRDvWIkAGQURdzBZiVYiREwpiSTEcOh4DF2HBrEY1GKrq6m5OyAB0PW61HV541fveOcOuzvQicnoyNbda1MmxDjidlPgr0xBOKljyvyV4fFvUfD9meYdLtndE+gohwkJkZiYBRGIcGyMYRQfvNT99t2uDe+vg05iREZEln5XYg4nzhGb+rZtr3kBb7Vu64JuwjyXScBtPgghADsIIM2ny/H8JJJSzg5xUCt6A0NQAAevi66LLottq9cGTRORlIkQS55Lmln4eD5Oh5lZynxIKc2H448//zzPh1Km43FmFkukhU1NGM+ng3VMoeaurZrZ58+f1mVFlBs+326LuToQMdxPeoKcEVHMjIWbqpnWupkBCwkTCyGBg2MAHGAHb9ZaUzPQ5mZgqm95N+hAFgbshd0qxQMIw6AwcxLpJob5tVXqsMTM/MG0MVEKXoU4MSNiyTnnzMyHw2EqRVjm4yFspaREREGOgHcvRFtzRGJet7VpVWu1buoKAGrNUNG0IzNwA3S9v3FE8AHuB1DqHxnua7mP78Pae8sjvcVKy7L8+vEjIq6323q7IfgkUBgyI88CmTBLxcyZExQvhiDmWK17CP0oRgZgc6/BJ5lvtZnuWDP2CSKAkDOFoXdzH/40EaGwEFGz1lo1N3M1U0TENqFOhBj4xt0tnD4kICGgceKFb+MAICklSYgIyNgtZ3dDYkTUvA6AbsGmESPyy7LVdXkzRDsGxbsfhh2CxPAHQWbWmm5BpfhYgfsT8W4KsPMl8B2rdJ8yfDRJ7ncPTmNYxxpAROYB3cWCaCAaxFZ/F/6KFXh8TdxfJewThT9MxEgYeBMJAdAJ1byur6ySu2ur27owIhPLNAlCt0qYnDIiH87vjpcn5kREQVWAN/SGAK7m6rYtut7asui6emvQmuRyLBMzn09P59M7SXJ5/3S8nCSl8/kyTVPO+XS+5JSJWVgQ0SyZFXc7nw9mP7m7mZoFHq9m+ssvf/n48YsqmDngZ7Xd9wdAimlJmVnAzLhVVVNtgKYKIsRCzEgEAOYQq5bN3KzW2ty7VVJrb+jigKGEBBTrwGHMw+CQSJiRUFhySmGShIWw03wYPkL4UZ0i7RcTJmZCEOYsQojzPM/zzMyn4zG+maYppYSEQTN10+beWq3bpGrELJLWdVnW27at27bWVs0MDQ1VDcwMcPBssbDw/ukeqYb9777bANz3k9b9kZh4uN5ape6gIvpAhuiADuhE6IRA4IhACLRzMt0NgUA6AOCAjuDmZmrazXkAvM4oWt9DhkADaECHL7vBDXe7//mK2jY3BAIAejS5DyMxnmhBXpqZabd4aDG5wcfHs83cVM37JMcdEN1aC/rze9fgaPoufqSL+y/c3Gy3So+LL2bIx7ABoo/PPG6yW7w7D/rwGx+GCcAtRrZbRkJytICBfSrBfPcSH4YRAPb1vCO3EXLEPqng4eMSdb7DCTAwJqKaq+mbKYhxdwIaVhpisYaHhtLRFqKDg6uFxwwG/R05ghMRMyWRkosxzXmap1lEDofj4XCUJPN8mKZZkkzTVKYppZRERDgomZjhsNS7A0WE7uTmiGhmOeWUckqZWRAJgGKeHicYCQkQENgIwGNHYT/Lht/t4OCIe9zFB1EzPLPXK3SMB95JQxw4e5zJxERIQRKFHydyx0oI4E6BjszMzffVx4jCRIjCFI6YiIT3zSIswkwszExIGKeVjROKiU0cUSVJSslMUzzFNOJFDjQst4cX/2hQENDhzkXsg3i3V/2D7zQCfndo4Du8EoIEBmEEBkI4ZTpkykJPh3wsUpKcDlPJMk05pyzCSIPHAlNXcNAOfcDcDSAAITKjOxi4O4IDGCBIopIYwy5YHCNMSHGiAAAZI3McdGoNABDFHBGAgPvcorA7IQkzIamqIQUo5djlSBYnf9jmeCh3gsnNzUzd9gAcQHBVbduqqb4ZO3xlHmBfTfvoO4AbGHrTbuCCAdsjiogQOwV3cIR98+Mb2wN3O+av1sADVtJuYzpeIjQlRDCxOJiIO1d6dxT3z/nG+wKwcfM4gc0HIw5jUSHvW1MdbrfV3tzDIv4Epgpq2qw1q1VzoXk+smSS1FrrGA+cmcuUiyVEDPQgiS+Xy1wywjv03yD6oRxOhyOzHA7nw3wiJpmzZGHmaZ4CUIikTtG7P0SUzMw0oreDrckkgHA4nJ8uH0yxNU/yy0aK6IidLlE1AGQWTmJmRGBGiL5urqoABD1yE1E5qFXN1My2rbY6fBwHN32LlQiFmZnJycn3ZdBtKQITp/6JZCqZiBJz6hQE0qt97xEZQ8SI1xFgJw0IGZEQp2mapomZSyk5J2YWERZG7H4iuRuhu8fgmNncDmYuKZ1Op9v1ZRVZbtdWKxmaNzJUxeaOZt4Xvscx9or73HfL4G7hjQ3uK/JbqPStVQLggBEEyEAIh0ynibPweU7HknKSwzzlJLmIpBTOQh8hbTFGEU6FfUMF3wsdQLgDgMZiZ+FcEiKYgpnvhLSP2Bu5o7G7qykqh4kzAyJ0oB1wx5pjFkJ0VDRADDpwP/nhvt8R4+hAs/DbhoPu+4NMtdbWatNHfPw41Heb8QBeA+k5mDsaqDrEoan90AxsRgREj1TU7sT11dljMa9YcdxRWf+J94hH8GA7NYGIzt1hi6Xq7sC7NziA6YBcj9y7DS9czYMPUXPTIDEHVOgYCIHQHNa1vrJsQVaZOYKrQRwmTVuzPFEpU8qTOjbVcMnVmojUNps1QnRGBBSm4/HoU8lJDocszMf5eD5emLmUQykHQDB2R0eiLMJMCMAAPZIZSFlVWzVzNVUzREySgImQRBIRT9N2Oj2p+svLlaUQbYAGEMvGVA0RU+KUkrshmSqYE2IMhgFYYO349K21WqtHtK6NFIHveMmDnGPu0zbcjpENg8xccmamLDKVwkzCkoOHDddvUH/g0NNtECPqHU5M4BYCR8RSylQKMeecU0qBvMJ3i5dzd3QEd0MKq1TK5O7MPM/Hw+FAhDlnEUEDNUb0eLBFJkffgPfd8GBmdq5iUEvxSMSwY/4Gbo3rrVWK54WPxgRMmISKcBJKTEIoEfwP8xKLr+9TtzgthpvaYQncc1+gBw/3XXwPY8cmQ9xX1Qh4W8fBCECI3qHvq226ByHx7nRADPfj54KBRLD7GOZmPQCx8zsA/b24m7kOZurxNgPA9yMixmqgtvESMFakw+6H3rOvHMB2XrBbh+Geuw8j+sZk+Ku/Hr73fQfsrJODo9NOa8er4zfP7MfW/os7TPN9Frq1VhtkGnjMAhCZhwP2egmFAxM+YH/OmFhzM3OIcBIQsSCJSM455USIwkiIroTgbi0nkZyECJjDwqOa1wqARmbkAHCDBQEYsTBHODyLYCz58eGHVw6qRhSnmrXW+oHJwiws4haHkN9PGBhR9+BvbCwVBKQIbo7B3IHTGPX7mnt7DWS9U4Zje0csX5iEWZjD9yIiEZZuR/rb2ukbjA2Cg3Hazxo3NUcEVYuTdSQc+c4r3o9Uh9127mFYImSmyHLqHpwjEZnH2xjR2gdH7K8Ymcdf7fD/9Z+vr2+xkgsaIyYBAEqE7475/TEnplORSYgZBZTdvVldVAndI0QNrVprCg4dlxKmnCg8fWJEbE3d3MAgMjMRSuK5JACoVTUQhbXAGq2NIQR3ACJKLGH93AwR0bBzRH2ugn9TGMxXj1iCd8oWujEFc2srWLVIVXBHd0Yfm9EBoJmuta1V9TVUQgQmFO4sA4BzrE6ExBRf3K12OP3hFzncPwq4g+Ggp7tjBMMeP5w745W/63wPm+Y4hql7XwgOBoCGaGQ41q9Dp1zGRMP99HqYfQNwQIMItLg23aq5e9WegmCOwxiTua9rfZP97qZWGxKCRlIHEDFLAoNtWbSppJKmRMTTYZoOkyQ5v7scT0ckiuUPZt6quyF6gMqq/ut1cQD3JZaXkjlaq/X5y+d1uc25/HC5zLmcT8efP3zIKdmgMVtr67aauTZTdUQUTkS0LKsqMk85zfPhbI7ret2uX83MAVkSAKi51c1d1/XWdNPWAIwYRKiUJMIjtBf2FsZ3vlsQenTu+/xAoB6AfiZIj26SiDBxEpnnIixJpESwTDiJ4N0U9f8iqGKDzAWAQZCatta2DQBq09Yai1C3MUSR4YGEaGgB93oUz4eJC4o95zxNMziUlHNKjcC8EnoDMFZDBDcjdKegY3Gcj30luCOgP8Sc7yt6YPXvXm+tEgIQOIeXIZiYjkVOcxbCOVEmYEJGQwAw06ravXh0h9a8VQMAZAAKVsqZAAmYCRBjnaEb9uRDFKYsDACgBgQdnhiYmYU7ON5XjBQimkbEycGp8ybwEHQM3ydmDuPQ3iHM8GbdXd0MLRifvlD6cWHQgVLVCO69HTne/VEHAIh8bkQQQiZkAsJBb5sb7gMEnfmMuYr0bBxvnAbMG7O3B/j8tW16iLcOqNiprD3doQ8EGQUP6nFw4OD2xyGN93HrP7GxrsY9e0aGmddmqm4AHRsND661V7xbhIXc1AHBrHusSBFyb7WaWpDezHQ8TOeniyQ5XM7z8RDOCyKBO5gGyomMx+26Pm+rqrUGtbqDG6qhrcvyyz//8fnL5/PhsP308+lwMLX354uwjBhJeHJNTZdb3baGiMES1KZuQCQsOeepNa11025TBgoKWkpbbVtrm5k6eIAIERJhVa/V98oEHymUA0fvE/xqj+1U93DcMMxxkhQGqOSShEWkpHxnux/CsTFn7q5qnQsbAChAXa1tXbcxmSCq0zQ1VQdIZm5kZOhIgHdEPUByR4IYQcCsrYkkYQHwxgxg7sZEAB7BdDfwwWLjeGM7fN958e+A/b9yfYdXEkQhDFopMQqREAljYkqMw+eC+xkwLDihE0fAJvbKwHhjJ6F7RIxif4TvX6siQFNVNY8DzdzMq2mcOUF7BzWKO3/iw5mKyScKIxBGiZDjEYx2j94NlwoAgi83h2bmBurebPfa3AyWrW3VarM3QAARiVEYd7eYCSNxXxgTozARdRd4N4X3cfKeBBAONz1423217Tbom292sD08g/0M7ksC92c47iGh+HcMuYMDjbm4uxDjTp2MAHtgAfYZM/PINRtWaTBI3xDmYUz6K8WAiYB7LmU+HERkOpwO57OIzPOcciYmVVvWDfpuRTdzbWEQmlYzu16X5+ebmZuhGoKDoRrqerv9+vHT548ft9N2mY8IeD4ezSFifIhIQCKcUiLj1ly1m1wz16a3Zdm2uq5b94GoFzMFeQwAnbTbHV5EEQ5HJj6tmanWsMP7Vow1H9AkajtebzKEcR4MtoSCIg3aCHejtQ+nm47km8f/zHsthI2aGG2tbquZ1XVdl8Xdt7qVraSUJCUWDqcQEcl3GDfWyXDxgjDBnunWKXbcg0X3Pb8zFoOaGOtvLIWxYod5evXv/R/f2Km3VokJJ8HExM7iloTmLFNOwnjIVIQGVIzdEDdEH8YB2d1Bgw6kXoGGiBwr2cxbM1VEAEI3WJcaFkx7BMO2yEFzq6rmTsyJM2LgKBsgw2KLd8PETCJmbhXcjYAlEmFxo0ErmFo/xW28ZQA1X6s2tWa+NjPzpl6bucNWfWu+VN3qK96ECEqiqTBAhx7MJIxEeMg8F2HCwiT0yiRR+GtjOz/Y0753H7b0OLkGjTl+s5sK7MVtfZ04IRk49ZOuM1kOgOANnRDcnQO0gVMYr0h9cdhDOjislAFgf1gEt0HN1bw1qxr0RHBF6EgGrvomc8JNW6sVmBMTEaEAlNlSPp/OP/74U8nlcL6cn96zsBM7k7m/bOun62czr6pR9NPW1VRrq8t6U7PrdX1+uZk5cxEpgADYHO3l69d////5n3755z/++P4DO/74/n3JRQ2AmMAZzN1KoZSKmiEK4Wrm29a02e22/PmXvzw/X9ftZubEwimnXNh0jySYqbm5W68GJeJSsGeEeSRVXm83MwNjd9qtGxEFu1zy7U1u99gqOL6JQE3kAwhHgV8PJoKrGbmbaWsAEHvE3VuMk/m2bk1VVbdazazWbbldTXVd1/V2c/dSyjSVlPNtW9e65Zwd7ODOTO6pB2fv9GOHfPF5mSglaVWYiYnciQANkAAJydEJkBwi/eR++vfQzt1KDWjeMdNOao0n/OesEmHHSgIoQIlJmIQpMSbhJN13jRvt67GDNOoRH+sOwxj9WPL9nVokNQU1pKq1Yt+E5mrWmjZVdaumBs4ATEaI6o6R+9N39TC1OE42dAD1zjQxAgJyDFrQIYO07EdaRJrWrTa1qr5UVfPWfKtmDs1QDbZqb3klQCZMfEc/zJiYiGJ8KPy7noQHgN4NE6LjOBd2Y0TB78AjE9gXib+au7ttevDgHryAbr46Zd7Jy4A54clijw7cQ7KdHBrjt5/nDtZPwIFuO1zynnsflVuIjpFf/npRxYNVLRg4RCBiSeRcpul8Ok3TdLpcLu+eiHkz29ybarvdrrdVzdZaW1PVtt5u2tpWt9tya9qut/X5eTGDUuZcZkR0bAD2/OXrn//y6z//859d/fOXr1Muy7JFGkAEuwBBiAFATbdNWzVVRYhcSr2+3L5+fTZvHqwbEQvHoQrxUftsdGBAFJU3hANiqGmLDMM+/DExSIQ9PegNVhrodDdJESftUIlwsJQDV7iDwc5I7oVZfZzMlmVtrTXVdd1UddvW2/VZVbdlud1u4F5KLqXkUo7n83Q4qNm2HXJuAGxE91mH4QS6w1gpURVAA1s88FqPQOnunMGdOwUfI9epijBJPQR1X9Xf9edeV+dGbmjizJhQBCExJqGeij2yEbi73DDKjWnwWb04ZqeaBt/vnQkzhX7y9HM+CkoAIIyVubdRrRTFOeje1MkM0LamiIhgBEYYxSiIBKgNGUytrtXMEqVJEhMhJERENObm2NzcvDmod9/bm1p81WZbVTVfN12Wpg5mqI6rWlN9HCIiyIlL5jE3wMOxzYniVTu1NGYLI5buu6vUmf6BlcbQ7dMaeV7mu6O/kxQjauN4h0qI6IS4nxA+LEUU+uE4xhDDrXVCNCQg6OGjAJ37EkMgvy/AcZzAmEvwe17p94gCBKS+mh3ZkR1cCd2tgtzUralelwU+I9HWbG3aVD9++frl+mLmTZuauWqrW8dK26pqdW1aI5sZGBEQVFVts1bJXQgJwJq22tZtuy63fMtETtRZRUAAJElSpmJmxKxNm+nhNFWt23YzNbPGBDlnNa1Vt6ph2XtpT0RrAXvGKvcjIYyfY0eWAZQAkLmXgn/LK+0WZ0xsgDIDgFqbmauqu/VkUNzP7Kjga53mqzUg0rKukb+y1U3VWt3W21VN67aFB1db22rN2/bp02eWNE9TyQkAUxKcQcT3RbjjnD1Y15fubjofCMlhWwa8v1/3pTwgO+DASwPPj1XV/35rmt5iJWE6FC6JM1FCEqZSRBIxAXFIAPTkK3fXvlAj/RsiC8khaor7aWMa/zIE11bdGpgBUwCe5uqqAGiObmDu1ayZx83HJjAEaN6qggd7hU4IZYMkDoiGBkiq1tZqzaZ8uExzr5ycImt3Q9jMVX2JMElVU7XadF1bVduqXtemai/X+uV5U3MDMsRmsG7tccyY6DDJ+ZDxbpUimxYSUxZExETI1HMdABDBueOSPTi5Z1H2RWt+T7ENN7PpwCa7USFCABcSQOy2LzxDMggY3Q+CHiYwUwRAYCViCk6EzSNHBQiB0JEx5C8AAHsmjLtH6juNw2wgr0BCsT0Rie7n4cOmi5gRMwNlJTH3htnAb5g/V0te9fZZ//LF3Je1rktrql++Pj9fb4HAoANMi1STqtXda9O6NUTE4okJ3Ftd6/rSliuDFWZBbLWuy/Lycv310yc1m6Y0zyVieuGoTvNUpuLQ8V6a5NPXTyhw/Wp1/ahtTQkoz2b+/LIsdbVIGglAGLW9bt7I2BAixgEURbCOOoorc04iQkTMiYgxxDPeGO7IjR+7MQC8qbamYUXDSR85Nq6t1drcrLXWajW3utXamqku6xp5Uk2bBzG/bcHQa60OID2pOzWFr88vh8PBzde1TqXAO48sTWFCHHxt0IL9w3uQSvtXh3e7JRm8V1BfMGA+vGWXRtJOX0s7oB9r9V+2StTTJVCIEkGkZNOeLoX3kKc7ehcp2k/jHaiNN9CPe+tp3rvGzTCdI4EJzdAdzV2DQB021EfeUlPf1Nx3qxQOqjmgIRiYqbWlmRq5VUZwSokABAGIDFDBgjhHB3SLbHLX8acO0BR1xIbkRLqnuuwrCkGYktArq0QUbDcTxcnTSZqBlTrx1gFPrEjc4ZKP3/rASmFZYpWPfBSIJ5p127a/wn7bvuRhP6/imbESDBFHmgCaIwWn6bAvF4SHP+/ZKPfL73cey+2evfA4RP1yJAB27OUkDWhTU8RaddmamS23uiy1Nf36/Hy9LgDOAwPyqFlqUbmmaqqIBG79WDe1Vr01gq6R4Gam1lpbt21ZV2LMJcNeGxGlfPfwApal5JJKkW0JrKmEhMLmHgbX9/O+n44eJnvEeDvgp1F/06dp8Ep9rN/apDFK92H1V4TMfcO6qauqubda61bNrNUaDuO2ba01VV2WNUSRNHI5VFutUQqh2sBBmVplTvpyvXJKZn693eblgACtNRWOQyhOzUdcvPNB/ZePZPdYAW9JhzfQxwez0CNxAxnel9BY8a+v11YJQQSnwnPmTJbJmLAkTikKlv31+Hay2zySehzM0Y0cJfg6oiwiwm5oqg5OCCJC7t51QqDVvuzUyAw9cr/MEVzQCQDRCRXQtoZbrT0pAgARc8VeG8QCRIJ8OpwYOWERTGgM2mvQSZCJDL0x6V2FDXCcAEl4niK5LjFnNa/uzaCaP9sKte6fmQhz4qmkByYbhREhMgNiRw33zRDQcaTlYyfFRhHeA1YK+xEl7U1dzbYWFU5xroewjiOgJ4y3wew80NgwgrDXxUcaq7sCApHHQWIA4h5qesbE5ITAjrEsAR9q5fa1tVuYfeHi90zRvoIQiZLIhCTNWB2r2XXbmurtutxenolQzaq6u29brWtTtdv1ti4h5jUildDAvZnWViPStLWGiFu73tYXAK/bom1t65ZTvpwvh/nARGC63m6//uWX9XY9Hg/rehLhaZrKVAhJEouMNBIEIkxCKbEwoDe0ak7qTR20NW1malpVt+qmLTS8Au+6m1lrHuMhIjHCu9paPCBEE8NYPO7kgBXhiAXu3PMbW2TDWEjNea8ztztWUm3amrm1WuOb8OTG/AO4IzM6IzGywKiFdcB13Z6fX1Tt48dP4LAeD3PJbpaSAAT3cKcXOyccXmiEEomNuVeQ9j+9r+hO2DwAobvVeXPdTdeOzL590FuslIRPczoUydytUk6SEyM4Q9S0DY5kQCG/S/kBABCScEZORJhTYiHTtpqrKRGWnAywqVU1c1/Wdl1WNa+KzQjcyYAAEsIpkRAiOnEDQNt0WayZG6A5AQATEAARllJE+DQd353fHaejrVCv6ArYACoAgwiKkDmokCmhhiONCMjEwQLkzAB4PPjTE5j5teqt2lr102Z4rfvIMdE0peMh414+0s1Qd3kG4uiRUHdEcNqxEmBEN4YDdz96IvWhqm/V1GxZe7wlilWoewwYWJKJhN0Ed2gDPS8K1KBqf6K6AyChxcndzIKYN+NAxITuRMweCDgyVXayso9R/GIApw6Hg1h4heb7emYuSU6OtDbYmi+bffpyW7YNoQIsALYDCG1mqm62rVvbKkSwEsFMm67uWltbIs7d6rZVR5g+z2WekVBIiJgApnI45cNUciIC09vL1//0T/+Yczqdzk/vnlJKT++enp6eRHiCQpQQnZGQgBlz5lI4CRBsaIs5Nid1r1urtZlq27a2bOBqVs0bOFliioKkOIkRc8oOoIpi2EGuGSJGzL61t0om7ta0tdZa09bU3Lat1trUbF1rhKADGYVpCwUxbc3dzTRKgSxSQscmJ6IkEcZjEcEeWQOITF5VB7jelmXdrtdbYrm93C6X81yKqZaSCQ4mEgKzsMNJRCYOxj5KfM109+coDkkgMHRDMPAosxls0huvdSDyTlLADkW/58J9LwbX424gBETA3HPZ8V6Z/HqQocOw8XEAo4KzxxSGvGGnzWiQF+jmqqF2AptiU0cHBiAHYSJHhqGjETvfDRzMoXUlAEd0dhZVInQHIcmSWvMG5gHGvCcjB59Hw7kYcaf7X0i9Fp4A3UGxKTQb1P59dBGYkJlwkPphlWLo6JVJcn+wROPZI2vj7bT1oQxqVQ0CNPkooYuDBXGUMe+U4oPn5T3zcb9PeNjuhG6IiGyuGASum5khmUUG3H6mYK++853YvPsh2A/H+zv/vm+ChMQA5GNH1NrqVt03sxVAd17NW6hZWduq1gbg1pUOtLbVXGur27qqWW2tturgSOgERORpEkFEYpZMlEQQIJiXdVlMm4iUpajqvM2tNndPScx4jzshhq0nJmQERhhhFxixJB98Q7jC/viRzYJ26RjJiRxCmGVwxZ0WepOGu5OlUQeoZlZr22pVtbX7ZbZtW2gAabdBqrEahpKHtWamYxbQAdgpjslwIAP39LCHdwbHrDHxuq3Lmsqaa621NmE2c3JzJwdHH6Hd++6gV5nqw0/F4QXsFNndffPvLY7dU92R0l+5vonBMeXEJXFCF3CMYl1GAmQijkf1fYJRFETEOT/woohR14sIMS/gxiJIWBVaBTO/rfZy25ray9JeFjOHqlQNGGAmzAglpb97d36acxKeJkbEP35dyqfbUvXr2r4uzUZZ2aBpAFxbXevKdbNWzZqLoCkCgLuCG4IReQjfMSMxAqI4oXnfjQApieTsgCnXtNa8tizcKZ++lLHzSsMfppGO9MCmDSMxRvXRfQuEsQczYszC7VLz2mxr1tTWZq0rRrsP3VvqGwkdyKKcfzez1msOcRDSe94jRYFLkE/uFNnTRGbOCE5kFrkpCBTlcwARGEZgxiSEhqF/YO4twlCAgGAOESp6MEkokso0qYFdr1vd1nW5vTxfbzeERrB22RhXd9e2tbqBu7YW+YqqLfybrW0hBNhMA+/1ZD5hSZlZpsOlTMeEdGKeiNDati3bclWtwp5S6m8mpSBfUpKnp8vpdBDhw3EuJSPRPBXXGevZf/5hXeaXpX65bk1NG2tjVWmuyuBu7uKgEe8nxtZqrREpI7Ku8SISGZithUZ5qIzoW6UXNV23mtZt3bZ121QtJHTNbN1qJEWGw2jupuoAphoJdz2xphPMYR4ieYg5TZEvWqZpRPMZAEybhcxm3VqrALAsKzgy0ZcvXxHQzKapAAJI1GCM0LBHiaBEUR6ziJhIMrMwTlGE0Wo10nA2++r3/Qy+L/LdMt3ZVv+O4fqOVQIAIZqyTFnYlMwwcpeIgnxhQjPXGg5xKP+DMInk4dU6AKqj9fTi0JAAZmZhXa1pawrXm376srZm163dNjOHatCMBEESJoLpmP7w/sNv3x2nIpdTIqb/71++In962dofP1+XetUxNYDBfwO4tbqsCLpa3ZqrayJTQsRRfhvEFgECC7EhGknwBD2a7nPh42kGxLJITpylvlXIRRCJKhmPtBbsOUdR/9H5vM5gD4JmYKgeitgPmDB28bcZqHlVX5u1ZksdVqn7iaE9DETGjEFCxVuicXLhiJrF0Ngg/KwfcAgAPmJwyiZKDG5EIoQRbWFG7pxuwEdhSsJkpsoIYAG8AkMAuju/QeqIKaUyHWpT85dt29bb7eXr15eXF0ZN3BC8tm2ti7nV7Vq3m7tHbYqardtWmzazpVY1D2lYQCjTNB8OHC5FLpLyfH5/PL5PhE9CM+N6ff78p8/b9VnrxmQ5J1VtZsx8vd4+f/maUqp1a+2plCwppZQJ6TAVRitwmf2ntt0+fn4h/LpV1dYiBt/ILUfKW/YgKdEAQFVba6qNiFkMkXLJYQp3oNQidG9vPbimtq4bp/V2W27LomrX621dVzPfarDbuw5EqESGgev6Ux2QWGQB9RodpCR5SinlnKfDgYWFWVJCAG3NtKnq9eWr39wBlttS14oAnz9/DVB4Oh0wsnOFcaAj6GpzkQ6ehMXMkiR3F1YhMjc3a21TpdaUECNk7KPuYjdJo2gY3qwV6P7Tf84qIQJHkaQ/hg/w0fD5XfJiD/zgHn3bS7hegbgRT1SDpq5q2oLW9Sjh7Hqv2FMMGDEzFeFJaBImxkm4iDSDRCzEkXJ0f0Pg7tZirTRr2lxdjdQZHK0nYO4k3h5nB2KCPdbVC9kDEGESEsZvNIXjfEIIEOJ7wuTDAIxHeoCw/o/96Q9uN454S3ezu9zt+LM7EXuKAfmuSzZuF/dEHLoF/fM9Cph5BIf6fsGeSGYQQVR7VWkQ1OU+YzCcLWRCo1CQu8+vjcymx8vBvXsnrbXatLZWtVVARWsI3jSYWjVVcEN3oi7SVYmInHrJiBFSqIanlHMpzFLKlMskklMqkrIgMkN4F6oaHkmtFQBINqnVzEWaqPJo26N6F9LCUbdNXcMHE5Mb5OQ5gRKhbs3Ivdckj3LGOyUC4KBGdGdte3Tg4XqzgLzjYtO9gUGIrZjbw1u7L7d+12irQ/eDrtcAdzqJWIiFRu6miCRJseC7yiZ12jNo9tZaba1Gm4SRMh5v8J69tr+BfqztNCMBMzkGjAJ37jFHwiETCN2HhN06vdobj99+c72xSigic5kOc/LNfVNAiOwkcAxrEkUjFkvYEQDUsdeVQS+2agZqHko2xNTnEGDT9vVlXbf2cqvX1dS8GQKGixTjBiJeGArrzPVAa3FOmyHiweBdOmTQ64TXlarq2tbatoBCWnXR7Vf9LCTezDZzh43EkoiSpQwtA4I6OhIQpCRIYO5Ju78TlRPCgFYRsQgICYFnoVejiZGgtCdKOwKMSL2PdIZuS0IzBf0uw4N3JnC4/QgwAmcaMTjz5tAcdFjLuP1uknYRhshIYI4F51mIEBy8KpEG/X2Pw4b5CH7U3NFdDVQB3BC5KXCsxpGWSaEGkZkZ1ZwIWiN1qw11ZMubQ5JXh52ZXq+fP336T1vVXz/+5eOX5+vL7evXX67XK5qStdB6DltespTDhZlOx9NhmlT95VbX2rZmz0vdmklOZSrMfDgdz5cLi0zH83Q8ITFSAc5sxnoDra3q9fnl+cuXdV3WbeXE5/PTk2LKuUzzYT6klBCo1kYUhf7QS41V1+v145/+eb0+O6ZLKZaxFDqdqbb26aN9/bKq2bK21rbAoO5et9qqNlV3Heg3SSqAvXWYubVxvUl/V/OtNakhStHUrEVBFCByYg5/9a5dG4YM9jM40LhZlEeIJGJOKR3Px5RyzulwODBzSlJyAkStVVtttW7LuuJiZttazZSJP3/+omrMdH13gag2Kwk8hJ+CqOnlEKpmI7eTo/cZFwAQIgJv2hDQzdW01da0PViUO6KJs9FG7D5+OlIo/iWrBMI8lTKX1LyqCoDTUJLq3R/M66jaj/NNAbq0SN9iXfWNgAQRmSG4BIdN4fm2Xm91WW3ZzAyMAm0AIhEAEST2zFDYZqoHrOIqmyLgZPyUpoz+XOBrwaqtKyaDu5qaq2/rUsEhoBEAGCecSnKGhqxyz+NHksShG++dDwx3yRkBrAJiFpGcwCPkgo/YJChSgE7udQ/O71bJd90S62gW9NVJcQ8aYIeUg4HuVik4Jh28dUzhUDfoEYCgaSO/jAgBqFsl9yoR5rUYCfdHZBUpCAaGABHGQURg7VPNbgC9WjRWDTOaOxM0MTXbGANhxZtMTI+Lyt1uty+fP/9prfrpy18+fn5ebsvX51+X2wKt2VbBLGXJJTFTPhyfLoec8k8//vT+6Z2qf73WZbW16qeXbWlWSjmejpzS+Xy+vH8SSXk+5PngDi9rW7aGrfKtgbbwg56/Pt8WfllvxLxVR86lTD988GmaU0qI1KoyDafKu7zBdrt++vOfl+fPp8uHpw9HknzAfMGy1ar1eVk+Q4VITnD38LDqqPhoqq0pIqY8TaaIGEyquzdttdVI1L6PD4CZVdW1ta3p1jTyJDT2KUskXrIkIh4eXKfewy2KfEc3vVsl4pTzfDyGTFWIc+ckU8mI2Oqmtda6PX/5Gun929Za3Zj4y9dnNSslLcvCRDmJW8BBfMzXtqHnae7RbSWJlJIIkREQrLVmzVrkKOwVAAM+0rBL4UhR9wp6CCVQ8r9olRAQQ+dJQBKIAABxIg4pQ7VIv3sr7jG8KIDwWDBq94gisTpqO6LGTR+xYvekYtehASYKqTkHxKa2NTWwuOXWMJ4WfLMDhZjBjk9gQJT4Z1jlcbhFsQCEf4kDkEYCo3epDb/ndsAeMfzG6x1xid153aHuCCwgDkTU423u/R8713c/PnrmhvvbADv05KD+DkZybRdO2b8C1DCROwSRr+bRGMr7YRCViQ/e695n6sGYwI7xfMDeMErQ1faYQnKPzF3RenIi+r2UanygWrfl9rI1a605OCCwsCTp4M085zRPhYWPh+PxcMw5zdNc8tTUcxVzNVBJlEBFCkuWeD5nkcSciMQcEAx8jzk6dILfQBGaovnW2lYbcbPRFVVERFIPnHuXQ3B1rW1b1vW2lLLqtoED5pSEHChnzjkhOi+MnVHreWTQHcAgO2hfEu73tgWdlH59jXnpXx1D95uFbt3dKtGOu0NBf1glCKxE0RqLo4tPaN9SlNIy08jptZ7OE15nd61DPLNGUsLYlQ/8QN8JvocjrR+3sXeYmJiSSBIhhNRbLqJqM0V3jBhl50sAoAdw0XaC9Z7E9/b6BiuJTPNhPhZPbCUDRHMLNrOtblGmpFiDnsS9uqU3VesBZAaKzADgpMBrq5+/Xtdte35Zlrpt2gyQGbv2VPBrzMScEE5sExoi/vp18aboiMYAeMPyjHMFAoTDxM0QIHNktIX6iPdE2Gh64w4GrmaoIdWqO2uFEPmZIQEfVmnsLnN3iznsfNNrC4wAxMiMndWGkTAxtnUApohTdSrA8VV3t4eZ2JdmpAJYwHhAROBQPBsvKl1PDqcsc5HEPJc0lUTYCxXNLDGoWkmcmNSsNlub2Shh6bzVYOVxT7DyISsaA+PuDgRO0MtK9libmam7NIx7NnM1S0KPlltb+/iXP/9v/+v/7CSrZRLO03R590GboRlXQ/DT6fj07pxS+vD+9P79iZlLmjOXqg5YZVXJbYMb1yaSmAsRE81IM6I4ZDMx91p92xqqYjMK2GYeek9NzRFRXiR9mbfamuZcpjKdzsfDYRbhlAuEx7G1ttTrl5ePf/zz86e/1Ovm1VKZDj/95nA+FU8f3p+I67Iu5puDbltdbstWqxsEo5JSN/Y55/DFW9sirl/rGunXb6glNd+aUdXavBm4gQEhJySWPEeuZykzizwg6h6xwj3aG7sPgZgJMYkcDpMkFuaSE0Vfa+7qEnHYaNNtq61ut9t1W25uOk1529Z5zrfllpK0lsFtlL4BAoANK7bVbd0iX8o9svaKiGTGnEi1xX5orb1QUF4W1XkY7Qh7YI8QQEeZd5zIRN8yk99kBhBzKiWXCZggJ3CIQ9pMHQnqBmZkbqB9XHriQWxw9C48LEQcYk2O1LS9XLfrstyWdWtVTR2IWQBC1xGRMKVI/4IJLaMB4telelM3NCV31IytpEgnypnZUFVw5KyF4kRFUwMF0D6PXRfQ3dAUiPYzYGQVIPTKq6hcBUez1g+3e/LFg2XCrupLnYPeVX0B3AnMAAEMB9R5eNq+vMZBMU7WKIIDs4FB43whpP3miEKUmJgwC5ckKRI4hIlQhJjIzAjBzISNMXpJWWrauVUNvm9U/I9Dj3avznujBw8V554uC+HKOYS2Z7hykYNubKaK8tqDM7Pnr5//8uc/Yip0/BHLSRLzqbgjmyd1Anz37vLjTx9yTh/en9+/PxGSNXLF2ry26qjAtTRxqsTMLEiEmAkTogCIOUd5Zat3e7SHy6v6zdQBUl7Ly80cVV0k51yOh+P5ckZCkeA6Qau1ra0vy9dfP3/99SMaJk55nqd3TyWjI5/PE/DpeuMvz19u66KmalprJSTiFBX+zIKIkSHeK9Fqr0QzU/NvesBYLwvXrq8DHtuWmFKWlEVSno8ssmuowv0we6WN0/c8gjBPUxLh6AeHgaOJYMcNvb1Cq7Vu67osCwC8vLyo6vV62bZaW32UqB9JSB2CNtVWG4z2IISUU85JlCAxmKnWqrXWVrVV7VpE5h4pJxEgCiE9JDcNnGrubt9hlb6j2333XfDuw3SHp5u9nqTVrRLAzrqH3BkicXQEQDM0A1VQNWsNzRIhcaRQAgAIR3U1TVlSToIwgWbwJIgszmQAauAINiJpSM4OAJiTxPuNl21a13pr2mo1gGbmwpE0YBja737HpXdqZwzKm/jZN2PyaGEig+xuZ/qw9rZgvlsd9PHNSGgbj+/EM9yDmDHATkPoMjgi7JmfkJiKcFilLCTMiYmZdoIJAZ3IEMBBmQm7dlsXbGN3cNYe3dMWZYkhgdkHxRHG/hlxw+H8x9yG5hJRH0GH6I7xaqQcXJvWrTIkJpFUwAlEwIndszkBlumQc0k5IbEaGHjbmlZo6rXqnrQ8LHI/uL37asOXePCBOk1BzCQNR94wUlSTf0tb7DNJSKHanSQlidQXGIEMA8SceJ4ygJ+OR1UT5pfnq8aKBHQHRhKRvuQJEVGkty1yN0SUb1TfHnz2nUsAYMSuDxzzymHsIq1uX2PDKnWoC6MBKtL+Ye/qavvCtj1PXFsPQ1pP4QyaDEcAd08L21nq4QeMoP+I5+yLU5gNIInkLIiQRTYRUlWibm3vh/FYVH0fPeyd19e33QQwpCjAuYs4jxszIwCDYfJEgc0edhREdwgAQBTJxMnM603bZnWzel23643QL5kQ0AxVEQBFiCWJ8NP5eDxOBJCskVtCZGEjbE23bXNzYAVaAImBMzIATuXowCJyOh+mKW/1+uXrn9d6vV63T59fatWUQFiZDLF6tMBwiurOnsndJyLgwgib7XvhO1FvCF+zEzcjhBuA0RAMQwsHR9HxGPcxFaPQbLcFGMdPBFyZKAsjoDkIBrmIQoiAOdGchAnPh3w5ZGE6TvmQU8QECdGdlNHMVSwx2wjnDbcS3KGphXDhutbWNA5BcyeEiI24o0ckY3x8Hqe1IbqDEZBRJI6zOyuJvDrt3Hy7bS+fr+Uox5/n0/kHBCGaETkBTAgMcDpNl6cDCxHBsjZTv37ZbtdqBmulZthMzRQhmm44kgP2+hlzhPB2tXprXYLCnJBSmvJ0VFWo1d2BC0pGyoC0Owz34IIDASVOLmUuh6fTWdo2TVNiFHSChrAx8eUynalsWyslv7wsnz5/ac1EvtRNlyXSDvLhcCYiIAPysEQ5ZzNd17W1VjcjfpXy5g7qoI4GBMQAQBhlTyJ5klxSSrlM0dg2bNO+iSP17k7H9EwOjx7eEDVDnU9B7G0Zu9LAti7r7Vrrtq23bV0IsW4bM5kqEQmL7CmTo9lyVBlHMqCZgpu5ghuYRjMkEUJO7uw6M1itDU0JoLaGZosNyheG0NhrGV2F7+2x72Gl2C9d5PXeyCnIOCBCYGNA6g/qTFZsva6STZKIc8/WNdNmWpvVxoJTJiI0hQgeihAnFuHznJ9OE7qjMphFQ3sDNKiq1dCRLMp0EVGQAZElE5Vc0ocP747HeV2fma/LakywrguTEQGTE/qo0gkHGwezdE/wGesF9n8Me/LNiPWwPAXy9n5oxtPv/mDk7Y8yMRxR0UdeyR9E1gGiRyICEzl3ftzMuTeVwZJ4zsKEc5YpCTNG4xnsqzHyHsHJ2aJoptfB3aMQ4DUcBzUwI3AzqGZgHep2XxzucKlHSboY7JCFxx7wQEcAo2/AUqu6LZWTMuWcD0RJ5EQkCeBAwIiHQ5rmQoSmW2ubNrvetpevqzs2ZwdqPiouwbF3yotoJIIPpjhSxHfmOXq3SSKknlJBDBhCIq97mQ7rhIBEzCRZ8lwmK1NOiREZgdAQGiJOU+IsrZk7zXNFpOPhz8uygtdlae5OxDllEu65HECIIMJRMcvMKS1vAwKd4OtvIVAeIu3ZRtSFbBMRsaTuw3X03XnKO4QxAwg6u6PCB1TfKe7IiWqttbq1umkU4GnruNR9F3fj3h9zHNcjstP1z9x86KkjOHVa2MGxpWSlCNNyy1uuhLgyC1EPN4HvXBUi0Pj3Xylie22VxuS7mnWqYxR2mJvaENc2MxvFbcHvgjmAmqkrEjmyYGSFNLeGaFnAE5QExxmZUBVaAwDMU8nTUYRPxzJljrQCVyNEESEkr8De0CyllEoBRHVWICQuU0n5kJIcT3meE0k+tTllM4OvX25gDhDaKcOtRSIn82hnFr1bH/BpR9VvfLi3Ll0f1t1Hix9Gthh2q+Nvnr9jlfHtWEyg2jMYgx4id0RUYx8aSdFPhRCz8JyZieYplZK4iyIyDpGZsD+xQ5kjIwnub48QHEiDDDJtCu6qoA3vJ1lPSveR1Opk0e26E2C+c20Pjt43YBLCKyIW6trXrlpVnRgVCRAVQpkryv3ArHewcUd2jhWnjtBLhvteMzd0IOeHdmw2svSiMW+WVBgbKZAZckJOQAJEo9ezOYQcCkZSYt90iMjx1ZXaAKPiDFsN2V5HsEQ4l/T+3YWIrteVqNSm0zRzykRo7tbb//YoPhMDAzN/G8cFpNFIzMeBP74e1R+HgdiPMxzgCPfFNRacd5SLwxePyOtoGtUTJXtafv/QPTbJIpxS7/LUsy27H0GEvQYuDqweOhkdOBGjUNRzErcswtthc/etVm2VANS01jbkgPaN4PcEglfN2L5nlQAgkiRrM7QGWgcxbGa2batqM4NmYAaIFCY6MqrdfWu1akWi0wknRFcz3cCqYD1PPiMcJnp3osTYFFsDQD48XY6XH4koCyQCN11Xa82IJZWJWKhWTGRm8zSdDkciWptuqsx8efd0OF9EeD6WnFOtOM0/bNsxyafr83IlbK1t2wYGiMycEcmdI/eqyxpijyK69yT/PS4O+0b85uqVaD5uEadYPPXh8d5/CH0ColvlUJkN5d09MhwaxIAwovYQqiLMFOLvSbhkIcQpS8lMhJkpcSC+/ga6wo6HMFTQDwgIoQQNAFEM25qiOxPWSrWp2t3cqEFoNpiaEloEAQaIGoPyyIX1bx63HEtK+ZDSFK9qplu9maMn4VIEKblVcwVQdW1ghsCSJnQAcXRHNQN1jQBF14UxtepAEbp1cEBFVEAFBEdCTjIds8FWq/jNzTjNJDOlCSQ5kzM6mmPtZFp0M0bEQAiJOYtkToU5MaGbbg6tNXUwQBIskoUuR/w3f1i39vnL7Y9/+ryuzbrkoatG6EWDzIusyiQpp/xWtzvYIpJAGgBdLyTa0gVckiSSZA9Re8dCnfOCURk+yuIG36aAFE2E0MAVHdyD4G5b56Gty54gM6UkuaRpyvNhOsxTKTk60O1ndUQbmKJxbVSbNbOmrYWubGQ5IaIwTVM2tZzkfDps25YZX8q11vr8/LLVamPx3xNhbGDeb7bZtx5ccOeh6xMMsfU137tQ7lkBfRdGc1Rz32rbWiWipq3nz7u6K4Ildk44JTgUzEKtQRUExNMhn84HImJvDKoKquiAJMRZSJIjaGuolkuepkJEWCtUYJF5zqfTxExlTpKYWVSLCFynkkUqs4e4rQ//M0qMe/Wp3R2vYTjCeN+N0ncsUjcBj67wwAs9MSMYI7/fYAQpQ/susqLNdWQ3eiguUe8rtQskExB2Ofce+s1JQt0pJyYEieMUIM5L8xHVN/M9+SpKkYVF2AGQjN3DxYhKcewmrUcCdktqIwfOhuf07ajsL/1qfAAIe9cxQhztm1TNlTCOM+2nOKiDWgSjiWQsVwcPqXqkQQdDYKWg53u8ECy2qPfITHhAiQyQK4IhCVLkqPCggX1ozTuM8DHAA8c78EoseDBTb+YNkVNKxABJLudTbQ6Qnq8mqdamW+sJhub4cKYFiOjCrd8ZpCBww+OnvZHIyEvb+ZJBRA8GADqmBQMEtPs56N4JziGSHQeI9STIngXZT8G45d6EUrpgyWi2AvtjviE54kDtWKkXZBAFrc/xQpHZe52KtkbgC5MqgoENr2HfE71q7put9tYqhR029D3osfs3SMRR7+LkgGbYFM1gq3pdNjNr2tSU2Nd1YyZXq7ebbpVsTeyEeDmln344lMzrZrdVHflwLodjIebMKESqKrfrVjcWydPMItq0HQ9uPpVynCYElG3lbUGiVBx5A6KmVQHrVm/rWrdtqxrLnNmSKCAgkmokKMFgc8jvKY2dmBjk2Fui5M0VDkEkId2rxvpaHwbO3B10BK2tmkfetpoZmFlTAw8ogESQmcPopCSxjoW4M+tJwp/NIkiYmESIOv3R32ogNzWFkAprzb17CYAYFd8AQG7mTixlUwcEIlmqdki+9xSLpWJmYWg7MbYbpn0R2UM/64cdhynn6XAs86EztebRjaNpW2tr5pxSNiBANdQQUevUiA+xM9DI24+CeEQjdiRHRmYWIfecxSujQQIkjc5bPcI4HJTQK+MHyfmBKnZfHXsBYUy7hc4suZn2uN4ovdZWrbk6opMgziV9eH/eqi7rdr2tTfW2bK05mGuLIDpGdqXpd7AAwPCierfQnq6PndjppahdAr3/Pt6IoQ+UbSGVqqZKCEje85Fp/EfYdQUeXsMj55ZJRFJOpURCuKSeV4DjpBuRnJHrSND7y4IbuIKpu6KHvmPolIXr6iKSktStJuZlXd1sXSXGKoooKig49LKD0RrtX7JKg1bs4Gq4H4AhkNZP8YRIy2Zb02Z2W9vnr9emGsQkETKjW3XV9nzVdS1ip8mK8I/vp3/zh3eHQ36+bp+eF3Mq57mcj8QyT4eSi6q+XF/WbRXmac7MHEkB4CDU6wBvt5frwoCQZ2dZHXxtatXWtX19Xre13ZbqyMyhZQEATsitAe7Zk32P9TrV2Gojpn+nDB/9lodNF/oeHeh078Z3hGS+t04zr63jy7aqqTe1rUW2p1c1ACiJc2IBPEW7VOF5KilJyHh2Ea8khCHmJREbCYi0N3npSAzGMg2H2gwIkaF7cMJBeDtAq6oGLMKyXZfN3Ksa1H6Mmjs5RPYpIph7yMDt5Tr9BRFDC2XA8X4R0TQfTk/v83SQnAHRIXRr1cENiZghZW5AhKakFtw+A7ubVa3RhVR9pDtjlPmxoQAxSk6lgBvUJC6giMBQjZjce51mHK1EEe+XKMzpsVI3RzA3BHJ37AIxvSbb3La6sbNpC3eAoatP1W0xBUAmmYjkfCyHw9EAv3x9+fj561Yr2G25upu12rZ1C/adkKNf9LcmaSCmsCOCKBS9hDj1DuMcOvnUDayELImaAoKph/SSaW2mjQlRumRER6qITEO/JqL4FGF0ksSIqeQ0z9PhMM/zNE0heSAc1tDNYVecjGPYEZ0iahQmyRooU0ThonUCEwCUXMy8tZpZltNpud0S0nK73Zb1M760qitUa6qPSXr/Cg/uYfHB/Ru/x+EorDihu3e5jFq1qRIDkTugNm2MoKqtWmtATgTCWBLPcz4ccnMvralhiioCkTyVUmZVraYePXWnLDGufi9YdPemkpQBgRmQepqxdg43WmTEecHkxhzrirrx2XM5ekQDO/LtFueBqv6rSS4j1tHBcjcJD/G0fgcfSZyhfGZqIQ0eWdG1FwOHjAogdUQjSVISZsoRggk9ii4xmHBIk8br4DBH0NlNAnDFFiQnRMEPAgsT8wiIgztKEmnKor2FvO2oP965g/cenDuq+GY9DIj5dkWFBU3Mgj11pDOuaL3vaDNrBoxgjtq5VwdACzrax7VPysNXSAmBIzOBoAMCoys+Ujd7os1DJGmnh+/uw77U9+kfDKzt5FncJI4aU48UDEQXRuEESNu25SwAHnlJgS3NHAEs9Gbsmz03lgfcX7w7aQ/ZKoCdpeyfY2D5MT8+fDM3C98GeL8TDZU2GN/sg+docbJRV03irmE5cgDGGn8YnwcOsS/rIcB/t6+9ODSiwYAIuWRwd7OSk2tTVWF2c26EgL0v4XdP/u9oUTLllHJJTupdQcU02pWO81hbdcDbrb68rFvV6+221Wqm5MgETrDczDZCN2pKAEI8T9Nxovl4LodzOeSkzKu5ASYBIUxSTufj5YNqgzKndWHyIs70cAx3qsvTzAeeHAAFkdHcnZnMgPzgU6oueUXKbWvatpDvMXM1AECLzC4HC+ESGMU4iIwMELmW5n1Bd27k2xX1SP4+oJX+ZUM5O3qCa7O1qjar8Y0FFgBEyAkoAtoplZKFOacUVimlxEQsKeXcjVOewqejHmreyfXdLO168lsXrMRw1CgKR+LhramTpGmT67JWk5zWtcJ1aWojMom7EHI3Y+NYejUI+L1V1X3kEEroh1ZrLZwaTgoOpq3V1ZS0aUSmrY0Yv7Z45xE0Y+acmZilpFwSMR2yzJnRqc3JKLuqorqAWzmfDoTAy1YVqlpmQm9gHAkEFsSUR6JBBKJ6SQ0Jp5JzKURGZEQMgObGhiTEhEYAZozgiOYhUKcR8SliHy5T00T4JALrurnZtkT32uruIef2avWYWlut5YiYh7wmOiEouaIpKHgTBQckQAVEax3Ca6uvJNzc0RXcETkRivCU5FBytHFMRO7m9QBtXRM9n0/r7WSqdUva2ul0PB0Pp+M8lcJRedQroB483btFBEYwDD8uXHcFU+jsM4AbAgF4JLgIYUkSvU7r+ViS5JQQoNZ2XVZhVLW1VmnVTeV1NOCtVUIAjoZFJRuZk5t5rc0ja94MHMysVjPz23X98uVlrW1Zt21dzV0EgNEAbLXNnQGOTEyYKB0Px/MxH8/n+fwurBItjRQwJRDGlKan9+effmeqfPiyrQt5S34lbwBm0AC8Na3VwD0nyTMDREl9H6PmQAWwkBrWYy3zSavW9bYtL6Z6u63LbQ0MZcCxf21kLoU3R0yEaM3Vepw/er9/Y5V82AF/NE/+YJi6yq16bV6r1ma3tbVqW9PbpjpEAIjwOCOLcJLg8oU5l3DwuaQ0bNFMzFKmPB37CSc8XM1XZiJOMNWmdTMbfWUAHh6IjmCqUua21TJfm+l0zS/XRd1rVXNz0P5I6KZoZ2Bg4JfxmR/w1atlFDs/yuVMVaNFByK6ZkfQVrdtQaSoE3Xzum0aokghf0rEiZkwsxyKiEiaUpkTMR/mNE8JwYyyZXVtjVQ3INTr5ZiEWJat2tY0E6IraANrbjpabvfzvUMmQmBkkVKKzRN4c2/hILu6ozFyEnF3BjB2NV+2ZmpA5LQC4pTK6Tg7wFT4dDjcbsvycvvy6bMrbOu61bYuqz22F3ZwVa2LbWJ7US4zkZIjWkMjNLe6aUTUiAEx9JjcXVuz3nlpba1GFSQTIkOSUpLMJZ3nnEQSd21CtirQ1pKu757atqi2bS3a6ul8erqcTqfjYS5dNngIp4w4gO9NsZl6OHAUdRiY3r8I0C1IrLBhBFRKSkyJEFXbvN2mkphabc/XayZoqteVZEU3k280zL5RfYOOgHFImb39/cDXUekTxT6D5h0Q0zxkNIHDlSKRLCmzZEdxFAdyH7lUkRDBTJIAiVMRd3Jia+TooOjgYARdFRmjRRcAmKs7hc43ABoZRnkJWUUVi8JSba02o7WCu78NGT1QuZ1vwvsPv8nF+evXq90KADtHY4NmevzqAC3UFUKxKxrSd5WFGOkB5nuXCWGR8ORYBB+tUnBk7mGoURkAaWjkPqKccfaRJAPA1DTnoqqpmYiYA1oI8non/l9jo/+C8difco+rRcgmOs05dcPlQOjgRl3OjAARnLt0BAihMApjdEtlpiyUJU52cRRTpJYMvLVWSlLV2qzkhEg5SSjQd7b7dRxxbLg+0pEg5E5Rw7jPJvaIFFqPmEUaVSR6xO9dGBwwi5ScIjSeJYEj4jZY2Tej0hVUIoUSRoTlId44GHkcnIvvfbg61YuDSYiMNmFOzEk4CyeRJP17j1M8JTeNJrqqjOCNKUfjuodWwN29DQf+YTkPDmyQ37hn04ww/QjJAcBgQZwAQ4tDmMA4CeckCJCHukBqWplknPyPw/Q2i1K11XXZEkBboW3uju7UM1EdAXxvjhipEFtF9yICCFkoCQGAb9VbE6Z5LnOWw+V4/OG3p8sRD+nLOr8offzCv34yM39ino+TQLFG66JAmOZLmi8EjXwhb+bVbHXQpF5M3Vxr062CQ8QhAWkSAWZ1WpXV0RpaRTdo63W7PWurf/nTnwz+1Joua7PoOhk8YJj1+OAOhmAO2newYwgEfgcO+OuvsYpgt9duDl2HW62q12ZVbVPf1NRcmINYLNN0upxLkjIfUp4QopZCmYGgOTtyImISkTzl+UTMnLKk1CkTGHVG2Be7g1trUjc3M6vaqj9aTCQkNHPOTVXTvDqndVmmr8/IaV23bVtvy83cRhudsQShlxfddzbeS6Xejo0ZmIEpupIroyVyEJgSnDKkhMcDXy6FOZSrEDzabZm7eSTCQF9yKdNUjMSORzpfiiQ5no6n0xERwGe35qrb7abbdr0uc5mv1+X5ZXl6et6qlkkOh5yy/PjDu3meIsxE+3m/kyIEGIgoiRm4Wo9g3Xdj9CU2B0OCXGQ46ebgYLVuDoBCeJxzYvy73/1cSr7dln/8T3/69PnrbV3f5Cu5Nt3WxuJIEFmbDkJCyNGBnj1UNyKjkhHRiBKDu0Nij17TMAM4Ex6nlBOXnN6d5pLTlOV8KMFaCxGAHzKdD3nbNkE/HWdt7XZ92bZ1nqYP79/N03ScpkhG6orq+5kEFroV1E8IB4KQSGA3bBUqemXbBJkiJ6ATekjg7qrgRq6JMMrKfZ40ayIQgKZaEudEhNALWv+aVYJoKbOt2wqkG+nWHV/Yk8MjRhkhYdNWW11ZJKdEiCVJSezetSgT8zSVec6Hy/n04Tend08O/nk1X/zTV/742dxsPrFgESymtG7GkubzKU0FwRA2BDNdVa/uLY4pN6+3Zbsu7r3DJBKneeacmtNi3JwQE8GEQG29tvW5bZs63F6et23bqqlu/YjZc3VG50NwMAgHJjwQ0++leD2aJITBN4/z7cEwRWm4N7VNe5uATd3MiaPYQaZ5Op1POUmZD5KLm7V1tabMzkiuLtmQhMPHm48kSXLmVPAOqCEEIoZ1BNOq2+am2rZWF9jrVxGQOPovJnN3KHXjXGrdyuGzu6/L8vLyYhCNNzRSqu5O7jBPO7rEKGp66+JGuFfRNTryMFhmIIdZ4JQxZ3g6yA+XHNI8iQVCGAzAzbZ10VbdtNXFTFkoZWe2pwN9eFdSSufL4Xw5jZweNNPttrRab7dlnqbbdX1+WZ4uL7VqnrhMIol/+PBunkoSFhEaxa6wfzYEIIrsZlSPhuGE3QuNxATo9edOhJIECZvqVoOsqm2rAMg8HacyZyH86d3T5evzy21Zt1pfrjd6pW3uZtrqysKAgiTAjg6MwhELdCTA/j2y9FL73VR46FxxosiwfTqUuUhJ8u48lyQ58aF0HcB41W1O2zq3VnPiy+XUan3++nVdlpzlfDrmJIdpYoCobgur1Mn3IXfD6IKQyIE8ISCCgKE2qOgb2cYYmUqu3ST1aIyBA5klAhFiEJqLmWXCRKiqSUiYwP2NNP53rNKO4h6Y9r4y36h17x4KRr0J4kiJQuxdFzjnXKaSp0nKLGVutdZ1UdVWo8V3L/rAztG2wLRE0juQgQGhk7pLCEk5GbKhaJS4ABgyAbJDbPTMEGnPcxjPqGbiJL1DSFerhVEhcgfYtpsYGATR+Me/cD3kv/RcAdhDU+4+/toZDQiTh8ThiqWUck5JRISYg2iIhLxQBbynvO0VCcRdkooIQ1wYRpZbeEnOsY7DH/QeSLPujiABADG6A5lxyg4gKYkkHSG5/tqI+8QDDDz2Kizz8BfcP5sIl5xSTlNJpeTK6NYa41TSVFJOMpc0l5ySZJEsCUc6kZll9lbJTJu4mQazRkylSHRLzcIp+D4mJDRFT4LgtUYYAJLwVJII5yLTIUniktNI6uy4+JW/MCJ2PVZ3/0gP0+X3Bz+Eo8ZjdpoNIkOVck45p1JyZAMRPmIlRMRIXCROKIk5TdM0z4WJR3a1TFNmFmIS5ohUxIt2SQNETkxCiek4lylLTjzllBMn4SRdXSYixS4MJogwlbxNU2PWVkOnLbIBov/4K/8W9/Dqo15KaBpgd4jdu66iWXTL8iD1seuKDQ7PcFAnXUgtGojvkmHhQL524b6TGTDCm+pti/TJHjeOFmvWfTl1Xc1vBlyBDAjdmnlDQshIuaTDYfrxt795/8O70+Xp/c9/fzw/ffzll4//9Ovt+gJ1Sc4UTJI2aHV9eV4Vy3w4nN+RTETEWZDJvbrdwNVa1bq6GvsiMLubtRbt9zZH3wAoUT4xZ0lzmc5E0upzW0vdbuVPByyIDp7MuAFEKlwYC4N70WNPbAfwyCJWC7r4YcDiOV3h0kaAzz1cNrW9TrBXHAX+2gtlkZAgl3w+H0tO7z+8//E3v0kihSkRtlrX27JVMwLGZsxZHZCRElJCzsQJOREnQKQdKz1EjMPqIgmAQmQr9eYBYWN6BQNEqz0WA5DWWrPD6ZlFmultubYWyGWPM8a+HVkVODbXSNJ7vJj5h/dP//D735V5fvrhN9PpUuv2/Pxca52n/HQ55sxPl8sPH96nlKZS5jJhT2BAM13XRWs119Y2M0WKHh44H+bj8cjM81ymIpEhicRqSq6NoG6L29rqNQn/+OGEgIfTfHo6snCZUpkyITKH5hdYj/9bp2doN/o9a3TA3TD54DyMWRfKQ0fohQ73I0HdFnDMgsSCOP/mtz+kKQNRKf/Lw+6CqUzv370/HM/z8TQdTiLpw7sfLucLE89TTsLMnEsORUmJpiNRndaH33twhpEI5yRJiImm3O2yjMLImLxE2ERMlQAO06zaltu51o0IszARzVOnmKg3RQj1ZA/5Q0JkxpJlnkslsFUaWBYicDRza1brgMYKI78BYBzK5qAN3cid0YnABSEnNTMr4La1luQ/h5VwcFpuBqFw2g2gY8/sBHcyQAXbDDYDBCADBEB2UmXCUrAkmabp3Q8//Pi7nw/Hy/n9b+bj+fOn65fPy/Pnr7O0o3BCEgc0da31dmu1MxJEmVLi+UCSACr4BqBtXfz24qrsyT27mXK10Wi0qUqSiQ8scy6H+fieRVpNrUDdcjoUygAKwOY0cGYHeTqIOkOAzib2QR25wq+vPZ8mclGG4hiMrH64q5D5iNWNZpMxaznL4TDNU7k8XZ4+fEjMZIpmgORArRkQNDIItX9gIEESYkEWIsFotoO0Z+n4HjNDQONR5j845B5Ii1xiRsRQPgTiDKCqpW7lcEDCZV0kiYObqSrGiTTyNYdLMKICAYlHsKBfRHQ5H3/78w/TfHj/88/H82Xbti9fpm3b5ilfznNK/PTUrdJhPhznOdKW0cHM1nVprbpr02quexKPiJSckSinnFJ0pwx5JgJNG1hidKvallLm02ESyeen09MPT8wcfEmYD99nMA76zjMPeTVEh9HGxDzUFEJLq6c8j48cqZhm1j1JBHA1cwQUyUKCCD98eJfK9PKypJwejBLknC+n8+nydH56f373Pqf80w8f3l+ehGmechZhxpwkcohCKKaL53QXenhYhBQKZf1f9wV6B/HgRmjC5sZE8zS56bYdtbUO7sCTcKShEO3aEQ4AbiEMABRC3TmRa0tCrsIdpkS3InDs9Xhx8g1ipN/KDN3JR3IfE2YxMzNxy7d1k7e6E99XMunpefcMvYHkEfb2rHdPJdLiw6YyY2IsRaZZ5kOZjvN0PKZpAsIQC4xQIiOkxKn3ZAYEIELhQYDu7uPO6jiYghuaozs5kAM0hdasqd6WdatbykBpzUhmKSxQLzgzBTAgQAYS5ExRKw4I0LM9HrxS9aieM0d3tNFJ7m6Sdm77FY/k+2DtztpDnl4v+cVgNRBLzofDYZ7KPB/KNAsxtM1bI2q4p573bLix7N+yN5EPNOwF3Cdkx28h89WlJ6IpnO9op79A35BjU8KopNrjZvvH31/+wYPDB4mx8VOEnNI8l3mejofpdJi3JGBaayoln06zCM/TlFIWYe7tWTBOCUCQ3nuG0dC7KQFAkBAh2Asv9heN08EdAEQ45V3AOtq+7B8GxvAg7NN0d9gfbxjFdQGE6X4mjQHrwQUHU9e2r1FMKaWUwhPt9ET0naY3Mwcl58vldH66XJ7Ol8sppXQ5HU6HwkxTjmQ1Som70xSHCBPznT0MSx3vR3D0ENtt1liofULQkZwcmFnczDBFfBxCetF7Tc7wo1+93R4Gxl5KqSJMTrSnfXcQ021CvOYomxyDj/cg7H2sOysRwinfhEy+sUo+jsbIBXTbp4LAEcE8qirBW2SLgzCVnJjwKH4SSIl++vH87ulwvDz95g9/98Pf/R6BAWitW2sb2SK2zpLfn+aUZC4JyIGglMzzIU0zI1kzdGuLomCcSO5mDbSSG6iJgavr8/Jyfblt2/qXj7+8vHw9Hk+/MT0ejg71cDowuOpt21627aZeSUAylJO4JN9b/7ibUlDEpg5ubWt13dxcm5hK03vf5LELQM1bJOVF1ZbvHlxPiblr3qJbONYAjsjMU0rM9ONP7//hH35/OMy//f3vP/z8d4SwPX+pt6s7kKSw7sSJhClF+zvpmh7d3NlIFdqtUu9w7+7aWt0201aXZbte3SI3EoiIRQAEO9KJdRHtXgkxmNbIro66WfeHEp07tRJ2KHhge0ssMdG7y+nvfvPT4Xj86be/OT+9b62t6621lnOaDhMziaSUExIJc9QyRB8dZkdhuJvER0nMbpcRBzVohg5DX7ESwflyTIlEckmFmEVA22bW5ULi7BuQ0jshsqeYIRjiaGYaHbQbopuK9f4jvfYjdqKpb0urW11u6+16A4APP7z78OGJ0KMTIbgKWRIQfrXPEfGHD+/+h//+33744cenp8vT5cLMx3maSqHeroZisgImDouDnXV/tDu4Q7e7IRonpO+oBxHI0D1wHLu75tQjnqbgRtibHtKuG+PQn0gIwpJknic9HTcmWzKDJaHERIQ8BiRSZrvH29+OBZ0U9PTd/A9p5sRkOWrOX7UR+p5VGh+wcy79sPAeBw5J3OiCFd07ARgpJ2bCkqyIl0ynU3l6fzo+nS4f3p0/vG/Vbi+tbc2soTXymjnPU85ZJPUm4SKSS5GcENHUENyboZuZtaBvFCyKk4wDS63VX5ZtWZaPnz5/+fpprdv5chS2PBX3CiBmtbWt6erQiJ0EUyEjibmKYTJFN3dDU3dzBfVWo45dDdTaN5kB3vd/zyAZWv3dZ+vh4ke00ZcGIjHlLEnkfDp++OHd8XB8ev/+eHlCd2gt2gYGW4QYbZWIonUBj2KAEdGOvTP2LO1sSE9cjHaptbatumtUdQNHEVg8J07F4YZ1cdWu8XJvGgoACAN770tu5ASMWzwaJiKa5+nd5XQ4nj68u5yfLmZW62ymklKeSo8oPS7fsbARKZEMJNc9zwe/ZB/ufcf1Wl4zQ8RpykTAJElCURvMWigyjE8McO8ausPeB6zcgQi4ualGPmOnaqE3wMEeLnSt2jZdruuXT18B4HScoxqaIiPNjdAjrvYGfRyPh9/99ueffv756Xx+upyYKYsI0w6AYlIHrB0DPAIaO3y74+T+i87mBP2M3SRE3XIf5lArNGN3AzPTFvptEYV+ZfnDQ8LI8eSUUskZta0iICzcK8A6wI5Hu4U20HhD3Xrga252b0FCvXqav3HgvmeVhmfSOZbYIw/LyAEd0YV4SmIOJVFmCGd4KlhKOpxOp6enw+WpHE/5cPTr2up1XVZtW0roRfJc8uGQc+LDkQ9nkiRl4pSIIxnEQBvUzTX6oS5mpnVt283dXJtrU23benNr4MrsIkhkrd3WFcs21+1GBNo20+Zqo9ONgSloA9gx5vAMwQjNyYTdEhr17c8Vvxmxe3vb3RgNDul+Itx1m3qyMhpTyel0mnNO5/PpdH46HA5lOohkcGOJhjn9K8oduTsAHZ0My2dmNnYH9ncE6GatmZvVddluNw2stK7uFmI9I7I4Ik2wB1p9aDq3aBBSQ/wh1EZw9/p2dskfGO+3pFv8dF9uvVUdiBn2giui3QTg2G07OfOwye5/43CcYdAV+54ZjjcAIrGwOEUt6XByHh3pxzX+sE/uPJnfX7mHoYcqQmiOdKUSBGRDMiRDbA7V3MHW1tZKzCAkREbICAT+Zv0gQLQhmXLOaQxJR0LQo1Hj3b566mt+c4cevuu+DXz08OfdsXqwZoOewnHG+H0kH8e8jwpgYLe+MkUspAVoZxV8fx189S79/qffJ3wPmtAIM+Db2fmOB9eVmFStNgMARg7xaEMCClklJfSS7N2xzlklcU7ETE/H8nSapqn89Pvf//b3v5tOl/e//fvzj7/xX3+9/Yd//PLrr3V9Ph5klvnpw9P5559TLny48OEJWbgcOc/IYuC1rgao62qO27bcXr621up6Xa/PZura3Gr3U9Fct5zgeKSU2m35S9NPyHY6X7Qd63a1bbW6Wq1QG9QGdcXtFiS3QXQlDVFfCB15RhchN9hWqituAJzeDA9Y7H+33YPrUm473TYEA8OOAEASYYKny/HvfvfTfJh+/4ff/+4P/808H46nczmc3bTerm1ZJZvkklIWoVSyMHMKkSByBzMFBGiR2oD36TJ3c1Wt66Zq23K7ffmsrbZtq+sK4NPhMCExkDlGCkWgEAvP1bTWuizbcltvt+1622rdQkM10qyjuTtwAKrQPdrBxzcrCpFFUkopp5RSSeLuKVGc2ijUw7lhVmA/nN+4IT2C82oj4ehoNijOOw4FROaUC4ns6fsOZPeUpLhLZ5j6dgr+xwAcDdmInUYiRSdAIQwTgu956eRIjtIwN4SGvDo8N3ffPi8v07NkOVwO5ZgY8EpYESTESh6uktO78/Hd5TRPuSSJutbItMRu9b9j6/tk76vw8V/xx2DPBqoYh6R5h9WjpHYf8mjuGARrsIQP9/Md0SJRFGqCaSklYCCDdZXwKPqCPjF4n659Tg0G6IM9Nw2ciZK47GWdD9d39JWG/za6tgISkAM6sgMO4VVj4pKEIkAgSIQlyzTlaZ4Op9Px8jSdztPxlOcjp+fa6nK7YqtJCDDlqeTDIZXC84nmMzKTFJSExA4Q53RVMPNtud2uL63W9fayvHwxVbfq1gAhZeHEgZVSIiKvbTGHdXup242JtW1mzXuqsUX7ZrAGbg4VXEchuSMTIQMCslMUFBiaAgsgvRmfAY7sDpFsMKeD8Xs1uwgYnGVgpePxcD6fT+fLFFR3yqYtWoGOnvH0+E3n9XashG5o+9Hm7qZqFp1FVm1al2VdbtEJp20bIKScB3M7knMGQxUenw29haZaVWszVdNOEwCY97zZgZL2xbeLL+0XRp4tv2qTyLHeozky7LhrIIIHtvNuih4Pd/e7FX4Y3KBSx/tBYunFIN4/aq8PiUD1jvYAwpQ9eG4R7H8Afu7gFt3xYoHs9cpkiA5kEJlzpADVwVTX1pYK5nByITJyRuBvTBIAMFPJacpdkxaHEO3DGN6PHHj73d0kDfZ+t03e/9x9Un/1k/ujuuUb3mEccntcaYdhD3MaWlU65HTR7W7sh/0aqG2Pqrw6aGDAbBhGa2Clb5DS9+rguotv5rWpOxA0NCREEWAkM1c3QwfGlChOvtaUGTgfDk8/z4fD4fLzfPlNPhxIjgAZXFzdm4I7sxBCKnM+XlKZoJyxHBxwaa2tLwAIfANkNY+Onuvt9vL1c6u1bbd6u3ooToEhIXpBTAg2lzQVQkIWRMKpnJgLYQJUwARo5BhtVXzb9LqE+ElY3b6siYxHuRQhADJxmaS03pD2fjk8MIrDqbpPfD9eqBcoYUoMQBNkQH56Or//8MPpdDhfnnKZUy7MMoxEeD6RXsnMIaQcCiQIAGbWakVq2GrQS8GnuHurVdVabctt0da2Zbk9P2trnWpHKmbY+aMRd9tZzWBQVKORaq3diYtbxz5EBOjpsvc4Xv/zm+gJABCLpMSSQsnfodfGgwK4QsebYwBt3zkAvUfYThmN7+770UOyxr13+zCzZVtqa4PCC8YBAZFR+ox2ZfNxauDdxPU4BAEzipASWncWejZSANFhNilGLCgmYXShnGWes5kJk5qSoXe1+65uLN/ITqjautV1qz6ade3+676V71HDoYTid2M0yPrxi/HjvijNIq8wtOvATIdQWvCl0GW5711lYWhQwB5qjztra67aWucotbZWW6uNwB00bmE7MdjbLQ67hMPFjyN0cGYOkeXmIcvO3wYpv5uvFEorarZs1cy9AbAhUkrGzN3yoaPAPImZ35a63Cqxp/nd+9/+t4fT6d3v/run3/49p5ymM8DslqyqbpuYiyRGKeen44ffpOnQZG48t6bPf/nzl8+f3Fy1Bc2xbquqbrfry5fP2ipoc60IwBTdaxntSDBLlqfzcZqzIzsJIM/zuyRHpkIEzMYGCYhaw23T52v98qVTM+5DUQ4gCn4QOIsUQaZUihyyAqVE8Oh0j4a3Xdymc3ruDwcSIQADI5bMxM6cp3IWTr/57c9/+Id/OF3OT+9/Pp4uklKXIx2heSSSJJJzEs5TSUkkp+A7WquR0RlZUW6+hQlRXZe11dpqe3m+ttpareuymllOPKXEwvPpCDgSBXfdVUJAsLBndVuXZVluy7ouW6utjWyevkKdhpy4x+EfxA3Bgy851g9KSrkccplIBIjdtWmXEQnXLbRx3L3VForvGrEGh5BahhFPtH1r+TDBrcZTWqsa35iaGzGnkqkH+DIRp0QlhRAYMUVor6fIdtYwmt+AMUHOAirrhjVyQ6y1ugGwWnXPD8d+z7cltJyZEdqh6NPR1Cix1orophoUchKZnEJi9HGIamvXZX2+3qS2lCo8kNy79R3+iveFGmEUgCE8DYM2GOyme1P1zitELNZUW1gW0wYhMQvRp4MiwbqUFPxfis6W2Imtbk/cddtCxW69reuytmWt61bXjdA5jiQmkl7MEYsFu4Ebti6yu0ZeGAC4h2AVAgM68h7J+WtWafiEcTpCL5lEczBEQIqCfeg5RQjMRGg08stZcp5PeT6n6ZSmM7Eg5a5OsXdMCYVdFs6Fc1HKQMkNarNlWaMJp2lrqut6U23b7XZ7+aK1ohu6IvRjzZm1JVMBw8Rcclil4khJCqEgMCAjkiP1YLK5t2a1jvW+61yCI3jQJ4gk0SsORIjl7ZA9OBUPyPUVE9mZVkJnRnNMQiVLSnmey+F4OByOpUwiwiyw+3zjSMBRv76n93fG1k3VASDAjLtta91qVdX1tkTD+OvLNfb5tlU3A0uhLWDhAfU1sjOYu40NL7C3L1R3tZ5fN/w8GJ1u+ggMkvS7F+6IzHu/HFc1jfQzCK2V0FH0utVaq7uPV4bWNbC7h7LjwSj+dPeAc2ZdymNgVWDh4sYiah5azogi5EQ73/zKg3v8ihD4K9ma7qbjQCJxg+E0j6c4oQjnJMoG3LscjaACED2KYd0vc2+ttdZ2n/Ftwk74j4EXo+txN099QOAxwBItJMxC8NB2ulNVW1ilqq1F4ie5IWFU4IgwgEUTuM5n4x3RhFWymKrWFQujrWXEmT2A41At7CfOo+M2TAoiPpxwOHB2h94Dz766vum81OMxBO5CaAjAGJ2fhJxGPigAIBoLgJOU8+WHHyWVv/s3f/+bv/+76XA8vXuXphkBtG5tW7bl6tYQ3F1rq4q2rdfl5UtrdbWXxWXbtl/+6T/++Z//k0dzKzdV3bZFg9vWjdwYIZr9qertpsREGQ29aDus5zQhSyrTE0uRNDMXJLG6afW6WW3eFJpCVVg1iIfOuUZNiQEqgoOTOpsRw1GcCjR7E/qINfOdC6DLOcRFAEAYNeoll8vTuZT5fLmEoHWXjnUAV7eOVtq2taj49BHUCMdtq3uMzMzXdV2XzcyWdVu3ambrumlrTXVdNm26Y3giymZgHmLJyP2cRXAyd4oMbuuNnlurtTXt/XloEFAjXP1NFAsGSfr6UtW//PrpP/zHfyxl+udfPucyq7a1Lr29tW4dYQZWaq3W5u7rttZaPZTOA9pHziQSMXXWIxDBttWtqur1+rwsNzOL9yw5Hc6nlBILS85EnFOZ8oGIp6lMpVDvGk9RVSfC5Epa0Y3AhNCZTFhzcqUuLIkYLi4iARgCOUL0OeBM0yGbOVLIoZsTOAEJ5SJIQIApCTKkJI9Cme6+LsvHj58GxkB3aNpU1c1ba9ZljlvXmewIqJuCmFwE3Fm7mBkzq7WGzeprQDVuotqsNQBgNAJHwsQcCvGnw5wS55wO88TMEu2/huA5gHutptq27eXr1/X6onWttakqE3Jk3zJFmgAjcCgp70TISLIa/mJPEnRz610QQpn9W6P0Ldttrq1pIwQXpmCCo8Ke0XuimUUTwZ6xcHz//vLj78p0+If//b/9w7/936UyH87vp8NRW71+/nW7vWwvX1wrornr1lZwvV2fr59/lVSeq18rLMvyT//Lv/un//gfwCEKac20tc1cc+LDnEJUP4sAwNf1+vJyAyJFW1udDsfj0w9phonLfPihzGcEIUgAWO22rbqtum1eK9YGa/Olhk2KOh5oDaLYeQt3dzNYGzF5snSAqqBvrFI/oO4ZAXcCJE640byTMfhXOhzmDx/eHQ6n9z+8P52fpuMp5wk7WxP1fVtb12251W01bYM6AAdUtW1bqdKyLMv1qtq+fr2+PL80tduyLVs19zAm7hBnZZR0BtzKak5W1ZopKgf4RTRARCe1vfd827a6dp/QtG+2iNkPovGv2KY3V2vtn//5T//u3/17koRpApLW6rK8tFZb2+p6DY8s2LzWenvp68vLsiw7US0i0+EgkiSnaZ6JQ2SBwL0ua1u22urHj3/5+vWLmq7b1lRLKZf3T7mUiGEjUkqllAMzX86ny+UswqfTYT5MKad3T6f5UARhYhB0BMuMJIRZoGRXBek5GQ7REa8340REYAQAYc45IWCaJM3JPVrKOhLkKYXAfWFJwKWkN2jper396U9/3mrbmtZmanq7Lcu6qurtdq1btZBMUDUzDTyo1kUOHdydiKZpLiUjUhTBqeq2rpHPHx6ua+tYSaPbkgsh407RQM7p6XzMKc1TuZyPUfk85eijk1NOCABqYKqtXb98WZfFteq2WdOcuMNLYcmC2NvBPlilngA6FF3JB0YyM9QRFXLr9TL/slXaoQDAyGzZj018QPTBGhIiYUrpcDyU+Tgf5jJPkgsxh88US15b6yWvbmoBhcJvh1a9bl7XHpdGcEjsjGbWdHNToxT9gwhsDw2rNXDStl/9RAFgQgGn6NcR/EVvOXOXhQ7MjgBdP64LyQEaQMilU0zH3Un7a9cYDbj//YhikfqpFo3BRBJFmUUP7I2sxx4GC3j8/2PvX5pkSZL1QEwfZu4eEZnnUVV9uy8uAMEF+AJluMOG8w8gQxHs8UMx3IJCQsARoXBHES7AGdxHd1dX1TknMyP8YaYPLtTMI/JRVd0XaEwv2uvUOZERGRHu5mZqqp9++qnvA9w9dHNyFam1iEjZtnVZRW0JX8m9BT1t0gIDhCD8TYrwKvDse1K5B0Z+/T+w55g/uF/GDhbE0e1TRzGfH+a+beV8uVDKzuJhlZazSK113ZZLlIkGbL63ur9czsuytPjHPeehqqWch3FQd04cHZTAQUrRrYjUbd3WdVVtVsnMh2kM/mAwF3OqZVPmlgDMmSOMHyQfD0MeGAgcyVtBPrZkA3GsLej6Ct4ZNv2BAwASEBACcuI0JDdHMHOPj4AGIbdV+Qrt1lrLtpWtylZFTefLvG6biMzzXMpmqrWEVVKR2vX7+mYFQERSpdYp2rExk2m0a9TGofWmTOzupqKqCCAEUUsXGKaqDolVFMGGTKrJM5O3Gt3GYlIFc5UqPXaLCbSDFNeWYdiIAv3CeySP2NQa+lTBkKNA711efh9fCbypDHnXl/PWv/kmKg+ODxIxMR9Pp6+/+WY63t3d3SVmdF8u56fHWWu5PPxQ5vP8+KVsm6qqVNk2MJkv5/PD55TzorQJlm3zupEJIiTEjAwMmdiBpjEfxiElNtOyrWYutZgaIIgI1cpbmS8XToNUSPnTulRTV3U3t7pombVuRUFpMrIC02oDAHAU3MccirkD5ABBU0FGJOo84pcrDxsHxq8/Xnk12O46UDTZoJSmaZimcZqmYcjckpZqWgFAyiLbIrWsl/NyOUstpay1FgCrlQGinEIA8Xy5PD481iqPj5fHp4uqFZEq2vxjRARkbpWcOYVUd8xNlLpt66wmUYne5C+RyrZu61K2tWxbIOcOHhSJKGkkBG5FjrAT57D1vcBmrZ5PKVX99Pnhb/7uN5xHnu4pT2a1lsVM5vPjw6fvpG5DHqZhCG+OmVRtntfL5dJ9JR8nSdOIiSPbi+AixUoFwLtx+vDVV+B2f3dat8XMSu212cdjSqmqbFtRUxFb14s7LMvlhx++I6bT6XCYxuPxUOo//uqrj4chjXfHPCQ0oOBx5SEdT+DuhEZEjCkNiKknlkKAsvFJGlkgIQ/s7gTcyisTUMtGAe3ladf1BaqyruswzPO6Leuqapd5XtZVRS6Xy7ZtZlrL1tvjaCOhaKTPCPeGlokpp2E4HKbRwd2Oe1oY3FXVqnRETqFhLyFgZ+6eEo3jEHneyIqquqizW2vzDp21QQTEwAwIkDIi0Tjk4yElHsc8HQciJDDCUNfVPRMdHxDlw/uuiWog6u4YkAcj/D6+Eri6kzf5S8CQUOr+YzN3AADRgiOd7u6++cVfHE53d/f3iZM5zE/n82WVWpbHH+p62S6PpayRfd621bUu56enL59SzsW5eCqlWF3JhQAz0BBwMyVAmMbhOI6caFnXZdtUtRYxU0DXKsK14DafL+BcNkM8jdMmKqUUNyN0RjPVomB8MIYC0+ojAGRMASdnziFZNBADYgA8gE7Ie3LtzQM758cby+7Ku4nFy0zDkFPOh2k4HMbDYRzGHGGBu5oUAKjbXOazlLLMT8vlKfL6zSoVdldEokoOeD6fPz88liIPj5eHp4v1VAsSBd2SmYIpnBhzDukLMBc1L3Xd1otqCUF+iqJPorJt6zqXbd3KViOYAGNGwBBdRWxWCahrDTTNjwYUdBTzmVWyHz59+c9/++s0TNO7mqeTu7oVd3349OW3f/f327LcnY7v7u8Tp2maDtOoavNlOT/N3uTUXcym+zv2TNDiva2W7XIhwI+nu2+++oqZ9vxTFVFT7Bc1L/OXh8dSy+PTeZ4vIrJt27qtiBj9he7v71NmcLg/Th+GAVJCRwYER0oDHwkAjFCRosfYTgeMiWDNKpmRIRAkJGRoeQR0DPJmI5R5F5a9XV4iuq3rkvPlcjmfL6J6uczruonI+fy0bauZ1VpaD25VdwcziKY4TSmPxzEPQ0qM05jv7o6EGI25oDOkVHSP/jpXQEK7Wmo1U0RIsX9ykARNDVXNnXJzqRGAgByMgRg4ASK6OTGPUz6cck7DcZhOB2Ik0KYpotVN9gHDsKTQ7xYAiDq6WZe6fqM4982Kk6t56u5Ao+J4n4U9VsHwKUADjC1l21Z3KGWrZVNpTYRVZV/c2DsgR4DlHjuQEwLHrEeArjWFLUrwDvO1/MzuUTfx8FprKUTbts7gKCKlbmbGCInATEUkWtMDoYdyY6O4IaQGmUQUzIDsiIScKDFzstfE09sRag/9Gs3g7d+9rrphkm7RbwNQY9qqiEqNJHcMlN0wDVruzXsSwm5CUmvTJuTxdkm4XsDQgg9vtBUVEUCsteRasLEcqZYitUiNBs3XsL3zB65klu6Mw8s/r2cPQuu8FH/yAK5u4C5EKWoGbHdA+4S6sr/6PkBMvakrU2oNoghxh2aDoL5bpUZ9QETCKpJrVrNSiogQNfpeTql1fwyWt/UbEi6pNlUKABcDBQOCNDBFgX0vXO1hbcsFNIJbFxeBpsbuV95nL9m5mTwdjdyD9x7At3/7k94zblF4GUikuVFQYj2ygS1pm1KKWIqJAMCSqnD7lpbGk0jYVWZTxSCqA+RwvaLlcYhfhoo8IkbARA4Ych2oBh7y8w7kYN4F2APYdnfiTnraqU8ICGAAZNFAB5CQPBhLIWPzYia95SvFnyYmAkhNAyrmTnSvAXDGIQ1jynm+zH/zP/8vaRiP958Od98isQM7kKnU5Sx101KwsUNzzoMTJs6xjhIRIIPbYRpOp0OUpJlWQoyCZBPZlhUJSy0xoQkohyCIudbqak+ffliezjmN85fHnMbIablbXLK7z8tl25YqBTLk+wzolAHZkQyTIhkCMRgCJvPJEhJ++Or04eu74alM0/cvERR/loe7Jt4ak+s6wM2ZakV8a93mbXkyLeAUOdX1/LReHqWU+elhmc9XUCAAlm57fZ/H4IjALaQiJGSmw2GMwushZ9qjLAAAqFJR8Xy5qGlKvG3b5fAU8xgJa6mX86WEZGrZRATcUiJ3yIy7r9Qh0hAgQiYk6NPJ8MVWl1P+1V/+1f/h//jfpeGQ779J051Z1TqbyZCHT999a2rTdDqd3qXEOeWUkqqmNKQ0uhu6mts4je8/vr//8G6YxsPdiVOqp2U7Toz0j//JP/oX//Sf5Zwjm+ZuRUQt9L3QEWqVdVvFbN3WeZlVdV7WZV7MrBSRKuM4fvP1Xxym+8S8rYKyrA+Xp++/yHYmM1Jx97nUuVZK/OFX7+++OqXEh8OYc/a+EFqIi0ghsrX3ywkkP+R0wQGcry2v9lkB1IFnbE2q1U2b1QADsOAOOWBjSGFjQPcoGqBXOIVXnHM+Ho85pZR4GIaW5b/iCh2PNTWzWqpqKPspgEc/gugRnxMR0jDknAcECBZlKUVg27SI+DpXqXUVUEhDTlWDNRtYRVCCGSlHfnafGA7g2KvYWaF1/1Q0RR6Afl4h98ach4hHH/TdPHe0BVPKOQ/Lssx/93dAfDh+nk7vmfPx7n46nNxNy2paVSoAUISmKQNh4tQqEkOs3HkchuNhUhUpq4l6kAuBTKVsBghV1cQcgAAzEwComVk1kEuREOqY82emZK5i1d1DcxgADcEA1QQy5FNyMsgKkZlNCoTkxk6BCSRgJnr/Yfr48R55G8fhlUfgVwfulm3U7VL7sY1b9I6tzTCtF9fqFo1qbHl6XM6PUutyOW/L4jtu3iLl+DILwCVc1MaUAcyJUiJmPk7DMGQiyjkxUc8gu4hWEQCA2aUWIirbNo5jz6mhiMzzVkXWZY2ZCuAp2qsyZm4ZJ2pWqQGZoTAAhITo9JLdzSn94i9++df/4n+XxkM6fU3jnWmp21m1lHU5HE7bso7j4Xg4pZS6AaVoyWFu4BVdh3G4f3f34eP7PI2H+xMllmms45CRf/Wrv/in/+SvhmGI/qbhK0kI7PdcTGQ+1EVUzGxe1nlepcrDw/lynhF5GKaUMoOVVQ3q/Hh5+PJY1ycQJRUze7gsD/OchuQD8pSHIR+mA3N2aGxOJI4RwfBbohlRK7SIzePKz33hCHRgDgg7z6b7bJ1+7YhAgE7RExPBzaN7MbXYuecsmq+UUpqmaRyGYcjH4zGcy5DxbIoRDtr97FqDQWLRuDy6ziAAh6+NkDhxSuBeS5FaFdjwqSiWCk+LlK0URcAtZ3GkPOSU3cYMGBQBD1iN9kYUsWZMzQXAnQhSAG+Kppjysxajb1ulFqz1nBs0RXF3DxUtaiN9DZhNVdwRqfCKlFPKQ86aEriZVDOB1oWJKWUeRjBOKYdkhzu03FOPSJ6fjPeCpWteqOcG8bobuEe876YG4bH25l+OgE0i3FyRjJI7uWcDNkB0Nic0RzNCR8dESMTIiVLicIpfDtE1PsM2N26GrgWXu4fTKCSiwQAoW+RDo1+8SGkRbiNbNJLjLh8QVsoBQvUsOUVgBO7RgSl8beam2wYIeC3Ra+QFUXDwYGbGdhKnLpHAEq2NJuPQatxxr0VAbPs0NrHGPVK5pmhfHE3Aj6LFtlgU2ImY2guQrkXm/fn2LbCn/7wR6aPtrqqi11rWbTXVKkyJzLxIjS7XcaLdEoA1FrBJrVKrqHowoQIxRnLVANSWeVmXta4bqKKImS3LuswrS7qcl+k8D8OQh9wbIUWAqUkzEfa736h84St5JJj2kXoNTe55pBa79hZGsOd9fcdlbpGB3WOIUQ3G7LYVBKilECIRmZlRc67avhYpK1NRMbVSGi1eVcCtOcIAzJRbfUxEoV5FpEqpddm2Zd22sl2Wdds2NUOEnJKDI0HKPI3jNFVETIwBi3OvJeFmSAyiVUGHJyLuc6SXZvvN6ty9ppEJATBR40e5RfKJIpJMxGDuorVuaxEHKMuy5oeUEtWZ6nuI1Lc5og8pY048jen+SOCx5h1BtnrZVhWV6BHUOFcEgGbWFDcbAai1dTJvpd/koce1GwlzK02C3xzBg4Jp4EZmbI4GwzIkcTLJm7E4QA1n21AEyZH5yPk0MEzHfDwdNqGU0lsEQnw214IEfIW7XNHcoRYxc/R1Pj9qLVoLgKaUAQic3Hxblm2ZTdWsEBkiDUPixHkYDqcp59w/D8SiGEk5YUoI7s0YEYXmMgAielAaAgqvKptUd18reBQJn5mCHeetqiPIe4E8uRuxMyMiJMZohcnUfCXquFLvkIlI6K/ScNiVnt318vSw6ZNq2dYn1frw8CAiYYwiVx14jqmJhAgncvhhhC5V64ZoGwESbed5eTwTwK9//ffZnImk0b1tK5uoEFH0HSBOecgha04JHfx8vlzOszsgJsKoXsNEaZuXH379m3J+Wp9+d/ndb2S7uBmImtmXy/xlninxReXbh4dxHL/65uPp7khEoXIZcmCROgg0Z495kT304VIiomTGL4Gl7hmFZhiYuFaT4iKg0nrhNsaa067FspNJVN19WWYV2dY1MS/zPE2hQTydTkdEGHLOOY+DUdM7cjOb53ndNhW9zJeyFTMTqW7KREHPmobhMI0BBQzD4O7LvGzrNs/L3/76d58+fV639cuXh23bEkclDR0Pw/1p5MSnw3Q6Tkw0jWnMzETjkHJiIhqb2m8IigMnTjkhRqPDwSi/rIB/O4LrUEk4fk2vBnYNaARiB0zR9clMay3rYmbKa6WUcz5mnji2LAJAZkrTwEwD45SREKIOwcxUt52a3Od1QxWjKS4aWC/MaWoP7X4B2LUrCcSW5OI9tHcHNxUtBmYs6gLsmGo6mJNaFqdq0HggqGCG6DilxMORE+SJx2kYVmd+GfR2Pu0V7XX32y0xvGtDD5YtQS3rGsKezJhSin424FDWtW5b7OiIzgx54JxzHtI45jRk6JvLJLnUMUv0MTZ3j8w9IqYUCG6v13QLpTy1KlrNXURlV69rlQQ9yxI3tgUUAIBMgLQzZ4G7C8bdKrVNGHfS7kubjQRMIGDrMp83FWlWaV4uu1qnmxlibPWtiqIlTxCiNtDUVbQ2ds22Lst8QffPnz+NQIi4bttWq7Xq3MrM4zQxcx6GKboNDzwMHFbp6emMSKfj/TQeo7s5IanIw6cv588/lPP3yw+ftSyurULvy+Xy5TIj04b+uK7DNC5F7+7vEtM45RQqaIfaG9UkQhwyjZkQkdPeZBYTdjWV52YpcmEtXjODps+jEPLt0IWKASJY8e5zBdyLanWDaJSec661HqYpMdVaHPxwOITbm5gM0UOtxvQyz/M81ypPT09R3VVLMVNmGhIz4fEwST0y8zgOImpul/Oyruv5Mn//+ct3P3xat+3z5y/btkFfkuOQjlNi5vvT4e54TEx3h/Ew5pTodBijUehhHBJzSjQOzER5HMaAc7r377+HVWqOe3i5N9J90MkqhJSCFRABDKEzQehsMjmFddAKTcAFCdiMEcGZo3O2OYEhoqdhmgxEpGwFcGt+XVO+bFAKmgFgl+/cUxtAGGEbBosk6q2iXlYVHKBaLVYcHAYFUnBP5MRg1KthDc3A3MkQDELajigRMwKF9skLvtLVIO00i74VPgvkGhDXog8VISStVWsBD0Wwpu4U5WYUijDcwkZOTExMkf+OzAYxkztFDyHvlW3YwsTm+4Qboo1O15KWwY9s5+UYqctWih8nHZ1HARG8VWk2dlLYhKuvBNB5b9gS4a/TuqHVJwKXp/PjZa1Sl+VRpDw9PpSyqUop27wsTNQosOa1lhr69mSAtq7b+ens7pQ4jQMgaqmmzkgOzedXb8SXrUiplUiKKCFxSnnYiBjJid3dH5+ezk9PSPju/sPpeD8OE+OQOEst83w5n5/qZV6XGo3qIwO2VCvq4E6r6KUM1TFdls2YaRoSM6acxnGMRGHKCRHHTEMmIsxjTplTGu7vx2miqvSKXLInppqlj7iyFdFH2OPgjo7uRo6Ojjda+ldaCvR6t6gZSlWitJAQsSeyay3RbuPLw8P5cpEqT+enbd2CommmTBROzbyM67ox82Ecp2ly93XdSqnzsmyllNpqkuS2tCrK65gQwMyZqNYy58RMlzkHw3MahsSUE09DYqbDcbq7M2YeDzAii5jZywF6rWRCCIkgOaWUMrgBIYABYtNG5JTygSgZgbmBGaMfBgaPajljUpJVVwZEB3YkSKmyW0opTTSMnBIE0xH8NJym91BrqdXmeXVHgxotOANfcHctAuAp5Uj+YNw4B6MOn6iZe6n6NG+R5t5KsGGlQgH04R2M7ER4TDQcyBAUyJEtlGnVSJEqkaOPKQ+HIY+AScSlxi5+Mz4I0dzGHIGitTM0b6nj0T3jjS5g5ApQ1tVEwCSRp5SIUgo1OXNCA3DOhJk48XQY8jCklIYxc0oN646+zENmwjpUqWxme5JUJarqPbToRK0UMbeqVoPdG/hSxxfcvUqknJtVSkzUVJuZGZgwJepod8Mir3DSjV1q9vTGF3A3Kds2n+dl+/V//pvffveplPJ0eSx1q+uynh9MxKSWeUbCdv/AVVStV/Ojr9tWahnGHB3Mieh0PL17955zMsjKIwAUl02lVHm8bMt8UbMS9FpAcHKHUpd1m1Xl4fHz4+NnZv6LX/zFx/cf37//8H/672DM6fL05dvf/uaH3/xayyyXJ5dSzaqouW8mm7qjPX5a/LESUf7NhVJihDE5dYwUWxI9IXWrxHy6uzscD8fT3T/76+PX37y7rCz6GgLYd35mDogwI1JOIf4Ft4IuN9tiOFjeb4e7e60lgIP5clERBJjGcRuHRJyY3f3p6enp6VxK/e6H7788PIjIfLmUsrkHIOyBAyLiOIyHaWLmu9Pp7nTCrna7rtunh6eneS6lLFsptXhrPQa0eqRBEqdoEpWpuds5pRAMi2LgIafTNCamrz6+/+UvvhqG/OGrj+8/8mWVUJf8KavUTFOnyzWJndjPo6aFOadMnBSsmpgZIWRGaFoCQGjgYlIA0TEBoKGbJgwdS+KoDlMgBBhSwpRqKWkYgDjKtLqCTyzbRnMn2kvf26oIKCXMhrur6VrqWqRWX1dTcwMRqMhuB0SHBAiUKVFgVeQU4FVgzam1laJQ7wcgU+ilss+OHWGhW2JGzJr4q3dkcDBQMFQVQXcllFLcNLFRmC1o4RA1xnVEBMwphR5p85TciTkxRXYsEPhgsji00k0LzQp3EQsHRC3SCH2Kd3JtK/rUK1GZsNE9IAqxCZmQGRGQCHra57qgwgxdcaXnh6loLXVbnr58+vzdt1vZvjw9lLKBG2qNbJCVsnu9HgIdO8qLoCJBZUCMQlmCb/D+9B4SAbIhA4ABiaEobEWWrdZa53mutbqBiLv5vDw9nR9EysPDp4fHTynxtqzL1/O2rvNfn1VKKdvl/PTw8OCy2bq5SjXbRAxcwEPMRaQKiAMCbIBI4AMboyMCR981IkwJEYdMQyZO6d377XR3d//Ov/6Fnt5RFTR/OUa7Ue8HEZG77wrCEahB4wVc5xZCd3rbc66mJCLEpVRELKWUUgBAEInQzR8enj5//rKV8rvfff/p82fRusxzKSVEccAdsTXdG/IwjSMT39/fL/fbrqu9bWVZt63UWqVqk9/SBgJYNK/FTthCDEpEVBoQI+bERDjlfHeYcmJRH4ZhGsc8HQ8nrfWGv/ajVqkFN2Ax78Ej2YYQrYbJAQ26KkWrKENHCphz5yVRKLBxiijeTL26yqBm7I7EQxqi2NcADHmYTnfvP6hIHQYJQy5b+GKq7mZE+0AAB8rfsqNWay21rpusS5TNgwiYAzAQEzKkREPmlCCY8eAAymBO4lyyV0rAA2YmOqbDlKYhjS6wXMpyKVKf9ROIeRhtcCKHhGDg5LGPXbP6+0z0xtgDdFdwBQdwAuCeCuu7ALYihl4Z0DKJvZ5NQ27PTNUkEnthmNSCOtBYd0F4AeydXBw4zqIZzPC+A4lqmR9mJEaOfrTXPxTZ4i4J1iO4PUfWUrGvEigpjcNYxY7T4Xg4MNFWNkIEN/IE7kyU9gRVtMq2jnMFrsSUm/RPGoaBOb3/8IuPX/9ymqb79x8Px3twMEWEaNRIgZcvy1pKASTCBIC6DwQiMjniWsrT5TyM0/lyOV8uSymeBj7eaclmEGXDCcABGD0jRFWuYSQT1czQFXVFVwerNXqfIIghQKmUmJjFaRVPQNOyWRGsii/2tWaGkIg5cQKAIWcdBlV1M2phe8MIr+9tpIM2TtjWGo3jmFIa8nA4HoY8DOPIKRFTKBCo2rIu58t5K2Ve5nVbVaXxTvfPAnCN/K8SCZOXKlsVJsqAgOQAKedxnIhY1FLKvbQAoHU22zm/AB7yUsFFN0M0d0KIMC0xT5fly9M8FRlPd4f7smxV9Od8pRBRZERx01Y+k5DZnRyTExtQNUOvkYvrBj9hIDKUCCkNB84jEQ1jTpxEZdlWUc0pVRHkNBwO0+kekJZt27ZiRKeP3wyHk0ot85Nu27Ytjw+fyraaa61qqtD4YoQYgHG7R2a6zvNlWddNHr6syyaA7JgAMRHlnCjhNOXTYeAEGRXF0RDXBBVJeFw4i005301TSvxx+PB+ep84L7N++nL+/GVdl3o7qSK3MmQ2RiVwixYiGvxbtT6jDHa0EgDBpYt7sxsDh9Bb6yyCrRo0SuOjA1CYpCYV6e4qxbQ20ZFaLEqkmthgU7mI3wwbBY1veZ3CANC7mDgnNCO3yFBCYkwZI3BL3HoiBlN4t0o3emA3G5j6i+JTQprG6f7ujih9fP9hXcqyrQ62bCtG+hyd9p6PAW93ghVipLgYqe1n4zid7u5yyv/or/7RX/+zvx6n8TBNh3FytzEfyjifh6fvfvdbqbKu25eHh3meh/FwON4zswCIozg6J0zZAZ7meatFzL/9/ru7dx/O59mnu+EDrNta6aAqKeVxGBqm2rp5JmZW1W1+qmXVum2XL1q3WktU+RuA9hYoDsCc7hY6nnTe0j99qh8WWDd4vuiQkBJHJioPw8DKdjAiNtWcklSJm9m2D9jBvB3apeZcIRHRMAwppZTz3fGYcx6HcRgHZt62bV23Wuvnh4dvv/uulPLly5en81OzsN0e9W3RACBwOiLClJEzMx8cRyBzHMcDcRLRNEzaVOtjqxTT6m4i4TSY1KJardtxcHfX2IrOy8aE1UEBx2m0PNHhdL7MkcH/KavURyAwHWsMpd7cwRsKHS1WQoV5x+gwmn1GnRUSE1NEmxFjmIqaRNM0QOQ0IBFUNa8OmPJIiKZCrkLk4EQpgkLf3YAerMV5eq9TEImiE6ml1qJIjoliBVIj/qTEiTjaOSsoghBWQEGuTkqZ84hDpjTSMPDAnGbTskrZRF/MKWhIMAA5dda1YQRDAUP3+dQpC+CtfKqXFoJz7MSIBND7ZrTGZV0pMVywXTDlKp5iN+PRBMC6PIB1PLT1QIsTaCp2Le6KL0FFcEIQd/SwA8HQa7W4iHt2IexRI0Pt+SQEaNrDL2ZPqzjJWcdhGMfRwIdhULOdrYc9g3NNXnQaVUpDdE8ASoA0TIfpcJdzPp7ene7fT9M0pDTk7KY+VFQr2xZRvIqWUtZtA0qjGwL36AIdoi7Kq4qqrtu6rtu6rkXEOeE4oYFnMRQYRp6mXjXMSJiHxCmZVnBFBEGoazKVEJkJYm+o8xqAORI55QpUD6tsxULV6yUG0CM3ImJicEicLKkSmWqHtVtU0xtetfIfIkJkxNCT47BKzJyjcVlKKbfyHHAQM1EttazbWkrpIlYtmm9h0Q46QDSORnIQsSrqjtpVJpgZABFVzZXZPIJuUK0q6G6ACqhmhqoYQnSusUmbmrspmpoT4ryW87KJw7KVrUipASn+uFVCgMQwjjhN4JsqF/Nop+LurEru3tO3gASkiCHGxq3QIdAeU1Os4KyJCdGin4hiWerDp8+cz8d1E1UkOl/m82UxM9caDA6rm0tVVYDQx2PmFAGDihk5QrXWEUzNTFRCCmoa88d3fCeOnCiPSMQDpomQ4ZA5OaE5lOjdi7ASVIi+FohwyocPd++GIb873h/HAyI92lbWWtZi8qxLJSCEuqihoaO3zoXkQRUCAndzfDUT49a7uZFhVO+REWBTO6Jwo9wlePBsAIAspm3PKdtWthK+UiSKvMswYytMR2d0R2q6+LsqYitk282kuxMQR7IS3R04BOq6dmqASrRHGjsToG/b+/FGZaWDVilbMbXT6e6bb6BIPd3fV6nYlTRiBvWdvxvxRnFMRNSDT0w5j+PIzIcxy7ZsKkpUkdx0vVzKsjw9PZ4fz+en82W5zMuybCtwGlUzsQIAMbAjM1CK8TDwIvbp4eH47e9EXIBomDLyAZOa5ZSHPISxCAGGIBGIuZrXKqYW6R4zG4ZRVEBNxQAg0RB90pFHNd6qf/5y/u23P3z6/FBrfWWUWrM/ZgbElJO7sRnYXnfZeNsNg4ryPUQmJk4RLoT1ybnBkGOv0g6QyAFUTdRETERlhz/CGOE++O3Lbu4xGriaI3Vtm0h1ESEzEPe6OnBwMzWt7h6qgWa2LXMpbGawIVLQg62zHdwAqsq6FQe4zOt5XuZ5rS+W2GtfKSc8HfB0BF+rpMXMFQLeIBFATAAea7BBD4g5A2JucUioqamKqxsrEwGYmCu60nJZns4XR7h//25dzkR0Pl+ezrO31eUImAgIQWroGSdijfSEu9UqACBVcAMAsCb27OA2pDRkuj+NgEwppWFEImB3ckCHrOjq4lokYhbfGIUYcUjEiO/H+7/48M3hMB6Pd3eHe3dAO6/ndT1vUvUWVyLElDBnMgVCcPNwFN0DEopguzWAaOQphF1dIGQiDVGRjHAX8SFyJItCUFUlIhElIjUTUTdf13VdF1WtpTRZL2itXnF3gjC0ijH1ypXWpWb3cDqqaNwczUD0oxIKEYbUVFAiiOvMAEQI4nTnifbD3F/YJXcvpSyXBYg/fvh4d//RsZWEdVwYcP/MbupadhAwiu28sRwCLFMHZ8QynysAqqG5qy3zvK3b0/nx0w8/fP70aV6Xx6fHeV2deBJxZgXw4JpxBs5gFtjcWutvfvf9Vn3I0+n+63w8okM6BZxEmTimXSYGcLVqKq4u4utW0LXlmgijbRUUqV4NIE93ebxDJHeshvNmv/ndp2r07W+/W7dya5MasISUOGnOZBYNbM2MEFXTTjbBxtHDEC5BxCh7JsIhj6H7nmInwa6fCW39A4DoLv8vUrVlXRG5ob2BTWFzsnsnWoj+yWagGJR/RKSU444Nu7vcql6apx7YrqrO57wsWUUAiWpR1eZJeZPT3Iqc52UTeThf7h7Oy7qWUl/s4q+YAQScgtrrzIYQAtfWdnq3qGhoO27LgjXUt/mcHoQYQERTM7Jgx7i5mm5SzG0Yc1lHYi7bUrfFm6wvEgIwM6Gphq5jc1u7DELgJtjttF+VnoCIc04YUeOYkcjQDQ2iTYybg6siKIAhCqAgMjJwIsycxjyMw5hTZiKzUFqyoD4/H6C2qICw9+ZBJ4zr7QjuNVV+W6PYDFOUGLihEUZ+BhGizVFT6lN3BxR3VrVeHNCryjv6vWesYPeEIvPQkXaHxji9QYJ6/Esdgqc9Jt0TQlczt9uNvmW3ZbVbplf5t4YRRc1DSplSZ7JRZKs6Gepmt97TgwgRKWLz/qNIwkKOQzxUOsVA1NSklFpKLbUJ/3Vt36Z/F0PTrweRgCIfgeZQSlmW1ZwPELh/0B9CWpUIMAQLWlCM1vZ5D1ys+TlRvrNXyBBxSgMghrC1GZQiy7KFivGrcbqyAvsUj82JYlm1ABybEEKoJyBSSimlFC5SzhkJ40fCRjGPBQKwb4PtIp4lk7HRPXBvpU32TFkboE9UcHfYya0xktioIv2G71KB0TU+J2ZwICZUohAGQOsbJbi7mJFalDrJW4SlV75SxrsT3d8RK2dgFbxstlYxoyqkah6ajRCt24K/Y1Uqobibu7TNEECQtFaipGLLWkVNVIpuDsakiYSYpSo3Wyuq2nF8MNWyVTVF95QGTN5I+sHRM0EHYnRwwt6UFSm8KsQAkBwQotWBAqqiO6qgCYEDGxDgQHx/GIeB352Op9NhmgYAWJZVxJZ5WxfZ1gA0r4PW1nDk4Hi3DkDkLQdvEAgKQChdQr9nId1lgOCgBrEgsdsVjrmZag3VDk4ZiVoK1nwrZStbRKzRwwh6BzPEtss1GOslU6FPoaBWtVyzA4C1+sYGPAVb0m+vNqB6aGDZ1d/y6xX5810OAYOVh0Sm5ua1yrwuopIyj2NmopTTmDMidgpViPwKAIRehruDGrhTojQkJBwR0gDoUKTUurma1U1qNZMol+ecjeBO6ng4HQ8HTjk+FhyHYUJwNy3bWmtxp1J1WQtgllpzkjZXAmEJ6JQYiCHQXFNTQSROmYAYgCACIuigMSFgHqbD6R6QYucYx5H5LdD2ekNumQHXvaBZBGsRHHlsLhGJN4sYEwqpF0s3Il/cqtblRLtU677mG0bYkXLESNxjN13QpxNiCNo6xPRryrdk7RPAdkQQEcNIpZSCsTgM2XQklhD5wIZJtU0wpksMXRFdtrqWn83BIQwD3t/xu3c8YjqmJKL06DBXEaoVRNgB1diBmCHkNAQVcUNC82q+DzeAoym7kapvxVRdrYqt7ua6gi3MlNOQ0uAG27ZsWzHzUkXUoEs4j01Ph8ANXd19K9u2BfLQyH/TOEa7v6gHdIsp7RD9lMCrEii6I1VCIQyg2XHi/O54PByGd/en+9NhnIZ5qefzUopeLus813Wp8oLi1cEP6xMI0RDBDCw6+6CTuYUATuSXMDQMI69mroDmogaIsam2VQGIiAEXIFHKiYis93cqVbZSg2gUXdUQnbDtYw0yv8753apcuQcQRtLAEdDAg/tLQVjprcHaFrvbUrz5GxrECLsxgTe0OhGYKWcGpKLmpmVdfvj+u2VdhiGfTlNKPE2jHY9EaP1Y162UAu4gAmoIjq7oPh2nu/ennNM45Lsxo8N5KVYurmZFalVVHYbheLobTIfTQdyIMw8HRFJzLgUcxvEwDllV3EHVAKhUXZYNMUktmjNA45e1tgsOHlYJQN3MXWtFxGaVEAgYRaw1igcHAqI8Ho5375BCdEBzzhyZ4udmHqBTK9qDyCK0bsYBY3hjexgCWtyViEY6QB7eDLUQAZmw5xDCKKmaRXt2UYnMfZPg6EYpyETEgY10sxSZGQycM+I4FzUyB4hygsZjJmp4S48x3Z0RgJmkjm5GXHPIzyKQJAewEFFwd0R1R/dNdN7KttVrtdmbVgl7aWViVAblILM4MZC3+l5vW8qth2gWr3gj41EbXFSF8MZVTdTNxVQj+FKp6GzEe47JTAPcVVHo3Zf7YPV0UHMIOyjRMYqbHQcd94lwxWd7UjvkFRpIwkQppZybVxzRaCmybVKbFttL7xK7l7tjhe2byfdz6PnzGy243Uq499xKrGnXxt5sd71ZOtoTR80qmXb75MEfbw43tuRV+/h2Qi+N0k3c9eqU+ot9T+5JxNiko/49BrLBFX7rjL+E9fso75cbPTK2ZVnMhMhTInCLkC5uuZmv61q2bpVMESCBIUAaCOEYGZXEwZ8CAkM3i/ous75PoBEwOFD0FAnYPsUMIUyqWta1ICPS1c1rolV9TpuBWs+A3t4vp15iha67M3oDEkfpSSZiQlGlHY2mvVTn1Ti9ugX9JvYg3wNjizFVDDsey60vPoC+1LGvSXO/vbqrv9zDxn409YS2gG9WzTXm715UD2D7wjforNvrBNhn2p5j7St0BzduEQ7snscbiaFXfCXGPNIwkW4uqTroMOEEIOrGKVVQgXVTVWw7vSJQotB5xJCKB201PNFIB0R1kyqqCB4gL7i21oWGtZo7lFJNTS2WXwwvOqCK1SLGxq0mG1NK4GNQeSJi3qL2hyinRNSWVltkFgsRmZK5MTdB4qhaGY/T/fu7u7vDeBjcSao/Pqy//vXnZSm/+fbxd58uT3Ndt+dkCmy7k0ObMwrQAjhzM0J00yYWGA4JdozYzVTRY6m7uoOoi7r3rk2IkJgjQkx7d0MHgOiepM3w9/339WR//uQ+ufAaht1Mfugj5X2BmZlqCEa03bVtAp0u09ZAn7FBkHoxqwiBKRypoiLL8vS73/3685cviaOxD0zDME1j4Ltq5mallFoF3COCy4kP05gTf4PffPOXX02n8XScPpyOCGDrtj2dzU20zOu21ergnDgRjXlCIlWoAuZwNx2nYQLE43E6ncZa69/+5//lW/stIWXOBIxOpmZVQjUBoLWvQwDg5BQNh5vW5/F0GqfBtMj6aNLhJEQiThmQ093d3ddffSRmqdVUU0of3t8fp3GZj5xeFXj3yoQd7m9sgCjEc5Mq1vUqoZtYwlZjFVQAYiQicNNmLgEi7yatp4CqmKjvBQqIIR8UbbkDCCNi77Y3SCcAQMwxj8JXQnSLmICQ1ZqDpB0YIwRw64WXKjW6bEF0/UZopQjh1DvknFPOLVnYxJ9eTuSXVokZhpGGkWp2YmHQPNKImAw8QRKo1Q281giUEBzIwKxp8gMYQrSSdvfWLUZEiiyiwkwDhuEIINlU3VHAA8HsFVud6AsApi5VTAkHBs6AwJxiYxCpquButVRzY2bzVuLf77ahtfVE0QmJwBgQQwMEx8N4d393/+5ITO5Uqz89rb/97efLpXz7/eX7z8u8ybrJrXOBbdWF/9B3MgBzMIr+226EFlh4hODQiALmgNGtsTv/VaxK8D5cLaxSo8flHMnp7kC1kNz3FP819fa2SXq9EHbUbt/gvMGZEPPOEUnVHMMXcwRwQo4Nru35N2+ERp164S8hOsfysapa1vX8w/e//d3334EZmAD4kNKYEyKqhYiARbQBrfgRp3F4/+H9NI3T/USZpuN4uju8e3eH4Ovj4zmhKIjKvK1VxcAjwzEdDylxKXqZi6qPw8h5ZOavv/n41dcftm1bL/P54QkcmIbgTrmYVTXTJuJs7pF2SA5sUQSESMh0GA5Ih1qWiyymErRXwKDlEad8PB0/fvxAzFKLSs0pvb+/O0zD48OUnjeF7+7kNTXaRrQ3odyFkMxaO88GZTY+BXDiUnLTinAn0y40BmYWPW80eI3aU28ADYNqPeMzM+dh5N0qtbbMrQYFEB0wyJABNSAqIikZdh5nwyIJEVrf8LCGpuqqe/fwmMZE2IY2pXAkG1SxBx0/YZWg2+8IWS1U9xKAAZsbgoFzDiQMXAAcWrOHBn5xDHwsJWx0B+hZHNhhjvDi9t3aO8H3uhfDNZEQjil0W7UjbQht7MwsZnkb/Ks/ic0JwRbrBKZnu68F4IBmbmLuvm0yz2VeyrLWrQbF66WDiR1bvvqj3WUlwKhwIAx7uMNssIOR2HDEmIV++wARDa2ZYwtb0MruvA9HC6f2oQyfsJ0jtk/fbdAeuTl4620BPeq+RuAQvfAcDA2xNcZBtfbF5AChzHEN4Bom+1ad4O739yia8pCHYQRXj+6niThFbGXWChKCE9CUtNIwpJw5ZWJ2R3UQ9SqK4KKm187c4AEGibg7biTCIq2LLKecgsXLoaDXDu9yCz1buE+7NpzdRAC0KAoa8T6RW2Vm5QjXMiCAukiD/kOiv/UmMTATU+5yercT6Das3ucqXpcf4J5P2G+RezQevp5tqzNyjwQXdrS+J2B23COmY6/aC9PUqaJEvN+vfuFXEYy4xY09jVc43BFb9i46vcVQmYVtutYPtQsK4+kxndrt6I5SF0l4drxmBkSlBnHmNDKaj4nAUA2xmqjUCsQuFVSgFHJDRI9CzsRD4rFtvEE20YomCM6JvJHTAmdLiKlB/QDuqCZ69ZIAek4EwpFwc3ITiKCG4xYgI4MalM1qrcIqahj1+Dm30feu847kAAJWgc1Mq5oZDXXebChm3voV//Z3j//z3/xwPm8PszzMslXb6rM+lQ2nIHI3BPLGiHBydwJnMEeP9ijoBGDXvAbEXuYY3e48Kmmbr2TRRxvNEBGYyUEpaj64Q2a7vGDbXLwre0NfTzcYQo/P+kvYXRsAd71aw5jR7ZN3AZP0gq+EOxXzCt7GaUvV54vOVbVKDTACEA/Hw1/943/6/uPXbupawJ0ROOymNdgurAwCRKFHyulwPKSUTu8/bobntarYtm7g/vQ0P1XdxAUQUlKVp/Pl8fzo7qri5ikN43hkTnkYT4djHnJOKXBNAszMFrL4rmCqopWlR7fh8pIDKACEPXJHt4xpPBynw1CWJNuMiJxSHpKpPpzP25dHk7ou5/PDD0gktahIYoa6lWm4PD2EG/hyoTXsOWwGxVwlYiKzAE+hAXuxI6MZIIUuE1pTgrIIs6jz+Fswjg6AxJxyMs9pyGlAbMaRmIdhzHnglMbpwCl5U8LxWivU2ky1mYOJgGJj6rZ9lzom1bn/AdeHo+Stg0MNLyEldoeo7MO2diDvzNhpmoYMFqTGn7ZKGBWtRIkoExjnhOCgjlC9qrE4oEsFqYgEqo1wgoBEmXkCQKdgFZmCGRgCYSLSVvNJSEiMmLDBHc0fslur5PvacjCFiAojj9bwQ3TCSM6bmYiCmpgjoXlCJkbG3WADApIBGJKAm/tWTUTGTbeqRVxEt1pE9POX+dvfPT2d10uFuYKYl/qS2935Z+SNIxEYmjOBEaC7MbmZ4R5vtWtxaLIk1uADiAbu1swEIIAZEIJ5TFNsZJqYDQ277g6v91x9TxK+2JJ9d829AW2xkzm4acN59dYqxd0nRARjUg5i7NUqda3gIOOBAwbu8Aytaulkbe26EIZx+uabX7z78NFNwiqhWWvy0l0tD+ccMIrgiCgNmZin0yQGS1Epss4LuK/zuooVc0EEZgOc1+3x6Sy1zpdLlXo63n/8+M04jO4eStYpCrvN0IGJEQy0+QEhRRX7OQBAv6cGCF2rnswcIY/j4XgkhOUymWnOaRqzuxVRhAdVq9s6Xx6JqJaiIilxArU6LvMcpIfnk6in4W6wZ0RvhdFG3bVuPhFFELany6zh8oSmPQnRpa7QMRTK6NolJmUHZFYzJw5ZwYF7kYp7q3t3AG0VTe3OGCheJ5ZjVLs0s8QQhpVi3jb8RaRGOIwIRAwQW2xTHEHAYcjjMDLTOAxDziqVftYqRfM4s3ZhsfaD/cOhsQagqWW1TIGbAroHY9lBIEIqb5Va4W4SEGCiVpfek5jtDjVnv23XLfZpWSYiJO7aY9RcqLhfiEjk5NAhs0YhMzNTAwAGcGodiALKq2JbERWd51JLHXKe5zINm0aeULUrXns4KXa1ATdTavcaECH8JcLYE5gBLawSkTt685Xa2ELLWbBD/CYzquG1F0VHi16CR/v3Pn+mWyZvM6fFINdn9kjKn8cDvboSegD3MmepGDcUvHU63TEy6O5S+Dq773+74DD6HcQmlBKP00jCbsmUo7sRtTRSP+fWq7b1dIttFomGPETKDBBCC5U48zAm0mGwUUBUUs6ckrsTJ3aPlkGAGCsECZEcFVQFo3AiWjBbTA2zaJkRrmyrtXRtLkBrUQXoIhIJhxoy5yomm5mWUkzU3KSWsi5Eja8UHQCukeGzEYKerMAe3V8tU/dDyJGcnIjAohfWXpXbMnt7kVeL+rBbJUBHoP1XuTFCmdnconpuL8zAMGH71NiRLbtpUrufMII3BnE4wuAYakd9h/HGMg2duhBliSPK9hBxyDnnxMw36NLP4UqqWArXwmoZcECSxIZk5kAJ1EAVM5MqikCZwAxETIq4m8li4QKIR8vPIHEhQMIBGYkaox8BXK2BTQjkwNFmBpD4CuQiIDPmASkIX83vdwODwFyIgHgYE9CgaqWKiqE7uhNRGoYI5MzMEETt8bw+zFvZ5MsP5/myPj6Wu8O0zmsacJgI0EWrgyFBRsaUqvrj+sxXQkRiSozgsa+iIcRWRuSk5uaJQFPIX1gv2etxigEAVDGKjYuaCI6oa4fgAIAImqhIF4HkrlEL1+D2yi7qoABAUO+7JQpH1Prs6iG/a/OVXK0n4XbDR4gATEYRlncAjXassPlJiAjmoLv2bl9ynCgPDEijA7INkIbjZM2HquBODqFlHe0vARE4WrNiyowhzOzazh4dzJETMQPAcBrSeBK1Osw0b8N5+vTl01q2WisA1lqn6ZDGzIlF5Xx55C1N0zjqILUiw/E4mZmJmCkTmldVV21l9CYaZ+im7oqAlBIyHw7H090hj3le18fzZb6cy7as50cVWZZ5W2d3uDx8RlMiznlIKZFlkwNohje6L19Hu/WVjBULkFK0JMKUU/NRIyWPLduVUxpyYuYhce6tkmObj8pFh5ClBhnSljMCjOMwTZOqEBPXRETDOKSUo6lpTKnYy1W11mpmUaYCHioUu2LvbdTZjFps3gC440NM2AkZV5OJGNzaREQppSFnYr47HY6HyU05NTLnj1old1BFUTQnCKE0EmQ3CKVbN0YCMkVNQORmIBUKmpkXF1MwB7FmlVTNDQiJOTMF0ZGxwYgC3uR5MPbBHUoKpiogIjIjNy5RY7p7SyH1eBwoZXJgAIfibqbiEXogUcoDkJu7gonausllrttaPz8s58cFEb88XHLC8cDIGQnUJDYbJiRkQHsR9GJTuQ48slX8Y9dsj5MPyWB3V8JY9fvfETBBQ0e7sYhyVL06Lc0K7EJ6O6aOHfiG3dbtABL2/FrvbLnn7axRUgNXCor5XmjWUV4Hhygij7ia3PcdGEN4oO0XDSkjglY7/nyAiJAZASnlELuhzNmDnaTq5gyQ4uYG/QgRcvYo/8yJGMHN6+amIlLKZmYIBJQIkRhgQDY7OCkmcx+nwzhOiFRHQeKUB2JGJnVdtzUpIzkRqAoR5iG7WVS5AyCAqrqGeqcF9bC4mWk1FQCklJHZ3bZtqyKlylLKvG7bspwfn6QWlSK1IsC2LoRAlI7HI8FkiE2L741swD5U2KGZXnESFEd3JgJ3YLYIWzBKgoivRwQdITWDiMSdxxfQWCD8ZhyMPCQMdIRC1il80l5dvftJTeJbJeqcmoZXV+cKFCkIARw1OoweXTyjuQWET9eqZIioWSyExBz9ClNKOWciGoYh55Sj5e/z45lVcgBV2DbYVtAVdSPfm1ZBW3cIkCiwIkBEc6jsiOoW8IebBYzT6mNMnRCIwjPaOawdQIo+Vx2Y3YPt9jciIMZWH4SDDugBgIMAkJupi4SgpAOEklz4KChKtSJSdRCDqrYs2zqv2yZ1q7WqVovOgOiYOTPjNIzHcQRD9WSQEC38y+vMQgjXGNw7FgmI6ACojctmyEbgDsTWMyYRNLQsGJECobkjBQkZWEI2sk0QRCRuoVBT9W/wIvQw63YD9h2Ce/58t3/92X4m12vZ42HcR38PBH2Xyrx+yR51Q1SI2avvdHcrpgsgdRYWIRgimalUMbUialXBgZEZGAgxD5ASEeYxc2ICJ9DwNqNxKSNkxpb5QUCJcEvclRlzZqIMPqkGEQYATaWuy0Ic9WUYDYRbeKIaRgfEHFBVy1aDayO1ujerhIgomTgR4TxfxsshOou4OwLmnAkBcjpMIyEeDsfpcGTm4+E0TlNO+e7ubhoP0/npNW5yHetnd+p5WgX6puA959B3Z8QOACIS9CcBsTUhdAfXkAqIP2raejOrkQNWVSMiVUMiEamlmtm2bbUU02e+kpleQ87uuZORRx2Fk3dnrXV76gy35utHD5hoxpUStQ69PQxtecKXI/HcV3IoGzw9QDbUjXRLiJAOlkZHdGILkYmUoQGkCABYq5cqZrBtUjZUhbxS2cgUVnKpgOFAAGEI9gPu8E1cRluK7XY0m0S91a869UpdAAB0J3cAJ6joYmZai6m4oQEYUdRegXs1EDUA3ES3alX0y6fl8+Naq16etnWp27FKUS1GRz4Ox5zTx9PlFx/ezUOphlVxKTo8p8BhK91MAB5mEvqiDhaSd+4GQPNZrnBOREwOojqqBc5VpT3o9ah2Nf/QdY6uDvE+Dg2yCFfIO/+ho9v9vLxbCm9ZBeuG6WYDuObU9vdai6fRA0u8bhw9vYeA6i0mfWYITeRct++R2Vq5HiMMAOxay7zVavPT/PjlbGoJE1NCJBpHypkTH45THlJmOk45MzlEbwnIDIcxEXGcRiVBEKmLWRkHurubwP3d/REAaq3rtpnpupWnyyMAvnt3L3oP7uu6BTpU6qY1ur+YmYvItm6NAVi7v60CiMQZOW3b8XA6VRGpZV1WFUWiw+EAPk1DPkwDMx8Px8PxyJyOx9M0HYh4HA4p5WVbo4PW7SRC7AmGDgB2kO0WymluVKBL4XlEn4noyRH5Uu7JdQRCBLWQvvFa6rpspdR1LdtaVHXbSqkVEXGTxgIFBERVlQjcaimluDcGprtHu13omxNGCxxo3h1G+6KIv7JDc8Ra9jt18xO1U8w05BxVqzn0D4IwTPjaRr/GlaAWKAV0Q90QQzqfo+KmIbwcODgBtpAy3PM2yKxgym6gBFzBDCC6MgLe1H52z3ZHXW62686zAMRoews9sAWIkmp3dDNXCo1HDYVthNYAQwOrQ1FBAoCyyVakim3rtq1FqtUqKrEThA4CJcpDymMepmFwBRZABDXgF10qe1SNza29uhNBP3AHInDbnZfmJ4VpIHP3GD00b6wFc0dEid4EivvQ+B4ttk0TAaEp3Tbj4F06269n8mMhww2T5dkFQWvucw1D+3rBnp9rdvImHxPc9megVLs/4F7VVgJuLHSIui1yE62bVl2Xy/nxQcWYUqKERFwmGgZO7C6DZM1pYCffEz5InV/qDuZgGGkfcVfikCJoRfPrCqVuZqYq67oBwDgO4ziBe6hqhK8UbXVrFVWTKqVsGo+kupmbeIvgFDkj0bouw7Ko1KA1IiCnjODT4XB3OqbEx8PxeDwx8/F4N04HIko8MKdhHH7MV9qdfnh+W25QPtiZcTvHvvlNcPOnR9m7Exsccen+UUvlRMIRGqUuYjKPrny1ml9dxXhPWKVooN1dBYBgvBs6BbuWEYGIdt7XlduELd0R7Xq4de1BJn6Gtr+RT3pplRCQHQfH0enO6COiGlRzATfzCq7kCJwiuZ8GChI6q7kDD5BGV0XOKW+kCpywFnAn0Awe6ksJoYmf7LkjaKzWwGh6i9YoTAtvHXbegCMYhVfvRMBmZk6gqo6O7I6ARpTAnThRSgCYXAZUZDsc8c6yqo+jifg3X9+9//jx/v3d3fu70/37ccj379evvnpa1rJstm7OW8353JNafYyIg3uGDQ3rQRVBawJl5mTXFQwNgHZ3NAcHZEZVc0cyTmYGxJbU2jRwA9iFmtoE3FMAe0hmoXPVQSv3SEKChYBlwEnk4GDoRhCe6S4IE+Pf+pz0/6DlAwNlDxANn8WN4Fe7hNj4dM+mlYfTCM2eIRpGqS1HDgBdtuXhyw9lq023DpHyQDnnIX/4+P54PBymIcN7GAdvXBrY1st8fkTCYFpVkd9+/8OnLw/rtv3ww/fn82V3DEut67qqqqgXcUS8XC4x+tt8KduiqmWdw/qIts4KIhI4HxMgEdPAOCJhyhPnYRinu9PxOE0AA50mcGeEzEAA0zgcppGZx3Ech5GIx2nKeUREphRE6hfLrmW6dkFR7xI1GjWgKhoNEttz4E5E5k6EXEvERA4QrT0jTNo/XES3Imr2+HR5fHyqVS7zZV0XNS2ltC6hPcxpcKeZiLSB0NCNaZKxuyQm3NR592Sw764DtgxIBzMbVGBmCAjmFHVe5gqGURBu4KFbqa9bKr+BdmMyPhgfjd14BDRFQVByRVscChAiIyVIA09HDjmRqLMLEpYZrksqG6vgMmMtaIZa2AzdyY0BcO/d4N4YqyJiaoAhrxSKN4iIYlDUzUFFpSq6kyuBEdgAklDN1HEDFXV0JXUkAI7aTuLECQGAlbIm9Xcw0VAAkTkR8scPp1/91V9+/HB6/+7u49dfD0P6xYLni67rdr7IZa7TvB1+8wVv2dNIxInSgGAQzkBft3S9LS1ggg7deHfSwxiwOpt66IaZuYOINaWERh1p2THsAMPuC3VwqNnxZp9CjbsrxF/BdQ8r0VB21ig+vSbufAec2uN9e27sJNz3yT3K8ObvOTEY4Ksunm7mKu47Rm+kiM7JdUQjsm1+/PbXfzuHduS6OQByQkrTYfzLv/zVhw/v7+9OA1S7O4lIKcXa+nUHr6KiWlW///zl4XzeSvn0+fPlcmm1DhaUVAMHTAOlCZG2Up6ezu62LXPdVjMt66JSb1zSCFchMw+Zieg4jYfDyMTj4TQMhzyM9+8/TMe7nPh0mFJKQ3Q3I2Tac2FMkV8mvhaQA+Wc8RbNdXC33XcJWShRqSKm1tSiVLdSRSTsA0QXwFZ6alWEkNZtS6kVV7XNKsanyrJuqna+LA9PZxG9XC6XeYnMmqq2qN871OnXQhMzdw8ql5kb7PIuzb/ymyDm5g/tOID11ezRHRgMHJw4kkIu6tFikgkQKWrwq9RGzvgJq2QOoiiKYiyWER2VXIxQHITJDYAVnQCN1JM7ARqgAQJEyhcQOAEzOCI3VXZgasYIuFWsdqyiAR0IhooIjsmDfBRyCQ4hOqchTuQQkmUOZKEr62DOUbChQLoPXhTJhIpY4PXoyImTI+GQB048TiPnTJyRM2ACTMQ55ZzVU0ZOTqz43P12APXoGgDQ5dUiutonebdKcGOV9pcAPPhcIRiKXaY7hs/9mmSLQKF96TVS6lGYeZOabNala790N6gDT95y076LV978vQcLN1FhC9ZugO32Jdj2+Sv2pA72AhQIUmsVYtKumQ1ASJHPUVOVWtZ1WZZ5viyXeXEAJAbiWqd396chcyLYtnUYktS6rmuwZEXE3KtISCyez4+Xy1xKmefLsszWs9oAEBAlD5AgNY0q1JZH26Jn7BaJszioZbjAGQEZQ4wlJWYehjyOOag1hMjMwzAMOQ+JD+NAjIzBoICe0OoEinZrbN+fdqMUBiJ6PgYA33XruiSSSpWqzZGLFBhxr0OMZIiaJqUbF7a546XKsmyquizLuq4iWkqRWsxNJCK4m3li5o3xr92F7hudX2dKT4egX5GXjmD6vg+6mQPFXqloZKox5UmpzXsER0MEjSgoHGeVLhv3I1bJ3f/2tz/8+//X/+c4DqrFpAJ4SkZsCMZcEIUI8hDFcZiGnjdH89DpNzdDqSRCblgLqDS5NXcIIlGzRy1t1BZQJEcQ9jxD26LNoVXVN4FkJ3cKVwiVwc2tqqirOM6GFZDAe2e6RgPRKP11X4sUUQSM3oeHafj7T0+Hw3iYxvv7Y2J+eHj69OlLrbptuhVdtvr9w3k3MQDw6WH5v/+///7/93cPt/poeIu4tDvXr/BqUPb7GKhzd5y8TY8WW3U4es8pP4+O2pq7tX23H7uHxbszDddfhh3qvpq4Hdh4fnR0c3/Yv3z/JkRAMoe/+d3ltsvgVuT/+5/+Vs2wcWcijcyIpGKlmKp9+9vvvvv8uWxlK7VIBQBABUIF/d333z3N58M0fn74PE2jXhNnbeVoFz+5LMuyFVW5zEspxaPipF0dAgBV5a1AR2TAPWpBgl3ZU0sAAI6ho4+RHCdEVVm2lYjy0yWlgTiN06eUB2aemjw25ZRohxvgFsLe4VsEgB9++P7p6el2if3mt7/5n/6n/+c0Ta3M3r3Fa24RMZhZiTZp7t7VVrFt7hyKg5HGup0ZMRlUtVQxs1LquhU1q6WUax1Jd5Kb09Ymi7Uuc/uMemaS9hnewa0dDcLoaRCgHhG3XBsz3hKaErcHTBgVhXwlhG5l++HTpxcx3EugacjpMGbs6RzsoUNbhHgzX29xqttWCd5cv/a4LYxXiFYfzeu/HVt9uQ6vn3w99+akwDUC8Z0zcHNV3V60N16XOiI0MamGusU/gQsC7MWrUERutfIS03FKKb3GL9+4qB979sWjm7F78daf+umNJ37s13d8683z+gccfh3iKlbqlbKEiNOYh6hcvf7i7oW5O0RPmn3H7q8H1y4w69Y3EXZbfjs+7gDQzLjvHS5fzJB9Y7uZTf5i1b08GnTXF97zRzt/cAf5bsz27b/PD1Xdtk1vgpSch3EcA7nfz9rhZj/Z/4brhN6/5Qak6g8Rng9PtzXd6Ph1Avz0JPOfnSI3X7n/iLfPv3rmesb7eO3/IIC511rlrVLBPx9/Pv58/Pn48/Hn48/Hn48/H38+/nz8+fjz8ad/vAyGj8fj/f19FBn/r3JC16OH1i2Z1EP6/bUbCOpHQKv/4sPMnp6e5nnenxmG4f7+fhiGP9I3/oHHM7zlBlTbA/s/1sjsx2Wez09PdtNcCK8A8PW53+dUvMP0N6DEztG6OW4xDbhCGZ024y+gqGdf8Rx3fHZKeKVFdPzopfR1/7br+/YU2w0U9ewbzVxkL39s5x148avTeTkaP338/K19TU/8Qz/nGcj76hfxzWdvv/bnZ0DgjC+0FZ/l4IjoX/2rf/Wv//W/fv/+Pfw4KPhHPWIcrFHcXEVKLWaWU8pDxqiJN0ME2pFqJLjy1nexUMDf58795PHw8PDv/t2/+w//4T/sq+6f/JN/8m/+zb/55//iX/wBn/zWDbmxr89bxr06XoDWV7g3RA699WaKtC44IFG0Vw05VLjBZV+Dlb//RbxxVu6q+v/4D//h//o//o+Pj4/7F0wjj0Oj8CBdqfF9KfaFezUgPXnhXmtVNezSlF0nAtVNTB0AiUI8Yb/3kU4loqj5VNFai7m5Ri/p6/hFW4brNVzTSRAlG4koyiDGnIYhu/u6bZHAUnN16N/CLUsKYNp6Ro0jT2PqGT9EgLj281z+/rcPl/naqHLI+TDlhnbvp/eG9YXrLX/TIODLNY/PX7z++OylZ/bxNVaNN++42WD6TaMrm/fWCu8c7V3ydk+k7yk7vJ7TvkhRRH/73eOnL5fbq3tplf7lv/yX//bf/ttf/epXP52t+CMd+1mbmZRqZqVs8zKr6jiOh8NEiGbqKoiYcubGMm99csIQ3Wbi/gut0m9+85v/9J/+03/8j/9xt0q//OUv/4f/4f/yf/7v/3v4Q5b2j9qk3+fwZ//uFABTiYI7ldraCJu6O3FKeWhsT7oWbex+wO0JvEx5/vjJvUjfRPas1mru/7d//+9vrBKOAx2PiZBCRgduvJkmd9H9ipaT7ieiauuGtVZCSsgEyIgDEgJWlaLoAJgYU8tAJyYkGnLwidI0Tcxca12WRVVNVKtes9zBULXbisrG1O2CnzAkHnNiptNhPB0mc3u6XOZlMfeirubMaRwPzMndTcHdRWqtKwDc3Q33d0MQr6OQOkSQvv90+eHz5dYq5cyn48SMnRW0b0u3udk9MfvcU9sfPPNGmxW4vZ/N1AJcDcftvXZ/Nh2w35au4bGbmL3ELmzKtUY8PhF7XUP/zV5GjjvDh3v2suumtPoBB3DEdauXefv8cLm9zuedl6KsLqWoJ/xvapKep3RVFcxUgSnK7xxMTaojmkioUqSUYl5SyiG+E/rhjcIAgAA/mcD/+SO239tnsI/PW17qG8cbL/7I7+PrnTKee9sqmSKYgiGYOHTz5G7oAJyQkRDCWwlySN/Ybq3Sm0Hej17PCwZDTA9+xe3GpjFzuwT2xqwePtL+ws1nYywkZiKgRKH3BwSIXWnbu2glBj+3iZpRoqafykTaAznshXqxoNwBkdhp59gjYufaYMpMiDlxTkyEOaeck7kPObfSD1AH63ppCNAkbAE0WqHlxNGUMBy3fbBfR1G4+yBRBuRX4/DCc4JdEbE/tZuZZyYImx25dYsRcb/l/Xd6WPrcAeuWJcafoPdfCWN0a2J2O96nTjdMzXQAQiiqNGW4uMwuUHf1s8LLCjpbF2B5drzR3vN2ev3Eq/+Vjxdf5aZSVGpZ5/XpS5UC5u7q7rVKrTWl/Itf/erjV1+HWnh4+nj1lf6LQ5R4e9/VX5zqm5/+89/147/RvWC4YWi96XR3/ol7FLhLLZeHL9syi9ZtWURlnA7H+/cp5/FwOpzumdk58T6R9v3z2Sn9XuPUVk5vBPbm6GC3StikQXXn0ITComPvZXZjJNuicR8SJc5MNKZMxCEqCObk7q4ATtg6YwyJQ0VsSJkThxBaIjYEUI3OJe7iAHtXtpQGZjazUkr0Douuy8OQj4cpqn8TISGejtPpOLk7JR6mSVQezwuUwsSJkTnkZxMCiKBUBPTTcTyOY2uMDujuEtIRb3WjIATGnf53cztubvPNP75boBtG1W18dKVZdnfn6t3svxnj3TliN2QxuLFK1GSR493cH3WJ0Gal+mS45Zq1KHhX3CG8TriXERwiAJijOdAbRuknrdL/iof3TpZat7LOtWxSSy2bmW2lblsdhvHu/v7+3bsUfM+b1fXTMM1/4fFfyR5d3Yj+A968tD8Jtz3cnlknD9XpKrWs83k5P9Va5su51jId7wAx5wGRhvEAAIgETtct+SeupD/3+tmd0de3u96M/K1r7dhCr/7bOcTYGkhHJHVlCkOrDWYmBkjMw5CZyETV1SGaeJq7I3hYpcSUQyiDiYkScQgwEyCYeXSggEaMjoY9w8A5D2bmrgCGhDkxMY1jPh6nlLiVBBCM0ziOY8Q5nFKpdS0iqruvxEx5YERkdiZH9HHIodRxvT9mIeT32ge+ve4Ys7ec1me3qsM3Tb2/j/AVx6GrvH/78Oc87KuT0fin3usH+u0Ozwh2nXjcDTpwk7zcfaX93r8E++MswuG6TiTHDiEA7A6kA3jzfF9c8J+qVTILM7Qt83J+KtsqUmvZ3KyKVTUEUKmmakT+PBDw9vcf0zj14w/8Cnz1A76as/7ywct/oftKorVI2cq2butcSlnmSynVAHkY8jBQyuPhFKaAmBFbJc5Pn/OrGfLMgP4+B75YDLu8V0ctekOTPRS5fnX0OEu9sENK3VQMnJlyYgcYhjwMmYhy1KYRRVEsETJSIkpMidmTxVYMCDlFb2QchpxzVlURdldmzkNmpmFIKVFKBFc4PCwaEhMbJ/ec8yB6qxYUQkLQyp8QoZVDhOEys5CvJny56LCL+QFAq6R8HotdB/zqLndfqTWFe2ZxmjtD1wftF+gGZt4tX/QLcvdbMS9olq4r9jbT1kCi2xIIxuuOCQA9xLy1fa/Qy2eX9OzJH8GI/lSs0o0z6QCgUpfz4zJfHn74/tu//5ttnlWr1uruQBk4yXTYLhfZVnBzPTwv6EL/YxolfPXgD3nT65/f+Jjbi3n+QhMIMpGyLev5aVvnx8/fPz18Llt5eHwoWxkPx8vlknMuW+U0DMN0ODlzatuc30IdzzzMn76sFmJdgQ/057Hg/gIh9I4RGO7PMIzMXSHXPcohb0v54lsZ6ThNw5hzSnfHQ05pmZdHF6kABMQECIfT8XA8RIsJ6ksPiRLRmFNiNsmHcchMDuZogDCGjSYahpxSVhUiywlTSofTIXomjjkToYhIVQcwV4PoHZQ45SQq6jnlEPAhRCQIgDwxCSUAZ0I3D7cip2RmYC6OiRI+hzeJMDHnRH3k97GCZyN6jbwaCIVXW9NNfJekpC4vRaFd21tmwb5J3EytVmFnLvZMIbknI6CHvK2/ElK3SoA7CtSLZLonfDt7rsYUOnHi1lPoL/dvfm2b/iSs0jNnJ5x901q2si7bcpmfHpbLxVSsCoDTMFGemEikqggxNwVsAGhLJSRAdlLTH+X4mY9tt+7treDH3/uT/siVhhMpOJG61bJt27Iu87Zt8+WybUVUATHl4XC6r9uGQMM0uRngtdflj5/AzzlSz0Tf4Q3nu+Mm2OEOJhpySimJSlTMR1Pzvl37jk4QQk485DwMeZrGnJKpJCZTTIkChxqHPI0DIaE1YCa+JlqFMVFiyikhuGOoWcAw5HEcws1JKaniUJK37klDHjJFSxUIVag9qeCIQIwADIDDMMQqI27wMEV+pftKBE3umaBJV1M01sUXsoEQaammaX2Ny3qQ1Z7ZRzL8zY7a7MboGqY1xybtFqT9Cy98JWhmws0oJORp77gUXt7+mXRV3I5PvSHhIO6Sp8FM6Un+Zzna/hD3V/rVP5t+PzLf/ySsUp/szSCBm6qUbV2XRWqN5EjX6AcnNjcw1VrKugKA6Y0+SyR54mP/aP7Sz3/sC3vkz1zXt+zCDbr5xq3y675iHjKD27rO58u2LnWrkSVCZGIGJFUH1LLVZV5MLQ/DOE3kdpOMA3CELmT5+x8/m5VFACZOoQ5JhIg552kaU0pVGBDUrg2cVEVFASBFP9XE4zgOOeeUQgw/5TROYzQUMwdEHMdxyAmRyFqT3w7Cxvp1JhqHnBIBOpBBtPoZcltaCI6QErslzinEcgDAgwwFwFF3jWCuppG8D73KKiKBKCEiUfRkQQUDJ3dgbx3CPHRlW9sQe+FKQPhKiXPiDl0D3RgleBYN7aLcDWVuUdsLHAebVcIm/3gdlh5b3s49R3SySNZGlNumV/9evOYZu9PUj2vCzlsv3PZ3zKabrrttusLtzMZnE8j7Bvt6Tv1JWCWAblQ9BMO0bOvl/PT08KUscyLCnBkxJsxadK0CUusyL+dHU7l7/x5aDwNsHsF/A0jpDz1eGaY3Hr75023Fv3s0sK6lXh6fvvzwQ9nKPK9lM1FHSpwQkKuomM/z/Pjl8zCOlNIwTSnYhswAiM4N0fp9B+oPAJVSTtM4BnWDmHLOp9Mp57yVQguraaimAnjZSi0FEQ/TYRoGIsoDhxT0kFNK7J793VHVon3YTciJ7BwRXMgEunvI1eRE96eDAwA5kAMCp3jvri6A05hzIqJgPgWTyQOSHYYMAEggKm5Qq0o1M69VVT1lGoYh2nmkjIjAyIIOBmRExgAA6qLV3LWG7MozyhECJKZpSDmnZ3m07lv2WRw+Szg+157G8ApA2O3FNV9GzWo9YwZc7+Tee8WJOhfUvUM+uxGMLgy9g8pVzrbFH0G7AEQKPyBwuM513x3Om/l7wxj1+FLo2iovZ9HbVuktx/y//vHSSjZvr/WZrLXWWlQVu+RIYgIHosZjVhWpNeXaIjjcQbi3DdN/m4v6qeONs/o5k/T6t4N6aCa1lrXUWlSaUGPLNgFGk0QRqaUAYsgJmeG+bf8sofynTrIfP/b+xjkiioR96oeacWJQiI6uAGBqpoqIQ07DMERmjXgHWSHYc0SWOrPfeou9wJUomhERhZxsbN0h0gjkzhFqEXMgO65qiBCtKrspaBExdBw6riJMWLQGCb/HPeTYoyFVaxvrjZwTrWsRei6iHeYv3ctY801jqEeg9CyCu7FKFB4VRbdp6E7m7ed1c9atUvO8+tXdIDm7daDewRApgO/9dnYfrX/o1UN6hnY5dit2jb9DVujqDjXv/gU2A9B53bB7SX+6vlLni1mo9K3rOl/m8/mi21rnxVQykzAD+LYV2Yqrzo+PKeVStvuPXw+HIxHTMF0FW/0l3v8ncPykc/Kz7ogDtF6PIlLXdZ3ni4iE7Ta36NoAAG7gblLLus5qui3Lti6Wc8pDsgERGUPwND71dpj+MD/zLVAJU87jOFLXAyOKoEYJcRwHd2+OTzQUAiDEwzgdpgkREBsTVmoRATcjQuwdPhDQrcVc1DXF+9m7moTWYtt+OM4HzCk0WFVVrTXzhgAvRaHTLGORxUuhXesOUdVzew9CndDF1QzDeIXwtCAK+o3eUy8MshcfEWFg4j25f8st6kh281CA977q4St5u0E74tE9JrgJlZrX8tKv2sGg4CrtU+p2g+qsKEBA8J2G7UDQqGZ9rcbVdYPe4ak+gv1HuHGd2glfldd2ztTLqf8nYpXa+AbDrWzrfLk8PD5++fJgZZN5dtWcaGBGgFJLLRsxP3z+VGs9zu/effWL4XBMeRhTZuZ+kY3I9McwTT+7dl8M803k9spW/ogx8rdf7fqqpczz/Pj0aKq94sTBjFqnbgPEsq3z5ZzKdjwdT/NJh2EYJ7OJkJwompSgx5zrXcWvk/v2JK9gAb44o1cnH0HQ8XjscL8TRdM+R+bD4YCEiVNOCQBy9F1COp2Ox+kA4GbVzdRk3VY1ieT9tS8GgBO4RrdoYNyRdQAwjS5m+/laSziG4+DuYZWwScqRu6qIW1AEIlMWJB7YStm24g5MiZBv93szU3UTNau9ryyAgxXX6mAQjR6Rmsau2ktcCYNEnnlPCfS+aB02whv0qqW+ILw99z3zBbfYDe7n0RDtuJHdT7pewI1hcgjt6GezGb1DUdAcyfbytTvGjgfFmezylvHqXs7c/vdrGq57ers2K3j/+8XxJ2KV4nAHMNOQLpYqtVatIlXcFJyiNViIxgOA1FpKyaVILVIrIvVk3G38/d8IZLr9mjcjr7ew7p/zjvz6O/sM9CanGwGshBK272qqkRYBghbiCiKGb0VEYbwc9y0M/xijRC2h3DFUaDsn9obGe00GUVNT5Wt5FbaeVW6qGqiPt8R6m+w9irmNRq8x0/VyHMAgpMODj25ubgZITo7oDcf0K+MGOuPZe8hG2AMVROzeZfxe9HFCiNilMTehtXE3ug1enh+7V9Q9pBvo+va1hnNHhu6NZElb6beX3NY8YttpPM4OOzjSLMJuCXZj0U91x+1gv7Dry7hPQrgax6tvdOsQ7e7S9alr6HbzxW8KO/xpWKV9hNxM12W9nM/np/Pj+fz4dC7rujw+msiQ0pQTISZyRieidZ7VzM0/f/89EE/HE+UBWkI27djhH+N4I3L5A37/53VI47eu/8ZN7otVRGqt82V5fHgyU5NqblcdcURHhug5jFhrPj89jdM4jOMwHYZxIo6SXequ+5vnvtup2/P4GUdpfyG6N5ipmyuCuyEggXk0wrNoXQuqErdIRSpu7u4u4KYmpgbuUkWD6MCcc8ZYaQYIICYKuiMxZgrkxAi9aRV4b+PcciCtiQeAuVF4FoQE1LLvnT8VfGwkSgDAnIgYHJgcAIgoMxOjm5lGNG0qCu5ojE6wWzgizinlgVN95a633Btez64j09RgphfAzi3O/Wz2XN2S6x3qp4DXL8Ob5tdwzXv5C6uA13ODG1frGpLFD13s4eavsHVh+mH/qvb3Fc28mVGtG8qNJ3Vz/ClYJehbn5vKssxPT09PT0+Pj08Pj0/LZX749FlqnXI6DgMT3k35NCUiMriUUlT00/ffifnduw/H+w+cBs7QmnD9sZwkfLWSf8rM/EPPwm//bzfYQc2kSi11vsyPD0+qYqGNH/0sEZBapZaaGwCnND6NOfM4Tce7+8PxlHJKKTsnBGjtCn/0FH/cJLWn37CwURYbFtTUAFo1JnkKjRJVkrg95t0q1U21uzeuruH2ikoRcfec8zgMhJSQUnTQfdVHjBA5UXcZIRAegLa4PeT0Y1GRhZcToE3UWYC7OWhTA4dQg4mCljAfQcIK9rmImrqIlVK3bQOHzEOiodsPRCLOQx6H9KLzElzB7B1JpuuPz+K4Zq+a9dqHvLuhPaDyDjI/vxXev+51Fq5HVy/v3a1L1r/vxkECb7DQ7iPd+ErQN84bR8mvn9Dffzuv0Xar9vz4Mav0s7v5q4n84rt/6p0v33szSh6zR6N3YLTKqiK1kgMDMtOYUBQZHFURSUXqVsq61mmTWlUEiRqNsp8XXr/l2an783//axmxW/DlH/aZt/71s9va5kE0gDWJ1qi1mrWGhYCAbOSA5KISIu1Vaq0bEUqtKhXbAuzlZT8KvL0Ynv+So03ntq+aRQdWuhr4dvefhbbN42lQhZsbmiNGddveGCKOPXd0G5zg82hnTzD1LkkB6fh12e78Gb9JRiFiANLtEzo6sv8xAPdwAyMg64gx+G3U8nJYoSF73pqmNx/nrb4br57C1rz47XsT5mO/KPdXhunZebz4Frz5/61PbuN7M0evluv2tetL+516FoX+WIQLP+cr9fDvH348x9J+6qN6NG+t53IRLVWWrZ6XtWwlU7kwMZHUUW1KzIcDjA6A6+MP35d1ret6d//OpE53d5wTDtgbzwHAq9nx9on8xBR663hxXTfD/A8eslsH6dn3tzXge3O0bVuXdZZa12WutXQkAimlPIxIPNYqqikxIpjWcZymwzEnHsYppcwpR3q85Xljj39NGPgx03QzP19fRdCuOXLmt8+6uWPwuREhIzMxglNHfAOYRnDR6M1KzBzSGqqGAB6dtgGA6VpL2l0OQARtEC42+nQbN4JrUUZKiam1ToToqhmIW5OogugrFR5PcJ3QLAbGVF1RxUzAFdGZKQNAHqZxnKC7D0Sk5qXUKuIv1l9rIBpRlSNiMESviBIgGDWz3beNfmMQERycHC283O6/3DjV8S37JoxdO2a3TXj7Q38cJxAaLH0jf2ZGOprUr/HW4Pgzz2L/fn+Byu9T59mDf1AE91Mu/k++7/kZIf7IR+F+UQ4enY7VTFSr6FbqZdm2dWMI/QdCUGKIenFGcvOnL1/Wy2yiH7/5BhEc/fT+HUAC6AWpfbN++bUvL/PHLv+t443rwNd34KeP10sdrnfsxXMxmB3nFim1rOtaSzmfz9u2QlugkPIwTkLMquJunBjcTMo4Tffv7g/TOB5Pp/v3oylgFJBe99K2bb+6up84zx87EDp9Kt7RMAQDQ3NzNQTg1LnJ0DR9qNNhCMnAqLH5AqUydDc1UENEGhKnhISMDOHMUOPQuro32hQ3ipMbAGROKSVETDkFjTOskohY6Q5ZQE9xNkjExMw9vWQRFpqDqbmBGYITYQaElIY8jgioZpGNUffozP0i0nT3ZpXCFoXdIW/dTrEzFQDdycEbA/8WBHQAdNrZ1GGd/BpGwW7K+l3t72ubT7xl34J2x3CP9/ZP3e/0LajtO5p0zac98/D99rX9SXgxDm/OLYCftErdpjyLSPqF3f7W7aPr1noTf8QA9Vaw/oZX2w4E2Hl3MV8dsHHYAAjQyYpYqeIOVU3NANREFFBLKetalrkeDiKVJSElpLh3LeVyzSLsBuQWR/wDXaUfuYJ/yNt+zBN//RD3LBZStHxVN2k8HQNERyERcmCRJGJupaSUGBC3dVu3FZlFqqkAMXnah+X35S09N7yvT3xfDrdxAyI6oSH2+9h00dpu0e8CE7WydSVycnByAHByIGwOI5i3QUitR+TetjbMEzG7OyFR2/l3oKbxp/pL7qBw/Q0iBGp6cV2m5Xk81RGGiNogfKrYDGh32bzNLjWLltwvfKVbh6IZmFbYe7OWbpbxbcDSjAU2a4TeeGc3vhBeV9yNEwTP7ideP+7mRnWaUhBGrgYM31oaz5/AOJt+7RFJo7+cHb/v6vgH+Eo/PmGvhmg3rxZjG7OmvfNVmIDdnSFOx9MJAOZlnQ6HPI7EXFW3IjFahAjLWsGGxABEjomJ1CHxQvDp13+3Pj3Ush7f3anc5fGQD3fY0su7NQIAaEQzbBvJT5nKN5//ad/xOsH85/3M537HK2d/z2S0j04pT9NBah2mwzge1LyKnZdtf3fOwyZOzGutaxVimtcyzcs4Dnk6uNvp/v707uMwTZwyEiFmCOQkPmLfQt9ykG69724k3rj8tuPGUqHWctIQlNrsabXpBr3iAIGACKdxGnIuUg29CKsbuJoDEyYkBLAqRoKEw3FM0wDuutMUEREwpTQMGQDBohFxhEMOiMwpmEqJEzO7m6q7KwIyJUJHAmRwgKouBu6R7zcEQDNwa60BLKD2gKTC/ULmTJwAXM0cXM22bROpy7betqiMuxTIYLcYbt6rcBGxVeRG4RsZOUVD7O7GNKICgDUDQrd+i/cJfXs3+h19rsx6db+67er3bZ+zDrdYtPsVyeq+1M1Svqb6uolqYNnNrrMbT99/xDdWyO+Zg/v5xfXKJO17anMrsfuQP4quAhLROE0AcDgc8jByykAsarXV3yIg+gbiNqR0GsZTzkY0uLNwITx//qFuS56G9fJEjEicDoZAzae93XhufFvYt5rfbyz+0OPHxs6f//ts2PZHfvMKAAAEsTAPQx6GlAcqpaqvpULPh1R1dSRmMRNzIqxVS6nDVu6+fBkSi9oyX8q2ZncbJuvtav12XH56MPZt5+XZQXdZMEJp8PBdmIgaESlkcCMwqwqq+xRBxCHnaRyJadNqAOimhgSQiDInBFBAdUDCPAzDNPqLzqsIxDTkARG1mlZ1c+pivRxCTNREmdxQQdwBgSjEaoGQ0QEMVBoLHMwcAcgMoTeej769jl2SKPQBEhGFFXQAcyu1lFK2Ul7U5zpAzz3FeASW1h5g434aNECImkm68Xti3VPfy2Ntxwb4bAvrd3Rfcs/X3guz1NzO/qnPbmzjBYRv9toDeuFm+H6euy93nR77g+slv5psv6dVeu7bPzteOPS+XwR0fDZM8E225ycmPXKo4Q/j8Xi6u78/P12GYSxbVTNVA4+KeSTQUmUtdWAWIkEksbIVINrmZTlfkAhpGI4KCamButBy1N3HfXbOPxLAve1C/ayV3veFH3n3/tU3Eflbn7HPwXgmKjY5pZQOh8Pdu3tHyEMmJjM3FXNH1SpCsZg65BuXva7bvCyc8zJflvmiqsMwEZE79elBfZDedtljtu5z1v3loDmAmFVRROgyPgDU0qJOjcFp1iZ/fGtiHphTShRKrNRWIQIyoTerhAjIOTkiEoawgJlVNzftqBqgu5sCYuCTXQYTENCjPtDBSR0gJJCCtNyckJbrgyhgBYAG/0TgDADM4GgG4FCLKHgrCmnVNQDQbK4TJSaNErzXk+DGJF3XTwx7My577r8bgeZutEVst/apzWkMd8ZxD8nbpLmxSS+ClO6hQbMtSPvb4lva2WI/N38xsZ/bO+xLxm8CIuyr7Q1jdv2AZ8dPWKUfNRwvn7g1Sd0otZypaVglDi3EHnC+lop0RHAigmEYmdO7dx/+0V/942k6IvBvf/MdAC3Lcj5fzMydVExYH2hBsTEnfgeIg66bf/mSzhkxTcf7w93dx7/U4XDK4wTEyClMfYu5bz0DANhvwPPr+pGo7sWw//g4/Vju9pqwCKrfzZveuM3thKOMIKU8TuBuv/jVr7Z1+fz50+++/+7L44NUWbciIkWUqyIhrymEE6dxGMcx55Qzi9R5Xt69/2imx9M9czZ35pQHD6CKiJ9N1ueXfQN3gnsTon1+Zb5u9fGyYq+WYuaszsSUiIcUTlnwhZITISWi4zSepkxM45hSBgEkglAIYmBAGJjHnAiJaUxIgOiJgKlKXS8q60pM4zAQEbhoFQBQMSkGDiGF1sxQRScUFadQR+lOQMDyJlrF3FXcqiOiuqMSE/LAOQzPSAg4z2tZNzfLnMZpIELK3LCyzMaYGN1GJizF+XlDisacamJO4eg0e9rsmqMBOCERmBkShcmha3wH5D04eulcNx03b4btFva+MSLxVw+sepSHHZ/b3XS7YT+Et9T+gTYt8TpZmnFseTftiTrsYSDup3lzFlcxhJvjp32lNxbVy6demaSrz+HPEoi478Bvm7UYE+KUiHiapnfv35v5p09fpumwjOtWaovzxSKHsW5lRjCzUseak4HgsgrX+enp/OWLVjncf9AqzEKZnn1bq/p6ZlfeMB74Y1bpjWF6c0huXnzlYTZX+wXrBt4IcW9HHIGYEqRBh7v7uw9ffVS3YZqYk6qZu6iiuVrAKCqq1HpxoKrO8xJFoU9PD4fjBABl24ZxAgBWBgJCcKeQTHt1o2/utO8318Bf/paobVX2Z8jckZiBASgBUsN6Yy6HRlrOaRwzEaWESKHl3P8QImJONCQmxAhcAUEQDMAbw1oQGCEo240taepmBg6EKbJb7m4AZBi1JIDoQLcL1d0tMnYKvcwZzCHOqLdUyYhYSw3mJRHmRMQMvMeJbZ3lxOBNaer1nLm97/h8EMNqk2Nzf6Ablwb9QPuxZ4/2d0ELmmLPuGEJ3dqiF3aqBYfNtDR3syNDANgbY+1+3bMvvrVKO0TjEadb85v2qpxnYVw/h7cCuB+zSrcj9vxf6Pfv9RscYgP1UotINXfVaqYppWmaUsw4vA7yi7PpZi1aB+W7u3tw/Oqrh2+++QVzAsDz06WF6AYGXsXWIg4wl8qJczJCcoOylvnhbMVO7x+XxyetMp1OzNzCh/YdzUjGYKpbY6zsQYkDAGxllRdQZb9a3EGpN42Xv3zUHQ0HgKCJgruqhmTdrtbFIbpxOzzPrVakfJj5cDy++/BBzX7xzTfz+elymaVWMLMdtjA3MjBSU1FFhFLrVkpet/kyn5/ORGmZL5xSHjKAMzFx4mQtrbWLetxcit+YJDNrNYnPJ4N50+tRUzMjYgdk1uQJoxGUx8RHJk/Ejh6FG+4IqGgkUncXDN0RHAxNBChUSLK7S62baq0V3JkodOMScxTfuCMmYGRwjC5N4FGDA4SQOIAk1AjuqOlVY+8Z5xapECRsfSubq+UAIITkbiGkwozMRIzWRPqh6b31EIFCguTFMPZZhh2H2vGXm0zJ7nfsTgc0Rln/L0ao7XvYgsI2x/yqN/d8BsGLt+JNJIc3vkM4ReEcIfYHccIdjcHe2gS7nKb5Nfu2pxr9uVd3O13ejDf+QRUnry+2v2Bgano+P10uFzOtUs10mqaPX301IRI5X8uvnp2SOzqQQ3Tu82E8/PJXf/n1VxWBHr+cv3z+nFP+/MPnxdzVTM3RZ6hVZKwp5VTcppTBaEo+f7l80t8Ow8g8HO/fj6fT+7/4RT6MCCTgilGT1XK/DIgAorJJUdfgTDfj6v64PBTZXlx635S6OXrbocIX9gjaRLEAaEstblZLrbUgQBrGlDMRjcMAKXU3+pmfFTMnTBcMw8evv5mmw/27d09fPt0dxk+fPknZwK2KrlXczAxcwNCICJFU9TKv7i5q33//g5mt23a6fydax3E8ne44pZRyGgbC0GXjZ1Fcn147scfMai0i9TbSjbBIwpldtyqViXMVZso5qSoxkYc/BJRzSoDuKkWqAUKpDgjSOB+A7hiaRmaq1RExcUJX9/UyP1zmcJuHlFNKQ84psZmqgINTTkQZAQF6hZqoiyFCImQCNSjqBk5AzAkItm2TWtTMjMEYiBLRkAZEB1MxQ0QyRkQzYQJIOGQeB0aiIlJF3azppQCGrRxyfVFx4ruZeTVNsM0r6OYI3MyAvKHu2PX+sbmT+w3qu9i+bViPVPzqQ7ywAFe3a/8Pm6/UJrYaImH0WAi0EcMudf4DRYPPiMMigxF7Ozj2EE5vrevNhO4n9YYn+bZV+snN//Yjn72w79BV6rqtqipSorqyF/ojhXTdazfgOmTo7szpcDjYMN6/e/f+w3t3Px5PzImIGvvWXVTjTm4iqTICqqgCVazbZbFN1vO8XmZAklpiXK01dsRY49RXvrmKNenAULw3MzePZuJvD9BPg0q3l7ZvFL0US1WlSsi21LLtgYozmztHdIf4dgSJiABENE4jIZjK+/fv1/MHkTqOQ0ps7lj7tOrW0MwQQURqpVLSuq7LsgzjuK3Lto4IMAxD0+Ug9J5LAuh78l4K0uyqW6w/EW8exM3M8Ga8RFVEjRyIzBkQswgbdycfjWMPanx+ADAwCy3vDvtiY24E77BFEqFpt20bAKREIXTSuU7uhO7ARCknBAKPP+FCIgIwQYgtY3R1uibFmwvYYJxQgCJC8OhG5w0ZBXAnQvfm44bISgxNXAwiIqbesOhHZ4jv6kYIcIu4duMEzTj51T3pKNDe7KSZpO7/hLfSISF8bguenUp/K+KNtwRX+CiSRN1i7e+/DZvawCF2QfGGQzk4QWtUTA6G1zWzm46dWfXq+Elf6bWFvaIhANeJ276r9lTo999//93336lqKUVVTqeTmR3vTsfp8O7dh5QTAYVqIlzXbN8c+mkzJya/u7v75a9+eTqdHh8efv33f3F+Op8fn84PZ3ePjl8get6KgqvYiQY0RKcBCiS7PDx++vZ349OZxpxPB8pJExoTuLtaCAsyADlsWi7loqaiUmv13knkhy/fLev8MlyNreBtFvSLoWoGNCRESq3rsqjq+XJ5enoMrchaNiK6u393OJ6GIWNXI+U9Un/zsxGIiJmHcfzw1VduAsy//O1vifA8L/b5sdS6j2RYQ0CoIlQAEB+fzgBgDp8+/aCqx9MRwHMcwxiYN3K6dWmvq6OvPVWppS7LbDeANyLmxOOQzVQqgykxDYmYiWN1uwJyVAM11Upuzn/QfMxNHU3BYn4RIsA4DIcxM1FKOZp1q0aHBCTO0a4SgNyxNVABR2JOCZFcEQzdnIhDGZjCVfawrGZg4goIppo4EZIaqXUlcDeIahZAQIxKkU5h8TwMxAyIZl4DKVc1U2LOyMSJKL11H/EGWdmtQeOM4c2tD988arHA0bBvqoyR3O7mqG/2nUG5OzzPl6s/P4letNIFuGG3iddJfHMeN2/FHr513fTW8ckip+QY4xaqDX5Dqnx2Gvjsn/34Kau0u5bYVmL82DHO6zUBIrrbuq3n83lelr/5u7/9m7/9GxXZtq1Kfffufl6X+3f3X3/19TBOBzoAA/ZE6G7IHSAiOHMnxJQTIX74+PGf/4t/HqUVn77/4fHh8e//9u/n80XU1d3UxM0uy2XbtmE80QAKXj1XNOKH330vCPkwWQI6DjxmPI4wZjOTragIgrM7uq+ynrdHMSm1bGVzc1FR1U/ffz7Pj68cn2ZGO1P8FVzXB66pqqpVqaZ2mS+fP38uZfvhh0+//d23tZRofpsSf/2LX3748HE6HFLO0UaciBxe+LdXzxcBiDnlfDgdfvlX/+jdh3fH+/vHhy93p+P3nz5vVS/LEqs3DGOs9nVzlVqrJOZ5npd1nQ7TfH66f/fOVMZxTDnnccTWYCjijibgE1TF8JG8C6qUWh6fHm7dSQQch3Q6DKqqdUNTZh6GoC8CgrV5SkjozJjjFcTYYFVMTM1RDM17nT7RYTp+/fE9E63btq1bFRExEedEKY3jOAE6YEye0Ot25JRyJiRDV9nZPggIhFHk66JSqniFhiyDDzk7QBUAgQaRg4EDMCJyC17dOaXT8UCtVS5F0LqWGnxud0+ASJzyyGl9EcFBR673TX3/EXuWDVv9DMZqM3RT8x5ftYvg3f/A/RO9V6IgYmvb2xzP3a5caQO3tqHlRLDLwO0elr80Ug3aCp8dMTpRcS8OIm+rOAYUDBRvC1fg1vXev/3F8aNW6ZZHs3tI8YKbdYehDa23qtG2qpdlPl8uKrKua+iNXeYLJz4dTw1UvpIxrhfeHaUG7cWdyTkfDgdmPp1Op7uTqg7jgIRo6NBUJ0TVwQqnKipsCqqk5FC3sl5mNV2XZVvX5IYJMaGrlRCKA2czBNhkXcsqWuP8e62ZrtsiKi89pVdD1TGBZ7/T8yANFVbVWsq2Luu2zfPl/PRUatFatJaU0uF0N04TEoqIuUUiJRg0Lz+4j1r4EUQ8jCO4HY7H4+l4Oh3P85JySjU5CJpeHdJQ1wVAkq0UIlrXbV2WIac85FK2NiFDSR4Jib2/06MILNwL0xaESq21Sn1efYpAiIkJwRORhPA+E/M1Qt+TyLHf7kFAbOrWZNlhXykQwkYpM1MpJdzYxugO8hJxxKk3oGrzQKKybq/8gkhJ9mgkQlFvmvoQYLwDEu0lMe2irjkm9zif6M7gjfAUJHRr4ikxZPt1PT/CjFzjDLyGUH00uitynVVtle+AlMcTeGWodI/p+re3274/uJ3ALdq6+kcvpvTrOf7sJj8L/W6jv9ivcffcbt/jrz/37eP3rIMDBxepqmpmUoubQR9wUakiovrDpx9++PxpXpZff/ub7z5936xSrcu25iE/PT0B4F/88pfR9wJwiN04hlbVRM3M6lZFJXNiPhAkznQ4TnlIv/zLX/xv//f/m6fHR5Ht6enzum2P86Vsixq6GjkmqE/zatU0D8NExknmuZDznNPfn2zgNA3T1x/G93fmtq1rFQEzNwGzYtsiZ3UJGWzrWiHLdhGtrwbGr+vwOnOu9816jLOVTUW3bX18eCjb9vj48O23367b+uXLw3efPomISTURTuyA27bd3d2/u383DENOCY9HT2lfs/sm0dYR7JwXTyn5MJ7u7v7il78ch0wpPzydp+F8WZan80XVvK8lETVUNSNaq6i6H777/jzP87oh8TSN0+FwPJ6IqeFcDlUkRMFrDe5BK9MIeyui58vTc18JmCATJmQ4HQ5jJo6+IDt2jipqRQEAwcyN3KNlnJqBqLtGuSrc0APMvNaqgtu6rctaREXELExYxG4uGhaz1eImEREhRKkm1cCB///t/WtzJEmOLQgeAKpm7mTko6v73u7pK3Pnw+z+/3+0IyO7VV3V2ZUZESTdzVQVwH6Aqpo5yaxu2RUZ2RUpqyyG0+luD30AB68DYgaD3OAEs2hjiZBtQNRg5kA5JAkESiklEWLKiUR4bqzolUBEpdStFO21mKMrAEAial6btg8UuRTtyJNgjMjoJDK6ew4ehN7vM5bX6JUEt1gQbkZELtZ7mzC6XeqAQ2OiekKoP0iEkVbAY3zZ4AQGbFS9DTU2xPZc8/0CXbVMpTLy5/G7bo2zwPxMt5+P/wqTCQByt1Kjo0bbtru2huEiu+/b2/1Wa/23v/zlz//+5/u2/b/+9Md//+WX1nS/31upT6+v5v789CQp/c//7X+mnC6+SorWe8zE5h50uKq6bVut9bJE4y9JWVK6uPm//o9/Ycbb29vt/vLv//Hnt7e3u+11Uzg0iiSVvuJWpOqqV0qaDNaw3zhJFbzWe7quP9//+Yf9H83tXvbampnWupupem24O1RNVZujk82+3V9qK++GcG7ygUXnSPfZbNFwo7Xb69te9tvr65//7Y+3t9fffvvtj3/60/1+P+SFafBG11pfX19+/PGnP/zhD5frZV3WlDqdJndLaoYxugUdHmcAKWUm+uGHH/71X//15x9/TCl//e3r07r89eu3fd8rmppHswFXczdmbeay8VYqiC6X9e12I8L1ev3y5bn9XEUiMknmvm33vRRV3bZSa5tSKXwJZvby/fu7gIAw5URMfFmeEDBnWWQYOwC22/amb1Hk6tachYXzspAq7dW9OZggY+kTQKZW9sJE232/3e5VtRRVRW/wBja3Wk1VAzSBvDZNtTJTGMpEtKQlS2w6A8yg8WJAIUoiy7IQcXZSi1xuJmJhWtaURjHwsRLct73ct62pVjVE0kNvEklqXmpr7X1DAmHKSXJKAYhokLIMO4i652tsvFhzUTfn0dKX4BrBQHIdhC4nqeTB2GtdKvnJfsOw94jClURM3q9H6CzUIwXEB4XwEEx9Hc4xGCKJpi+Mpvk3x2kYRUOzPpScfoqf/hZWiruYwDW42Jq2WkptdZ7xtt1vt1ut9Xa/3e73bd/3WppG0xpt4YAoJYns0QCsFkncWveeGLG7t9ZqbarRcKkKs2pTE/SsMGehdV2a1mVdljWXllk6ObI7BQhvatW1JW1qQgZyampuZd+32y27lvtW983cW6vhOaq1qqmhKjWHhnEwsMAnDSpwQtF9VOeP/gdXbRFlK2Xft23b7tv9fr/ftvt93+77tpV9r7X2eqpwhJdS9r2Ufd/3fdsA1FpktC0N+deFXnC9wMeutsG+ARHJOeWU4ufoojG+O0Va76yN1tpeKoi2vez7zszrunSLjIiIzKzWWktRtbLvpTZ0vmon7lKpPfIHUfcaxd+JQCySe4uSCHGgiQj3Xrh9/Xcycp85z70nezfyuovAo0+JRue3Y5p8xEqmOh++jU5/Yh4NeztLN83ENRppNlPpD3uSD8/z8EdNaw6z929cwoI5k4j8FJWartIPO4tGq+wudqPZFAEiB1tUt8js2NjT0+NEBiNiIjdiGIjcQtA8eEJsSJaxSB3DZkMXG+T+aT/bdz/dT+84Hsbjv3A8YDUf5tfvQqZ3UilGUgEFbJDwEgCzVtu+79vtdvvll1/u93ttddt3Nb3v29t2b02/vnz7+v17a21rBZmZRFqGA0x7KSB8/fbtT3/+09vt7en5+uMPXyLHjJnN/HbbtnuJYLmqXi+rarmua8Sf3Wzft6J3Q7l8SX/4l5+WV/n19bf0QqYRjaOmdvPSSAFa031Nacm8OrPw/du35i1fFs7srs6smYxJzXbd1cyhoCHgjB09M1grHgsqEEk6e9mHnsPcGbFfLNxY+17L/uuvf317fb3fb7/8+7/fb/e329vtvtVStdloHxY6kfe9AK9m/qc//rHs+9PT036/PV2vo8kHT6nUopPHcMBQKEig7lsru2lj8sua23VdXrMwNUL4pgNcuTlROJLV4fzymrdERNfL5Xq5q2okLXWFYb7dt23bmurb272UYuY6CIOcoGpvt9tD0QwhMXJvLtTPIyn18r28EFEmEripwQ1urdnL6+u23cx832ttRsTEmYgpC+fMTNr07fUN8Le3t/vt1sxLJW0g4lKqSHHvGU6T/UFV930noDVvzQgE88aNCCJODHNblpQSH66dXqRr7gOjqBrCnDW1Xrwf/rXgjN/2PVQXMSfqorZHyiUxM7E8blxKIr0v+YBISaKMjmSEIyn4NtUi1mgwrYcgJMCYmcBMNnpts3RL38czqIfBj2lChiAe5OAD1jGGXOpCOhSCA9YjWkNq+YA7ZwfGtLRP2nk4NE7/9ezL40a66+m/5u22KZXmPcSE1rrv5f52e/nlP/79+/fvt+3+7eV7bW0r+23f1XQr5V53d1czSkwEaSn8p6UWM/328v0vf/nL29vblx+e79uPKUkcpvbycnt729xdm5rZ0/UC6PVyaa3Wslnwa5EbtfVL/of/9kO60OUvi2QCQQ1wqNm9tQIFaM1pVXmyxCSipN91229pXWTNIFAW+nLFJavbbqX1TN7OaAKwO0xVFaPy4CS23VurpezT4zNaGHqrtdaq2l6/f7/d3vbt/pc///nl+7dt23797eu27bXWbduC/Bcz7AIBUPbaqramf/m3f7u/vX358uzWvnx5zjlfLhdhGV5L3/etlB0zBk7R2ZG11lp3s0aEy5L1sqw5MREDHknYE1oQyAzUu8wHNdplXS6XCzNdn65LziIiScx8u9+3bW+tvb297Vsxtxr7xKHuqnq7bWdWs7BHsnASjgJaIgoXTM55vVyYORNJSI1t2/fNzN5eN7OomCXz6H0CJkncw4Ha6n0vZnq/3bbtroZiqZmAtNY62m3NtFMCrDV1VAAxjwCUNHZizj33Ly+Jhl8cgJrrNIECa8HcnYwAFWMfGWfWcwrCGRqSi4XyMQ6R4RE0WI8bT4TXZVnXZXSFQxKJF5He1PMn4K1pLTCjZt46UWuXvkIa9qQlFmZisDEHPbm7jwz7jnIOQE+gzgo1zDf0IDKfgCMAIncfbdGdMLLShsyZQumwaGdY5R2IPUCRnz86QdN/IpXCZmmt1lZ8NnaCA6i1tlZbP2q02dhLqbUWrRqJ+uhBS+HEgKuhOhk4sjmgpZTb/U5MxC5CUyqp+uvb7X7bzd2aRmvYZZFSdm21lt3doo2yqqo1TiSZ8yLLkhuZV9MQ7XAA6lZUibAIVAFnVqUGZW77Xu8bmiBRLNfNqrp1URQP6+6OsML2rTZ9V31qrWmrdVrS5sG247WW8I2VGmlbJd5p4TDuVPYzAEzdLguFFLkzTfd9v293Fn57ewUs59xq5aBDdHP3fd/LvsMjNRDM1HOatWmrwT9JnbCjl26NfmPTCAytZuYUvvDWWqmNue6llr24e0opuXuw8Wo3xZs2M2/aBZxapNm/o1qMKo1oaRsZhjwqyDjixyKcEjPBkpgmMy3aelfILmwpGOwCLHC4eH1E3bq/aWRPqanqOdhF/TY8WoeQkFGEsXtSZEglJooS4GHrDLtpLntCNOKYwa+52YZ95F0CobtY3m07fGrB0ZF72d1JvZUuJSbmwzwU9vlgh0wwRxSXEQLbeSwiPomLw+aa1z+ibdMZxCPPKKShCPc0jXHnxEYj2QEeHJy/583u4cTpaqXzXz7mSv3N4z1Wum+3v/76i6Thyh4Rpa4ty/769nrb7lvZbtv9+9trKYWEkUQSL5kZmYhyXlLOWnX7fqv3Ukt5e31ttRAh3EPXy/r0fJHRGszdt73VqhH5MlNhvqxZJKCIAlgv+XpdQf52f5ULVk8//+GHf779477V3/799VZ3gitcgZs22m6JWZsky4k5a86a0PTtP36te/HM9cuia2rwO7TB2Yidw/UQTpuQvre32+v3hyzK1trry7evv/3a4y2E0TvMaymlVm3t5fv329tbKfvt9rbtW60V8OiYmlMSZ2Un7hnkZuqOSL0zs19//fX19WVdl5fvv63LklK0uuYekjcv+77vhYBFOInkJD/+8OVyWZkg5EQo+85MKcmy5MtlIUIzLbVOTOfei9PJIjWMRe756/dlWaL9Y85pXdd1WRy+76XW1lp7u923vZhZ1dbTu7s9W8/jw0yXy/Ljl+fh84WIrMsa1nowpPGSxS9ufl0XVa2t/fLLL7fvm3uHgCJpyRBJDH0jTUxZsCYQPCVZ10XNy25o6ur7dletUdHCwsxIQkScMuVFmEk4MycizjmLJBZaMktiuEMN7vtebm93bUoSueFQ89af0dzUCKQ8+tKF8RDy0ZmQkzjgECcOjNU5uUNV63tvd8xOThI/iWjJKSehXqAXXCzqbo0booSlKjz4xa1pEApQ6CQGSEBMbGHod1vr1NRyiIuuD+MqLMzLkqMsJi8pch1yyhy8LMJwlNaamqre7ttempqWUqPTJ42sq26uUk+6sKlyDw/bkNt4J5l+t73Oe79S2fdv378uawoNFwMUePW+bbXW+3bb615a3cp+u9/2UpbrZV0zCSVKzGDm69PzZb1obcll5+1O9PXrb/f73eEOyzktWdY1Dwcou6Opm/V21aYGGLzBjUeI+On5+sOPTyLCC8tKGfLlx+s//OGn+9t++7pvtDugDgC7qRUVQvL0TLYwESzBTXX79rLvuybebqku3Ag38gZnE9ZETh0le2DDtt3v99tDHZyq3u+319fvRF3RhbvTw2Ndiqq+vr7c3t5qLdu2RW+ocB9HOJmdiRzh49eGFvjLwo+rrUXk+Pv3r0lEhHPOTBShBrfASoVAlyWvKS3L8k//+POX56eU5HpZknCrhRiSJGdZl+RuuUQ1qoF63Wzk9hC5uhMRb5Le7rlUFkkp5Zyv18v1cgkpHFjpvu17KWZWRpfQgFuttfNaI9CS89PlwhxCz1NKl8uSopERGADnFDoeRA7a9/Iff/3rXqqZB9NTEmMSOKrT5k2YsMoiKSLly5KaGheHm5tGlW5KwrwSJVAUoNCSZF0TMy/5ktOFRdZ1zcvCTHnhlNjNrFY3e3u9lW03NSFisAMOZe9pY5HMZGNLBV3VRATh0nGQU2RvQl35BGpG59STVCISZhFJIqkTIaQlp5AXwmTuphRkL8HKwr2wvDcojUBWuEGNycgZhwnb83uHb+xI1+xRtnBjsYhcchLhlNK6Lsyccw4VGBTVDi9Vm2ptzQGiEgEi73RUY8aHDczBV3dqkB7wMVLROmI6Eip/x6X0USo5UFu73W9vt7cuVwdM7gtuWdbaLutV1W/bPgKXneCPCMTgkL45kSNJar17sqtZbW3fd9VmKrDGTIHpEeMbVYiuRAYYkQEu3KkhUiYR5kQphaLD9Xr58uWJiS/X5b4mVa/VAmJG/U0zrdrgLGpqxtE6ozYz0mTqrARnOMHCd+DcK9SC4bC2uld9tODMtOzbdr+FSumZRO7hV4psSVPFoPiYabAzyAOEUQ8/k2HRnAIP8qHofejOsY67VPIe4CMiMzbjQFhm6gZEDSUhiXiyJefLuhBhL3XNSaW3aeheh3499+AwUCWisMrNrIeCECazaosiD7MZpETsOH8HBM7LLR53pOBEKM3iot05GqYEd1P23TnGkkRsy5yTMKWczKyZV1RnBUFEWDgluVzWlEKOMzNJ6gnH67JcL08isl4uy7oSU87EQq6qSUyt1ZZSUjXrez0iiWAQM0mXPDSM7zDZovevm8OMqPN19Fs3t+GZwtGk8bODzjM/Xh7Jo8PncziYu69mxCbRR1iYczDMzW/6ZI86JiNUY0pJhJPIZV2SSEppCam05HVZiTnnnHJ295S1Ns2t1aoA1cq1trPHe7r2+9p2MJH33Cni4ExjDz4bHoWd08TzISvfHY9YyfH69vLHf/vj7f5mqtqC0piZ5HK5/C//y7/+9NPP18umLm+3TZ3/+OdfVHcmWZeLJGluChWRp+v1y/OXlpu9NaooqTS1rdSmtZY7M1bhNbMQyZJSTsQk6SIpE4HFWJzFc4YwUpIliunX9XpdWDjlJEtyc3b++YcfX19u5V5Atm/1t99emxZzMgcDN8g3tEzkBGFmZXLnWpVRNpQEY2pZTJgpG4NI9vt2u91VLZxCpZRy388br5Ty619/+cuf/yjMKece/WAGoD1GbNqKmcItbHWHC3Nsf/HozEdsAHdKxsjPJe6pcYZuHgUc64R5kUMA16balIlUyBhm0FZaE6bkJiTIQs9Pi6po+2Ja9lKWnFLi2vT7681vMDNvFr6wCCnV1u7bLtIQxI9JLpfL5bLS4F1Ws73U1pq5qx15gVGC+04udcc8QTgSAyQcKGF+hBSXYGxgOEGEQN2dBOKQBl3Bdv8IrUv66cfnnFPOOS2Lmf/2Wl/vFaCUIswnl8uSkhBT5CK2VkrdmOgff/75H//pn3NKT89fLtcLCMQGuGor95u19mtO97c7E9Vme22Rm8zsDqwpUfiwp382EnaShHyqtZWq5i5EHgUiULXms4xZ27uIyZHKcDh/pg/IR1f24Sf2+YfuywsLLmQkkyfmJcmS5cvzJWehwT46sNrY9wThHuqLpFYRuVyWaN6xLCsL52Vd1gsL5+WyrKsD4VWspV4vv73dbtu2AbRtu1qP6gp3j1h4Y+JqzBRuOjMTdwJFzvvsADrWHXzQUf1NqQTf9v3rt68Oa3ttpRIop5wk/fDDj/I/5PnpmTjd9iZp/e3bNyI2A8BJsojAGwARWVK+rGsFL3nR1JhFe2WZt9KI0BiaiInymvOamWW5du8dJyeGCJaVU6KU+LKmyMRZ1sTMackpJ3ewy/PFc84//Pj09voGcvpu5mHGwUDFbKvamNfWrqrsznBraoxWTcVV2NfkIsbgnJ3Q9rq9baq675GVVVt94FdSbbe315dvXyXJsuQgpRZORDRH3LRhEjszcWSW2FBWEXClk172EViljkyN0JqFGlLVQBnuCu8F9qCojGI3M2umzSSwkjFjyckTP13XH75cLzXV2vZSS23bXpKwEtEAgCGY1Ky0xma8dWzf1GrTmR1n7rW2qBbSAx+5uZsdPtZDKIUW7Mr58J+6KTrf9YD+wWkCeK+emCndA0e4k3sSvlzXdcnX6/VyvZqDl7LcIswv4alZL0vskDjh/f4Gr0T0/HT9w88/5bx8+eGH69MT4IZmrtrqniVCy8u6tNbMG2pHv3F3KQkLD1EyLDKAiERSvN/UhtLvTSo6Uu5FOp9xTgzxBJ+E9t7D8T2SdQ5dncVZH3ALQiAHEyWmnOSy5HVJ4TAi6nmPQyoxEST1RJxlWSSFVFpFRA6pdFkuFxZZLtdlvQII6F9KabUFInt9u6kaq0aeCffcgo4mAYQHvgfwCGT9VulIqnCjzk7m7h9F0nup5IBq2/d92+51q3UvRHRdr7RQBLMjitxqK6Xue9m2fd/2iAqJSvPWTEVkX293Fi2tbbvWaq3FoIvQmi/CuCR+ziLcpRIRc1pIEjNycklImZ7W6MEhSZgJQr3VKjs40tolSfbLZf3xxx/2raaUv3+/taZuHh0qzFHNHVZViyq7JyAJmwULqQsTcXIRSVmWhUhK2seqUu9G06MFpxZhsiRipsycJOXkHBKI2E82zaHzwsts49Ce7eLdaxxmMEVtZdg8IwWSpOMGC2su5B0T5WXJOUlOUSMavsNA7MzsTnlZrk9PqbYv1ar5XtretEbBvbt565bc0Npxg9G/TGrPe4xl573Iq4vdT/Nx5xIKjhFhjubXZgaQiMAMIZWAXq/q7M7hPY12SRhk4ylJTimxZzFhLEu6XJZ1yeualyWZ+brkpgQaWEl4XVJIJepst6lKAsAga2aspuZqxODoKwDXJHDLOV2WxZqCRI3MrFlrpgRI6jR8Qw53LNtpFQim1pjNHcRgMfMmLMqAh7jNOX3YeH2s3SgcdKZkTEQwYswM0IPnc4w24fh12EKRgbHk/HS9XC6ZObINaMgvBAt6jHCg1pRzvM5LFu7h0h4kjf+LSEqIRcnm7jnnvOTcWtjI7sbEztbjdxHtDb5Cd+4hzWjc5+4wdrOesOQ++Okc5lNpPcTo3ltw275//fq1adnve7nvQvLTjz/5k1/WKxGntID2233//v31+7fXb799+/r9G+BLSilJs6bWmJlKrd/fTH1/rXVvdSvmDsKyrj//+LRk+bLmny5LEl4uS16zO/aitSozLldKGcsiX35MeRGz4Mh3IYiDHeLBeMrLkmiVLPl//Z//46effv7rX3+73TcilL1sb5s2q043eDJKtTLtwnxdFiA5gcjZwUIprbzmtFzy0xewtLJ/hcGatap1t9re8Wq3Vr9///7rX/+ac/gIZV3Wy+XKzCnnlJYui7pXIKrYo0G5qVqpLXLko5p/ZAyACGEGMguhkxzSoJ0coeHuqArPxppTFg4YGSRg5q7mxCQ5A/TMslwuanZ9/vLDTz/tpUjOklKp1ekVtJt7bZ010dzJrDbFVpg5ariIOUnQv2Gouu4vD3+HDUvkkNpmt/v927fv4adPIsyyLJWZE9HSO7QNecjszK02Ysrr4tp5wJPI9Xq5LJlJMzcmfPly/cPPP6zrknNKKZmDJK9r8D12aqVlSTycWAAS1GsBIA4thd11LZqyJF6XnBbRxrCqws9P159+/GFZlvtWU9rVrNRSWwGhE7B0Jwl8YMWw2wFwp690kkyS3J1cGUagcN/cd5UkD5vMIuFWGU7OHESZ0S3XTuZXz42yE3ajKR99GP7rkp+v6/Pz5Z/+8afn56sIR1zvMOGGV4yFI9WyJ1yigxwQB1l7SB4WWZZ1XVYQhepMKT0/PwUAvCxLa1V6vxfKWdZFYpWycA9JD2MzHBo1cWTtt1E2MapY3B2tiXwgPX2fGaCqe9nTJvt92++bsDxdnnRV65xtjEhvKbXXR2z7vpeyF1NRq2qNiXdmVndD3U3rCI4SifC6LuuSny7Ll+c1CS/rulwWMydssMqMJVFOWLJc1yUv3JoWq2bgaEvv4E62HPSjCSu+/PDMnGptl8u6rNl6Aw0ovLm7U1Urqsl9iXgZhz/cGZQ54vV5WTJYoti9wxtT+5BGaWZRR6Ka4B6GekojZCndm3u4RMYEhHgaUMlGMt5EVn07dWXPPaGOh92OUUFKo+woi0QwhTtTFcWFJD7ClHmRlHucmnnZy9PT6+XtRkw5JZFGZhpNCoYPZyYHUu+VzQ6kI4SD6RM4k54/2G9RyLIXEYbDxEQMADNDOEmczADzGUpRA0hYesc1GEXsPAuDhFwYS07rZbms4RBhdzSLbrPd281MKfGJXhg1SU7iBgZc1Yhjo8ApAjLklkRgmnNalsXMzag2V4106DAORuY0mIndTKkXlwTrmogkpngAEnH3cTu05CQiywesdMp36hWEZmRK4NGke4QFJo7uBz2eBAGlOSdZcr5e16frRRIvOQ2pFMYmUzT+jLwJCj8+Ha3IIkrVicmlJ5ZJIiKKTqHmKaXQB5JYmE1YKJLh41tdNwDkZJ1ojozIKciFyZTcgYBRw+3k5v4pK957qeRmLRImI9YDAoGFiSkYb0sp23a/3W+1FhHJOQsR1JwANag5Wbvt266mtt9qLXbbb1YKTK/r+i///b8/P1+viZ8zM1C03rdNVd9e7rfXTYR0p5wpL+w15YUBitwLoxp+jpa0pMrMOTdJixsu+ZK+rK3YP//zvyz58vXr97K13TYErSFQ1LbahFkkEYsb1F0ZrTYvVQhZhLRFSXjwnaUsi2XirhJPu85VtbYK8iosLhE6d7iasCqA2lrk+Ny3LVK6b7d75FLW1mw4xQHYyMQb5hpCCjFzGCZECErUU6jZFU5ANTOl2CpJOCVprUaweVnyTC0GQIyUkpktS17XxYGUUy/iZwvyupCjFk0ZibgZkXKnNz8FWUZOXMhQf4gfzhUUdRrBMIOAgszMkPBsd6nmbgYlN7ec0/Xp2pqabq252+gAKbzkJTHWy7quS3QcECZzrBYIgsLCZ+ac5YyVrC51u5i5MFtTBdVSSkpmIhlANmtwi3r9YbhYSonIms64YLdW42Ng5qg9Hc8sRInFyIkpwheJSSMpkUkIH3YcekqFmRM5wQ3hKoSTjUTwXv/WveK9wcks8Y/QXExMSrLktCx5WdZ1XUU4JTm7u8eI9NxNjBhjh30IdBM0pEJS2ERS5pTD+nKH1mLaXNXNOrIKx4rRTG7gLpXgzuwBQsi5W5FmzNYhefgi5xgMpfu3pJJra7XsdeNaauQpgElyYuGmbd/323b79vL967fftm3r4VgWb+pm3hppc/ftbd/UtOnr633favFWdSPXn758+b//3/73P/zDz6SVtZi2P//7X/769ddS6vdfXl5/uwvj6SI5U8r0+kSSaF0uz89fRJKZmVeEUmIi5sv1eV0ukpcffvh5WZ+e1mdr8v317Y//zz99+/rWmnm1pkru92rWijCDxIic0BTGLkC530XbCqLLKtnMlYUly4pFhGut3/PDEJl7KSUKAIFwtfKSs1j4tNnct72UUkup319eb7dbqe3t7a3W9kkt60gcSDklETiJ8JIjyyZJMNU6AD/a4Vnnt2rolmLEMER4XXISzjlfL4uILEu+Xta4q3VdiOnp6frl+VkkrS/3LTcirTqj2KF+zWI9Reo3swPJwURRyzbyHEY6CttwChxHpICYsQMiFvYgM7Nnz4lIHE6965o1wAzruv7441JK2bequpsbEYSRl/TlKeXMX748PT9f1yUzORPMIYKlAUBKTMw9i3IgTTjEnRpUzcGt7NbangTuktmptZaIIGzCSIlzTmqmhqZQtao7lV70DYDAIX2A3oDWR5ZaZrGUzd058nBhickFnQAAH9vBeS9INAMZzImUwGCPfK7YpN31otSNO2eGOM0t3IefeVny5bI+XS/Pz0/PX74wRRIpRc7CWSrF/7o4CP+ktahMiHqk6I/HIkDvDxigv9XaStFa3RozkjBB3JO7LYssMewctuew9Id94OasYcGZqHkUrQ4yg3AU8GNnqo9SKcDA9Mp2GzGWqZo1bS3wUimqLQAkUTwi9euYW60eRfP3bd9KI3NSkCeRp6enL1++eN29kDYGIc63b6VsOxPExRtrBZwkAcprUiQ2gwahskRNOgtnhgDM4JzyuqxPz8/mfLleJSViieYYDqh7czismVVzEFp4fNSoqTElUzMjU4eHDc7iAjG3967KDrzVlMwUFIrOiCjedYeq9sKcWkvwv5RaanUbXeeHCp3xCzH2UUbfy0WYWXgiJBy+865YZ3peZIFE8oEIqxlH+R/Topm5Q/1o9hYuTeYJzjr4Gc7crsLNWMm4Z/abIVIbPHgIR9YOIqXhYXjOJ+lSDmwW0cOh+b2XSw04wsw5k6lh1BLE2Zh6GnROkXPIBDA5jwAXEfUaWI4yl/lUGGwhpoqmbrCgcgBxq5XYmYkyZKT9cAcTbO7D/TrTayJaONQIhpc6cqyj7iNEUqCqSN3rvLqfJQv6QEE+1xSCbhwezPbTexRTPFASQrJMDIve3yUKF7s7ewQ/ZkbTkUo5DELHaLA0wr7uFKT1iHKrNrGwqnpv/TKI+hjM5N7zFM8xOB+pLnCQk8Glt3EB+3zuYD+2I1L76Af4YMFFQVYvfmogv2237y/fm+qf/vTHbdv+49ff/vSnP/71r7++3W5120L735sR0Lat7hvMoQo1Vdu2vdZmAizETGXb/vrLf2gtVjYrd23tl1/+47ffvtbS3l7v93thgjVKQpJwqSKJyk6tioho89oMDkksmYnoNd8lZUn5t99uy3rda3t53fba9q2klJf10lCrAeZmaO4G2sy9Kggq4WlUrU0A7CXtm2hSs7ykEAdmXlJJOfVAwhTaM9u1cLRHTSmxSFVNtZr5y+vtft9LKb/+9tvr2601vd+3QEkjWNvTz6ZZfhr83NfoCIqpqpuXFvmNQUzX4G6m3nkbuy2TkzBTTulyWYT5clmfr5cuiVia6reX29tt2/ayl26iN42eLujxfaJRtmkYtRdi6Flx0V6DZl4ogf0d/I4dEHXoZt4xGLtzQHczOvJ/ySd/kLnCtGkIcuFWS8vMJE/X9XLJ1+uSEiUhYQoWFEm82PAiEYggEnfVLThJsq4pqZfSvXe1Nd12wF9ub86ekzw/rynJ29v9dttLqfetvt324Ju3KKEMHm8iibxJgJkJ5ASNdtvBQ2AIc4wRXkZCD5bG25/KpJDMRMPN5IOsYGgsD9nGBmZKzHCIEDPBSZiFKYvkJS9rzjmlUePbuZmCBRiHPBt+wW4+Uw/PWcRJzNybNi+R7tNaOLbc3Vurr6+v+7btpbTeawsRBIjpiCjfgZVCCFnv4dvXCIVQoqgM9+Fl+i/5lcwtmJGa1qrFXF7fXtz97fZm5v/+yy+/ff36f/4f/49fv37zyLF1L4D6Heb3l9ft5dXdONK0Hc3U3JGFZBWW/Xb7y7/928u3r1a3tt9V6y+//vofv/21FSvfW301AjZ2Jk+ZL5ukzCm11xdl4lrbvle4r2ta1wTAEMzWQnklycRCaSWW+31Lebk8Pe+0twZXM3g1Y+DWvHgDwYXAYGjem5irMN9uKSU1XdbFEYWdtG17XvLj+HhtrbMjuTH3PjjMQlyYRdW+fvv++nrb9/LXX7++vd1UrdQaydMYyiF8RqHlop4AQHJTXSx6+7iTe4TtzGzby+0e6Z2l7MW8s+7CPZIMIgkozrksmZmv6/L0dBHmZVlyXtTs28vb623bS73vpdQW/J9DKp1zjKgT+buLuQY7P6h3jOTDzxSVwO/XVHevRgTHRGDiTD32RHARBEUZWZSvw01NTTstxVYYZd/XREyXH75cn58uz9d1yZSEcko5JRAZkkPcwzdnM25F1BOgcmZcF1UHgk7TS62ttqbt7fa6l+1yWf/whx/Xdd22/fVtq7Xdbvvr201V1Yt6YwrvRTjdwfBODsnsTkEh4GatsXXnPcCUJYGymZVaW9P3xsmwcXqGhbujF/rDooH4MLsAANHQPNgFACTmJARHFk7MS07rki+XdV2XlLOkRBTtMh1Og9h7oKweqHAmH94+pdlBxsy0KpqDSily3wBYMBO29vp22/e9qbZao2F6EgYhpYlPB0bt1SUgdMqn2DWd08qh1OmpgvlS3hsjn0klevgHHty1rTHxtt2J6Ha7bdt93zbq0BKRrQxzrbXV6ubSKV0iSohAyUQERwvSyVK1lDB0eh2DBapzVTNyEFQF7IARGjHX0speQxDHAtC4CrFXAxeWlBaQpNYaOlkpgxgEJwMoKFrIHExDU/VuAt7b8RpGxDdEhyShj70aDzPHgOCvtFhcQT9Uo9lLJIfXGjUNajbnrns+jrmkXuIbC/10WC998oCvMRe1NTMPe6Svp7G9Cd7EzJ17ngGFWyf+K3VUxRzW+RyJabD0ZxwG44CJx83S8IcB55KJsYK61KWuNmkEDR8x1dmyiWZKw2xB+GM7kAgy2R6RpJ4zEc5fhzicdDIlGo38y6EpHDSiPA4zb+6t6b6X+74D2LYKUNlbqa1VjTCFmTkZ5nlontW7lwaH3KDDosX8w6B+xqNdcl5Dv5/x9X6QehSNwvNEw4actBCdkCHsqKj3GLfhw/oM2ypCrSAiIx6A9chxhYWGc/JOid97djZttdRWWxt86TRqiB5WRBd9I/Womxj9DoBBM059ZZwE2X/i7QaLLOuyXpbo8QKQw0otqkqO28vr9+8vr799vX1/mTcjgIDgrlWDF7k3rOj+ExdOl8tVruvz09N1vVyWSzMrtZLz0+W5/YhW7eZ1o+ZRrqFKwiYri1SgKUG9VivN4d5Ut63QIIV3sHJxYic2enXQXtt92zX0I7Ez4N3I1oGnQ1KLU2aBJE45L2ueju0xSmYm8phsEmLCDQZqYPYqnZzfnRzUWnt5ffv+8lpKvd3u9/vm7kF5PdJgA0jyXLbiXLWxMhGqalIzgBqpcW1t23dVu2/77b6rWtnLXoq7jzLm7oghIPQSNytVibDt9XbfmUlSSimZ+X0r+15a09tt2/dibhESxMiGmiCfh3gcCzxyFFI4FGIXMpNZR4unjUTLsjxfn5l7HyFhXnMW4SVxXoMqw0d/GGcCyJP4ktyz/HBdUZ+erst1WdacrpGM87Re17QkTomXxEtKIFJKhuRwE/PeSMbcjAajNrGxkJrvVf3uBtua3aqVUn97ud9utyXXvWLJuZR2v23arJR92zfAL1e5XjMzLVly2CrqcCX3wRyAGR2TKKgNyU5hFtHEBhHmei9raLqKumSIEE43iAaBd2xqd5iyJVGylrlVBrAkySLrki7rcrksPZMrp/C79Qt5d/xRl0oIjKZmbE5izhAzB6RUd9fWbvcSiUWRwV9rV2G1RmNHkCCcWSKJmYSHXH7YIuihvWEDus+3uw05BfNHtfaJVJIulVYDJiwutZBTvW3s9PLy+vL16+3lFd1ioMScImppHllycIUdmjexPF2flufr8/X5sl4ueS1NTQqBr5cvJEtrBt3Md22qGzUvxMlkdUlq2pq6W63eqrsbaTjDQ22xA41YQWq+tZ7QBhaAmrqDnci5t//rsabBaJcBJyFOnJa0rHnJ0ysRg6ex6x6PoVIAgM24p/l2SNKahlSqtb293bdtAwamJQq8y+Ys3f4O6yk1FW4gNNVqKohoupVS73tR1VuXShrRvXD/DbnRfw6s0d+dipBH0nnv+mC279FMYJLrDn1F3X99uDq6uqUocqdZQdINxu7ZPUulNa9P1ydhTtKJ2ZeUmEgSRb5nYEp3J4bACZ6FXAiZf3haxfyy5uuS15SuS366rl+e1uuaF+EkFDVfIG6UlBJCKMOjH6YOqcTMnkwWNvO3W42mTFttL1vb9/Lb9+315ZaSvN00p1Rr27c9dp9qIUJenpZ8kbhcYvcgJw1dOxI1AhdEiSV1Z+BpWToGBP+Ii87yiIaXvScoRPRDwITu/3F3YU+iRDVxTQzQmmVJ6bKkde0WXF66BceHp7xP3Qnvu7uTBiw34u5R4rSzu6ret3ttdt/2+1ZMba+11hZLDPCU+fq05MTiSQSRlclHwKMLn26eDaA98PgIhfTPHoPxQSi9l0oUGToceWYq7g4FLHI53dVNNZosU69aOrn1+xruW2Tm/XXk6HAzrdqkaQSkR4OJKTc96ALC2nKwe6RARVqbAe7EPnpyhukDNJg61Kw1VfNIGRtRLvSoxaEuzhGOjhF67dbo9wSCux03/8kxFARNlDFtLhts2rP8FcNnM5ZGX9BThfTEmAfDzR3e295Og2v+19VPP9tJLJxMMXePTprDvejhRbLjOu/3i+N8pmNR9Aeem2nox2HcvFtDxCNbimPT8mF/0WNzsInGwvGfU14WWyJhr1dAHOxo02rwbkTC4Z1UqGcpE41+aiDiYP/umNRVtdQWDP/NDEqtKRy1ahgnEe5nRmczIB4Gig9533feTLp52GUd2+A0k/4h+32sn7mODmvoMGuGfdxjWZEt5dyp2tDTl2awNm41evhOmoG+NIMKd6x6ApzY2dkcvSR6qBl3b81aa6W0fa9Rkl1bi9sNiBfBOkycMxcd9T1/9gm4+yGbbA7H8WJsvPej84kFly/r8nRBTrIubu5FvZo1rdu9bZVKe+LEyxoMCuiJD+6ATWTe/ZmRhA2Q7HutfRZ4yYnh4p1w6172qrZtZWtV1Yp5daiabYUrD33ubkDw87iLACPxwdy3WquaOaq7OThRmlZFXJ87hhsyxCO524DWFIRc8l6qAymlvPR8fLiNeq2HLRdBWCYeDH7C3NtNdJ7A6Y2Jmxho4nFv9aXsR+Y3zKHmqm5uDmWmUnWv2lorTZtG3gWO9Xt6xJD6ANzMwoQe2XFuBoW7a0QfzKKRdd9pHcbN2500+H1V98cedlzX5gQKWoMPQ+Shj4hZIsORetGsEAuI4Orm6qFvzN2RJDGlnJZEi/5oSfjpkrLw9XqRlCNrLwApomM14NBjSwMEWGYRZ2ZJNEpEmeFpMM68vr39x68vterrfdurqoK8BotnMA4S0HkMSEAStlgYxj3jETBtrqTmVXVQlQDAYMqFmzpBTVtrIe3eySXCCR/xFC5BUBep/BAe0j6ybYVTYjJEyjtAOaf4L+UkOaclc06cwoJDhwid3I8PPxfB3UnV3cgdrOYmTVkSq1e119t9L/Xr99u37zc1i0AtEeXEwrSuKS1E5Mxk5syRPd6lVE8jeKw4cSCSYXxYGEOtoivaD2Smn0olTkvO60IpiZmbK1ejqk4hPNH00h3LIZWoqpbaAqqGKwoSUZwBPIhLqdELxtSSyDXn5yUDVLYaJHeltNLUzKp5A1S9ejvQBYgQGWYgEmYgisjcmtpWWqnNQd3bSebi3auB6Y475MDYPeaEsJZrbbUowMSSexVwj4d/RJjMocLnZpNwtRzMYN4j+/Py0x9Iw1WMvuH9pFXcBu0sgR1GRrVpaa1FVW2PCYzO76NIe3gNvV+W2TW4mbpRYaMhSPdydwlI6IHp7pEK6eQdW/bBGoPfJ7NLpiER2abIPW+77jWJdGke5VYsvQBrrs4AlQCikheg6/IEZ2HPAias65pkiKSorZlZGtQrgXpYA0iJzZwlSggBkDsRLFw25H6/b1+/fWvNSlFVNwJ7U3aznkbIBIkkCHCPZR1tgijM/yBuaU332swDvnTd3Dsd9QTR6FhnYWA+js+DBTfEU5SpjYT+7q9xEMPdmEUYREkkiYAQVJYpSUopYtUsiSUd66s7dqdUGnvAnZhDczkTuUtpLEJsTe12L/dt//py++vX1+C9VDNhuiwpJzH4c12SUEoSpSN9rXflCqDzi7sjlqsPGRRyCidC8Qn/P4KlD1mUNOAa02jdCwYFuTTcGYiGFQCDBCAdLEHUaZ0Gvu9mCeAwdZC1pnWvJsrqSZ2AfS+1VDWHI4koMYtNCm3vvnoep4sKmx5m8Ij+DbjxsIuImNjIoqptGk9TypFPzryRlKFGqtJMmxJzuJ5OdWqPp+bz/pwGhhM793RFGnowpNLoxDpg0zD6yN19JIxEHmZTI3MWJ1DrrGshTUY0eUzUMWWnY9xvoHh6uP8JiIiIwoicCGkYrPN/84TokPzsTfHJwPF+AU0/gru5cZ8Xwqhij7zTYT/SxH3M05a2kTpqXeXGw2OEBcfa6JYcIoYxF9zRpMN6rmkMvKnW2lRN1Zs6GG0Kksgt4pHi2aPKMHOjQ8MM5YE2yBVmzKuHpyIccg5dfhifx9mguS6Ooe+vHz9L1PsAMFGYDd2CxtS144qPX3443QgZxswTAzZUJhwInuYZ8FUzNYeTmk+CwVByNsRSDLYNPayjg/DQgJhSyYZld5JKCKH9bhV9lEoEIRfq0JQQtVgOYoeoi9OSVnBgWg6Lcq8N5Ai6XxCxgBjmulVv5mpWmjeqe9tvhQkL8RsLAfda7rWQyPLDDz98+aJmfLuXWlUtcoKYOchVgzUeDiMySu6u5A2mTtW86SAQBJAgLCIJZA9l7QOyOIzM3Q/i0Vr1fu+8ZmYe1U7E2Mt7LkoiSimlfFBGpJRzXkDkaAGv8pLzshC3XBc7yQic9vBYR6FqrDUFoGYse1OLdUdAqW3bdlVtTbvJMPDug6dqQGjv7vOBg0LbkztZR1hsiO3cczcfWgYedtzYKOHa71SYasxkxmG6geijSIpnUjM0FGpmNmAlq1o1RbSP0eYOZuFg8iYhYjcvtWlTJqiACVupe6lR5a9GYIK6z76SMBq956IBM1xjSInIzCyi/LAsLEy17q+vL2relNVJiFtv9XjoUSZyp6ao1UzJxRp738ggc9/V1KyU+rbtqhoeHgSO6qrR0IfYe+LzJ6KpD/IAkj2qPzH9cIUNvT7glQjnSBQSTomCzWG00Yv8cMYk94yEyTOYDVsrdKnDid2JB4+3mm2l3Pdy28rbVnQoD2EiIYdI5b0qC7NobRapBrEGdbLXt87rHkVoY1me3J04fnWgNtVHWg58ipWcyU/UZN1xSGB3dicgpxzJrEbswN4aBVYSppRARJLAAjUt6m5maNWc0dyLGQHFUZzIsWvbtEpO65cfL5dLU61NzUHQWloXiywU9QumQFw3KpTIQOqkjmh9NUyZAYlHGLELJkJ3FICNgtwlZolinfHooBNfJkawLz6ODwUjDY8ItKQkSWIDBzqVlFISB1KSppFY0OuabCh6THDnbkYatehAqdWGBxiDykoPmoGubd65mKfT8Jj78BzRqAufq526G6lfY6xYP+2cvuVD7gzoYqMsIm4iysM/EUnoHnqiaDDjDo+YmJmZ1QEKg0hgJuEJITomWFMNhMeMKBOPhW4epFhwNWKKpTis8+7z6SHW+IuZaTNzchcmJmhr+7Y1gyIZRGDEEIpK2kQEi055TmYIngsP7iMmERGCAs28qRXVrVTVqQwnq+3wQRGy8JQ0nwglGr6FjpWGeX98fMxMvwAROROxEKEneXdy6cD13SyBd3/CcFY8BCRGtk4HX4Cjg3oih1fV0tre2l6b9n6hMKGswkxNralFSUBTG8YGAA9gZea1taYhlbpQO1mw3eN1iCfQwbd8Oj7kdgf5S/jpmsGc1cgciC6DmRSo7nBVK9bUfS+ltqbuSNINYmYSMYeDosND1B7AnXpvHbAR3FtHe9H6qqqZtvF87m5OQkQkzE5MPRbCodGcOOZ/zs9w4kzxfCBbg1H38xD88DeKCHX+eRkR9MDf4d48MvtOy2lGPrrlNpfQ8dm+yohHn1Yaf/VDTHq8T+RBqsfsoeSHIY3WaQbCuOvyZipBn5KgT/Y491RNPv9O4fwc7U1ONz0MifGAgRtG5uOIKVkv4gOzYRrRw1o7Do/UIXV3IeLe1shUESo9DEBmCa+Jmg3DxU2tWWdYN3IYquq2F2Ksi9z3NbUAH2CmjJwoOQcjNLsFqZxjFHn0/rqdWgAEhMhr6lvTZpSYXZbMwsw5ZCM4sfSCzpBKpkRKRMlcmZtZ1dbUqmoz1VCgB0oPwW/d1IKxU/vQ4wQYgj6QL7sZx3rnORaheLqTyodZ5NOjMHJrrdZa9kIs+30jEAsnkfD2wwfKm7JvSLqzGguioelDONW/Dm3n1C/nNgSTqVoXZUAs1CiVCx9o4GU9eH2OxTVt22Af/czZ/Rm/0rYVyUmbaVU4coUo4LRcrguy1lZeNm3tXur3t1tt7dbqay1GtOScJREzpUSSAGpEtduQFFQn1hrMxVDVAVd3hbHbdt/xejPzLdqnmnnrUD1zFhE3b40BJxGKslVRM3UBpyxj9wBwoqbhqprZSeHcjBIqCrkShDNLWphZcs7LMhr5drgR7s33Ju9oUBG5E+FcAg3jvsszYhE2jxwf9whDuANuPVSqQew49EbTTkfLUsJvELdgPgm2h2NgaNXH2cb0gvnIKjjD5uE24kgR6At/vH9yKfV3ZIhdDNqm1pSoMbP3okwykXiQR6HkpdbbtkVRHgvDvNTGRAY1a4DnnJd1IUJrXqpiVOGZWW1NVcM/yYTbffvr12/rTVorcE9JhBEG4Zcfnq9OLEyOJNAGLdaaEcMURGTaAivBPBEJkda23be96Ndbve1tTfmn63NUalwWE2ZfkhA7qFar1YjcvZpXIkSGgprttar5Xuq9tEFEzWOII+5sTAaAqzL5tu/vLJQwigMSErzHhyOh1NmYADB1T3JIVVXTph5a3B1A7TnC9PLySvD1vhGwXi4iEq2PpzOJqfcIm2qmBys67qJo76it1dZK1VJ7daTOsnBYUyMmqbaXCjgRX0o1s15e4h6QNrDSkEoRyjglm2Ouu7HDiCL6+W6bfYKVelfCqtqMHKy9TjClTKuQU6FijqZ63/ZS62ZarRlRcu+5JSxgDq1qAQJDxYc2C1Hc/Nj1ZLWqlGruWnXm54QRMpDJsM+pd+cDc+QmQZhdOlgEgFFDgkDWB4jgkfMe8xTRtJEX00vODwvIzxv/2P+j+n5WUhANSDZMxQ6TumY3D+/wNKwnxAgZAsCNNIyRptO8wkDnw4kU3F2R1kkDcPU59oeji7sptcKzPJ/hvfN/YqfDoOCe/DOswoigugePlzsirnVQGowVjGZWa6OIF7h7OB1C7LgBnoAYarQa5+xu0aNduKsBTK21bdtUZV3S7brmlIQ6kcByWRc1OJm4EcwQZhd3b3dHdx7U+xhYqbVS2+2+vW21pbZyhsGTJxIXEWFzJ/M4FZGrqXkDwM5EpObRIq2qVosC+w5cgXC3gWHRN8eggH3ASsd6dPMA8GrGSs5gRdDp+eBwD9aaaFccUcs4m5nDramWUrdtB3y7391UUsotE83MraGCT6uVR7KTJCfmGUzpgKgTf0wHJqiHDXo3OgmS5abdMQl3IOpmbYin0MR2dol1FzXG2uzWa4ezj8dHJhNAGcojbREODnnY4AAq8Q6qRBtodxTH7qgGJ6/NuDQSZgPErLbeLaijtZmq4NSZ8T0UjBEVVZTi3mcdA01Eh0WJkEfsTu/Vfd12I0qWqRNme9jJYUgSdfoJDsslAC4PkREwp3+y2yMDLPjw937iFfDebgtRfdahiaO2WkuNzrotukNYNL8+llT/t9tjc5F5zD2IomfsEIA41nMUV3m4rglnmXOausMZQbMO7XgXkXDo5IOY61EqnTwdPHOrwoPUpy+WUVwiWBnf4W93r7Vu+2aWliUFyCd0rm5JCH5LVQOFnyJSzGOb9aQtxLXMS2tvd0uVc5LruqYkpuqqzLLt9fX1Hi0wU0q11peXl1pLVzlElzU9XTIzaRM4w12YckrNokeAEXNTLahwFKqixkw1J3dvTVtTIm+magoEMyXMEWXZVa0n5hzmG+IT5gpXAhI7E/zDlrPogtK70DoZhQBiIjcTJhz52R7+opmUqwMrxeKrTe/3HfBSm4OXJbNwSvnARUDXoKf2aCkJC0UVBwtvWyl7hHrqyVLs10f3u4Rxx6oeFlxVQ/eGBFay2kIqWUQ2B8SfAehOgzMHJAJ4/yW/EozQGI3RgBYJdWJgJ4uGaYXklbiAXx0v7sW8qBd1J/heLW2BlZhZ1Upr9YTY1Cx8JCMy5sHkQYCWsgUXUk+6GuijVmwbi4yRouE2AZglZ45eq4GlQ5nTWChRnxsec49/+nyNPBomSeBRZu7hC/Qh3vljiuDYe5GF2Q3zCPDft33bS2tt2/d931Wt1dq0ucViglknC45gP3q/EjscgMAJ0QTi7RKTWVy6Oz9kZwjm+Y0Bic922XBsUv9kH7jz5SZq6lKJBlSi4MCkUeBvDjI4O5mZdyoKfEiecPf7tn17oeiX1TlZtLnbelm+fLmSiDvVpnCUUve9dqnUZ3e6q4zc2162vTJ5iyZgIve32/22MeHp6el6WUVkXS85523bfv31123b58z/y7/8w//2v/73dclkmW0BPOd0vazOvGyajchRam2lttSsWWJxNxHWJHtJW0lEXrU2LQ7rhanUU4lUrWokOgzvm3dzQGs1rUy4LpKFDyN67jCzqiYtCl+JAI2EodGlEhhSCT7P2x2lk8WUAEBdf/vurzcR4a/fXoSj8VQnWIqZnZnxSVKU8l7WFER3z89POadS222rrdl922f7+RPqRrgRlFDVSlMQiei+N9OepePue2mRtNh6DK6H/wmniNlk7JmrBdT+K1mUEeKCdZ9dPJijW3IGakQNqEADVUd1b/Dg5VZzbUrsxG7MgQYt0GhU6Y97nX7oaZO5Gzd1+HmR04hMDyjZH2lGqcKrF2ln7h527vn7OJKu+jeGjd3ZsQIyxWnPoGiItkdNeMYnXXJOxgHXwYEwaBB0Qu7p8DGfpfoDNM2c/L6r5+WHnOCwlSx6nMQSHW2bZhhsgmk6bpNmWlTf7A/hHR/O2SGSxv94iiWApnD08cRxHyGIx92cxsc7awIRghDH3aInWlKJyzkws36HBRe6f/geuk/UzLRpJdi+l71UYb3d9teXNyJqzfa9Csvl0nLO9/v919++b/eoOnRmen5eS23MnCDkFutkGuvBs6vV3NFUlRUe9A9KFLk2BsIILVnV1qJ5pyQQjZwd0CigGVIake8jTGbi/AlW8pFyGRNIfXTJArAbMPOz+4KYKvrkKu4D76U2VRVmbdprT47KzRNWot7dQJi15Zx4WXISdkulWeu+pBlmwvRe+PBmxDq1kZGvZhw50xRT2YuZdPAjz9DbKPw5LbzTAvUPSab4hMkktizYOixBdH4ytVKb1lZq21WLWXUzos7SGyEHd1Uj6wX8cwv226Eg282nge6d80Cd5diB0bqoY4RYQyPEFg85+KWsc9lhWIXD7TucKt2yHttvIg+iqCmkk0oZ3+MhP4yZ/RN3d0Ce0U+t/+rmtu0lcotKqbVWi2k+mefdHiR0ZjWEsR85qDRdUvHZfqPcvQLBIUmR+cNChEhg6HcRtLbel+swSI99MJZyXw/DVYVHaNalYI8HTJ8E00NKTcefc9+8Pxw9/7C0JrVGIJPC/GnqALNFzmQngBlrenhkARhBQcaIxApq5ltRJnt5275+fQNwu9V12YlIJAtzqfX19bWWCuoNnF9e79+/v5VLXahl0n0r7poSL86Xdalgb6ZW0GxqHzXd972pPNUlgFEn6em0Oe4Kt+agnskdSIKURmA2Qs3qDid1bwb9sOmGNrKBI7rFRhQLMFzUXQU/xoDH/AEIP6WRwsygZE2DN/VIBDjpbiKi2GvCdN9STrwu2dyXJZlTVJuG/ZgGLQpGPGZIXvfON0BNrdboU9+jy7VZnQkBwxXawZKNdIThnDir9s+SKD9iJTBDmIQHE5g2i84X2yANurVWte3uymTC7hYWUngTafj7LTKpwmkChFdHkswwEqEbuxjzMLYVundubsshTIbvLGasJy6Hq8OjcjdmPTTOyPEaVvZc9P2fznqAQUgF2AiXzBDpO6PXR7lsIB+4z+D97Xa/3TdV3e7bvhc3D9CEcQc+wF13j4WgYuogZi4ihDjqrZciXWtKpShNwKhUwBixOdvuQbJ6zPWBZ6aaer8Q6AwmuzTsDko+6kyicoTmoB3+r8chgsGbR7wGwrxkkXAVB89Uv3My9WCjVPXaFEMpwg1eHZYYSwIz1+a3rZLj16+3X3755uZLXlJKAXDc4d6tYxJEYeLzl8vPv367rvmartd03Up1a2tmp/T0xJ6t7fVemjYFei+Aqs3uTYSfn1ftTkOYUzRua4aocOqJaaPSIqYtLznnBHd1jyYKEWVuHxIDvEfNI4YGApw9+sE5c/Qx4OHRHNMyRM0prywQjTUbWKpfaCaQRAnIAKChWoiJ1ixJ6LLmUstlySxJcnaQmYpwShy9cygaNvcp9iilCMd8bbqXphrprOFo0dLUHaPgZKw0wqg+G66VmZ4AgKDvdxjwmVTq3xjIbRgekd1r3cnXfdg0EQANMOfnk4wlP/4+ZFAgzbHoeeoFGtNGnxzzIicvbXye3r0x3BPTKCGaCU3zs4eNdp7/cXXgMYp1vlwMS4QlBnTS3vFtoOAu0CYm6beBeRP9db/V8P+MCQtEMkRB7wc7asN7mlTUfz0+N02HE4Jie2DoTkTrAzieDC8a34vf+CS+h29tGL0DrA5nFtGn4zP+RGGPj0YoBMDcyEDhdYfbsBNin5+0Uk8JnBNg7qoOR2taSiiFZt1nZdMBH4/tMHaqVUutzJTQFkRrTg9+KBEWIxdlIg3F0Gdn1GoFlmGaQH+CzVFsEQn0GLM8q/MIY1N4BKA/Xz8YVlK8Q+bOTkZORjgA0hBCc+bGevLT2abLyQfgP3tLJj7nOZ8IS4BqaUIkDohEpt6Bh4l84CA63fpc/DYSUEIqDR9FXLSPRSjfmJJR5u3h9Z7P9+kK+pAZEFSKtdSitTaPVs7NVG3f99ozN40IzLQsi4pKEmni7swsLN1TQeQAR4XkSOqZgZ3BvUBDbeKwnjtKPcTQAZL6APcH9HHw4Cibb9Kw54a07lKJ+WEnM1OnOh6N2KZq6g6I3s/vYUnZNKEDslYNEtvaWnBOBmcWDqDWfVjOzkzuMDYRmfc/zn3AugBH418e9oHM0RufHFMbjvox09OIPdDTXMEdWp+Q1Lw2OnjDYDfAfBUZ9vzu6uSDFWIeRJRzvlwuIrKua85JOPrlkRNKbdST4xMhwvnu5pE8SVMqgkJXOUUwDqXZfa8w36u1CPZL4rwy04VTmE5+NLNSkKvT622vVWklWXmvOkl4kiA7s4lelyScJa/LKhEjbw2EUsrLy4sI54vkZTGz5nBtIFcjt8gtColgao0AFl4vCwHC0JTgCFYRJz7v6z5B1ksC0YWYk8FoxCrGjBDAQ1P5WPjUDf5OHHKce8iqIaGnY6jvliD3c4aaE0UcTaWxE4s52IVpzQL3NcuSRZWaWqPotnQoNBs8Yt1SYbhjEMUdcqb/pN6pfbAHhYjqsCGk1ke59DFfyWqpNdd9r6VUt2A7VjPvKdzDqGGRvGQxMTVJMiEGhkQBoiAu6C/S2FFdOkRDQR5p2Xban59AurldxwRhcDCGSTVFUpyKhukVzzxz6ucN9EeI3rDMzNT7rrq7R0dWSSk1kfdhuFHW34tm3WprQYNba+3t3tRiDdAEzsLUu4SIw703qjtJjs7Xf7KYJNHIP5+3TlOpv1vmGEtgQLk+jsMFO6VSXzfj/fe23ODumIN9SMkYQ+BATjPh4rTriCjlZb1cU5JlXZYkzBSdtlVbacXdo180EY3ECQTFChF4BLVmb06DuqM2hRU37FWbEYEgOS2rJHl6elqWxQcnRmu1lM3cmvPL27YLs3J2KU21NXJjUBJeiBUJ10WTZMlrXpi4lVosCHb27y8tJfl5+THni7k1h4OJrEWxEvraUqtqTuQifFkXIhLhyHjUZq7m9MBlGt/rsdfpkTAHE3cm527X07Tmw2mIAy4B1OEkTVh1kmeBwo4Y/AB8cdNGagBRpO5Eckx2Y4cwrUsiwmVJa5YW5mUDBmUVdcPQ1ayOKQvgG1bUGX8/rM7ulcGwiMKZROOv70boQz+47jcZZNp+TkIfUmAuVh7GV7TYpHkr8QgDFA2QNNO4TkRDw6abEZ3jQY7xjCftWGkqhTNEslP67JzOcS/H1jok27jN6XOa5snvf3xOPs67vv883+yD5DhKMGngV+eHdXLcJY4Bk47hKLDSlKenO3oAWfCBzXwKpS6nMDhTIpty/qCP2TTTHqcJ/IcjacLIod9PttyHY9yjTx0yDMBj0Caq66jScZqF8TLCjL3AcNgGHf325vY8WlQhSjWZRNgAIjMoYy5dIkQ5Gzsz2NmZ2TnKIQGAmEQibBbddsMuo7GmqMPvw78xn/9Y1cxsbDAich9S/t0aOo/6SRfTO6Axlby/3+lz3v14ST1Ztt/O9FI/fvXYYcfqnbt6kskRM/Hkg6O5Cuak43COTgD+cGMPy+CDHn28mQ/Hg1RyR3R8BVEkkpl1WtVeH6fRYzNsHuLE7q6q3PjASud9fvgp+JDk8GHgkoT/+3iSiR6Gnj8elKayCEyDYa/1Sv8xtuxug7t4ruGzqMEAC1POxUfjjywJoOiuJfLegsOAHiPJ9LhDZoq0k4S50PvGHoxlXUfMBX0cRMGfeTJyp7ebh2nDD3P8AVHGM829ezJqDwzl88XDZ47b6EbDGKgxdBhKZU4D0SiCOo+QO1S11KrGgDeVLCKXtfvGJBE7iFo0iCeWlBwgcuWg6eg+GUlOBHKjoAFwbs3N4NRr3NOal8vCwkhkZA43NndHIoE4mDNDxMPLXpq6X9b1H36mXd3vxtUbNy8VbnCrbQdoSfnHH38gota21jb0UjfrOcpgN4umAx7VUIAD0eV6ySn42FprHZxKIiaS/G5THrh1skMGtjmpy5N/qk/CowpwdJgULkPq8ii+xEPC+5QKx4WDmTJcaebDWazmAMFTYocsOa1LEj26rQR2G9R7AWPJ3A/f9eFuwYNFQ2OBTA1/Uti/J5Y+qYPb952YtOdle0+rGqBpKgWgY9PWWmgVms6I7ogdahaYWXwd5fHo4iOckszV36drivIzVjpG+GGOrTcaUZwaHHLvFdT9avPkZxHjw6d+PhtR1OuSjONjIqUPwTSFSy+C5Kh+o9SviCH36J1/6kAx45GGx3VIJXRPHB0w67hVei+PYshovpoe0Ik+TzcczhCfmOUBlXZX0ZDXJ/EUsnG8+/CEj4PjbfTOJTdV9pwv6wKAmJlSgPFgbsk5cUoARRPZvqDJmcHiPRs4OnIqmUVBAIXVndaULzliZ4agenWHQyCcAOfMYHGmZqitOWhdl5/WdVcrKMatEEpiM4pyYhiul/XLD1+Y+fWl7bsCPkmChsRHqxpU1uHkkcSRB5RFchIAJSpyiIgFEJL0UbGd1xJwhkjk55WOKYwm4Jq20Ejfp4GYKMyjISkm7+F5mR1xJGBU5KlZ9FsFEP2dco6OuGYOR5uzfKqzGvJ0ArYDM5yWxGnLHubIfKjfQYD4rEvlEAePBt+DRXL4jAkhQY0fpRINqE/jqn1MQzP0JT0/Beo5e33swm5+HNLTA5wFEw8b8NG11F2HRJjsbp+IpP55etjLJxT2ab7SgPNnEcxgi7K66dKaVzzJ8YH5P5hOA4TQ+Xi4ymkQDxDdH6Z/ovsZArl3+2fabsOaxylQemB+mmj/UMn02Xo5buLzoyt46u7Nw+rCw+I9r+Exmqf1MH+OTw5N4BjWHRFF7kQvH+47GuiMK25O6uFFdgu1HptqFGsKU/RZaw4mCx7AKEni0WAYXdXBfdiQB/7uUYgBqSPTFRGJRRB0EX3ILZlDP/45Fv556Ds+ovfTcJZBcyXNL3oXTH7esfPwk8jrv8ej2fF0sQjATNFAXHrZZR/ymZM5Z7nvo7mkx9KhY4GOhzhL29OjfFxRH6VSZP9pH3/vUsjdRfoGS0GMPJdVI+LY53xYLnG2WCkjdQJOZN0eGc0cjnSY0R+lS4XRym6cad77tOfHsl2WJb4X0V/vDMG9TPO9/D4kzpRCBqLmIJBIp5IPlR6E4A8DRH3NgiLw4wIkgpsHU7W7pVOa0vganyVRh3Tz98PIPQkieoy0nbASADoPyGn+0RcqAeFg6qIwHpURJE5EwU3j6AGReRoapzh2x7Fdzgv6mIx3B5GI5CUTUXD82CiRH2cjYg7H2tQo6NmuIHEEPa04zXvzsRq6IUXElBbOqwDemqopRbSSqDWrbXczokScE/PiqFHUK5JTMtiS2qLELnpdWpZa2gY3syVzzizM18sCv8Y+L/vuQCdNV43BZeGUV2JOWZYlBa4t+25m2+1+u+8AOzVQ2rbdHpfQg76ZPw6n68OfMNzeND17feC5x69mBtwA4CdnGHVRhekVAVHH5R4taSMlsjXmcFc7gCS8ZtHIah41uAQQs6SeVptk3DzPNTZU7lgZ/k7qDAWDkVRx+vjD8UEqoacnTfUcgtOMYin1DjznLmCEKAubin3sOOqdxkBk5p1DBMDwTMVkjHgzD/zVR/VUH3PWNlM1HGqXQlO5iHQzM4L2wzX5TiQR0bD1yF0fB+gw68LQ8A9LioiJhWAsEuUXAjh3Z5m7i3WpdIKbh3SAg9lM3/lz+AABOCvJKRIepFAXGvMUD1LqOOuj1Oi7PGzb/sIfPhOCqcukD5fDw4sPpx8Hs4ikDh3c3aFmElw/I0e/e+4HhGQeCbFRm8oI7qzuwIsMge4a7446Fk4Lm1kkjDFGKzX14HdlhggbewU3MgaDKPpBJaHETMkva27CDGitqpBIIBTOSzZb4/HCT9QiA8hs3n/KWURylmVNxERUWw1q+7LvIZUcFJSq74eJToDoUQz1F1MOnVb56fufTHZovd5aiPyYwYm1fLYLJ4Aosi7Ujc2aWvQTCucCM+XEbDRy7wcCYBKRUdk+bnZUxwwj9LjHiSoGugP6XRIQGvIdeuvHh24CwQGfJCjtPHJYHe7OQULOLClRJ8T2SJJi4eEtPuPt4MQHHD0rq/eGxgkFzhGbnQv77+dJ6HboeO5pY4Uwmhbc9HlPn8knvbhOZtoxmzim+WwJPrq25jfOGg00Y4FB4TU9NRhlaHOuaKisqcaOk8YPehQBp3seZ8Nck/6pTPidN30Mayi104uHb8Wnzolu3TCc+2Be/PE7p+egUQXdI9TDDiIOqsduoY8R6Cccu6+PQrT6gJkz4L2dcq/P6KRPo6Rwjpx3Wme36B5utamxNWIVMXeoopKawYxhIO+9uhPrmkwtCcwrlAmWAikIRYoZmxsgwsuaRFlSzpnDZO/W6qD7ICIRQa8eHWRGH8aoL54TEO6el3dY6RimuQloWJEzjDrdFY++mmHpz+u/WxthwY104KE1B5wFuRincctdIQtPqQRgROmO7x4/Zzby7+ivWCJj1h+O91IppXS9Xq9PV0KQ4qILpt6nr5Mngsi6odfpirpl0L0nfc2b9QmjUdATQK9DdyKimE0CDAHQjtt/P4ZjKKPUY279LuM+WnDmbjgKPuZYnKXSWAI+wcEUa0SknxAJHqUegbViAcXnmdjhqmxB5ttDbngnE8gwOfnGtprXHz8PJNxh0RnWPCjL4w5pDPFxt+eAWy+TcQyCuA4/HsDSOHu/hMUcjTfoWGX92+/iiUQinILbMUAkUXRaYqfoHyzdNRncZgYaMJkIDBBEZFmyCFtrCnIzExCrO0icxVncoFWDXIeYBaDw2GqDNm8Npq2UKkzLEy6Sep039ijDzTAnSIYntpyfr+LuZqj1BUAijrBhoHqDk5m6ZZKnlJkI1NtIuY3CrJE9mzg9rezorKv3D1FcwkiYp/7kQ0kflbSHzTbly6HezmlK6BRj8HMG5nh1SKVpBM85NFBzmLqTo2kwzET/ZxFelmzuLJwPswlH+Rd1f0OguVh0hx153kenBTnen70//JDLj8ejVCIwc855yQuBg51ousQmxUjQLpGRw82M6ei+hnFD/bbC/PVYkSHgH6BGHy8Kl9txiyO+0x/jLJJOx0kyE/Ahr9J6V2EQPXQ0eXzik4XUL+dTcj2gquMJx7z0Fto8wKr3h0Z3u56k0vk01HX+ye/8Pv33fLXTjI6PToH8qIT89MnT6wN9jgfy04v4xONDRhpxLGEHMMFTz8t9hwHf3XRnxZsmKHzwJRHARB4Fx2NCxsgfm5CZJCURIVBUoPcKvOiVzQ4Oc8oOnDWCcGYwHTlK0VNv0WrOhCiXCvgsgBOEByUciQPbXm633d3Tsua0oAMz5mjm7STC62WJJu9xE61ZrSHnLZyxTMyJHYhGcMIftt3EShMgHcD7bL69w80HEgrBNBfBw1ohfPJW6M6HLr4OUFiWas7qFileg+ZLhBlORGx2nDZM7yE2+1KJrTeU4yGeotwIc/EdeIqHkqXjBA/Hg1Si0exMknSp5FMqATTDEWcqETIHIyyzcf5eMEg9deI8RqdN07HnTEkfd0+P22QAjfFsJ7Q4HFAde9iESN2t84CJzoLBhyMpyvHm6IzV0V/wJ/j73UETIZ+dAEydeIb84871926CY3TG/jx98sMFQ+GdhnH+5ZAWEzRPaT5k44Bux2CcVNnUKqChkb0r4tHG9d0NfSKWwtXAM1Y75o97Gcn0JmHK8R4R7WoL0X8KgLbWWnONNhgOTJZ2wuC1ClI2N7gpDNoUICahKHgjkhTBGfIRTwtjMOow+8ARgRC1qSFKeGTYMyd1Vy1uYInEdjeHqfqomIvlxCzDwhqAxmeS+rvxGcmKUyxxHzQ6Tfnp1elFX7mxeeakHRc5ltAA/2HbuTEOEoKz7KOh4fq6ZGaRuI6RnU41tsS8yplJZ2ClscaM7cD3B2qzsdaY4DOP4fF439E7ypcu62WUVfa14p2jwNTMWoWP1lRREiQDHLlj+JLgEA95HA4A6sZ3X4/+sBFO/7yDJ10IPQCXzgbpOLiL/ORXmkphjpr3hg3zOo4I5qSOpmUGOwD0OhFWSfyY9XFCH4RDovbvcueS6dNkQxiYeSis2IHOHXBMuHIIkHdL6pjTk3w7ZYv0ATqtjfmHeasD7PaKymOIhnCaJzir3xEB83EvdixfArw/wju5RABTkE5wSlmE5+zwoFicTsV+I8fNUuTlmTtVYhWtte27qcKiBaqJIKUeuVONrlXm5qbe9mCYIQILS1ooryJMeV0hCYC1qJJwcBiPI4+MaZBeiFk298wiQsyyrmteLs0MhajVXh8VdOqRY9y8NoNHs410zN1QpUt+v4Qo8g9EmCEhDYfdNuXUKTts6svjvIcdMfA94f3/Tn+MJQBnO0I3g5s1fgYfQE9GAiUiFvbR57bfNLoaHyu0L445f7EYZjazkfEE5t3JHd5t72yJjGiw8lEsfeRX6qQZwyKJ0D7cIWOtd0Oyexg7Aj5v+DkzfsxSH7tzwfDp83S4N86rfBhvQ/yesNTpo1MkTcqqh53SsW6XbDgBMR9zF6M9KxAnSnpXzfv+OCkC74vowFnzsTFVm8/Rw4yfjcyiiX8OJ/Bxlf9Pj5Mr6hgrjPHESRoev/fJoKGJ4316KKj8m/d0qH+O9g0RugrEbgOQHvf4oCqcAHIPrs7huzQLJtQ4OTMdOSTe63tVrbVm6pGZS0TCkpIIk4gEKeC4WF9DIUCZycPFFe2MhCnaJYSuEkkpkZmoiNvgCg5tOMqwzN0RCbcTLM+B7t7whwEaSPzAK8RzXA4d1z98+t4Y35iSA6ecBnWc4xFeBZPCILzvtzhW7HmpTv0aOU8Tm0x77TjzUFkdM3RTf+hAYDCHzXU1f3aYRQ/q93x8wmRCU4rEZcxDag5avqB1msH0sbWJogEA9T5LwfLx4Lh4dIseGuCDnDrbMGedD3R2tp4O2wFXPBx3lyDNHT+fZAzlMOy6xAxkiwNFDokZzjM2mw1P3h/zvn7noHkyP785LjwhzQexgdNUA/NhRkHbp/KAfldajFNNT+RJ3Y5/+kI5YPwxcmd/63HGA8V9MjYEJk69CXes+i76ONy6AOAzhcd7Su3YDCJg4ujwzUKeKC9u6qpoDXCRZVkyEcmSRRIAIcDgCYtY9KdkEgCSSXJPOwmgHuFjEJBGp0ZhInIiZ3JQSrRC3JEoevWIxL9wZmFWkAexOjNEpLMgBT+YJE6CoSMdPaRgUwPMEaLDEppVuBMX0Wn4xwh9nGucVvZxUpxPNeWau9PUKjYnZIik479ZkjFm3A3EE/uf8ddJJM3tRgGg+/10s3Gu32Mpxql9MO58to8+SiV6NyiTAl97R5Z4YdMopen37WZarLrwb1pwGx/jdwh0HIOI4YkbenOu/UMqUZ+igUeHBUJz/4QqGPd9zNjDk3t3rlNomwkHJvfa+BQ68eDnUml8CGfBMnc5zXf9eJeG680fv/MOuR0vveu4mMX+kOeRGS8OBDbrcB9v9HyZQ1uNk/aXU2UeDodj6R93fpJ/jvNj9E+SMGdJ0qmz5geImZIwEVprTZuPVBIHhDpzS1oyD2cQMzuThZu6lgaH+7LkZclE0OicC5JFGAwnhhzCG3AyZwOcfQRepPeS4MwkPFAJnKCxfCTLAjhJ1KoQScrMQUAkCcndAQWMWXISd6TESwQOIxAMBPM1EFvG7AMDLBFFwgEPfN4hOQ2bDSFlHr93RrMDDkydfhIxh6t0WnA94EvU6b775hgSjAZvPR+NbWKxCvxh7XRHUl9jfew+rN9DoY6tSp1nE92nCThgs70I3h+/w/o2RyIeK2LKbgOvDlPqhHKGAj15K6ahMFojzlmZL97BJH98HUgYfRLmGz7maOzBsDa6qXzcz7G3h4E5zxdfOfDHeWDdxy6nYUF+Oiyf/vpeRH3+lw9vfSL54trvJNB/6fgIPd/vi9+9yQO4HmjppFIeTkqf3HR8dCQqP+KsAQpA0ZJ3+ggxtBNNN/CIkDNF8q53GhcSkRx4Bx6ynkk4KqPRqcviiRVm3mL9u4/YUncYRuv5sdOn0UMU9GDsFK2WpuUSdze8KBELICI4GC4+hcKJz2cu1M8A5ZQH3SrCe6Pr/WSNJfBu7k5zNlHMwFunOwngcgqe+AmXnS3G8dZU0cdP7zc5FHrItiFzP9G2757gOOZvv6fyP5NKI1oTXprBauKjurjznJxAzbB/LN4e7ZXCrzmbH727o89us+uuQ2fPmTiegQbHc4hKovdTOg/rXl0aVmc/Bw0iR+pIGgSP0s/TrhwJrB82uePwhRxPM4ee+qzOXMRQFjGrJ735+ZI9/ZnO43L8PF3w+GOfBgxYc5ZEXSn6SQ0MNshxifOIz2UKPO6daW1PafP5kiI4wxnnptuE3nEGU9idIcSUFjG2ZobWiCncSRRJlTkTPEkPm/EB53qunIgwSffqR+gjJsocbgTINFOEmSNBSd0dTJyi00G0hoc7NFgNYEGFgl6Z0DP5fYggMzLAzTvdFrz1fmPTR/Bu/cSi6xVW4coMGXz+9PjtPf54nPn5euCe4xiDToB3QdL7cwOHE3PO7/xvXhsT5j/MdK9pGX7g47/usTsayfloSTadwvH+dIdPugL7IJs+9jjpR/C9AlDtjE6RyB/VQN23ZDPKdNJ7mAMzmhH2RdeLyx4cz8f2GYMyzcKTnXzWP6oKqMONghSTJvqNY7qytPcR7LLVDz1GIifOJwBw02jq0umFg+DoQ1S3z9BYuvOd0ww6EfX6yGlxj2j+REaPIMwxhcrpdPBDEJwkysdjiiSi8zUOKHgazN6W9gCSx31jrNIhnUICPZTjdUdT17wDjj8eDERGEcfFQacA+KGd45ZjssKvHBq5Z3W4QiFEIS1EmCgD6DNCCKZQeLBkgwBJKUmKle7BR9mGjLJevAaiaE7KUZykaubMlDgRc7MuT8J9SiCGcCfyPW94+Ag0O9wbzLzUVmp0kepNeQYNzvtpI6Je9trbSHZWozkTOL5zrnk91hsd03u6LRpkD4Md8DRRHSj10Guftu5i78sCXTD5WEnx1fP0Og5HCrpZONpTo8Nfi9DzFE/dYpo/MBQGVK01i4Yb75bQxzq406aYJ/ThWPfDLMMMOA+pRDPvfQ7/eL4puOORTwJiCLQJjE6q4FH4n846Jfln5gV1wPW+/G3+fDgbuln4iDjOPz+KpWMQD0PEP/37f3b8jU8+KtnPsODpb+c7J+BE2j34Azoq9yEjxzvAdPf3N+lYln2hjg1z2GTjluh9+ue8h9MA+qFwxi90mv7TdAxyKMJswsCHLHu81AB5U7lhOBaOO/GHN99NlI+v+HD4na2ESDIAGUbPoR7j5hErifVvvebBVLVFZ8ZgmDsW+ac2zZD/Q9B/HMTfP/z4yPAqH2t1oqcDSnahGmi99wo/BCaNzz+e+f1tHxoVY7AfB37Kiu70nUJoIhd3Hxztfj4+jNBHzoAeYg8G2CH7D041RBkz90cbu3Ku6Ec50hvmDZ1KB0FtHHNFhsSOjwCnrRF/PXYSiChIr2lkYA+mwU+wVdSonTHU/Er8NfYHE8uZqO1wQL6XBoewP4+snSDr8XYX44fkPvTFu83xeJydY2NhHUvH59/GggppM3TAHCgfP5kAJjgZRwoboXM3HvVLB159hGZTKEwzEP2cAczowwhBiDMznfvGHpqHiEgkxX6YayBgRfDbzoRJwBOzh/MbSDEbxiFzNQSHd6Fh5nASrkzEg2DvHZKL7okMF2MyMrVogsYgZyHmUttem5m3UnVvIFryJeXF3DYtzRoRRIKpmqL4u1Qtu5r5XmupdYwMEVFKiUXaxyYnNDbKu1kOkT0t8D7SdEzO++VCAXvNB4Q7UTVhLp1jNfR3PHIp+8yNYjDvL3oeuAOjp9uAJ/DR5mHYR0MGR7zR3COt1N1H4hI8yKB7tZ27q3tQfAdIspnXeTo+seAGQ26nfTuXvI4hZYKzDNf++OrM7plj7p3l4IgEv8ez3nfVwR4wFPI7pENDAjL1kAGN0v93QpN6eSTmSY77OQmmECcR12WObMp3OA/nd+YNj6l4pwMwxNOMKxxiqOuDYfXNn/545pPYOfAJ5o0cv/qx4MZHJwDx4bJx4AgJh+Xms73IUHqnVexTNwz8D9BZKuG8RSLTx+eNHUfkVPNBzNBPTyManZIIjiD6MdfutdVaaywZuGcRyjlmPLoZgNyiJ7h7C6YKdziYDGohC9a8EI21fkCqPm8CT9p7O7emqspORo2Y91JvezG1uu1lKwS+XGxZTN3u5V60MiMlYonae3ZH2dt9a6ZWWiu1gpBTFpGo6RVz/SiVxmwBE5mMgh7gcPkc937SRcdY923iwy89hVEvSSJ0LTJrhfpXprf6WEQDcPUs1nm/dlhg/cXg4Dl07CysPF6EVBrU9NE+2QdTlVrHlHGrn7aBeceQ66XWt9c30/6/857XwE7uagPU4jgljSU8dwjGw4ehfhjIxwYe25XAFKyPdHx5rFRMlH4aERxSuTPkHrtiZD9O6dFqba0dsvXU0duSMHFjaiOXZtwjgbBvW2vtPESqer/d315eBwbqM4MHYefzT8P4ttNcYiSx+CEa5hTMVyec2P/5wIp5lgbTUB7jhEOnjaLwiFpMRTftn3ndXvMwr3qajKHPOwDp+YfurZbzrnOg1Ha7FxpUJuPkRMJcFQczl89bDbWhptteWm3hNgW8smkNvw8tA73GDTUnHYsJju7CJhJJe1YmLhqOnvB4GIDgtRTm0jyn1lT3UlSVRbkaiPdat1JVre2lbpWI1KU0mNu97lUbhVRiQmxgUNnbtjczr63V1gCoQsSYOGUw617aOyaT1mzbqo86d/TubxP7+sPETjPjcYHMmaGxYw4/6cm/1L8yvAx+WFwHBD85oehU0wrM/rdnl9Cx7A1H8veUSrOox4/wkg0Lo7PidSMMRA4q0Vfu9xc2APzDH37+p//2TyklP/nS34uDvuHeC7lDxeJBf46PPxzHOxPdH6PU3xmz8v4rPn85ZPB5Ow/1Pt4Nm3R+5WzmjYz3yaP5MC6q+vW3r68vL/P969P1n/77f7s+XcetHbLlEDL+8OvDR87yYj78J1LpgN7zqU73dQj4d4JpDNT7MZuP/vD74yXn6J3H4Ox5OD4e8J8Ax+vL9+/fvppq/FWE//Gn55+eL0OB+8Opmd+tOD+QIdxnX8+O5ZhJeloPJg6PL9opOz7uLrbn6AoDm27nY2N3CRhtbXo+USe9EBDULNS4NQ2/UrAku3szjUrvMPoxQI2pt2bdQW6OE0tP/LuX9u37vdRDt/3w5frTj88SwcQxtA+jckzsR5fLhKon5UkYWAA0J/BhOZ/32lkJjesdTsmHGxnC7Jirk1E+oPZhFxxL/bQNHrbD0OI+Jg1q9vqy3e77+wF4d3y0Wv5//PiIAOn3/xRS6dMPf37yT+H3//8fn4wMgP9sND45z4fxwQcz/f/y42/N/+kzf+Ov7zfu3/7kpyc6K5D3f/q/YnzO1/ibT/q733p3/NdP8p8dvzNifz/+fvz9+Pvx9+Pvx9+Pvx9/P/5+/P34+/H34+/H34+/H38//n78f3X8vwFGZnGmCmVuZHN0cmVhbQplbmRvYmoKMzYgMCBvYmoKODU3NTYKZW5kb2JqCjIgMCBvYmoKPDwgL0NvdW50IDEgL0tpZHMgWyAxMSAwIFIgXSAvVHlwZSAvUGFnZXMgPj4KZW5kb2JqCjM3IDAgb2JqCjw8IC9DcmVhdGlvbkRhdGUgKEQ6MjAyMTA5MTYxNDQxMTMrMDInMDAnKQovQ3JlYXRvciAoTWF0cGxvdGxpYiB2My40LjMsIGh0dHBzOi8vbWF0cGxvdGxpYi5vcmcpCi9Qcm9kdWNlciAoTWF0cGxvdGxpYiBwZGYgYmFja2VuZCB2My40LjMpID4+CmVuZG9iagp4cmVmCjAgMzgKMDAwMDAwMDAwMCA2NTUzNSBmIAowMDAwMDAwMDE2IDAwMDAwIG4gCjAwMDAwOTM3NTcgMDAwMDAgbiAKMDAwMDAwNzU0NSAwMDAwMCBuIAowMDAwMDA3NTc3IDAwMDAwIG4gCjAwMDAwMDc2NzYgMDAwMDAgbiAKMDAwMDAwNzY5NyAwMDAwMCBuIAowMDAwMDA3NzE4IDAwMDAwIG4gCjAwMDAwMDAwNjUgMDAwMDAgbiAKMDAwMDAwMDM5OSAwMDAwMCBuIAowMDAwMDAwNzQxIDAwMDAwIG4gCjAwMDAwMDAyMDggMDAwMDAgbiAKMDAwMDAwMDcyMSAwMDAwMCBuIAowMDAwMDA3NzUwIDAwMDAwIG4gCjAwMDAwMDYyNzggMDAwMDAgbiAKMDAwMDAwNjA3OCAwMDAwMCBuIAowMDAwMDA1NjkzIDAwMDAwIG4gCjAwMDAwMDczMzEgMDAwMDAgbiAKMDAwMDAwMDc2MSAwMDAwMCBuIAowMDAwMDAxMDY2IDAwMDAwIG4gCjAwMDAwMDE0NDYgMDAwMDAgbiAKMDAwMDAwMTc1MSAwMDAwMCBuIAowMDAwMDAyMDU1IDAwMDAwIG4gCjAwMDAwMDIzNzcgMDAwMDAgbiAKMDAwMDAwMjg0NSAwMDAwMCBuIAowMDAwMDAzMDU0IDAwMDAwIG4gCjAwMDAwMDMxNzMgMDAwMDAgbiAKMDAwMDAwMzUwNCAwMDAwMCBuIAowMDAwMDAzNzQwIDAwMDAwIG4gCjAwMDAwMDQwMzEgMDAwMDAgbiAKMDAwMDAwNDE4NiAwMDAwMCBuIAowMDAwMDA0NDE5IDAwMDAwIG4gCjAwMDAwMDQ4MjYgMDAwMDAgbiAKMDAwMDAwNDkxNiAwMDAwMCBuIAowMDAwMDA1MTIyIDAwMDAwIG4gCjAwMDAwMDU0NDYgMDAwMDAgbiAKMDAwMDA5MzczNSAwMDAwMCBuIAowMDAwMDkzODE3IDAwMDAwIG4gCnRyYWlsZXIKPDwgL0luZm8gMzcgMCBSIC9Sb290IDEgMCBSIC9TaXplIDM4ID4+CnN0YXJ0eHJlZgo5Mzk3NAolJUVPRgo=\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:13.520083\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:13.776275\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:14.034943\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["input_imgs = get_train_images(4)\n", "for latent_dim in model_dict:\n", " visualize_reconstructions(model_dict[latent_dim][\"model\"], input_imgs)"]}, {"cell_type": "markdown", "id": "ef21b4fe", "metadata": {"papermill": {"duration": 0.057981, "end_time": "2021-09-16T12:41:14.313924", "exception": false, "start_time": "2021-09-16T12:41:14.255943", "status": "completed"}, "tags": []}, "source": ["Clearly, the smallest latent dimensionality can only save information about the rough shape and color of the object,\n", "but the reconstructed image is extremely blurry and it is hard to recognize the original object in the reconstruction.\n", "With 128 features, we can recognize some shapes again although the picture remains blurry.\n", "The models with the highest two dimensionalities reconstruct the images quite well.\n", "The difference between 256 and 384 is marginal at first sight but can be noticed when comparing, for instance,\n", "the backgrounds of the first image (the 384 features model more of the pattern than 256)."]}, {"cell_type": "markdown", "id": "f812acd6", "metadata": {"papermill": {"duration": 0.057213, "end_time": "2021-09-16T12:41:14.428039", "exception": false, "start_time": "2021-09-16T12:41:14.370826", "status": "completed"}, "tags": []}, "source": ["### Out-of-distribution images\n", "\n", "Before continuing with the applications of autoencoder, we can actually explore some limitations of our autoencoder.\n", "For example, what happens if we try to reconstruct an image that is clearly out of the distribution of our dataset?\n", "We expect the decoder to have learned some common patterns in the dataset,\n", "and thus might in particular fail to reconstruct images that do not follow these patterns.\n", "\n", "The first experiment we can try is to reconstruct noise.\n", "We, therefore, create two images whose pixels are randomly sampled from a uniform distribution over pixel values,\n", "and visualize the reconstruction of the model (feel free to test different latent dimensionalities):"]}, {"cell_type": "code", "execution_count": 15, "id": "7df92e6f", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:14.545606Z", "iopub.status.busy": "2021-09-16T12:41:14.545125Z", "iopub.status.idle": "2021-09-16T12:41:14.748703Z", "shell.execute_reply": "2021-09-16T12:41:14.749086Z"}, "papermill": {"duration": 0.264385, "end_time": "2021-09-16T12:41:14.749227", "exception": false, "start_time": "2021-09-16T12:41:14.484842", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:14.633242\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["rand_imgs = torch.rand(2, 3, 32, 32) * 2 - 1\n", "visualize_reconstructions(model_dict[256][\"model\"], rand_imgs)"]}, {"cell_type": "markdown", "id": "267b07f5", "metadata": {"papermill": {"duration": 0.06058, "end_time": "2021-09-16T12:41:14.872630", "exception": false, "start_time": "2021-09-16T12:41:14.812050", "status": "completed"}, "tags": []}, "source": ["The reconstruction of the noise is quite poor, and seems to introduce some rough patterns.\n", "As the input does not follow the patterns of the CIFAR dataset, the model has issues reconstructing it accurately.\n", "\n", "We can also check how well the model can reconstruct other manually-coded patterns:"]}, {"cell_type": "code", "execution_count": 16, "id": "21864c63", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:14.998551Z", "iopub.status.busy": "2021-09-16T12:41:14.998040Z", "iopub.status.idle": "2021-09-16T12:41:15.222492Z", "shell.execute_reply": "2021-09-16T12:41:15.222012Z"}, "papermill": {"duration": 0.289797, "end_time": "2021-09-16T12:41:15.222633", "exception": false, "start_time": "2021-09-16T12:41:14.932836", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:15.098251\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["plain_imgs = torch.zeros(4, 3, 32, 32)\n", "\n", "# Single color channel\n", "plain_imgs[1, 0] = 1\n", "# Checkboard pattern\n", "plain_imgs[2, :, :16, :16] = 1\n", "plain_imgs[2, :, 16:, 16:] = -1\n", "# Color progression\n", "xx, yy = torch.meshgrid(torch.linspace(-1, 1, 32), torch.linspace(-1, 1, 32))\n", "plain_imgs[3, 0, :, :] = xx\n", "plain_imgs[3, 1, :, :] = yy\n", "\n", "visualize_reconstructions(model_dict[256][\"model\"], plain_imgs)"]}, {"cell_type": "markdown", "id": "76301ef8", "metadata": {"papermill": {"duration": 0.06382, "end_time": "2021-09-16T12:41:15.352722", "exception": false, "start_time": "2021-09-16T12:41:15.288902", "status": "completed"}, "tags": []}, "source": ["The plain, constant images are reconstructed relatively good although the single color channel contains some noticeable noise.\n", "The hard borders of the checkboard pattern are not as sharp as intended, as well as the color progression,\n", "both because such patterns never occur in the real-world pictures of CIFAR.\n", "\n", "In general, autoencoders tend to fail reconstructing high-frequent noise (i.e. sudden, big changes across few pixels)\n", "due to the choice of MSE as loss function (see our previous discussion about loss functions in autoencoders).\n", "Small misalignments in the decoder can lead to huge losses so that the model settles for the expected value/mean in these regions.\n", "For low-frequent noise, a misalignment of a few pixels does not result in a big difference to the original image.\n", "However, the larger the latent dimensionality becomes, the more of this high-frequent noise can be accurately reconstructed."]}, {"cell_type": "markdown", "id": "7be3c419", "metadata": {"papermill": {"duration": 0.064246, "end_time": "2021-09-16T12:41:15.481865", "exception": false, "start_time": "2021-09-16T12:41:15.417619", "status": "completed"}, "tags": []}, "source": ["### Generating new images\n", "\n", "Variational autoencoders are a generative version of the autoencoders because we regularize the latent space to follow a Gaussian distribution.\n", "However, in vanilla autoencoders, we do not have any restrictions on the latent vector.\n", "So what happens if we would actually input a randomly sampled latent vector into the decoder?\n", "Let's find it out below:"]}, {"cell_type": "code", "execution_count": 17, "id": "d7f283ff", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:15.629358Z", "iopub.status.busy": "2021-09-16T12:41:15.628883Z", "iopub.status.idle": "2021-09-16T12:41:15.799212Z", "shell.execute_reply": "2021-09-16T12:41:15.798800Z"}, "papermill": {"duration": 0.241041, "end_time": "2021-09-16T12:41:15.799325", "exception": false, "start_time": "2021-09-16T12:41:15.558284", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torchvision/utils.py:50: UserWarning: range will be deprecated, please use value_range instead.\n", " warnings.warn(warning)\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:15.713164\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["model = model_dict[256][\"model\"]\n", "latent_vectors = torch.randn(8, model.hparams.latent_dim, device=model.device)\n", "with torch.no_grad():\n", " imgs = model.decoder(latent_vectors)\n", " imgs = imgs.cpu()\n", "\n", "grid = torchvision.utils.make_grid(imgs, nrow=4, normalize=True, range=(-1, 1), pad_value=0.5)\n", "grid = grid.permute(1, 2, 0)\n", "plt.figure(figsize=(8, 5))\n", "plt.imshow(grid)\n", "plt.axis(\"off\")\n", "plt.show()"]}, {"cell_type": "markdown", "id": "dc366247", "metadata": {"papermill": {"duration": 0.065573, "end_time": "2021-09-16T12:41:15.933017", "exception": false, "start_time": "2021-09-16T12:41:15.867444", "status": "completed"}, "tags": []}, "source": ["As we can see, the generated images more look like art than realistic images.\n", "As the autoencoder was allowed to structure the latent space in whichever way it suits the reconstruction best,\n", "there is no incentive to map every possible latent vector to realistic images.\n", "Furthermore, the distribution in latent space is unknown to us and doesn't necessarily follow a multivariate normal distribution.\n", "Thus, we can conclude that vanilla autoencoders are indeed not generative."]}, {"cell_type": "markdown", "id": "beb39fdc", "metadata": {"papermill": {"duration": 0.064649, "end_time": "2021-09-16T12:41:16.062528", "exception": false, "start_time": "2021-09-16T12:41:15.997879", "status": "completed"}, "tags": []}, "source": ["## Finding visually similar images\n", "\n", "One application of autoencoders is to build an image-based search engine to retrieve visually similar images.\n", "This can be done by representing all images as their latent dimensionality, and find the closest $K$ images in this domain.\n", "The first step to such a search engine is to encode all images into $z$.\n", "In the following, we will use the training set as a search corpus, and the test set as queries to the system.\n", "\n", "(Warning: the following cells can be computationally heavy for a weak CPU-only system.\n", "If you do not have a strong computer and are not on Google Colab,\n", "you might want to skip the execution of the following cells and rely on the results shown in the filled notebook)"]}, {"cell_type": "code", "execution_count": 18, "id": "87bcc28e", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:16.196119Z", "iopub.status.busy": "2021-09-16T12:41:16.195656Z", "iopub.status.idle": "2021-09-16T12:41:16.197888Z", "shell.execute_reply": "2021-09-16T12:41:16.197398Z"}, "papermill": {"duration": 0.07074, "end_time": "2021-09-16T12:41:16.197996", "exception": false, "start_time": "2021-09-16T12:41:16.127256", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# We use the following model throughout this section.\n", "# If you want to try a different latent dimensionality, change it here!\n", "model = model_dict[128][\"model\"]"]}, {"cell_type": "code", "execution_count": 19, "id": "3abba35a", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:16.349216Z", "iopub.status.busy": "2021-09-16T12:41:16.336154Z", "iopub.status.idle": "2021-09-16T12:41:29.806879Z", "shell.execute_reply": "2021-09-16T12:41:29.806369Z"}, "papermill": {"duration": 13.543186, "end_time": "2021-09-16T12:41:29.807006", "exception": false, "start_time": "2021-09-16T12:41:16.263820", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "fc07ca3d23014b6f9d5fb7b961f16005", "version_major": 2, "version_minor": 0}, "text/plain": ["Encoding images: 0%| | 0/175 [00:00\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:30.318327\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:30.522324\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "JVBERi0xLjQKJazcIKu6CjEgMCBvYmoKPDwgL1BhZ2VzIDIgMCBSIC9UeXBlIC9DYXRhbG9nID4+CmVuZG9iago4IDAgb2JqCjw8IC9FeHRHU3RhdGUgNCAwIFIgL0ZvbnQgMyAwIFIgL1BhdHRlcm4gNSAwIFIKL1Byb2NTZXQgWyAvUERGIC9UZXh0IC9JbWFnZUIgL0ltYWdlQyAvSW1hZ2VJIF0gL1NoYWRpbmcgNiAwIFIKL1hPYmplY3QgNyAwIFIgPj4KZW5kb2JqCjExIDAgb2JqCjw8IC9Bbm5vdHMgMTAgMCBSIC9Db250ZW50cyA5IDAgUgovR3JvdXAgPDwgL0NTIC9EZXZpY2VSR0IgL1MgL1RyYW5zcGFyZW5jeSAvVHlwZSAvR3JvdXAgPj4KL01lZGlhQm94IFsgMCAwIDY4NCA5Mi42NjQ5MzUwNjQ5IF0gL1BhcmVudCAyIDAgUiAvUmVzb3VyY2VzIDggMCBSCi9UeXBlIC9QYWdlID4+CmVuZG9iago5IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMTIgMCBSID4+CnN0cmVhbQp4nFWNzQrCMBCE7/sU8wT5a900x0oheKwXHyDEn2AVW7Cv7zaC4GFm9oNlxqKQ7i0uC8RgUESr3HFjMkITcddK3msGp5jb0OyEzR9dic70gleuijkohu+Uqw9GHHPGCQ/o3n0Hi2iV6gg95Pct5WPcIy3Swn6bNvDhV5gm6IPF8MRII30AE9onwAplbmRzdHJlYW0KZW5kb2JqCjEyIDAgb2JqCjEzNwplbmRvYmoKMTAgMCBvYmoKWyBdCmVuZG9iagozIDAgb2JqCjw8ID4+CmVuZG9iago0IDAgb2JqCjw8IC9BMSA8PCAvQ0EgMCAvVHlwZSAvRXh0R1N0YXRlIC9jYSAxID4+Ci9BMiA8PCAvQ0EgMSAvVHlwZSAvRXh0R1N0YXRlIC9jYSAxID4+ID4+CmVuZG9iago1IDAgb2JqCjw8ID4+CmVuZG9iago2IDAgb2JqCjw8ID4+CmVuZG9iago3IDAgb2JqCjw8IC9JMSAxMyAwIFIgPj4KZW5kb2JqCjEzIDAgb2JqCjw8IC9CaXRzUGVyQ29tcG9uZW50IDggL0NvbG9yU3BhY2UgL0RldmljZVJHQgovRGVjb2RlUGFybXMgPDwgL0NvbG9ycyAzIC9Db2x1bW5zIDY3MCAvUHJlZGljdG9yIDEwID4+Ci9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9IZWlnaHQgNzkgL0xlbmd0aCAxNCAwIFIgL1N1YnR5cGUgL0ltYWdlCi9UeXBlIC9YT2JqZWN0IC9XaWR0aCA2NzAgPj4Kc3RyZWFtCnic7P3rsyxbtheG/cYYc2ZW1Vr7dfp0972ExENg2YD8kJARIrAs4AYhhGyHP/gPdNhfJQs5wkgICQsCHMY4LCAURmAJuLfv7dfZj/Woqsycc4zhD2POzKy19+luXiHZcWbvrlOrKitzPsfjN17Ad+279l37rn3Xvmvfte/ad+279l37rn3Xvmvfte/ad+279l37rn3XvmvftX/ujfZ/MAsx978cvr+QXl79hb9/4d1vm//yX//TNnevta5/igjRbnQ37Z93X/7ZN3dT1fVPZt6t3f/PN3e3m9EJ838v1sjN1vfE/OJYOPY76wvv4lJ3v1k7kbjR/380Mze7GR39sx4d/YK/WvPPPiHQFy51367//DdfuO/t6OSfw+j+O2h95OZmux1+O7r/7gfq/oVl/VV6Fb97QTN/6dp99t2XNtB/b5rZzei2nrKkP/on/70/8If/VbjDvZYyz5O7aVURfvX6dUp5GLKwMIGImIiYmMBEhPZKcALc1d1SYpH+FYEIBCIid1+W2cxSSsFumdfvQYADDg3ev595AplZrbURVaJYG1Vzdzd1d2YWlnjSj370o//j/+F///6bbwDknP/Mn/1zf+gP/493U7E70yBvs0G/4ID7P/W6+rf/+aVd+4vaj3/7R//xn/8PHh8eAKSc/43f+NO/+3/w+3ff04t37ZVWZhT/3zYr0S/pQL/PL5kF/6UU0vs1vrv+9qOf/vbv/NX/+C9ez2cA4zj+yT/1Z37P7/2XblgkeQygsdd168QYiQAiYoebKXybXkfMdfxJ3PYfMTMAc1upPFG/E4jgBC+X8+M/+kc2z0mrMP/wf/Q/vP/+910G52zuqqbuS1UzL9XMvaibuzu5AzDAmSBCv/WP/sF/9hf+o+vlAuBwPP6p3/hzv/v3/D7vXfyl83vz8o/V3OmLv9vviS88rf32y33x3b5xAP6bv/kP/q9/+S/M8wTgeLr7t/7M/+bX/oXfE4Nz9x0vJQTNII4ZRicggJPHteZERtyPPITA5EJggjAlpr6pyZ0At/Yzc3MH3EEEZsrCp+OQhE+HkZlMzc0uU5mXOhedihlg0UtCu4e/FNXc/Tf/wd/76//5XyjLDOD+/vW/8xv/61//tX/BEeOibTq/dR39i9+tx3P33a9GEdwbZdpfHovpu0vWty9vGoehffr3/pu/+5f/6n9aagHw5s3b/9W/97/99V//9TgGOWVJElygnRdaicg6sP4ZdZbbp9AdZubuqmbt/DWWABAxrZ1biRKBHB7yhlqptZ7Pz7VqKdXNU0rMPB4O4zCCghsxs6ARGNd4kntjSOZ/5+/8v/6Tv/B/Dn3v3Zs3f/ZP/8bXX30vBHTmRgmCGog0mnD7ykzcOJ8wEcVviRmgtkGZCQTurIs2qtlnhraPf2Wd8jPyFR9SH6vD/a//9b/27/8H//7K3dP6Y2b+g/+zP/a/+LP/O7jDbZ6uz08PZlaWJeX8wx/+2uEwno7HnDMTCRMzCRMTpXglIoLEE62465A5Z5bO/plDIGB3P5+fa62HwyHnzNHa921R1Stg1LfOyodUdZkXACLCzDlnIqq1mpmpuqmI5JSJCMR/+2/9l//Rn/8/BWsXSX/0j/3xf+ff/XO3ez32HXlj6ivbutn+3l/9V1+KLy7P/ta0dWN/8H71G/1Xf/tv/Rd/6T/prD39oX/9X/sj/8t/CzfC0EZo1uFtR67Tkb7VOqX99rZSnV/A3X+pgLKR+C+9rm/+67/9d/7Gf/FXgrXnnP/I//zf+KN/9N982Rs4M+IQ7r+Iw0fMROzuqtU9CHUjM+7tPRGYJYkwsyQBoFZbT6jLj01ydYJPH97/5P/xN/R8HpZ5yOlf/o0//fUf+AOeTp4O1axWK1UvS6nm17lW82lRNVcnNwAKmDByov/yb/7f/+p//heDtY/D+Ef/2J/4V//IH1t79YV536bv5s0vl6JeTljnrLe/63vgy8v6Ymle3NUd8Bu28v/8m3/9r/21/yxY+3g4/mt//N/+g/+Tf917ixuhsXZxIiB1YugE57idu5u5u4GUBUQizISBIYzEyIzENEhoGQyQg9xhpt7IeuMgRBCmw5jfvT6OQ3r3+i4J61JN7ePj5fkyP0/6NFV1L53JObyqriS0T56742/+9b/8N/7Kfxqs/XQ8/Yl/80/94T/4P/VNWIyBfTt374LQrSTd5p92a+Av/nuzJLd/tGVtIuT+GLs3Bu/7DbMTWdqi9PX7y3/tL/2V/9tfDtZ+d3f3p/7kb/yhP/SvBIUeezsej8wsqStk9HKs8WGTuX074EGna9VaOzBA7YixCJpg3TTAmBB3A4KvX+d5/uab96WU62VStXEcU8r396/u7u6IhVhYJKW8DqosRVXdzcyquZofj8e/9Bf/L8Ha7+/u/+0//id+/+/9vcF8RCR4igiLSMrxXogop8TMIolZmIXjoiTMzEmIiFMiIpJEzPEPTE0xpSa/rsS2a7H/2JxkncYQWL0JdXB3N4M7i/yHf/4//AJrD1El5wQ3cjKVIadaqzGEXBjClBKnRELBrcHkzAjmnUJBhxOg7uYmzIk5LiBqujszuUGYvBFkDzmdCNKVd3d3NXdrahm4TQvYzfq+4VXfop2sK8QpYJa45EZ53WvdG2+n3UHxL2nt6841/FM16kTCbz+JJ//jqGB7/abfapOLNrm3IR8OAAwCwDsi3nfbSlh+URf2fP3bNqW32/0ijuNEoUkF1XV4zHkjqPEkf4GPxOlnAHCP9w6HKwBd8cNOiZMkEWEiSeLmgJt5tepdQQnNbj1sLAxqWmLI+bEwtE4U4GaotTodf+3X6vl8/c3fnC/z4zefhrufH773/eHNQYIpJRpdknl0jAnVvFSv6g29oi9BP//46jd+8SzfXtiJOKgTeHp5hQec9jl3fyF4fakXdPvlyytDvQ5RqjOS1p1O+JraRkQMJzjc4A5md3NQJQI1NUnEhZAYIiRMASH2RwXd5NDUzdg81P6gtA5YYCdtCphSlmHMI7gSmaM2imnmtixmXRwMZc7Mq3ngBOtgCcZkHexpu+XbCfeqHXxOZAgA+Q5F+5YZ/wz6c8TTvd+8q77YNvL6M18xs36lr2qLA/CdvYlIEktiEWHilIL3hcx8o5TeYKudIocFjdzjxQFxImIzE6GQ3Aje0N8wt1kXcdBJCbV9ayGrAQ4iSUzOaaCUnVMFw+BmbFAnoMEDtdaG4TiqeVXTb0Wets/b6sSseqM5TfpxC2YVX3n7k2HmTOTm5iDAvOMQ1Og0cT9iBN7r8b9SW2XieLVVMl577g6zFzwk3fyReMiBeBkslSwM08WFPAlyoiFRTiy0bt92zJiRE/G6Hc3JXQhx9hqr7dKDs4uwO/N2tL0JBwQmuLtWg1s8RdrCk68yHpF0UYuItBRzZ8BBwpxTipsm4f3k7c9bCBD4Erv9BY3/CYnwTR9uH3erhf2qLXpu+x9xo1/AZ+oXEch3QiNeHEvasetv7UZf8V9i2GoK7y8eDpH7xtdXYuMrMaIvCi6dBzAzc5xYc1uVcuw4EAkLIaXU+LSqVzd3M4M35YC5i5xdYzC3YhqHkIhgGgwPDitVrwuB7/7Ff7Gcnz/8ox/N5+vHn37DnL83HI9v3xEDIU4yqbkImbkIqdpl1j750Uf9bA43xatP9i9pvyJf7yL+9hD6EnXDt3P3b2PtfTBYWVp7xmdNiITabuv6IXmwXwB9apoCEGwmuDAczk7EYHS7XSIS9iScGIkDx20qQt/+4u4BD5qZqVFsLnLA4AayECIISDmNIBdFEgdpAwvMVM9WtLbhDUlSkqK+VM3pxi+CyRgaQkubmV+Jtd9O5s0l9O3ffbF1vr5KbHRzn05zGo/dlrJzc2qHJy62/QMlSc7B0iXlJMIi3Pm6vyAm/c/Q0Fb1lDr3JDiIGqkOsYmoCV7SFnJTP1Yo24wUrqpaG47CKZOD8yiSjVJxNnNzJbImVdfqcLMVIEExL2rVfokG1bYKOl93izkj7yc02LnDTQnsRmC4Exk5KTHDACYYrZIrrcqMx/tNS3L8Inq6R8v23H1bv01/1y7hbe2GtVMAj23GfVPN4x+MCUKQIPBuMIUzgRgkzVpiAaEAtpsIDuG+iwTr5m1TRtT76B7Y+rLMbpazCDOY4qd7KCNuSp0yMJHFDVei07f7i9FhE9PWoxhT7H57jv4pufi3NdqjBLTpVL+y3t4Z52eXbwSlE+i9dNf/BlGcsbhsk+rpc23uCzdfNYL2pP01wa6/rXu7H3jw8+01tsGqUviLtXMzU7OmQrvThixj4xCdxzigZmTKtbq7Bg5oZu6h+gsYXVxw96qKsM66qzbWvmkfDgBqXs2FwWlI4/H41TtJSc0vz+fT9XpYJoCcGgUgOBPASAQwJSaT9Xi2B93sTAJT42VtkjuE4vuZDvm2aS6/3PaBvtkacY//xGm7tQJtlr9t1+xW6xc/aDW1+vbJ7fe+ekD6esu2Fx0AkWET8i3cGkTQB0x934KaIkFJOAsxwOTuUDP4Ct7FFm1MlNoRC0JkjXGDSimqNpe6lFq1Wcq7V6SDXBDEmUDIiXMWQFVD+NiNzo1gDNtGv8KtXc7dz8WXPv3iB71929z3Q0a+Jx3rMafdDnNagRIAsBWe29lH1gWxjTASpZRyzqGtpySSJOThdbX23B3tTG07zoPC9CeHKk9MIowmTYYLaYNwmcjhK1LmgAWEX+t1mpZlWZaiapDMLCBxYnV4DXTGmMgciFOMhg+FpFHNavO++CWT3qll4/HUzlD7Rw2k8p0Q0JFH+DaTK13dWLc3KedWevft9L3sTdMrXvxJN8RvpRD+mSfYC9ZuDCMycheyxO5sQi5kmTSxZbbMLgwm0qpqC4HZnIkTMwFaC8zIlWDwCnMHe/NLd2NOCJnOw3jZQW4K6u2utSy11uenJzd9dXeSITfS3fD3hvk3WY+cmZS6IGUGuDDcXTWEjK1xiBgbcVmb99N2s/J72reytX8m/H5/H4f17fArUOpdP+nWPkBmFNA0dS1mx+z7m9BV9luJaSUH5L8Akn9xn91QXl7TFb3P7/GCJroDZE3d3varO8xdNxLjQFFdammADQTcVYFGvEFM3lw43eCu1czDpGeq1j3Sm2+HMDObNn5f58lWHx83D0Cp6R+tqdqilinx4U7y+NW/9Pvr5Tw/XKafvJevv0dfvUkpp2EIywG8eXt5ghjMQIRSrGg1g5nbbnRokPVmnECnHH0ZV77e3v8SjPxbFm4jMyFHrdKkrxv8W+5wS2Juv9o9o6/eDTyL8Hpr9LoZ0IPsdiipTXb0QxWuKaUxSTgrmUFCW2MH0SAkTGNOQxY3c6umZlrhROzBXEABigbfDb6ucMANbrVWY3u+XstSrsuylOpgUBhwEgAjZ1giI7KUkjCPY8pDZnitLjcz5YTKKP1ItimhPm94MbFdYPtVQJdfsCLrEQvJmJpYvqo0eEHf0ITnrkX0/7vbBtC3u+1crIkO43g6HYP7dmP0hl1+prW/6GLM+DqQps8nwJpJmohYJKFj8CEcx3szdzOttdbler18+vRpKeX5fAX49OogeYAkI1F117C1NXYbAsE62uh8VQvufjPDRJs/zX4sjalbiNwEYzQ8Izg99wtCtiGELkzU1EQO8eaWaRBgdHtifuk6r0DaHhPCTnla6cTa+bV9QWuHx6j6KzlR15LdCEYgJjg1lZzIGGAYERkMMIKRG9zcCBQsw92ddw9aN0D/j5tbrfVyudZarpeLu58Oo3vy1cltpy120Wm7YYcsNon0Mz3YGztZJ2c3hZ0o3Z6I3fuYyM98Xz5r+w+/dH59W3XcqDFbz79027Wb61g+eyz56irwEhqITbnBE7vLNlbfFZ1vfXp7pZdT83KA3hnv5/fYWNXGyAF484imDj69IE3ubh54EoGIVAFvCsvu4k7VHIDBQsIOLdnMtruvZI7aneOCkP2BYMZtuvqdA8+Fg4glnU7MhMWNFiepamAjM2qMqs1Wl0FJmLQbFN1367/OLW1LtvoHo2kwNwuw6kS/cqQj7d51Ka4ZBJu0v/qld1rh209jnr5Fsbgdwku+vg6tm6cdDgpyQO0L6iGE7fCSuXti5CThimzsGktGoGbjaz42aPpUmGPcrQPARH2VbQMIqM1YrHMpdam1lFpKDb2BuFkr3WBm5M6ANPku/O+b6XUbmyMIoTd+EIvundl98UDFUL5IGr595V7eokmxjdl4P9f9Lr7CP+21wWCrSNHNYF2tANAcXDYzHxECge+Ndm3l64GVUJexX2wAwmdUuCFizOxY9XXa7bsNeXY3U1WttZZSa6lmTuTNE54ZxO60kk7rk9Mt7HAA5kRmYQH4bMIbRLfB3evzw5ru/ctAoOHOgMXHTZDwMDFg3XPkhg3ciY27qfIvlzUsJTuiSp8doc86fkM5OxN5ye/2rN2FLJG5q0PZK0OFVMiETKCCyl7IXDglYmIjNuGwqYuwEuBUjYy9uqtXU2fyBCY3q6oiAg/Nhpg6fOkOQFWL6vn5+bd+6zfLspR5FqbDOOSUA5ojIg43Pe+2EKNVvArB3F29LaJFvMPuuMTa1L00sL5tE9+8Bdry9j3ethz1Zeo/X0XyX0TvsB0dbPfZAUNxAulLP9n/cPWyoY4BEXajc3SzR/t7vz+4vzYqsDGR7sPY+PWOoH/WaBvynrTdKuj76dhphDspswmwhH6WzLqo3aUxd6jCdL9P1bVqjcdRJSaOwcSM0K3r/0rvTHXF2Fu0LhVmFrcIdaPQIz0Af/Vw3wRYGIH3xdQQg8yIjFDVhfn49ffJzF5fsdT0+vVcraIGiwgvTm74iDOQM4mIMOXEtfpS7IVXfxuC07pwtwj5zYr0gJfb5ttl3+6f0wGaiAqzxi/39HRF0fb65kunxm9vRJ8TciSmJI1ya2gO1FQ4TsxEKQkBtaiZgg3kp0N6/eoYW7KqwZegy0QYszTbL6Gir5zWoCKNyxB5j68CwEyJObEIJwaXuZr782W6zvOyLKVWahG8xCSrBsEOZspMLBxBtzBj2owLaPK0MgJV8O4VjSbE3AhVXf8Abk7uP1Hb5GCgI1fdbLGZurCxvJ2f3cZy1tO3P56+JQIhUM5pGDL3CMOu5WI9dN1Pnj7bdV2G30EC3haRWJjYOYKisMq7sFX2dg9MbSnler2eL9fn57OaGUiYUkopD+AE4uqkBkJgtBQGduvKgDt0/dp3LrfRuZXgxMYNNz2Cg8yIya1LLO5McDMWgTuLOIWdiZycOGRwAoV7nREJEyLkywFCozbcZsbRyVaL7GhTFtBFt5NiPZXuXdTxXbcNAVS7twH/Ils7dTjJg400d8Dtn9umuMOa8O3W9L+mEjia1h5Pb9NnZkHRCbsT0L91d3Uv3aZiZUksqg1ZudXiVvlnlUZvbA837Pymfa7Hx7CdwLtd315XKbg9L+jmjo2FDvxSAH/514Zyb3Lbjlj6C2Z5c5ebz7vy3Tr1+XM3DymiF/S4Hc1QGPec2Ds/WE84fTZtt/e5fehubLsLHK0zvm7bvj3pxW8b1LK+99CqAim8eXKzMYVEbaH/gcDsn/VrG4PvGgKpw+5whZL44iJg50y2WQ63uxNJygyYAkkp5ThoZgZmix2+s3UyETi8xNnZuKN/L2Z1x05p9Xv4XAluUuhnH683+hwGfnkDIofbCpHvl2SVYbugtE7u/rrPHrHONm4PYH9gk0Y2StpigwkUETSA87YzE1NO3LlBGFsa1tQ94r0BfSHKm3W21TjQtpir8tz3mKqpW6laq1U1VeMmDFKHBrhpH9imIQAAejmzm/F1h8a0I3/jsdjV0m64/SePtmkExFdFI9CE/tdL/u1wc1g/aTuEC/3ExZ/tf7uOEW4R61Vwitf13wZovzgou65QmxcHOvyOvQtG74tHdgFrnFnNaq09lNHRXPhaX5yIvFO7Dl5vvd+Eim+jaTve0QReNCHNKLz93MiJYWbEzNEtmBO7kVE76mREBFNnbpvNujTX9l5sDdtOV+uA7dE3X3/kuxX0XT/3mnrM1oYo/CKtHUyUunOaMQnBYLBKBoayK3mFgZ0E5K6w4g4zYiSixASCkiu8wtWNHexKMLFa5+tVRMYhiwjcyN1NHU4EFq6ml6Wc5+X5utRSEoGY1KgaqoLYE7k02uPukRPMVROzVa21FsATM8epDivqrWUFbrCKzxvBETtm51G/Q7S6qLOhlkD3buyWIbTNue3U9d5f4KQ7hCXEuRuKQQjIwG8+A7pw7oA3i8mL0dnu6s+Ie6P7O+q0sZTuBrL//Ettz6qB/V7aDvANBLDtxc7c+w+akT1ObJPezJp7smkt+/7knMZxUNWQyr3DUCvBWGe0nbUWTNPsgtQJd63V4c3K15Ajb0E11hXWXWaKPrUO7/GfOaXQwQm4T+6g8ADBig5v4EVXpkgIJM0d1IyS/AI0va0Kw0Hgz9fiS6uzcjGEJEG7Nd6R3EYT+twFEugrsrgqe7sNFNaw+LbdYd0qu7VdO/KSiLpbLVrmZvBwd/eUwoRNSSK4BgSIk3G4o/mYfCB3clNzqKAC7s4AQStgRS3ssMtSIlQaTavvqW32M8NEytWtTFKJikPNL5cyl9rctPuIaP0JAKFtexhiq/Jn00+mbKWJrXt5sE/9dtb7bupT9EVu89mHTVr6gvzfPnJq/Njp9if9xAWfxI1W1zGaTcFC56U3j2AQg1ueiB6DvvOkay7uuyn3voOCrBhkjXOlLTJic01r5jB1c6+lRFBDoweOeV7O12kpRVJmB4kwi5nVUjhz+D0yQgzjNlozMLlDXFZaESO89ZMw18V0JmOA3BjM4RRvDDUmJrdMRG5KzO6VmM0D9hN4IuIQ1KFCTLBI4cIgJhGYgBjKYAKLb1MWIiPH+3Wi0HC7nUyybQcPjtktkBbEEu5uCov35lr2w3uptXM4/HOjSiHfh/YdDikEJQhTs6Y3DmTUBZVN8kF/fKjsWgvcTJWCjPZzzh501apqqXUpVauScGowQ/TcV/K9vsaWcKNg5AHRon/XxZz9IXnpWNc/D+Vtx70/a4TPLCYEdDvN/rJbqfnmUG6/vSUQdPvJ+tMXdv29OPolrX07uhtvXSWPm37uhY39R367nz6bgdtdd8vdu//njrrt16tTmd2tm7i5svbQwboSZrrvBjevWjfqmnfvxgb/7AZCZk5ELcJ0BV7QvdOdIlylK4B7yQBNXen7qQ+YWoRhC+wlAmUBmjcYQD3r3Iv5Iya4N4u7sXGjSLuZ+MJ8x5Ru8uUvaTtpohGQ/Xh2D1onpCFysUGdOmK7igSNu+9Yezc9tk3dXNdvlaP1IbuHunlzWTQ0KtukoXhtTnZM7E3UjcAcd/fmuBOOPQDITZ1gtQS5KKW4u6k11k7EbYxt6dydQAY3I1UDqJhHfqFarUmC7rGe68ZeMYB+qNY9skkAfYI7eezfxINXl5TVA6qJXzd83b9w7venC7tffpk0eQMOXlywPtMbawfcdy5y/SdhxFvPYKhDO4JGjSWtmdaoJZh4obhj9fTqE99MWat3K6hPz27zW+9f5JOokaPYdNXKVK3WqubEQgCxMEvwbzYndgohuB3ZAHeIqYVerFPgfX/sZ8hN3ao3VLwHsQDu5GRwDlTQiFrUGCzMwgS3ZoaQNvKIdgt/DOJQvZwYkAZaNUbe7hVL0PF+oCH3u+O+p5WbXm6Aw4xW3hqJlUzdDPv1fcHaBZ7gTuZuQibs6mZalbA6vXuIwSAmZVIiSEgvUALBK0zD38jcCDCoQdXqvMzBHLlloohD7ie+H8asWs/n88PDpx//+Mdm9v2vviJmgztD3cmVjRJkNaJHkoAk7sSqs5mChEisGWm01qVq2fN2N3X9ktaOsCWsOemw7tzt2BH2pAufsbL1xO+13767+vsb7k7bpX7zm1U+uBECQtptrhxNt72RXNyxos07WMo9kCq0OMs9zNDJejPt/MKUNU3ywe6ZjWWvhIuaAESEcCfwncjcWftGPINyW0igjQaFw5uavfAhbyEVQs4cLIXQgEFhBlaVQzuu9mL++/ln9hDidipVpyONGhBArjAOwtFVOXVTN3ZTaHONdWKElxx1q2HAn9Qcl/dzRQADiYGELDfsIdazE5am7juFzLztgi9Lndsc9ZuxrwIKyG+Wu73u/E87d2+uATtxqY+cHDAic5DDvENXjbnHlvDGRtsD9kTJy7LM0zW09g50B65OWsFMsMhWtRqN4VqX+Wruplar1rKoNVJWRYio1ohzjrTTMefd/8LX6KnOkENlMbuCQLQY1FHUzbm7Ca9SFK3DqGoEr7TGebuZq1ut5eYMaEFdNrm5U23fTvheAt6vFL7E2m33h28/9nV7roSo37EJ+ZtJDf1Uuu/U8c+1dqfNjtEPaSRXetFWy/qKwLeu0Nq5uGpPtwDA3KuTtXglDz+41hVzVQtxHmGFs0gceUMzi5mD8zC+O46mdp3nTnUs8g2Tm/o2I25GwMBCFHBaIzrm5rBBZDcDdp2u5/NZiJkosTCzMERCkYj4jERMUVolCUd62biuSiIiYenxe2tOJSZiltRuETFhW1ZaYpYGCxKDBCxt22xWjY2HtGXvDmSIbMjBzrW4m2sN0dlNdbrs99kuG10Q0FCVI4o9sB5VD6bSY0gISmAi425rYDIKe4Ort/D5kH7anJprLYs7zLSd7t7/UUciN63zdL2cLx8+foT761evBh0NcCKDqbm5uFvERUVUhBGpCpjdqpsaE4Eb2zNTrWa6H2pAB5/t27ZJm3bSN6lv1iN0AoZt227Kyw3/+cKdva8VujbdWOD+BL2U02JH0v4+WCmnb3rt/hYNXMF6zlchxXfce6dFdKVsjei/PZYvh4IdidrNxU64DBWZtk3Z1fHO2rEh5+3zHU9rwt4K3O4ChUOWpJVkEwBuOawoRcIZNXcvFYoO5+1Fo+BycA5Cvg3Utzft6tW/JNg392VucAIsspo3CLCdSF5dp6mxdvbtlv32gbGTRA61/dr556ydmsrT5v6X8PV1oAS3VUSNXdzvGVft8Il1gqgzCFp1K6L1pusPzNrORL+5b0y9vdkdo9a0lrIscWXkkDRCLYUJzmAmQYDzDdYluLuWsniwdjWtxcxVYQBqQShzamau4QjWVESmyFW743BNkjODy0IFoMVZw1PT18oXO3Wpn0zVlwhfsxbt8SR3qEJLm4PGeZuIsuP/26lZGfSXmuOFh92Ke8XU+i5txHbugsGuGsF+5F0LXQVr72segOiazL37gZu9HPXKzlf1ch1BR3+oP2I7/mhnntTdDFXV3JcSVvPG12uNM9WPa396uOS3zWPuRDmn02mstS6qZhYSdDgOuxuvu9DczYgo0suHBaHPA5tbks3A5ebLPM/zJMRMrMxMLEISezIRE4lU6pVKXIiZg9WxiDIzs7KsFzR+HV60kiL3LXHciIgo6iRFjlYnIWKwgGTj69ThtsaS4E1HMjODGUxXdo66wNS1Bl83q7os+4W7BeTN2NWsuhWySqauVZeFTL0WaEJ1h6IyCbMpu0a3BUZWAbgWV2s+UE30N5Ca11IWVb1enYhSTiThuQbOGSKXy1WXalWF2cznZZHp+v7jx6JlSCxM93enV/d31raGBmnQwmC2unhVZyd2ZbiSW0VdoGV/TnY7u8+e9+OzU9fjyuCHLw6n767Bxrh3H9Lu691/N1lsf4c9BXzxdt9R9Ki2nqczQAnTG8FlFadun+3UXeC9e9HddLJxjRe0hm7erqK475FwpjUFl7tHhqI45xTCcvwz+A1p2SiTN3n0hrF1dM52fhLeMld0c0MnM3F4pUdQeA9d47U3tx5i7gDUt2DeFVII6k7UEpVzStJJA69ywkKLwTWi1IksUiKukCWCYEJDl1XDCloCzcrY6ecLESpcDPb7c4WMGsr4clW+pXXFfZNRNz5CCNli77m9k0xv9ltHd6jfy1YnXN94E1EHhDqoFZdsAYAAuqjdZTmsGXOIItEkIutfEiaiFOn8HFVjn6uaz0tkJugMxKHWQxZbii9CI4Jubps1oUEK5AxXD4iqejKn7pbVtNmGVXbf3133295Bi6TQWm70WteKWrARvFWH7ouxHZ++DN+6kF08an/0CXUHiJq5h9Yvth76jcree4yOw/dtvkr+cReiYRBhVnM3L8VqqV7ri/us7s9xIMwCdu0I/KbN30gz2gys9jxXNStVW7Ud99Vk3FIPxIZjIkC6jLYSZ2I292UptS6x5kwU7i45cRISYlNzkAHOMCMiyjnxCjIE5XJ3kPDmLKFmz+fLw+NTBFkmFmEWbqy97UbhThMoiTCTrMVigk1HFZkUaa0zEVU1dSMSYkl5OBxP1GTOJgEwJ2IWThysnSMJq3Q4pFG3MBM0U0oopR76upkWN0Nd3NVrbTnyrU7Xab+Zblm7K1klLWSFtJAptNZ5horXgpqcDc6UhYzZVNyYKIEEICvu7rVYtabwtzmMoINSyrQsdZ5nd4zHg6TmWeBM6j5Ppc6LV00klWxaFgV+9uGb5+vzmDgJvXv71uFhnHOtpcxM0IUgbLW4qpuDXchN4rzNN0BZI6t7SGrF0v3zIOH98fG9PrsTXW/I845gbh/txHOiW11mU4peigL7h25X+8rZWyIH1T2JCUZqa2wndvpZnL82273fqxpPhI0B7bu1TdQqAd0aucHWvrEG1SBiJSR0wJUT7KjLxtrb57bnaw64WivTtJ+AAGLWmWwSNlOUdSHAwi/TNLgGr1L8fkrd0cJFeuSGrySyid1RCmIImsdCLSRW3Sxmr6pFyF3TLIjALfND72ooRN4RuEhfswoSPYf5tnKtGuOuM60/jffS7tJf1npKzK3tbDPgbYFXCnoj02LV2Sl8jyno7+bXtOte/3lkEGPELjRfVa7d6KzvBCWi+ISZIlpAw5pLIKKcc0qJqzFT2FnNvFQ3bzBkT3G0E4K421Z7rbYYxXriDCBH3A/gCgQniP4S3I0UMHM1eCTtXPlmyIOqXZDwUutOIHLU6qV4H2xIRTsf+ZWvrwz7y+u2LSCtv9jNeevpirx0r4WVtd/qBv2rHWs3NL+muAUbMx3uZBh4WawWV1crxepLLDB0aWo6ZItZ3qpJeVPreyRba6o6zcu01I9Pl6pWSnVHTpmjSFpESKx8HU2jbfrxuo6OCDmpdZnnCxMNwyiSxiGnlILXOsGJHWQNt2BiTqlVa11dGx3uTnnnvmpmj8/PHx8eg7VLq/3Sq50JMyH8slNiIsoiTBwqfkOImFgYka+NOaeRiC/XaSkFxA4+nU6v37wlImanht6TSI5EPcICFoiAOKrjdIoSJ4tBpA5zmKlpdTPX4m61FphZXeBqwdq1mtbLedqd0Bce8oAE3Yn0IG5kxu7inhwJyKAEEjUqlVWhxk5CLOqkCndSJVNygXOLDQu3dFMRHrIQHdyhgBadS62qnx4voPfzVC7P0+Pz84dPj2r2PC8pyeX8PA5ZyAT+1bu3X3/ve6fj4as3r5lIyMCk5kRuVVWrubrPYiPEoBV1gi77M1NN51L9RQvSxdJndLWIRHWZ/cnrFJm2oI4dfvLyjG4/cG+G2ObcAWrp+YzWe4I6yE+dCwZ39+aqveohDjXXcNu95e0dXfPttt477LTmncPW702q8I21E27vuyMhtuHc3eTalYPgWNatlmtA0Kqt3bL2rjSv2pc1Smbmgfvc8HYWFml+LtyB23b7SGMRKgSHLb3NofEL58G2tgBa4PPKy9ArDnVZv1NY6oaAndizEouWrmL3DHfdPO29uasTOsDR+cMN80U3X918/uUt9YtaW6VQsLePaeu+NQtp8wfdDWs/S8AmF8YsUBdvu4y08deopdzmkYiIqday77I1L+gYKPWsXc3FgaIaFaI4L3mcaQK3YHJz99JdhfoGv9FtqUlwO307HKk2btqi9xUAYmtFxQmYKSGSIbEZIse4tZy/XQANKKCx2RdLh0CZbjizY+PB201eiHNfXr4+uP5mnfb9uWlnssP8vvvN7pf90K5vuyeiOzFSggiGgYdRwpRHYH9ZYaS5MIebdNACImKKWLPuWOOkiDATR88Os5Q6LXVe6jxXNQvrhkg4uTS001aIL9KYArU4AZKEu4WgLpfp8jhP16enTzmlt+++4jzAD5F1PmJOnAktzyb6xvaugnXTvW82hTZJ7kutcylCTAhezpFaSpjMhIhUnIjEwUzFeE243iw/TCJOTGxO5NWU2C9LXZaiBjVXSD5WbmXPKJAEFmOCiElzJXUwM4fm1ZxIqcvhEdvQWLub1+JuWou5d6aubqpaTetcb4wpt2505BlgoALiTqbsmtyS8+g4GB2dMigVpWrkzm4ilB1kzuLmTmUhVaEMYkSBvgJVoNYxi+d0lwYzfPPp8TrN7z89PV+uHz8+fPz0OM/L5flSq17mom5F1eFCynAtk9fl66+++uHXX/+uX//hv/KH/+DpcHj7+i4nqdXcUMqipWhZtBQ5HZzuYZWWiZbzetrdMS31eZqrtlZLjfTEBKSUuGcVzSmnlIZhGIaxSaPrGYq8ldR2BnxT3kKCbTSGCGgmX3VXMyImkoAoiBByH7vCw33BwAJiczJnB3qIlwJIIt0luwF+qlq0Fr2h4OZQ8zUFNwfy1fJtRsZm3owQq57OBAe3w8Y77t5nbWM5IZKhk3XAuWkSZCAFnMnQzBjUjH89Vm3P4jskG3nfHECki7GmIHvteWGjESGnNAxDQLsdqoaZOzu1Ii5AsPZ+fM0dakA4y3sMKtxrmcntluz2umzCIO7IYtNUPBgIEVrWJG4ijLoBZM5r0l9zK63nTCBPkYgtdMPO2s1Xx5+VynzG8h0ImeEGQSHaeMtnFtu2/cy7f2Wbp2a8ANB0Y3hHZPs9127EoW0azybB0gbPw8xqLWY2L3OU22zmZ0fO+TCO0zzvWURVFF2nOW7nBiOQsgPh8dvELlEIG3EQTDdV617A687FFqPe70mKhoggND90OysauTf3Vk6OPAFgMiLAi5tC2ZXNoRa5OzadeJ2K9WTbfu0crubVm5y9AiCrI+PLJdp3e3fO0KXw/a5Y5YFg5nGSgButvV3Ufda3I7vecf1PHFh3VCEMowwD393JeEgwcjOmapV9Vx3G3U29qrE7EcQ5rB+BFcfOZmZQeLqgmpthqbpUrdWWUpdSnp7nOHFR+5S5O4g6CEhEWUS1TtNkqssyOfzVq9M4ZFN1s+n54+P7Hz89Pvz0xz86nk7H9C/L3T3bXULiiG1ldm+VVNdu12pwZxYQh0UmnFv22Ky5naf56XLtbnQsxCKUmJg5pURhMieWhEhWGBIpOa/1ToWdmCQxM6XMxPz8PE/zPM1lXsrbAj6+ZuYODIBaYTNPEkXeFUzhiLeKHvH/YDPN69BqsHBrrF3NvaiZu9ViblaLaj1PdS+Y3bD2WuuyzKpFa238stbAZGoppSyJzJULQPCwspsQ3LmRdNdSrBkjObLRhs9+FD+OBxu8lDovZZrLdSrXuV7nWhat6rXl9tmc7Bym6rXo9To/Pz8/Pt49PDzWZclCQ04CJOFlutZS6jJpWRh2GJJr1eU6L/Nexr5M08PTs2pVtR1rLwRKW1IlyiknkWEcx3ERkcB2gmGQK6GT4NAghYVTP5uuDY3tDMFRVEut4QxJRJQSMUXNe/YKuNXiVg3kYDWUiG4IEzWUgJRaSXvqSaHUtJTlxei8ydc9W1/THfpBbxa6jSuE9EwG6tGtrddrbOVKaBpP9q4EoOWe8PWWzaBpPf8l3AOTXG3t1hlbuwkC62up/mtVa5ine2QqvgnkoBUB7vJNaHgIfkY7MtZnJLoErP7S1DZfW8mug6/a6ap0UvN2jG7a6urTqFFXX9YZc1gMvj/fsdofO0fcTeDnzb0lJXihzd8GKze+vmPtO2ayDn63xn1YMd6Nzq+mslWbBbCunG0/bl9tliQ3U6tmtiyzms7LHG7qAbK4I6dUlvl6PW8acysI0J6y+SQYqHOoWAOOhDBmDrCTcRd37CZnWlfN+s7z8B24OQjoW61NfE8BqhSwmAMGMiJ3UodGTpeVtTt1rX1FsVYme7t+jli5tuV/JdPJyrFfoGOb5HNzj/V4dda/4ijeBUZqO85XaZW6QOC3FwdhZhJIBievVlC0KKlCrQUb75t1PxhafXaInQwUynKT1c3JHVVdo3aqWnO42gCvrpr4uimJQLWWcrnM8/Tp/Te1lmWZHfbm9f04Dm7qZp8+vn98+Hg5Py/zVZim65kIl8OplppyZUmSskhGx6Kiu6oGBzJ1kWclyfu29mIT3mNnoJse1UGOqgAD5qDIKu/ilAAmTw5yT3BiUjJizOqLYq42LXUqOhVldmYQSCJwVowIyayBj0zMLt6TLW1WjRDUui+S9kSr5hpxRC0xtvu2/27axtrd/fz09P7nPzdVtVqWcr1Oy7JoLWT68PCwzNOYRITKstRajuN4Oh6S8DhmYoiYw8NdgtPQ/AOJq9WlVoUv7iAukFLt4+P58fny8w9Pj8/TZapzTWBJx5HdSc2BgzsIoxCTP3365vr8WKt//Pjohix8dzr++g+/fxjyq7tjYl7mi9ZSpktZpq/eva1lsVrn6fzzbz7Ubjoys9/5nZ/8v//u32tVB1RLLWZuqiAkSUSNOkcay/EwjofjYRzv7+9F5DAORCQwuC3LsmZHGoY8DGNjTqbBboMPsAgxP18ul+vkDnOSlA+nU8r51ZvXSSSRkvt0fl7maak6Fy2q10Uj5idEcSIahkFEckrSfLvEYWb285+/X1VbB9S8aLekdEw+1IcgVTe298YfN0mRgFb0abtotzPQGQeopUtc/WLb3gpAXveOKxtx8U17B7XcEnH8r9drrXWa5lIWQlSFSjnnUqa9Y0TXLym0z3YfwIH6mU/vXp0JRTWkbgCBiUQc8ioib6o7oSPW4bwCDzTMTLU4FKAWCQJdyb6ZhXeee5RXECIIc1TUIGK30kUDADtwpC9eNSthjm6Z7LqnAm7J0W7Od2aCl6rhqk+tYlBQAjg8UjZRn0PfOTHsEYOdwspETDCtVuu8zM/np1rL9fKsWqdlVjPj8F8111aF+bd/+7f2oEs1X1a3kJWcmkc8DhEERj0xt9qNDBezZt0r8qaHXaiMYuodiKImW0fJgIitaq5+ZESOqFfphEIwwgIqsATLHh4bQdi7fMtrRer23Jdp5KqiVHyJtK5M7Vvkr9t1i5H6Tkppkmnj6Ggw2PpVl2/6T1ovt8vibmjBoOG8ljKdjikPGF+5iH26fKil6HJn9XCZba5cdKts5+6l1GUpFKBIzkhCZB6W8uiamgPqZI5pqbVatbAQU+ydJAlw2dV3437OiPDx4eFH//AffHj/zX/1t//WNF2rFoK/ffvqMA6xw02r1QVwdtVl/vFv/9YwjB8/PqQ8DONdysPbd1+9fvNWmJKQqc7zFBYXIj6eTpIShZ9a20A7hYEo5ZyG3BLFREZ6JggZUSE2ULV4hQHh3EQkRD4kPmQRopGdQTkAWVUiuy6+VHqe9Xxd6nlO55lZmDOBmJ3ALCDiJGCOEFAXoZx6vowWPUbcjB3aqKcpWrYP92aaqnAjr3BjaBgL9jvqRmuf5+VyvgQtK6XM81yWUmtx5st0NdMliTCVZa6lVK0OT0mq1ci3A7iqOZyrMwuJEEnRutRiQBV2cngt1eZSl6UuRUs1s0ZrOAHua3lEAkTABJEsklha0pJpmoV5nmaYRQ68abrUspT5WpZpGIa701W1zNfr+Trbjj3M83K+XEPGiZID8YYiyKGfOhFhpqJaVGutYE5J1FSYhJzcl3mpWrt4qGoRfVvUdJ7nNWpLcibm6+X6fL7EyZSU1ZGGzCmlJJmM4NP1Gqx9KTpXvcxd4GgJUqiUIrJVTe6lyn2a5326vbBohlKysvYbM/BLJQ9NIYlsjWjFsrZf0Pa7lc10K2d8x52iNVt799Iz8pbBbUXlu61yZcke+l8pSyllnqdlmcMjPSUFXPeeuh6hMnWTMaKDvAfYtuadmDUFOhhyi08L/c02bf7Fbykw9gbDtvR4pqVU1QJ4LUs3wcAtqzQ7TpgTmFh4IGYIc9MZPMI1vRN1j/j7Va9FBHT2KKDOjH1dNHRZLAwqbk0C2Kl+7YehoTeLiO0cWd1MEePu3KbFJqh2Nrweu9bThpATiMi0alnmebpeL7WWy/UcrN3MnBOYraqpkYPc5/m6H506dF2ypl+2aHInJ0dohNwlGeoaTOtPz9ewhzQ6voMA51coosWTe4+4b9e1fdoxAocbuzmUSFtKLjcH2W7SqS8edlaA9bG9H13X39CUveYeuPO2z/oG7idj76OzOgzsYPrGyFfuvq6T33y+yqXbV1hl8VXsiEmiNHAakbKSkFpdatGqVrSqN8V9N75uAjMgJHiGw8h4H+MKmLN5hGiZr7ghQikFWg6iQLPDKbVRkvPz08cP7z+8f//hw/tpuqoWImidDkMOjzW4kZsIDUkIdH5+WobFKaU8DsVSHo6nk2olkBOHN5lZbCA3V27FPrmLTje6eyTgxXbUnB0tbTrcgAjZLO4GKwrtG9NAIE8MOKTtV4S9vBiqo5gvVYvqUitzHCVmIxDEldjVmZmYnBniBHJykig5KURANy06ISxE1mnvGuLSQdlQ4PglLbvR2n/y05/913//74cYaKHb1jrNE4APj48sgSlTnITjYTweDkl4HBITUhgziEDUZCVJRFJVl1ohQuMIZues5h8eLpfrPBVTJ0rDwCNgIFfV6gUddlMt6iosx8Px+1+9+eH3vyI4uwpzrRVudb666ccPHy7XS6laVX/66frjjxdVXebpR7/9s2XRdXTTPD0/PyNOrPX4KncANahbiOpWQXQtha9nkTR8+sTC4zCI8GkchMlWQKQVE/Luyqu1LACGnFlkOBwkpU8PDw+PT5GwkVjk+UzE9NOfMVFmCDm5wo04QdJc6vN1UdWyTHAPJX3IWUR6PFGzlpv7z795X1fdyBHp/Hoo0qq1G62I6m7lQzT0JiM2FYJMsfOOa9Sjq+XtJJgvS1FriSGD0uUkw5BFOOcEeMshYd3LjwJa66nhyUEwWNFFVT99+jRN0+VymedZohEnkQ8ffq7dJd7cP3788JOf/GRjGGH0+4y1b5pMHGO3RlfW8TdSr3Bb/RNbiAAaIg+K3ISY56XW0hEvczci+vhe0HLRe86DCFdt/hu11nEYX796l9NwPL5iFkmZiJ3WaDTUWud5fv/+/T6AeKl1WopqXUE2NNV8DZjh8PMjdDmsMZl2tZqtFMpKCdE1elVqhbsHxaKGeTtcq5ppqbWWijBRUIskDLwkpSzCwsLMWkutZVmWYOrzfFbVeZnNjCUxs5aqquwgx/T0vCIu7r5UvS61b7w+4w2MNCYM0tLS0eoLcruo/bOONa3cMXLPNaxl5XyduVFX+L0pckoEB7nCyVEJCipBut3cIUAi30IHm/GpPW9NbbAJ1OZ+me3pukU3xAj6eVuDvPdiamfL1K0TTdsO/rv9BNjwJO9+H7j5Nj7jVnmsiQ8RJBIxIKHuwwySkJMfDsNXP7zPA8bj5F4eH7kana91us5l4bLIsjPXunspZZ6XlJw5wInwnyKiYECNdauFlaPlTY05MAeRGingAiaQuMPpw/v3T09P58v5+Xz+2U9+8vf/7t+dp+v5+cEi15n7xw8XuB0OwzBkLaWWJed8dzqA+GfffJCU3nz1/WE8HE53OQ+ScLobhyQ0ZDcnmDRro1st1S3iXIJURYKjaGr+dC3DuVUeaiQ6XGRASmSgAnGQInUjDTGTEOUkh5wS05g4SgwLkTiIoNVMfS51WpbzND1dz8QJciBi5hRmdSZKUpkkMTW8ASSMITmYxoFF+P40DIOQEtzrjDLBHaq0QTsabu7kHgW9KaUbBO+GtV8ul4+fHmKE4dZqqkuZ3f2yzNQhrwj2uS7LcVmSyJCFQTkKqEf27ZSYmTgTS1VbqlJKogCzs6n5dS5zqRGwFl4EAIXTQLMoti4Z3ISZczoeT2/evKllma9nREQNeYhpz5fz+fm8mFdDda5gVStl/vR83Zf6CQYccleX5tvx6RpAM4yCSF0BENW5FGGelyUJux1TV/6Cs2tLitVYu5aFiMw9iZCIA8tS5rkQEVjASho3dwADOxMSkzAkDylTrUEh67IscO+ZysFm/Zg3q7W5T9NntvYeMUqdqTf1joLD7bQKR8/PZluEquvK5vvDNrbmLQzD52muqrVGakgHoMNA5D0hhKtWNJtCIzfWmqspCM5ubkXnWus0X+dpmqbLPM2SUgw5Md1ofu7TPJ/P503kaFz4M9a+04zh3da3185bvkZFMIaWTq5LvETghJ7/cp7nZVliq4SERMDCgIcs6DlnESllKbVqraWWw+EkJDmPcBZJLJmIIV3vIyzLcr1er9dpPzo1LVpjC3WREdHDlFLE7hORu2zaLLyd0I5CrdxFp8lqLWWppdRa56WgD4FZAETGvlqrqZZSSynBY1r+n3YEkNPAIimJsFRtZTXnaYr9qaZlWcxNVJlYa9VSCcSg8Hbe0VBrRpMbe6ITQcicoC1P0A1hWmGL9bVhEj07kLest52jrbOCjtV417Ph7i0fLJpSCfRykYC6s/b60+iHxBuCsFfyApq54bBFPcJuOmvfK9/dprDXsFem/ZK1b5e1AW6zsBNv1gcH146D6312ApmBe0DoYA91zwBBEqeE8ZiGETmzGgMw86XYtGgtpOo3AbUOU1PVIBBdUwzH24ZshNysCgM5hEhouxJwhUVQEodvhQPXy/PT48eHx8eHh8dvfvbTn//sp+H+3YUqW+arao2CdWVZlnkahiEJu/tcKrNwHsayVNNhGOb5UuvMlLPStgphFnRzgwFMkbTAb4OffVGbSovL7PK3w8MrmAxUCC1ivsuPwszUKncmZocLM9iEOYWHr7tHEJNq1VpqIQGRgjy8z9yciUAceBg5mZPtEmkxSxIfBx9HhG2jmKO4Wbg4UXd1AgBFHzHwghzuWTs+PD3/6OffCIdjQsyGlroQYTgcWURYmCL1rp6LDnPhnmVilMzdq4Mi4pgTsZizQyhZWhKI1BdVe3h8XkqtVdVaYJiF463aPC9mFuGV92POwsPdIdM4DjLP17LM18uTDvn+bhAZvv76XRI+X57nZV4qqdJzwfnTJcjx03xTGTQNeTgc47h0kthIXjN+9apS6FwenforHO6lqvHqThIJ9x0mkiTlwc1qSsx0f3eXUuKUifl0d2/gql5VnchJwmIM91omaC0wgufBs5E6UkoAsSR4g2xaIYHm5uQRDqHudU9jEGkwtQ8ltObwzTJ4BZy5S01r7HNEOEZWCoCj5ExTbs19SxQTJruiXkr95v37eV6WZa6qEV06jofT6ZhSGocB8CgWoKruiFIqQdCbf4NbtWquS13MdJ5nVbW6wCvUHFLNSq3z5bxpfmaPnx6/+dk3X2Tte+LbSGXjBI6WQXhv7nQ0sLonPQ0Lf2ftTgIK+g/tJaciXD5wlHFIjeI71M0IGlH9RuSixZ6fzsLzdImgF2n7pFlCqSzLdZo+fXpYtXZ3f356/Pjh/TRdyrJorbVHTgvzMI7CMgyZJYrSNP2sBQmqlVpMbSklzAZuulzOWuZ5nsNyVEoJQQFASBkbeNzfcE+/s5XsBIkIMQ/DKDlLSpISA6fD4J7rmNxtWWZT81K8avXmfcCEYb8tgaK6lNJIzGZIp0gezFExqwUFdexkW6u2pAQwtbLv1HFyC9zdwt++sci9hNBxpUhh1LZCZF1IZAw1r+ZL2xQAkELb94b/NKt7f5y7ed1lgXTHZfbHqVngqeWF8r5LORTxjX9vs7KTs1dpe/+CFVBfX7Y/OmNtWomt2wvGqIAbzIPuEzvUYYdj/vqHh9ev86vXSOJW4NWvD8vTh+nxzJdJHObOi23Hyd2meTqfn6fpudZlHHIgiEky3BA5JMjdfJoXM9y/eTceTg4Ox0Uzf3p8+K1/+N9qrQE7CZM7fvazn3769FBKWcry/PBAUUtMq8NDlyvzVGvJDIHN8zRdp1oLADO/TldJ6f7Na0m8zKRWHh8/fPhwGvMwH46ECHbjPAwcACBSKKQeyc5u1+5a6rDU8C9cGbs5WY9LNjYQSVCJjpQ4kbqXhtm6sIEgQkeWJDQklizTGewqrmxlyOnV3cgsARNmaTK0iCRGYiTxIbswjiOJ4Di6iB4PU0rkrK5GyZFcFcVg7sXULDzWI7lXi4UuN5lObuu1n6fp/eNzTkNOA+CRxaHowkwnyeJIiZlIq5kqVxUqgYkJy3EwAmkQQaGW4YcTKBEPnCl5daJaq5k9X+a6y/xABDVVr1W11MXU6lIJwMhJ5DgMhywpsWrgQzPBVAuQXr2+G3MeDyNLgpMaVdVlmgEQ8bVsKSxAJJLyMJgZWhaGFVHexJ5Vkl61iHg1gHrIcigdIbzAGOwRLAE3ZjDR4XhMOYcr7jAcjk5LKT4XD/8cIqQE9zq71cjLa0binMDCnFg8YrR6YnIiYm9BZk0HMXfb3HjbOTRT7qw9In3catiJAHMGwYOvR77UMDJG0kfAhTbnLO8Wh/BFCLF3KTYvy4cP76/XaZoutdZxHIdhOBwOy3JKKY3DAe6mi7tpre4ePoApJUlSa9P2ljqZ2VLnqDLggGshr+7i5lZrmaa6TDvwBtfL5enhCS/aF8qi7VdtRWpfvPrKIRpC3XXhiG8LHuDNXQCR6jTgfeHIG9nEY6tO1AJ6YURgU5+uM3NZFiXq/nLE6BGSy1KmabqcbzGJ6Xo+P12en6bpWmupPWFkEjkcjyJyOBwaKWi5FkLqVlUNp855nk11mSfTOp+fyjzN0zRNUwDyqwbc+FofMjd8kEU4iVDPG9NTbRERlcMx5WE8HsfTXbe5YEBys8xiqqVVmWjuUYxmm9v2pVptmeS87+dmCuLghQwmSHPPon7++oKiY/XRt8as19u34tY9iUqPg0TXeru+udq8icDkAuOutRsUUIA3HG/Tibvqv6FmN5nY5+rXpZlBI4EKaPU0j2fzSmDWIe1Y+Kbixp5aLezYcff97zrq0F69dTueYQkGmMINUJDCiQ2sPORX7/L9XToewYSleFVfrvX6tFyn8bI4iYOt7jEJR1mWeZ4eHh7m+XIYx3EYch6GYYCZaYnMrmp2Pl+1m2YiUtvdTfXy9PDj3/6tsizEXY52//k33zw+PsYmnK4XioCY8Bdzc9daAyJKWrmWsiyzu4tkVb1cLymlUpfRhlJng16vz09Pn+p4gCpH7tZg6UjwIeqPA2Hir3vWbvBFbdamMMeaB4ZjoO6B7EQgibhh73oDeQRDhUneiZUSaHS4c0oyiGQmhpEruWb2V4ckkiL0KzMxU2qp9JDFhJGzp4TTgURoHJzZczIWN6iRxWYlp4bEmpp51aIR/+am1v5h13ZaO1ANS6vtS8zMIoSUEkuSu1dvch4CjZknWhS11qWWlOQwjpSyHF4RUVkmM42iTikfOI0smeUAEuXB3Yu7GXEahNithrJDADMxRIRAMDVlYqYffO/dq7vTu/vj3XFgcmKfrudPA8P06elBy+z265LGu7vj69f30+Os0xJxFwBAVncSKABJKeWhS/JbOJY3VXfVWRod2EywcDdjQFodAFB3QA7PvmEYXr16BbjVAiDnxMxqMHdOwjVlMCjZmmY9CeDJ1TS7VrhKHtMwgASSufAyT+Q4HEcRGfLAwqZmbrWUZVkiyEOaFaOtXi1LmS5wJw+m3RJ1uqnVCfAhBR5EcJRqtagZtK4gFoT3yTFXs3UwSFaz67wspZRlMl2Ox8w03L+6Px6PqlZrmadlulzQEzsv82xmd3enYRjT/d04HJKQMNW6uFF1hxaY8ZZ/KkRkZ3IZZMg3BRip6yXbJ3T7PTbtfGXu1H+J4OjUPuVutV053Ar3omG83LaAk3mtVkPYSSmdjnc98RZFmsmmF7qZezcir6hkg4NWpW1MxAc+DId1OG52ffj49POfXM/PyzzXutRSmpJNPA+ZmCMntvSKc43uNglP3bzUambLPJvW+XqtpZRlKaVoz3MXnEmwJeWJFFnmFcxk5C4gIiGE0wVawndjN6+LV6szUxtyK7wR2QjK4loJFtgE002eWQBqxbR4w6sDgwSFfYhA5NVB1GKLmqiFTepqC+yOoG5bbAOhF0cIzfozhAYbbybA1cjCoCrAISMxVSNzmqpbUQNHuJM1q84W3d7jO9DcGlbFGijV5+JrZHnPoGDYdgBWrT12qcN9LfKwVy2AANK7gr4nXy+19nX7O4qjMgXP4JwyHMtUqlqFGdndke/u5d27w7t3d4cBcC/L8uGbj+fn6dP7p8dP04KTAwpzoO6yIKvW9x/e//SnP314+DDPl8M4DDmHXqO1LNcLyEXIHdNc3DHNy/39a0kDSyIiZn5+fmRYEuQk1HOAvXv76njIsUylvPneu3dm1nL8ucOtLLNpFWFhnubper0Gyzazu+WemY+Hg4iYVV3q4+MnSXQ6nOrdDIeqEjgNmVnG8SCS1Cwc5onk08eP+0ndHDzpZpqpZfchAhiU2YQxiAixSDOWC4OJkhAT5eTCGNkyI4tncUI1Xep8nZ4fB/KRvkoMMgOQiZloYEnMOfmYPWU6HEgSHQ7MgjwQM0l2ZlglNySCOGpxB6LMucOK1qqmXWtX86LfwtoBVMfSc4ELyZCEyBOnnPOr12+HPGrVwM0xa611ui7jOI6HRDLK8RWI3KlqCVcpGY40nljGlE7mKApTK6buSjIkFleYFe7WGyFxZxZ2sypIwj/4/rvvvX3z/Xev3766q1qqLufnJ2G7ns8/+/Fvl/lqrinx6e74urz6eKm11trTmPmWF6ytXUopD8N2ZHw7eU0Z34DT7u+zCs9aySPH3k7ha4ZcPhzGt2/fMFNkJA1kIjKmsiRJxgmc4REqQpCUgEh3X6HFTTllkgxOkNzYDdPxeMo5h+IbmWVnniM1jbtzShty6ajLvEwXrNERFm59xU3rfCbYYZAk5EYAzXOZ56rVSwnvqsibQESw20zT8QgmLrWer9eitcxXdzsd7w6H8d27N69ev3p4eHr/zcdlKZfzlYCcBO6Xy9lU4eonvbs7jkM2k5xkWVDLBeaoi6sKj0xsMA+Q3EwIMsiYZc+8m4Nt79SOTm7IysYGaP9hlwu2wtKBNK0sbl3KDR9lJEKQIjav1Qoc5pYln06vRST8V0O7bXfvFvqAO1oih+aOsObmAzINeTyMh23tTC+fPjz+9DBPl7rMtRQtzcCPFuzXxsu7LqMDDyy8qpVh3ViWqlWrrmZ7X20ucYtwiImUnA6YgpjMY7wCoPnMM4NZ2dirlalce9AjUU6ZwsUPsIhyIQRkRQS6sfm5adW6rEvT9W9eAZNwSTbb6fQ9+VBfmK4uUcQebuvLaP7wUUrnRt7bznh3JkZL58CMUXxIpE7qZG6lVncyWPd473PaWLtttMJXf3+4o1QspTPcEG28hVh29To6ZQ3zp7B7rex7PWxBBjWwufVxfRwrht93fhsROQywxJQkkaThcHAnm2xRKKrBhsP47nvjV987fvXuTkhRL2Uu73/28fHh/PH98+OnYoeKAequCD2wPUJV379/fzodn54+zvM05JRzqlVrqcs8PT89EHA4ZBCpOsCXy+Xu7tUwHobhEFm/lunCUGaMQ4vcBWHMb8xercJuZO+P+Jc45BHiVcqitc7LPE1TVZ2WamZFFxDGcWTm67yUWh4eP5Y6vzrdo1RVm8MDKQCpPDDzsiy16jAex/H44cOHDS0DFKhdDN+n6+rXGAMSbFj8NHAWyZFrnkAAM3IoeOxMPgoltoE9izPUdakLpiecEo1UMgNWAUTdmJFrYj4Mfhh9GPl0lzjJcAQLSWYSMBsoYAQURgKW2dXcyTBVcyuRp0bN3CNDf90JnXiZQ56ZOOU8jodj5IV1aK2Tm2vVSrU7h7u5E0seD+PxeLx7NYzjeDwSsTNVrUWrmRFnhzjYvaG+4XRmVl2ru8YSRgBAOCjAnFlBnkYakhzG4TDkIYkwCadxEHKr85tM9ClnIZ6v0yVnAR+HkcyX69VZnCUUAKOb09DE41VEjq3leyn/xfHZPuwkJuaO4J5yTimFX3TOchgHEEWWLjMHSCDEjrmomq+xCw4mHofMTPmYyb1r7UPKoxEreJrmWou5RxqkMHqHysMiKecAvHIe9tJmmafpcjZteYsCindVuHmdCF7Bzi0upS61LhoVfqmncGu67E70oVVJdCNAmB08jtncxiENA49jOhzSMufjcRAmrZWALAJ308HN7k7H093p7nQ8HQ9mVrXmxEyllExemgzkxvDIcExGDXa0m5K1wTCbsNUrsgauELllqRe4o5fUndZ1Xa0vqw7l1PXrVmUkPkMLirFYamtgciP3m7dicCWsAL43Q8ZKPnYsuLN2dHVg6yBJysMwEKyKWC5as0f5VCJ06YF6rDx1Dt/wZ6Y+NB+XopGZauXrK/MIpzxu6bKpJ/2OSWQiaSbAcK1qOemIKKXMKW04BIGIJNSyGF6qFg5EgQUQp+GwjtDd5+vl/Py0TkiTrYSZOaVMzBL+//3mTbQ1atgYXM3DBLaXw9bXlrlrdSH/whHudYIIiQiDM3jIchxglB0oWp6uxQzFFnPUlgJkBeI3PB648bIGoIaqfWexwYyhCRpJvcKfizY+3beAW/OHcuoRe9S88HsGqU2yaKPqCwlEHMf+UyQyI4UvZYG72uSuw4Fl4Ddvhq++Ot3fDUJw1ek8XZ4vjw/n58cLkPMwLJSqQtmUbiq/mfn1ejmfz9frdSmzWaoqWsM9bInMAVWVELlIvASmSEzEbuquWmvOGUBujtUEIu4HJHCcMMxH0s92MN3gLiKqVVIKzTvXamZq1YFII5aHrK7Hw2E8jMMwdEnJzb0FtkyTO+ZlqbXe3SvAL9YutiMD1CqdEhGxs1P8ARYweWLLRJl1YGT2xMatlDPlxEwUvqeJnRkiECERTkmY2M0oMpsJOwTuLW5dSDLSQMOR88ByEEksQ/jfU3jrdyDRjRtbY3ZhE/HknhJ5RN8oyM3rzvoM4Ja1E3OWNB4Od/ev3ohQFqp1eS6TVV2W2T3SMHqtWtQk5ePheHd///brH+Q8HE93xHywV2Z+Pl+WsjjEnc1YGdWslEW1LssUJkILYxBMhIVIIIlHImOokJ/y8ZDT67vT/elwGFIWGvJhGNL9ON4Pw8Ph8P7HP3azp0+PupTE6fXpnlSvTw88HuR4Z8SVSG8h3BV5vl3dJut3IrgD23bAXoNyfZMWhuF4Oh5LKctCp+N4f38EcLlSuI+pGoEdhPO0lOpoCBoRMfP96TAO+c3dcczJtLjp4Xgaj3dFbap2vlxZZKllWRYP7+KWbZsk5YOkuNvheFiT3Lv79fL8+Ol9Wea6LG5qqkSIXMzihcmpNDcWdyrFyqJwgQuxyCANRyVqmcM6ICzc6uQyec4sniSNIL+7G4Yx3d/nV/cjvJreTVMJW1pmdvchkbt/9dXb+/v7t2/fvH79Kiz3ZrUuY63L3ZCWZf706dM8L9Kz5ThCDDS7qUDV5EK81Mi/oKZ/W3P3UA2DDayKL3q8UcR9CCK0hBC5zSkQ79YZZ3WrRu7e0m/0DIG81kZrtve2mToTXh8G74lv+wYkGg/j8e5uPIzhoOpaHdCmYDZsk8JbPopFh3a4D+qDO2BhewsI0s3h1BF4akUvopr0GvUXLhehktpqk9i7bzVMwrb8wqFyA1EpFWoR6NLGwsT548O6Fmb2+Pjx8P6n22gBZhYRSfl4d88iKQ/hWIrm29h7jGY7ZzdyxG7v3gYvgJmmZu2Y4aoKr/nEnQlZ+F7uWNLdId+fEiUiHq7Lo328Fi3XYmoo2g1Sa2vyrsN9nudV6PReHSZcy53VSTMpuKZelKBlQTB1J2viooWHXhcHGS3HC1rqJwKhJWNvPv7NQS9qZIM4gWRLDmBkSqOQk8Ge3W3Ri0Lfvn5993r4Xb/r7vf87neDIJHPS/n04eH54flnP37//DyDftfx7r4sQ62uohWqe2u06cPjw+F4mOezasmJUxKtZmo9AxpQtB0r0DzP3RfCFyJmFsbheFjztmK3Mm2dYnc18yi6eyDIEaGbZlqrWngNtyBFN1d3j6otkkRE4GEDicm163SttT49X0op0zyXUr/+/g9BcpvBM6RTZjIGEpThLYE7A+G/LmDCyJ5YD0wD+8gYouorcQv85lb3Rd2dkBOlxMOQD4eRgahXmJKknKKkRaMzA9KI8S6dXosMPB6FhNIgYKJExODGdJzgns2yurkkTe45O9hHE1YGA5FhBmttsNZuy8OIpJTDG6KpMN5IX60KUJSLLbWaO0eWAEep6lSl1Jbkvhs2unLT3JGoMzaHO6QnLjSJJKqSRIScCSSMwyDjkFLzyHdTVaaQKplIWA7jQbXOSwHocDiyJHdHbIRlcRGTZDtwqVHVL/B2NEV8v+86Y6e+BVashtCKG45DPh7GnGXI6XgYUxJ3F2EAIk7kUbQnnMjMNxSPiFLinGQc0phSJXN1JlDzalOCp5zcvVD1rXbUHnve/t7Oobd/2r09W9ZEAhM7IUqMW2g3TEgMZ7iAhbjVKAYRObhnkosiOY2yOA1CDs/OIM+JheGmWmezChiz58zkGIThLsjuGHMakkgwyqjjsC6GezjxNa7Rta8OX39hpT5n4V2J+1xZ3y9ueFLA+39WbaddEVw/7EnNzQxrTJw334V+KdzRzmfoTrE7mFbisk89j1Vbb7zUwbzbWwCIhsPxcP/KtCJYu6k7FDvWToxwe+FexGYXzbGOIrR00+4f6ntOSUTUfeVakS4iWMuiG7U7e7I/64CwNytVC/zuvL1l03B3h9ygFEREe60dHbK7ASyYKUAPrSBXF4rYJzi3BMgcezcgsjBSujfzunezmXcBhVpyNu99bzNP6MptnBpufvbMSIlyJjCcHWRmakqmLSVD19pXpGf9n28JGxBTZWpdFiBlspxwGiWL3B0GJgIJnCJHUUvZ2IshmXqrw+U9KtN6TD2gxj3PQWRYMjgaReCGw7RUJtbM98zUypnmwcnfvD3evz7enfKQWOBWtSzL+fF8OV8BFhkKsiEbNsH0FirzeZ6v12tZJrViKrUyfKubSC3UC5FGNnZRAJlEJMLuJK0SgnUtdCVct8d4f8CBZtUhImNicXdpiFnAxurwFtMhRMyuEeYWwHPPaMhEzCJiXS68pSltsEk4MVLgY02nhkvTrZkot+KNq3QFRFkyajp50B8DwaGqIDZTM2fmJIk5CvB4OPnE9hOKMDKJohRmxBROpdT8fVY7X9v64bZvG2lpRqhWiMT927V2AsbhcHf3ahwPzAK3UmqoSu64XiYimqZZqzoxiMEg5+us7z8+SkqnwyJJDocji7gzc9YaxRwtpOkkAboM7maeAPRs8Q54kjQMA8PFNTF9dT8eBrk7DENi0zJfl7pwvbK7wzyxfO97X8/z/OnTo5l9//s/OB5PpgrTebperxOlnE6nOZAGtKPeCqhsK4v92GOv7a246GV4qAeGCTnDj2PKOX/97vXbt2+DYEuSYUhB4lQ9ZVfDvFRVPZ5OClqWcp3noPI5yd1hOB2G+2MeU5qnWhxe5qkuRX2qpuqHYWCWeanhzt/FdmoAkjejyH4hjaRSquwqACWnFMSdCc1fM5NyeI6Q58hqE5ZLJklEnIYBRKiBrxohhNNGwZgpD4m4GYGqXs3qMj8/2HVZqmoRpvs7EeKTZAKsjgDu7w7jYUiwOl0CRfRa67QsZZmuZVmWealL0cix32BLr9B6u0tDxthHdTdCQD2Ry6o14rZ1qW3V5pwiYVFXELFJEU7uBiUAQTAkkQhMXWtsD3Myr+ROnJkppTDeMwX5jlxbtoabRzFQhPQS/gwh/QaCF41Z3nz/177/u39fqNstMUpEdhG1moRd1mhd3g8zGK7vNnQQkhCdbqzVQMspsm1st5ZIt1QVkfFwcKAsxTswG4hoeOGuT+pSD7CmL1474Dj97D3v7e2q0LKWVQnph0TgWsZEEEpGxMmM3BNIHA4GNQmVAfEgmyBAm46wQgxN7O592IgfCAxbBS1ihiQw5YRx4OMdH++lmqur+TLN16pJdZ28Pp3eWMBq1wiLaXugo9SylJlQCZZJE9ubu+MPf3B/f3f84Q++IuZazMzLUqOsuDv6lFut6h7uMaitshdM23hq1VrVzSJRBLm6+1KrhSjtULi2xGdO5GTImd+9GcYD3b19Nxzk7fdene4Pd6OcBqnLMp2nx/ePv/Xf/qgs5TDcDTn//Ho/1cMCK+6R1GetpwVAVT++/wA31dldI/5RJGXJ1KMlo0BW+AM5UGp1TKVUlvD9pFITE/VKHMGMIzVwFNbqwEv8t9VwAwBhiSQwq2rlQPcdadLoKnipV9MS1VEFlEejlI6OXOvhdDL3w+kEphf0wc3gdhqHw8CHJAM3ACgELRAjCRB+3hAA8EjlHgqAMC2q0l1PQgiuANVymedpKfeH093p9ZiPZTYyH/LIxEMSERozxgQBwWCVygxJnCSTNDIZbLFzc0OECHrdnEAs/pWANF3VfY907rX28F1hATW1qaNbQQE8cNGqRhLaV5TeIfNIcNOr74J6yR0DWZTBBdydw1VqC9WQrkvBk8iQMsPZa5R+GZI07MDMoISWYyF+ndJQ1ZZSy1Iul8lBpZSQ56o5g0ir78Al9AHd0sSbRp1ctb9W+dlbXE1iFqYeApIi+Voc/rLMqj7P1QzqbB4J7xwU2KNJlbhpkkAjun4UWhrIQBbZPTr8TkzMvA+A/nbdFE7sJGCDZJCtEkAkEgKTc5Rmg7tHhWNqdew4OBlxAhGx90PYCo2Hys5COSdmSskBn0upajCrRSPjfQPHqG1OE3RcuwXCRaqDgNkiB78aHD0n9UqiW1qolyNd1fObT27lsZsJ2aPKG7Unf7Hw3hY5Dr7EiEVALDmxJAiRxnog4vgiwnxt0TE3cPhKtcUDuhtzjYxv7Xg4EZZ5S1lD1GI3zJRbyOLKWVrsfoy6+5Xt+Xq7SYOjmvXSVpe+9bfodgh0RhigvEED5K1VEUIe4KjWz0IS4ZRC4IgNS1sfQmqim/l2j+LTa2OCEBnHSW8DabQDXWM1j/rR7OHzYdRpC8EjHKnrMH2TrOjHup7eJr0Trcjt0bl75GD2MNtDmJLAANUuTrlHor7uVEHAWvzPO/rzwqrXMtRJ6OvihwGHEccDHY98ukvMXJaq5iJktfkrmLEbVEkr3GFObogilrVgNXZrpapkwcndokzBUFmNKsTA1VGNEkMcQ+bDIOPAh0MaRz4dh+EgxzGNWVoiqaLTdZqu8zwtWu1wyEyDXblYiPvrqG+0drWW1bCXY6Qk6qnlSYyYWGZhifomNYwIIiYWJRZ5fSViFmciAZzR8F10IK2jKysJ3ulYWxFt3zXVLcVlqaWUxcyqqapFzpSWlcLbATGzfeAisO4HjxpuIsSAOIIag4myrFaCKFJIHXigJm56RFFTO3fkpogCGSHdO5lhWRReCUk4jKRcCzhs+TNJQiJmsJtEbUG0BP3u6ohiZhp4dFkqSqWqrZZPoJ7YxTWs7YUbnbBkM1pKBYxDkuMcBxYA0SDi3gJNh5QP43C4f/UqJTkcRmYex5GFD9zUmYAsqQMZ7q5WAYxjFhYK/N7NTZk8kcMUOjPhfuAslMihxbySt2py4Z9fzfI4FvOH8/z8/Pyzj4+Av//4qZRSG9swZyrTTWl6M9O6JZTdRh0QBDpVbkRVYeSAEjFBxFPi73/17jim169fjcOQh5wEl8t0Pl+maXp4eFiKPl2Lg4/3byS34MbqziIDsaQh4LIxy/3xkIWX6TKbztdLWZaUB8lZiy7XUhxFWR05D5Ic06S9doh5y8ksPZJk26Uy+HDi7ENHjwO/IoATE8E5UhNGmr0AMZ003JOZiDmPBHYRNhsyJ4nSpw0IEubjmEXoMCZiTDNXnZ/OT5fzJfaNCB+GA5nTrG7h1oHz0zP4QixEkoY8jIda9XpdSq1TRTFWHpElMqq3gDMSJmGZ9qdbhEVko+Krlf12Ldfl3otB1vi6UZc9RVJiQsfeHUgp3Z2OwiyRUmgYSVI+HNMwJFiCMVGWyJBD3iXdlZ96VB3RnuoOHo6HSdjNf+fnP/vw4dP58ny5PBOBxX/6k5+UUnpXA7FWv8lh2hXRZgjvuPM69lsSHK+1FHfnXZR0gyWJmNipSwyNdhKD5uk6Xa5Pz8/fvP9wd3//e3/f7yOih08fI8kMEb19+/b+VfItnnsV97uwhB13j4ne2fyI6HQYX9+dghyvokUgGELE7rwUgiczdkvhoYMklMy8VDfXorPDIOGXnIhYhswp9XC55n7VowkiTVAI6h7lEwP3zIpBkNWy6UHomEVVixbSymrSbRNkJfDmNvM9mQkAh8vmbg+HV52LXg8jDhk//Hr8+t14OPH9q3I8zafjlYgSq6mRLZU1hBEJW2pYdIklZTjaEQdHlvuOw0Skt5rWej67G9HBQUpJIcVQDLX6XDwLn0bJiV6/SpIojURCXrScJyS2xB9//vF3/uGPrs+XMimRDMPJeHyu9v4yaWVTsCmbum5MIoT1lJPqVFUvl2lZ5qZwE4skYk45s8g4RJhuFkk5pZRySpLzICLDMDJzxAOnnIU5VJuURCKkM3HbED0HUUhQZoaOWUZCMzMrpVgPQVrmJbh35H1byqxmpRY1X5ZibqVGaBg58PbtUt9gmuZtZ8IFmlBQ3MAOAUREchKOTiYZDofmVgJYbWVnVuK6wkVR4zIqNVtRAKXM1cq0LJ+er4uR5I85p8M4CMtxTGECYMbxOJyOw+nu8O6rOxuS8EESERYS1Tq5LvU66bws8zxdp6fn5Sc/fSrKcz06JA8HYq6KUhvE9kLBuXGjawAgIhAlsEtmFrgT2IHIfBq5eyTllIaUh2E4pCR5GCRWmplTJhEJI+7qMmRwd9VKhOPhkJKEBhO+lOTKXmGqRQUe4fxB7KKuuRMZBWygZk4sxFzUpqVM81Rrna5TQ+NW896aWLvT0L3AvfPqcA9faW9q3XaQO/wZSfeO43g6DnfH4zgOQdpNdZnn6+Xy+PCwFH28Vic2znnQPHiS1PLOcJQBppwlvD8ALMtitczzVJdijgyqpZayVCe1ZCBmCdO+7QcSnezmxt142DltylSUzLTmZxz6Udgtw5YVScmIjBwE5sCfQezicaSTwBRWw2YSAZ2JOafETKopmGatyhL1CkmY4W5WV3OiqhsiF5Bkc5A0rEVVI9UXSwDhIUYSQFEZgW8TIoOYuw3+BpTvc7KqjW2td+9bDfLGWtyb0kbrrgCS0GEcWtAqE40HSmk8ntIwZsJALkzhHhgZYGrtBea9Fb9Bq00a7x1Qb/k4fZ6n5+enh4ePDw+for7Up0+f9q7IXQ+56fbWfTQpZBVbvjRGePNSNMaaMDFQGCaiyJtivP0wXINrqVH15enpiYhUlYnmZVnm2QEiqrX28j6+e3q8D+a5x7q2KW3rQ0giOckOpaD+X0rB39QInkzZTczZXYiEWNVtUbhanQ3uAhBRMiIhYRbZJoxWfYo89KuwfbsiyigwBfGO6BJ2CJNw2Ie1GfDdGW5uYfiPELY1hGId203YjXfNhEkEh4FfnVIebUiapTIWAjEUZISZXAPuEIpyHCmMrSkzADXrSfF7wtSGBrkbW8UChkFSArFyNsjSWftSIUyHxEnoeJAw4AKAmsLJDcbXy/zw8Fyuk1awRNZFKVrn6q4eqbfoMzOfsATS7u5LKdM0UZTrJo6jkoaBWVRNRGqpIpLzkHNNKakaNzs3qxkzDw5mTuYiZu7JwcIGobZVQSEUhoteKKTh52labQl2bubB4Odp6YUSLCLy1HQu1dxKqe5eG2JPDiyR/dRuhhcGVnjUwyAYIMQkwhRBbkOOclwAoERmHV3ooE5sibDvtW7v7KcRVDkv5XydU6mqJsJmOQvHliuLaSHC8PpVEk5WBwJMjQAtrqpl0TLXMutSbJrr82UulWcTUDpRZkZIL+Eb8kJvv9Hax8Px/tXrwPNEwm3KXGcAjMTE4+GUJEf9u5SHPA4p5fFwFOZhTEwkEcPPjZ8RbS5DBHKzUhZ3S8KRcD7spO6wWrXMZZnODx9gekgkjLvMWegw5jGJSBJJqlaqOsiInRPnkfJhfj5fr9OY5c3x1VH9WE1BBVxW+g0ALVwhVmNljF0FooaygJoV2hWmQ07HMQ9DfvfmfhzS997eDTkxkdZ6nZZ5qZfr9Hwpl1mvlRR5uL8DiclQwFqNraxSfzzm2aoQzg8g2OXxoZS5LsVqFRGWVNVLNRfBeJKU716/ZgkPzMB7vMG80fObdVzrugQfCM8uDg+2IKahS3lDO1utrQRLTEdhYR4yE5FKMtMhSRKOkxMiQjW9qgpzeOtcplLKMl+tzpRyEj7Uhc/Frdp8jiBJOHypVcMoEInP5MnMw/lRhkyc0jELsJRSaw24WUADUTos+/jobm3rysxGabuv+26lV8hudZxGwwNIhIT5q7dv7u9OtbTE7/M8Hw/D11+9zUPO40DCljNYkBKxnHI6DRmmXqoDR0JTKbbM7Y3hubtWnaZpWZZvvvl5KdWdVG2ZJ631erk+PDyollKn8/P5JspoKza0pSLpO7PhgA0o/lKLWTGzpSy11jLPWgoc7h42nTY/hA5iA0BiEeLr+XI9nx8eHx8+fXL389MTi8zX6zLP8zybWRahqG2aJO7T2elK3V72q+pNiFHU3NhQVgIRs3AGv4KI4bAUNq9kTl493CDMybToMpei9Xm6VNcaCZ9SIpY33/tePg5ada6FBTJAEqVTAtF8XkrRp4fneZoGIIPuj4ev7l8JUxYb1JNBnMRZIG6kxU2dIqlblFEwdbcWTEQMYl/LrYS5d515RMpnLFbFvdRzWWbUQvNUH6V8+imcVN3N57llmgZcOLEI0yh8xyJpHJ29+OzwnEfm1J1qVmdmM1XViQDOiRNxImKMRtlhxqrsZlYVRGow9Cznak64Xq/X6/Wbn73/zd9+D3MxIeKHnz5WT5+eZJqJXOBEqIQ67/J8icjbt2+/+uqr6Xo+z+fLZT4/X9cIi1YYUBIz52EQlmEYUpKUchKJGAgmlpwpgjuIcih+EsZ2aQVHwnzTxE3EMY9TEUilNckyql2HSN3OWpgDhNkJADuRJBYg5ZBLuaFDxHd394fDIee8kgkmOo5yd5AxUWKSODCqlWCuBmXmahVRTqkDVEPOKadQE5koMm5xJ7DeHeFSevf69el6Kc8P81z90yNzc6fn4CBPT5fpMr+5f/3Vq7e/9ms/ePP611zHJCcT10Wd7OPDZZoeyjzXZRmGNI4ndcxFzpfyk5//rJQ4Jnj37u3pdIy9qLfn8MaNLqc8Ho7hbZeExiyAuWUAiTKzvH79bhwPYCYWDs1ORFIOfZS55bxvlIm2VKAxzW5G5G7BWjxUPXDkUfGqpS7z5fnJTWtCIvKBszD5kcchJlejED0AYScmSSypqM9LOR7y8XhI6qJezKloTy2ArQ/Ma9E+QneQALR/EAe2BZS4JvAx03GU7706DUO6Px5EuKip2rKUy2Wa5jIXnYstRiDO4xEsIFGwWvPZXG2+ZlqXidyuqG769OnjMs9eNZyTqaWfJk45v/I8jKf7e05gglF77Zkmm7j0grv3vwNIbKlw12sCVKRmKXV2by7yRDmRMA2JiLg6OUsSTkwOqLectG5eqhpxkcxMZda51FrclFwYlsypqtfqlylK+7oDcymlVvREPyCYeSkqIvcpCwvnTMx1K/1FTCycJB1ewhIxh6u03EVG9x4Ou+rhvjFbrFb2MKUzifDpdHj96r4syzLPywKry5jT/d1pGIfhdCCRmpIRRTTB4TDeHQ9Wa7lOADZK1AnNhssRaqkp0eUCs1rrrIparWox01KWaZqWZbpen6P47zYub3Ss74Rmf8Rnqjm+jbsD7lZrJJK6lmUJP/kVkG/XBWLkoMhiTTxdrtO1tWEY5mkSkVpKKWW6Xmsp0/39dDikYUgYaJWIvevwwAvW7r0s3m5X+i57WpjpSJgH8Mklm58K2Hxmr2wzvMCjZEY4mpVS53mppkukl0yJRE5vDCQOq+pMAIMEdBAQ6kVnW57Oj88Pz0eSkTgrMN5xYmGIOzuxgxHh1wjZNfoeWju7WeRId4DF3do22uLTthbFlBVWW5aohTDzfFFgAeAUXnJlaV50IGcW5iR8FFZOko6jky90dfJxPIrksFS0HC8xqWZqhZldHALKIIkM9eTGblyrz9p9t41CsI5Q3aeny8dPD+8/PL7/dBaS03gH0HSdqtJ1GmtN1FxEFN1Zsi0V8/F4uru7J+JatSx1ngszSQiLzAAxV2auVZlZVVNKIiXJGtYRfletvlHA8tSFg8isQKsMu1l6toMRrD3g2H5J7KmmpuZhGPJATCICchZGq4hKknKEWUZmupSy7LxAiDAkHrMkbqYeAjziS8CuRkbhRR4CfBwkidwPQamj/jdRSgLAoE4mQkRISU6nwyd+fnq8VPXLdGbmUqPUUwLom28+PT2ez69qmfhweF2WlDjrkl0cKmb09Kk8X65R5OnVvQzjYFiq8jzbhw9P12mZywRAUs7DQM2c8S2sHQSRnPNoZKaWEueo1pqOFMg8NcsKpywpUTD4KKtLFLUQ3HllmyvzCb1GoyKiFzOt8+ymLdM8jGB1mebrebqen5+fYIZDNuFDPoQcWjTAMjKHomNW4NPdvROPY9Zavv/Vm3dv7s/X+fF8vUzzNx8fbZn72QDCeYeo58ZApMrsgT7hKMWNEpGPOR/yeH86fP3Vm3HIr1/fh4GIona1oygtimux56nMxasLSAhCkADtVoTVI2qHwl7U0Gc3N0oubl6tlV5tLNmJzaDmpVRrRjjsEZdwFv7McaJrRC/01xuNtrk/wJyskitpScNwd0hCbFpd3bW6GfMgLBCmnLXWea5urtWYiLkwcyluysKHcUwio/ABYCMx1Mq1Wl10Mbe51KolvPQkSR4ygyIEQw4nkUSDRHCecAoveWYRyXwTQAVt+d3MzLnzqvUlZq/9RRTR2tIUVnevREgCYqRMIqSE2b3UUpZJVZnh5JdaCmNZwMLsA0vUbyRyddOllKfrxQGWxERDSgEah48YM0VEslavtdRaIrNHqabqp7s7cKaUDvevlmW6XM6fPn18fDqblc4ePHJBNeq2QyZ2Zpi2ou3PbU29+z8ZJ06UhjFzFDyIkJpeRGclnBZwZzUHzArIhyyvX5+OhzRfnoRJlmmsVWuRWurz0xk+3N+Pr173HrSyfi1AtKf2a/uMoLdlKqg7Y/Y/KSc5Ho+ZSDhB9UwzakQYethDNA01jzD3V4eB6dfyDwGfl0WrPp/P81J4yNEDdspEd8I58R3D3J6Xma7T9PD4/PFRZdCUj2koUcrokNI4pNNBTkPNuXCyYYQeLF+KBLzmSfgwHNzs6XKtpo6w5veRtJO3NXOqTpfFF9VvHp3M74b6eoQQkiB8JcyhrEbewvGcXUXVzC4gup4vRj77bHDmx+ZN0w6ChEGtqp0vxQBL2Zk9sbfsBJHIJMGIlJl5PByYqaqr2XW+zmV5eHp4eHqYp3KZlOCXZXbQXEiNZmdrK8holu1taO6+LGWZSx7Gu/tXKQ9v3ryNKr+d4jQuHWGZ4ziuXqZxFB1rti0CYS1lic6oI3LPvZWxWDdM3/OBV9TY4xRdbYJCI+fjeBjGMVh4J49ddGjWNSLinLOw0B4IBBIjR+LJVj0hzp7HRBAoPLNMYYbn8+OylNjMd3d3r1+/ZpaUKqilXVZbHHY4DCml0A2Z+HgcvFfdcqvqqKoOFKtKPtv8tDx/uHz6ycefHI+nd6jCMH9UnX7+/vnpfLlcLtM03d9d3nw612opjTmbmWottRSHR7BFHGy95e03tnaRlNJgZEY1JUk5pyR3x0wUzldIKTNLzllyjkIaMcUBZWNTYLDj63EAWupTs6Km03TWWmJDMbkQyjLN1+fr5fz89AR3wdFzstMIYnVUgysimVozOxuc6HS6S3kYv/5eTvy7fvDV97/35tPj88/ff/r08GTqy+W8aq0h2XMDTzyURDhbFJ9bk24AgW2PQ351N759ff/DH3ydkxzHgQg1LF/F1L0aimEqdp5rUSueCMIQaiIOthiohjVRqHnN4cJcOblEqV3temdIFhJxestSpOes2CPRHQ/dUxjQZ3wdXefzjQs6N9ZuUCUr0CVlvh8TEV3Ok6pCq5uTM0NImCktZm6mastcASIUZtaWMCqxgDkTD4AwJ0WpfFnIL2pV61KLamWQEA/MaWDmlPnAnNLhRCzI7ASBuFR2sEMkcRp4GPc29fCUacOxDgnSCrZQryBCIDgDBhbKWQAzI4KnBCZPmVhYCbN5qbUuM+DM5OTXWhbyLCbCB/LkkjiJJDI106Uuj9PVHSxJmO+PxxxGFOIoumxQc6XFVYtGQriomW5+vLsb716Nd/evv/p6nufL5TL8+Lf/wX/z/6mlAAjipmt0+Ao33LYVBt/zyHVvBFDBLMzsQ5bA+NVaCrA1aigkna10rJtVIs+DvH51zCLL5VFAsiirjqVIKfX56VwWhdPhgGZY9JaJNnrRhHtekX/dRX73BdpTbR+y3J0OwpQGsVov6lp0KCbmSUQ4lXGw8GBizuP4g+9/LUTzZapL+fGPfgdPTzzkmAgGZaL7JFnonqHmaZlxvc6PT+ePn2w4+HC8G4+1qo2eDjkdh3Q6yHHQlBdOmge3g+ZcmdiRzEX47jCY2XWezBHh9kQhyPRaNLsWnPu6OMgSqi769s4zUxI/cKg07nDjcLEUGFngZdVQJjWblqrus1V1qz6bR2IDZ5GUUli1F/Vvnuus9qxWmy8fCbEwZ0+jD8LpIEdJ6Xh3T8xzUVX98PDhfD0/nh+ezo85j4fxjuDAbEZLgTvxOITHQa+EcKv5eSSYK0Me7+5evX79hojCHwUObwhTwPKyZ+1dmoRZM3vHzVcpM8LfIzdp0ah24WvkVAdbHfCqqrV2uJ6iiEf45ItkERmPx3EchUUkrak/9thADCVUUP6ctUvwoAAWe97AJnW07AFuomofPz49PT0ty1LK8sMf/CClQ8jNq7duqVd3vX/16nA4hC8wER0Oo5tbdTOvVU29GtS9WjX2yRaan46Xw08+/fRuuYOwMGl5qnX+5v3z4/P54fHp+Xy5O6ZXd8PxcHjz+m1K6pE6oBSHt/RUzST3bVp7VFbWSPyUWSLtDOa5OLwuxR3MiUju7u8POHFKknLAa42qrjIPRaHcSMbcM9jr4qZRd7LW2bQSkRM1p0Rk8gPcX716Dfj96ZBzOhxOw5BZ2Igp0it7z35BbuaBhAwDJ2HVermcyzITfMjpzetXz8+PstPasbn9eCczEeiFBIoELcR0fzgchvz29f27N/eHcRgPR8CvS1Wz6zKr2vk6L1Wfr/N1Lpe5zNXUIhKCSlWQtbxd5g6Ev37H20Pd8VYpndgFBGKxllgwsr0yUx5YRB2rFN2KLne7MhH7i1TdkTOu7+YbHh92ZxgASZRFhDMbkRJVS8y1FgbgSlh9iMxM4SCwO0qNyOzMxCyZmZ1grp26hcejFtO5lKkuRZdK1VhlFAFJYhHKQ85jYkpCiUiiWot5OM+QszTLReghNzJKQ6sBOJw5dW1mBeWbJtqi5piYZTweXt3fuWkpE2AMJUI+jCyi8HOZ2ZWEg40u8PfXCy1ysiGnNI7HnAcyQG06X6fn87SU+Xwl5nFkCOlSwOqgpdEFN1cznedlWUo1zePgREaF1BRCzjnn8UAsiVgOh9NnzgHYudH59n7HSjrVbQnL4itzw3qxG9yul/MyXUzVVJs7c0RS0lbsnAmUmIhyYndXzYdjFuJDGhjgpG7uBK61iihTcZtbZntbZUwiBpydyEAcSTmImF6EGPVUGzEGAGRarRYaRHPSzLPlWlFLZbMsKbH4kGhMmeTEKQ+ZRyLmhEQZr766zyMfeBgkm7CJjMnvCQk4Fq2mB/cZOOZ0GIdhHGUYMEghq+TMlITHYRiHEc5awZAswyDDIQ0eHpHs6DLitj7tDb2QuUJUMneHwGkq/IhqZqaW2ccchpUm6qML1q+P4+vTkd0zvBbl56mq2ULUrI0VnOAOYgMT2F0WtfOiU6VPsy5mIXBEHcID1TupicVSIZZLnRw0LVrVni7naZnm4kaDIldPQe2cog5QBCE2q1Yf4Y1uQMQiMgwDdfN6/Av/QcLG2sOgHlnnbrBS5j1rJ6KWlrg/waypPe4xS+j5BkNa5RbZ0o3x60N72GnfVo0r9/Pz4jVwib3vKqIafVBuUGSMCdtLDyoPOBXO5ogSLAGC/n/b+7cmSZIcXQwEoGpm7hGZWdXdNRdySOEDhf//56zsPixld8+Zme66ZGREuLuZKoBvH6CqZu6R1WeEwiM8PFLW1ZER7nZTVSju+ADmyLx3c+6VrkSJiF++vru/5TzlNMV8unndipldrzczV4c51lKLmtZ1vV054fy8fH7+7JiWeT4viXihdJZp28pvr99ebu/0+oIff/jh6elZhH/8059OT8+lbiCcTydhrmY1+isejmO/dqhZqXXO8zTNUbnrru/r1Uxvt6ubAUwkf/F/+IFpOZ3zNIVXnokDaidK+Qzm8GqlWjVTtequrjeCUzTRqq3rlyTJ6fx0mmySeZJlnrMQEz2d5pzS03mZspiamymLgd2h6mF2A1jmeZ6wTJyEa9levl7VIKDzPP3TP/xU1lu6K7FFt5HQms1RQ6kO0RvOpH/+p5/+9MOP//DTn//hH35SrdEc87dff9m27bdv37ZS36+3UlTBRrRVuxUjYnCCU1kL9fyPuGe0deGeahGaaSQzuSSwSJbUFfCI5bS27kTVQG5xqXd0U2kNtqJP6MF11YO1R12186XGgogwyXzK6ZTSkgh1s42SUF2vzS5hMBlHSw9m5iSSzWnblDgt0ymlJNNJROCJYB0citRQVa+lbrq9l/fq6qSccDrN85RT5pwkT2meJqJEPhEl5xTl9XAyTt7miCFiIn4YHRFFc6O2rYWmHGAPPe6OaI/bkMokZUnp+cuX/+Gf/wfTer2+uavVlQnz01ly+npbL9e3Z6bnKTkxMd0c//7ylUR+XM/nef7pTz+dT896W62Ut9fX128vBlJwnublh4USb7oxE0x3ZAI3dzP3UqsZlufnfDJc16rGxgaaJctEbn5+8tdvr0cDwgM584AJE0t55LmDFba4477mu+R3V5i9fPvt+vZiqqY1spZSStFRY55nEZnylJLM85KnLCwiiULtdWJDRLoJSM9LNX0rdavVofV2iQSDYOJhPA0dk62ncYCPDJSICEawxn/DNDTRumKa+emkKV0+LwWJa2X3WfLEsuTpNC0L5yc5SUr5SYh5Ps3keVr+gu0HXo2LiSFVTKTPWBN82mo1+2zkLJ+XpXx6ktM5LWc+Tze2hS1lmqf0fH4+n07sZIWE5iXR03T+vJyL14uviMQWFrQWrTj68z7mt3gkmGMC8+uml9W+kv77rzUJL5mFSUKJFWemOfkkmM7P//zjj6fsnxYra5n+5qW4v3JVqiQEG/7OUOLgsqq9rHop/rdXXVXV1eGZU2L5MvOfF54SnSdx0M1IHZfN1VAMCsppzulZKbPPzJJk4pYVJSxTT6b/7sEBpvn09OTwPeTSOBkowItoF+1DqA8Do/cnugNGjD9FRMSJ2MypVfwFQkandGocLYpNw6QJvJsU7c+HDhF5Kgc1ZTylP11Y3I7CL9rH1ooWJkBgGkR9Quv8FkOk0V3NQMQpEbNRpL8aE/VA7wT3f/3PP3/97eV0Oi3L8vz89Oc//2ha1+trLeXXX7/W6MborQFwVSpKv7399vXy+uXzj5eNPz1//p//5X9elpnnL9n8cv1//+2v/17LrayX/+lf/uWf/vGfUp7/5V/+R3dyCrgDBkit3rZS9XdEewtYMru7ajVFLQCslqu7a1UAkiaRRMS+Jy62AI27EeDkAMyrw9WruXYIbmvx98CYnCYGUmsBSRTAZzkDPs8LE/I0Z2mFryyBMyIt2NxCX+P/qGpGKKgMdSd3RhTN3qfRjdA3Ra159GhJAf7H1Dtr5WiLBbfIZt7KVqs6FFQURX0tthU1kBFXQ3Q4DiDyVjoMB1GSNALB1O0cCuYngYEjTEjRkyd8qU3hDdx/bjp000gDg5qIiEHywWeLey31SMHBIhJBGImRmLLwLIwpEy8iFPpUQzBDNXUiMndmtsgriVBGyiQpiKm6uWsNWElDVaj5WrW6tgwlTsTIOTW/dmYmNjN3WF2JMufEknlKDb19OH46FNP9IBBor2ByEzMLiA1mTpICeYAISALh6TRP8zKfzzJNEJ78BDefEhPyaeEks0OZZ2AiVEcxq8DmTkTKYil5Si5ZQWq+lXK5XJzFOU2gagoOiAlSHc14jAhMMEd0WlRTNdeorApe1zLIJKXez62vHHrkZk8V+r5o566iDel+N0WmZlrLVtZ1M62myk22S5QnmbmI2GQiyRxZ8+CPzoExzAyCqrtvtaiZNsh77h4S6TkrvXfb3RYb4nu82x5Eat5OIsDNlFRE1QhGZtEpmx2JTJJl1bSJeIqSSgk7DyyERUlcxGWCGCUjB2dIInLKpqSnZJ7kPGWd59NpOp2WKUu0IBJOSaZ5yvPsXrw6BIH/OXEyiTkgRQPoQce1bVxnYBA/HOEJRHjam9RLTb6QILKmhRjmVNmv1a9qJFgCA0HEGdWxKt6r38w5wih9Gp3oVrl6dmJOS6IMVwYSSw7bRKi5vgKPlBApdmGhpzSlNIsklok56v6bE3q3DT42zTvuvO98vP/Lfd2PKt0Q4XeTdPgE/aCD6jQmeRQVjW96oAqHf0e9KTpd7Te/HwCi1vdhBOYRCIsoEkQQ4OntVVrrsMCvpDyleZlj5NM8YfT8bTCR1NQwNzMFXCTA5BMyJX7SeVI1rXUrxcwh0VyHqtF8kiSVfL1evsLLb1+XZZ7r9qp6ezqln/7yyepUy/zjj88BpKnm7iSRzuse8XtV+91+7cScRKaUaqnrdqm1rLdLVG6LyOl8yjl/eT4vy5JyUrNsalpdRODuvpZi7gEJ5F67/gVpRdPISYQlIOamJEJktbhZSgICiyyBdMBChElSeM+EmciZ3UZvm+aGcSJyMzMt28201rqqFuHEkub59PnLDyzpwD/DZ2yR0jBP049fPi/z/PnzkzALA+7bejPTKcF0u17fWXjdyuv7uznUqLhclW4FL9dy2zbz2EXiCIrYWVjYv8uSU6SxetebhCUJMXFuf3Eg3LHklKaUw0wmZuZErYkEtKqb2baZOzdUB7C73m+5qJ/quupwyDMRGMaEnCgzLYyF6Zzkec4pzfP0SYQCgizk7uX9VovetlpKNZi71erOc0qTLE8sUt3d7Vq2quu63baylqrrVhDiQSSf8iRTAIcsU46Ay5RSKeX2divV396UJJ8//TlN8/nzc5bc/BA9YaBnDR5G1+LRoU8Gfh9AyDnNz5+SCC8TMXkWJP70w5+ev3w5L0/y9MzufDozIYeyJARCOl8/a5mqTWpv6/b1/XIxf6lV8vR5OS2npzqdSl5uftlK/fr69te//Y0k8bwsp3M+n+d5/nReiPi2rXXb4A63aL9rbrdaVe2y3tS9amRyJEarjuUemz4KCO/71bt6NSTk4GztAyC6c4RxM5yfoZHfbmst28u317eXb6oa1VChL+acRNK8zCISNUg5Tyk15u5ExhStGcixXW5uLSN9eXqazqccnTKYJUtPUyLm6Ep3519pGv8dVw7Uo/gDALnVbYVQxYU1o/J7Za1SncEp85KQiqcrS+I0kzAC+j6LEE9zSuDJJTknp+Q8gZ6QEtITLVbtDdvlnQSfzuf8w+nzl9NnNuVaZ/g8ybJMz5+/LKfT6/uvpW4pW0qUPT/nBYneUzahi6m7VyLlJja573AQ8Sj7iW0Hd3IggcgwGbFFPxujzTw01d7VAYlXYT+/1dO3y+cze2KYb1k2xdeyvV/t//Oyva46LUuepnD0IzzHoA0nYz5/+rRQCCRP4OT0lGnOJEyUQtCQgOcsmQiUaPdbBw0NtrBnQRzJ7ZGpWEPFdbeIc2O8VtSGCDE1P42ZHa12kej5eWwl551CEKF2+N1W3x++a4cHId3NMzjADY45DmIKjP2uaxA1fIzvKywx0qK2bgbqfaeYmRBtTfKUmag1HGYl4vPzaTkvOYmklFMyr9TTSFNmYYapkREpSKdZnp6Xz1/OP/7pOSeZ0p8JKKua2tvrSykrUIBKIpTE3KtV+MvPf/1/COdf/vq/5zz96Qc5n/hf/vn0v/0v/2sSTiKOVB1bWV9eizmez0tKUszNcVu3y20rpR6ZRr4bKxAmeylbraXWSoTwgOQ8T9M0Lcu0LCllYo7lYffAly5a3F2t9roRF2mZa4HWkg+967MIM7kJuYHICanpeSwpMdCZHw86CU9BLLkD5OaBPaS6bkW1lG2rdRPJKWXi1JzFd4sZmiMivziikFFbzzBw26daCxFYGMTrVt4vFxA5pKoVtWoefV+cyNHMTQ6hERulG9uR6RGGCjNHDF1yYo6gTANhThIta1PHSB/ijWIE4dJXM7MQnURM0rbTA91/R70malUwLf+cIOQMhllUmrO0DE/3gPNsIG1ObL3LXxhu6mB4tepuWy1Vy6alRGE+aWSzcU9WlNBcwvHkDCZXaLVavJTKgqwKkY6RsQOooYUQcBzd+Jh3C19YqAFfpRRGiGdBkjRlyQnMtXsDB7wsuxNBJM3TPJFlMhEbnXWCPpy5AsWtwpVICQonMMEZtnmF8WIZwrEucIM7iyT3AEMMY9fMPSa1QZ32NJ2dsPvYmhPMvbVsuzNlxvq2hIJWDtTdHARiYpA71KyqBqR082kEqx+yBYzWbKU1wQunjDkqLOdpyjOBqpmpVjcQZmLhtBvqAXfbkz4/ssvvWXl3S9nbiDi7kxsbEnlmh5ixsxIlN7jDKAnYgSjHb6owKCcSa7VhlJwrweEJDRpmXaTU5OfMPstpTsuECqCYoLBv4is7sd9gm9vkltg3WIEXeHEDiCscUMCJQtE+kOd39heaY6wtbrf1MfpFD3BjgIToVvztpgDPmclcN98KborVsClvJm5ivIeoQQRip0RMoRYKO4CEAQVN6A2i+iSHN1KIdmwPYLwK0+gg1ccwttnD2IZHHbsS0H9ycNM7E7m/wB4E//DhbrL3ew5rm2ivkzx6DNq7037RMYU0vCboDxzOoQPV4ZFeQaSG2sp00YtEow0Py+42bR6X2AbRaK7p0+G0H/djIqZoVD/P0zwHZ+KUWnVcomRurqcpM1MimgJ4s5quZTOjbTUCYDenKrzklJ7O04+fckqSU7pteHkzDRhdp9kMRGpmjgbcc7/z8nGoZVuvl7fL++Xy/s7MKaXltPz001/maX7+/GWaptPplHPq3Q38cnlH2MLkmysRck4svMwtf3ESSUmmlJhpNBoJ32FrmWSRYmMuTWkM2QanaCYOZm4pk5XQmvyp6vVyUdXL5b3Wuq43Vb3dblvZcsrzNH/+/DmfPt82PdoPgJMbGEzkVrUWhl2ZiFzL1Uy39WZaq8HgnCZJszqKOZEgTQ66FVOHk6RpaTC5DTFdDpkdFOl40zSlJCGXOXRCkTQlMCERcaRDDkcOoiNeaMhVN3O/3W5qdr1eo5NSrEiAP0jiUuud38ndzEbmeMQ5AGdytsKMPKVZJKGKealuwHKaiZ5SliwT4NfrTVXXtap6JBiVrbxdVneqyqD6bX0BfK03cy36br45VZDlKZ2fJpaU0gSwmRBxpszEbAKjsmKzWja9XbyobtdKyWW+GWzRU0xDow4woj703rkURBJYGPM8L8syzfPT83NKaVlOLKxuTqApIwlNadOyVn25XQDADHCrBcAknIX/6U8//PD0lGdOTjcX/+0VSpMSM7lBzX67vBdTtkIT62niz8/KtOW0Zirb+6R5szKz+O2G2vLNS7W1aFW9bjd3VzOHa1V3J8/kDE/wMHDlwWFoWrWUQPCL7iQ8opWDQdKImHjjqkE61ibKzN4vt7KtCuFpWVLDuk/NG5RYZJrmQAvhntW8bVvdttu2vr6/Pp3PP/7wF2G+pQJwkkxEp+Xp6fwppSxpGsZfCByLf+6LweINHz4hGO4yOx1Qdp6rk2FyOGClwAsvTJnWiW8z18y3OUEoOlwG3k6RBAnEqgRmbypHYpIsCzJvP5I9TX76hM1rOpd88o3qpejZPb89Ea7bzzOdbv5uVLPXBP2tvP66vVyv68vra4DkC/MpLyIyiyQSgMh6+elxcFHv4pUocsoSUyJ2zsG6QgOLpq4EgoEV6a8v+nrVJeHTDCZigzteb1RNVnnGzCo5BDk34P0QbNGxSagVsFJ2SkYAFQ1PXQolYEc6b/qGd4C39soHUcoUpaJDhN4xTKipqqKNGdRD4rTX7fTAA9HorBB0Ep4kIqMuZRvJHo4O7d5LiTAcs0Pk32kfDrC7qokAzNLN9hEYilxO5+G/HKyFmeiY4OmOy2Z8UyZnYMqtNK+F1sMFyeGlia6QMbsMopl5as4QJmKv7pFOLumnf/zphz/9eF6W02mZ5+xuCodXZp4kTYn//OdPTM/LLHOvulMrRa9mqFuzi5n5H/4yPT9Nf/ry9Pl5iXz7X7/d/vWXl/dVv61VnYwppajwwq2UUqv9XhodUWtJFKn1IUNyzqfTeV6W8/kpTTnS61RLLIKqRtjM4cZGzJkiYZJzkikH8ok0QCsiIkSVtls0DTFVa/496sItAi6NARABke7WVH2zaoG4tVWt19tata63VVVv67Zt25TdnPJctlJqrbtG2TW+6E/T7mVUtRK8bltEKVXrWrWqgRNxdpASEyekCSQ1UFmj/400iU6cuMMSNeKIWs8pS+ryPihdRLKA2QXDaidvHVRbrVzg4dSiauu6NgQS1ZxzZPsLM4QRVvtBSet6LLcWWTw0V0QBTqD6NmD8SO4TnlVBiS05vNToY2JmMLCDAxTWwWoCkHp1+FpXc1XfHIXESDynlOckKeWU3RkrWniRJMoRrLpV1821IHoUMcHcpIEBOzVFJF6XP3ogYsvlJM29P+Vlnk+nU0ppmiciJiMHaMqcpDCbmbrWwBNxh1spG8FnkSzi9jm1VF9mif5SEUBoe6DUuibJcIkIbU5gssTGgFWFb9H8UI2sdYJwkIHUNNpLo9c+ujuZRUOMDrfzaNj6sNqHaOfAnxsaT/dW7RwaI9Eo/mreAjNi5pTTNE1TYDFMjQhFpjyzjAZcSZilGnF1UK2qs7OkUE6jYoNbdXUObeAYmu2b6vFoltaj7dcgfpsdyy24wOYCiIEArwZ1dlAGKbkTZ1YkdHTk6KQb6RSeWq6lJQYLUiZOrZw1sstPiUU8iQsrkSrR5G9UKrazXifxYptDs9VE+qLri65rXd/LCoeAEqd0nqbeE4T6oPhx6agbjb1fW3iGORCPDtDeTNQap8parFafBFtyJspMDlqVDWyUSFKA4dLe56Z1s2sOvdbahwJGwxCNY8Qj+ro35aNuvra2OnsC+R3juCPI71JmDOQokuNPPqzzUNyGK/57hIGjdN+J5cOdD1ccd8s4wTHaXR+v7eZ8kNkoTQoxT3gcdzVUA0fhuQRnJWciQUCtkxCBIO362ILc3IfERNJr98HRNYXnZZmmeZ7yNOWUAsfQySASbVx5TjkJnZdpnltPaPM0G9xcc6QiGTM9n9LTKZ2WtMyZGjS2VPMaKWxGm1ruCNDWGuHcTfp9U9fT+fnTl+V0/vzjjwEVOE1TXk6cUqmVzWopI+EpnMSAuZkk+fL0LEmmeZKOlx4+C4N7dbh5qWa2rrfItw+3v1n94Ycfvnz5vExT4mVEIINOzN2IXCvcL+vlcn0rpVxuV1Mr22Zmt1uz17XWYHxV1d2r6vvl8vLbr6XUA2kZXJ1IGGXb3r55nrLriZk43G8MFkrCnqQlsoHYI0UuqjISiBJL9MgLv7M0n/aAXqJmhoZSlziLBKt317KaExQOclMHXEvtPlxrSWnupWjgDw9yl+WU5zmEg0SN/uPe2XeqMHL08nUjN6srwW5uKlRYEnHkts+3+bJdU8rz6eTA7bapeSmq5tVgjsttfb/enMghRNFS28GVEpazSDpNWXKWeZ5PpyU0OlW81U3VXQFXU3eDFrVqqlaLGSilzDn1DjceyZccFkoAy9NdAg4zf/n86ae//ClHU8mUpjxJThQZGLcaQhSEiSFTNi1rrU6kDRuciDBFWYuqM1/eLmIEEYi8u+bPz2fVn9bkAL2+1ssFp4lTyzRyJiWq5ltVIq60Kqfy5JIyq5JHsig46mPczOBmtRR301rcQTwx51bdQ0wkDaF2Z6Bmpg7y1rb74MNsJ+wpdYOH+gg3EAByi5Bhmk9PKU/zNM3TJCmlnLmnNUXRYE81TsI8EbmwM1fX0/nMKZFIXhaOdpZEMmUEIH6zCbrV3l29g1mPn0frodmcoMZwuedTMLv57XpjBqMQGRQE4mJcPW306cZg+kGMGSmkSGJiKsLOVIVVyEUsiScuWSCskkECFYBRCUZi1xuLuZWpEKe3ouLXn//VJeUIqYlXgb78+29f//1Xv1Z/2RLJk8xTzk95SgQDMzt5j7QT88Fsb7ZrGHlExE4SxDyAn5tQCOpzMIGckpJUohr6LwFE1nIje0pciJLuuuEekeaj2zkq6hiQwO+zwTn7EkUofcAFgo7SfaiIBxZ5zHEBUErZtjVOHR0WevEbgq0R0TRNR58MM6MBubvqoNJGHi1jtItZP3r8m6IxBHYrfyfs+RvMLJ6IImLRTDQ3N7YhPsJhfoy1pwRJ6T7wj8takNcp0OhAlJNIJFND1cNUI24rLsIilAQkFDyNmJkSiKszMUtoAwATqUMMLAwXahFYIk7M5HByrJvWSg5xEkmc5zML8lQZlE8iTPOcmPn9Uq7XEgnQv3y7vXx9v2x+XT2abqam/qGqee/NOI77NLo8zcsyL0ubwahqzBMzqRu7KYGJcpaUxN0Cf5TgTLJMc8ppmnMkvUe/u6FTuFpd13Cha63vl9daa62bquacz+dTYsY8j/Xm3cyOYLPe1vXtct229e39zXvzn23bTPW2rVo16sdCfdlK+fbt2+u3l3suA7jFXjGtq+tk05REhLM4943LwuzcM5rb3AEg8sgbauDJ0psOd9O8OeQ6VEJQqkQyRoRPYarV3YurwwMNtKyb1mpVI11OVc28VB17LEpKMM2R9NKKMD9EOseOj3C5NGYAh8GqQ6tXsGuomwY4qqkBKeW5GkC3zcxQ4gVUq9ltW6/bGjoqiEicBJJdhPI8T1Ne5mme8jxNy7yEXV3ZrlydSE3dUIuauhatRd1hCjC4cYioi27cBa1DG7gFho+inaKSpHVT5SQiJByB58DEiF6YeZ4oiZeq262lCvfmg619gBlAZd2uJJaTJqnucpqmKs/uprquN2emUkgXmoRI0ByabmoAWJ0kWV48RY0M1L2a9/ZgPWZeq5tZVXfnLMQBXkxhCDxsQvR26CHX/X4XHLhhZ/U9Xn20dSxAqZjzNEUbrih1C39S29F7g2xO4ZZ3z8DkvpzP07y0qHZuvW3Dgm9qxT0gxgj139th+y+HfdcJtHtGuyuCainMYFLqwkwAhufA+CNKICFM4e4QIubCpExVoEye2JNo4m1mY96SgBnIRGwQB7mTMilBxY2lVMAKvjmxcGZmSlbY7dvrby9vv8oN+WYzpyk7++yRrckG2aEfP6bHj2gxABGi1pyRqedL9NKH/T+i8GmRNT9ytJsN3y9zjxT3SdtlZkx0pG2jifbWTxTU+2C0y7wzA4msvrsX34U6Wmxn5K7fSXqKKqGmHUMAybljugEBXsT3ZDDu5t6STQY9DA01LMyDLMeBbMYn3VvvTeUIvYBHFkJ8ADeL9pwYkDVjj+AwSOI7gwFAqSpFKTOEVVyYCK0JKDUn536/3FBQicBwGFkkkIJYISAkBKYGMSE5mSM5HTpQ9tQYAGSqbuTmop6mJefpRAQREqbTlJNwEhAhutoQhDy9v2+3W9kKqlJUC4og+q9FF/mHPIk7h3xwsR4uaf/E9A/PRMsbI0oikpMbqRPBtRRXsVqjmkb6BBEAt+22vvzya9m2by9fa61buTUsIrfz6fTp03MKagC12ISpO8pWzGzb1lLLut2u2021bqpuFvWB67pGKpMTErOI1FK2Umop1+v1enl/KGRseyUc4O6mtK03EaZZ2kKyWGiKMAWZo6qD2CKmQhk0xDh342fsPbZg8MxEZG6DGwYxq9lWNm9wdpHABG/hWIchXE1ElOJFA3g5R+JCxPEoekrKdxJ7mkOKKDoUsnnV9eameluFfP50nnMyAwCK8vk8ES9V/XJZzext3azl5sHYnbyiIpAUE7NQnllE5iUnkdOyTCnPeZpkYghvrGrr9VbV3t+uqlaquaNWNWvjAwiR1jMx57AAEsFhFhIlSLDFB+8kCU85zVMORugNPUHGfqfIAQR5qQaI6oyoNzci2gOFIAIxy1ar5emi24VaEkoCPYEy0TlSBb++XG43ZzjhdrliLXNKfzl9IgBqiXiWJCxFq7lVjVibCImb6ba6able3KyU6u75LDKNZu6Olhu2sxjz5gFrDJqO2Tn7Ia3vdWMQQdtHbhWp7/AJhJwC2KcjKnR50Bkigt85gZNMy/REn3IOqE6knHm0Bu79wzp7Glvp0P39YLgHtR/pkrujoN2h52p2fEzq5Q8AEKV4KUQ7kEDhso7LiNnQ0ZsIwuGbxyQehEFEsTmM2EBVUJgKYWUoJ+TJWDZ5daaK6nCqlczWr1f/epmQP9FynvI//vDDMs1fPj1NOUtz3aDlCDn1TmB9fZwa6i7II+Tt6LKv26BER3ndfxtFNbtM9YMoiK/47oPmGo+P+vxR8/tjPIEJ0vRkdK/3eEZfQNx98N0jxLMNNyRRNAX1drOehW6ta4uLiKpSwEeqEhFzOhJwf3pY3Ie2SN1M73ZUs6Z2qd8YggQMGEDJncyZo7zDA1glnMXhih9We7uXRwT5YDM0WmQidpA60BK6wyPFDSKcZeDkEISc1N3IQQxO5rgWA3rrSCFhUrMkkqVcb2tOMs9TTsK05CRLjip4Y6JS9Xq75ZqrlSQ8pyTMpsZExIXISqlaFc7k6bp5x71UmFd37vjZHuAav2u1B2hi7MKWEJE65QHNoqWR8iTCxKnhdgBWqresApLMrfo1cQRTr7frr7/9ut5uv/z8cy3FXSO4TIQvXz5v649znmIZS63uHv726+Vaa73cLtu2VatqOjwwkTVw3TazHaWVmdXserlEA/Vtvd1nFqAtZ1CXuwIbPCXp+QAMFgfUvJpVi3REA1oOjVPuEbVWgBmR9eDJDlQnB2JsptozmZv+qKrrtgXsYH8TJg8f+6FWWERSJpYkzCJRPxa98gJFQ/p/90PbfVxMSORuqtvVVXXdknCW0zIthU3dWBJxEsngXLV8e3kvtb5cL+ous3BizuBEYEVyTiQTpSync0qJn85TSumUlszTJHOiyYvb5nqr779diuplvZp7UXP3auaOaJ9FzHs3yyzRsil0eAJYpGlexNyE32685pSmnD16clEDYOv+xdj4Tg4rlcwZNoHcPSHURAcAC3MpM8umutX6m2+/2RYXnjk9pyUTJjib15dvVbi41mhzCVpO+fPyxERWKhPNnJjYzDetaq4eQGNitZb15rWW69U0RDuWdMoyNzjPxmnuNmFkvbZMp1b/3v2qdwYNDeuqZw/dHQHzGdRwV/nTLueeQw1gQIqChad5ztMUmx0gyYnRcv1AGMCx3C2Pg9e2ye3+a7/7WLvuL6AeFGhvAiIKHz/U3HunNQlgVaLEFD4TbgnyHGKejAK/iYlSOKjIElWGZ68MsDOBlciYbuw3QXSurCRVFmJyUoVf9Vat+qauRlejm6X5/Py0fMr5H3/4sszz+XQWkch96KyT3CH3IFjendIx8hAlLTZ92JKdkB8aBNx533owfLjU+6l70gU3M3A0PLzzI3SDv80wDn6C/gU/3Pq/cASZNcyNtvKwgCdqfiDZT+ti3vvBLNM0U4/ReMehY2b3kZECjATRZuL74GZ9p4wtEEK6A28IzJ2aWeZMDNlVoXCqtoEAzPeQNX0Bmo8fXUUjiPCQ9xFS7/Is3KbRSlWdyMjU/PW6AeR4nqYcsNPcqz2FKaf0dDrPU57nGURTlnCkM0NNL9drylJ0mnJ+Pp8Tc/EojLqal22rtSic4WJIzCdhJttgbmZBDiI9C+f3RDuA9Xb99u3l6enp+fmJqNVE9V1NXTNHqRY2r5uaai2FiCLJCwRmeno+RawvSw4Si+lJIlOrF5x6zA5Tzua2buu311d3C0u91rDXN1XbwiuhWrQG9rCbbdtm7qWqmwXVrWoV2+12W9e1lOoHhjgWMrIjIETUYFGCnmpVNTI3h18v13XbStWiama1mkeTB2KL1HbaJ4QbWgEIcGIjQdQ6oVntg50BRPAkJGBB53ThL8ZoXcPCEoW8xCxTEpZI3ZySpBT8DtEE7qEiR81qVSc40SRTSlMlqtumtdbrmiXBEmOp9bYWSAYnKPuUUI2M2ZOkkxCBJmIBJ7AQJ5EkKfM0JxFelizCiRI7l6rFDbrByIvr5mWr75erql3L2orQg/Eh4F8RQ2v5CYEz01RjIo6Wbh2ihwlHrsgUBZMKihTM6uHgMQKRgaLmQFhyTjlHuAHRF4za3h2bmJjV1MtmUCJndzIwE9zgEAcBVkr40oQp55zzlOcpJTb3zSoBoMzM1TSCTa01tMNUrdy0luv1TdXKpg7m0yeenKU1GkFDh92J01vnpGZJcwckGkL9gZKP8v7OphuEPnjibhC27dZdufcmXM/A7OpCUwD6pjEa4Ol3ov3ew7AnATxsvDtxHkvMkVXH3UFNIiQYt2+FNNEpggIHv4sFIo6uFc6RqAkxJCY2BwNiTCCLmgoJ5BgSR6b0xNmJckoGn1gLk/bcfZb0JNPCaSKGGSwUyFbNus/gvdcTTartAmNsdyICPepeh/UAqHNX7k8hIqbejXIX00zci7eO+ZXtk11PGCcP2Y1QPqKhNx1OOHqNGsZ1J6m7d04ppZTlnsa4nU4USPa/r4YOTTQ+P+h2TRsw68F4780i+8t1d3uT925O3DBo0Sw8V9JEhBak2G8+jPWDMhGdR48me7A3oQC7DX3XycVYPEEGw0gpi7AGSm5O7tLZGxtBncAJvYH1Mk3IEo4pEAiR+EY5ibpPkzyfZMo8Z88J11WrBfRAJkpqbIRtLXATsfboJZmxGVuldatbbfPraDD+3cfx+w55AK+vrz//7d9/+umn83lOKVJOudsS1CUY1vVWtrWWUrfVzLQUAN70MmPmn/7hL8+fnp75eZoyupcxieSUT8vJJ8sR4mYSoXmZVfWier1czGzdVncvtXjHSghiiRacFq54s21bI+IOINrJbutqpZRSrtdrv+5+VzX90CkwtEP7hbvTVgzAVjc1e3t7W2+3rWxbCSWjDuXXIN1BEA4a6q6btkWQZ2JhmUZcZ6B7hKdoChuEiHqaa3iihVtVu7CA2XKI9iwikWmZWztEMLkQS7cA+9Coqq5byYTEWKY0TdN2o/V6rWtZ39Ysk/3jRKfzum7vV5OJeZKcMGc3hUpyRj6JMCg7BDG0aUrTnHNOp9MsLJNkIkJxN7++38pWb5d1vRZXaHE3L0VD+HkXotTwWUSIwBQNPyQliXrP3UEXMxiBdsgHiyKLTJJA5AQzWslVrVQlIDkL82masiSZcp5mUkBhxmZRf9EbjROxCLHUqIUQcAKFug44ioOSg9zLelPTvCxpns7T/Pz5EyVBEqt209XcC03CbLW4GkoljU4X1ayWequlfPv2Wy26FQCSzz/mBSzWapkAMx0DjPh8a3EfdHSf/Tu4ZHg4P3LJ/U5tLkHhRLpj4e2cwZUftka/skmpIaBw8DANtr3z0Caw797EQuXaj902HQvdmpW2+nwhCvg174oDevNpD6TKJs7jdHYhFwrb3YkCFcbFhQExYlDkPmgSsBCQCInlTJmEfGJnfzUrLoWooiZhyTyn5Sx5IYGZaYVFxi0D929/7y2LWtyxRi1oIjTszn0W+tT32fbDVPPdaYdFoRBLfc57PJR5TzV9nGvqvAFdPIZ094MuyI39ERGxH7xB2NEymDnnaZqmkCPj9eLCYPUpDzQO0u6nPD5lOJnonvACriNEOx0Npq6UBJ1bz13xFtQPi9iYRVUFcGA0mmNmF2c6ZjsN95Uzy70SRjnlnDIRHASLBTIiF6GUJPYQD1hlFmbWOc9TDqQQB1urtksgum01tNaF54iFuFtElqvehOnr6yUn/vSU50nOJ1kmNiVXkpRYZrBUZTN/+XYzq5+eZJ75NM/LlEultdDm9X291hZS4KhjB1nY1MyPgbD7WLubWTWrbhpNAqlDAXQe7ARs63q7Xeu2lW31CFljp1eR5myhSBsGARCSaZrgHohd4WGLUEqtuq5rLKu7lVrgiAL8KA4OD0/dSlk3dzfTAZEUEObqYDKrNbbZUXO8Gx11dheOP6bRhznKjmopampazbR5iVtuChDKdN+EXbRzZFTuxBKspLWNHVto90PurksONIzGNKOEjpilYchTB3wh6doD766TB15KFDjk7pGSQw3VWTwSB7RKppwxzzxNniajTJwcSVzMkyJvBOOsws4TkVAWkUD/kczEVsxgRSvcdVUzX69brbqtpW7aMNQdihFV3/1/iNSBqP4PSd8bAfPB8xynI6TFB5zJ0MrMVL06ECn7OSV3mKmBUJBEJGdjQijhjdPKlGbqJhRIQJxJnPgU/jUmYl5YZsoZSACxnBYyuCyTzBNPuQa0i2vVNkQPvIiqXpVUydxVzbTWcrtet227vL9XNWBizsGbmDgyn2MsD5TZDOc+2IeffQa+b8E/ThV1rbYL7PaQvhzfNffHzYfFs1P18YTGeTvjJhD4wysdcshBaBCK92/Z7901f+wvOLxRTBRpSRGJatpGwOLG1978PEKEJOQEiDdQURCbiDXgUBeWOTB+J3EBoCWlzUUpExE7UsrhSjJVZim1Zoudxt7EI/mdATxecp9MtDK/R6HLI6vrTrq3edwn5XFfoyul1LXlmJQQsGM5unrV/09tqSIDYA9njyXdXYnD0xCJvvdrZ3tdOyIHCxAihsPMufsRpEsK9Fy2Tsl+GPT+E0DUjPa3Gjrjrp6iV3Y1+z7sb/YGIMMucDgHxlRT75q2sqPH9xVp/tAjoWK8XrflmSiwehsWzx1najln6k6qwpQ4ejGPoqVupDs0wFrCM8cChsEMhKpizAnVxCG1Rk5aUkMpFkkDHqAjRmrITkQQDpUL0dhaDebs+2ZpJPegINJjrN2qlVXLra5X5Ezemk5G2jdRAx78+vW3l5evddu2dRWmqI9NvedPpKnDnNyjz4Q4ZUnPT0/zNDGTmZZa3K1WDdK5XC7dY9pWN0Djiqq6betaSqm3rVxXZk4SvaoULffGt6gfqxEbHQb7o9bsaFEzAhwMTgSwOeBmxd3W20W1llK8KrtPTC4sKSDbmYhJcmuIMKrfGpQbSSvkTtEHCyCR1jmWeulKY4fU+5PRqAZqYj6+btYtN7Tuholzt+H50flCZGalqjOEAOZ5OeU8aTUttZSL0PT8bD/+ma6wmoolmICZTOBu4BuRiygL5XmWlE7TaU4zObNL2er17Va2+vbyVote3m+mHfmIeylkvGBU3HVXFEXCMxFH85uUUy/HkpRIEkkaYfjGcugARnXYhVEWuF4v1+2GnCXPKeflvFTVb6Wo6rYVwD+7LsuyTGlJGSIpz1PKT6dnIvJqcGh1AInlzI0pxLtnlqc0MchLJdCn08w5+ZwwpauWF928qq0rWjNcqK5wlPerlZpAQqRaay3X6/vPv/x1XW8//+0Xd3z6/Od5eVLV6LDA3vi7mR2J01vhU+OCwY/8YJoPo+doxO/SorPGjgBh/dxHFWEomHQfjP+u3nB0bw55dn9CcDQ++u8BqN6PrqdE7lu8pzbyjjPKjiZsuCl4Da+KSQQTMUucEMh75MaBlgOEpAeBmB0sAS7IRISUkHNwgyz8aZKc0/nTzImv5yc13Za1lqrXWqU6s3Nm0HrbpJgpRJJw6ho5EzGil8khVnTU3e+1pXvmExirI6jcJ30/dRdwQ05/vGd3LjPHonS5efCcHCImdwTQzK+Dm3+/6/5H1XKIPvjtdrtc3sOUn+cp8jRVmQB3AwDfiGie55FqFzGGEUU323F7jvCaDzQTswr4gbHF5xpJS6bKzACzeMDVMAsSoSfYATsPPfZoaOAVOSXKdyo1yNS0RqZHg89NwimFROv3iUxpkchyvamSYkrplJMbSjFi4XxiokAp3dScCO4Eyzkv82zmlcnM67YRcN1STrxMMiV5Xs6fzos5tF4BUnUHVEFEy4wkoNmECEBVrLVcSlGjapFLHfEokENya/F4JLk70U4RXHJ3NzjDeg+icDSM7jy9qi3cZaESBQJLkpRSa8obYXg3c7daSq11OGEi8fKoS3Jn7LHiRuRAy0Cuurt6uqOmZ2G0YMwx0/JIsg8Hukjs+6jdruuF1jIfW4SPSAjNdxiivYEMBMW0dr3N+Gzq9FDXe74hN0nsw4pv1jp3ud6riGj83M+k8cDOhXdP6YPiQkCEB0NzjQa77u4EI0ppQp6QJpfJnAys4IhYGknhrh6SOxEbtAqhsiuVtVxfb6XU29umqtsasEdR7CcNQVyi8qpFSYkQNUAYu21PExTqaDGdXd6vFgDiY348CNHm/Ha9rtuNp1kWYoBShrWiqWEKqGkDaDdjdxbyUB+EwUjuITIbuplw6FFJZEoZoJZzJ0Ii0VvWG4RnEL6zWYv/ucO8Qbo7Sq3btt7W9bbeQhn1nqoWbxfWQLNgHiw/7AlFOBh26EnFg0fj3hyhZnl0Guh5QCMvaZ/RD8fxw++K9u+ef3+CUwvYja0L7C6bcWFcxeNzdPdXX7lm3IfZCvSt0bcPEY9U8QZVwFFxEGKcIoEX4IhUBSwoIXosRiyom27ds5olMZHniY0oAckt0CIaQTeIcuybO2hVHsz2sfWP5NrX926Gxzx7Y0R9zscJD4J3rPV+fxARx1S0kqJHRzdRd4bsX+yi/f7k3b6P38B3gwMCccFC4kZSE3eAsSA8uBOzmgokRYhtqBvu3rRY7qZn1LPtoA594zahPuZmDLZviMOAPCagw9Y0wdAVmhEJ3dVWIXI4O9/FaMPCbnIjDL6eGc0cw6Jgt2rOu9LhIE9EFm8AJ0Qf7z1hor8qB7Scd/01epxHO7HoWjIlr62s3AFE90pzYiY1VuNSfUq0FazFuxLSSGW00Arh4gPorR93oj0zT4kJZmUVZJfuA+oOjShIXpb5fD5NOS1zTikt88QiMk0iMrfw8GSq316+fbNfaynbequq1zUAODV2XJNhjJYp3SYUVdXc3q9XNS1aW3YuMHF6Pj8hbuFmtTXZ86aIHIuBqYvLuy3ngPWkgfBvxPpSAz2IfChj8sj0I0lwMW5iDMSQliHf4HB57GrukjmYXLT5ZenWOIibl1668+hRH4/bNHsl1K/gQ93SamvRX+bBKQEH1BFVcQqomVata7VSE+mU5OlJP33RZb1NdinlutZbBHWJSDIRWGwhE72upvT1/aWsul3K7a1ote2mBGZJxMxTYsmSpUU/Jdpxxzb3oTy1DANJlJKkLDnLNMk0pyQpTyJCnMBsNPwZrbKdAAep2Ridm/2n//T/S2zbttZalqfn86cvMs15OXNK0zRNnNI8G4EctdbIw2B3NluWE/IypXyaTokln5mJ3RSwzJKZJaWcMyXhnKv7layaqRcU8hr490TMmZLIZFa32+ZqpgoHqYr5uq7bVt7e376+/HZbb9++/aaq67qJpNboDYApeoIUg+CHaHS3HnaWiOGSbqnFR1Lp7GnwRBzIfpfrj5R1uEP8NjKMjseRLR4z8A+kToeH0jAXm75JNOJe4zCzqiaH4Mv4h/v51INl8R9LdC0WkR3Fr38dkPgOErCDhDrKXwh+yk7ewloc7ZOZCSTMBmKHqkcjAmHJaeJJMAs0goTCkmSao3coRzchGjiAzX903HjBG3EUsYhEmKbl4rBg3iW4Dyt6zLz77wjeu2W8+2KoAkNFOC7o0LGGlxvHax5u2r33bgfCRK2llDVctterDjUjJZmmqbtaWU2JaFmWnHPYb2Fno2WM9v8BIJqmnFKKDyLeilH7GOg/rWSGmbj3mGDmRMRmIPYcPkLb85RFJKUU4V8mgvcEp4CIYQac3cz0MD0oVXmrnWMF54YpSYIbMEoeCUzIOUsSYQiDE1NOTCzIRO5bIWptchNRIiIWEjHF+7o5NbkLYpCoJxBTjebZpZQwEhRErX8okwilfKqeLrcts102e7upOntIERih55Y2pcFRvJTfibU3ccbM4WxxaeWjzavsPfeFRDilRAADOaWcM4tITiwBTM1R+aVls0Azul3V7LatAJycmAZmSahInTKjUim66BZVraqGhs5LkmLxnIyoKX/Nxto3XuxuJmqdW76zOxrVHqz2wQ2HAdLNZAhR9EeMzuIc5sKdY3P3W7Y9hBbwoYGruZvdTdD3i74j3eNbOprvdBDiPVP2wTAKFTuweoncPUB8Azc4KjZEwOLMRqyOqroSgyLrhJghXBNMyhVWcX1d12tZ37fr6+aKujmL5HkJNFlmbvl/7f3xgLUyFLew11t3+UgfaOi8EloMWhZ0iyfGQoYqPUbnwPVy+fbyopEGQZzyzFVr9ZTz8vwUWL4BjRBY+mpKDnJj1WIK5omoqRrMzGCnxJI7LD+ELQkxlKkStHGXvkjCgUfWql/NoBZaJtxrqeu6Xq/X9/fLVtZ12wL1sblmeJjdu8foQcHeE+R72GgIUrS3eMQexE73uzAGvi/aH+Q6Djd5tDg/mPLfI9EHC77r0LscOdpGUR7meHAXHiQOjXBD11clOqyg7YajItH/a/lt4f69e2InpoOra3/BgFOXtgW74SLCKTVdfG9ay914Dj7RxvJBbdo1nj7bu9uFaPfcNC1h91DgKGbxOKuPAnj/7KjR35mhj3R10P+PGsCjbMfd7weToUcwI88uitqosafUUBO4nUcj6T0aKLiPYne6H1r0Shn2eg9S7F6rMOulyaJuo3akGqbDlexD6Wz+rWZuNwyJYc23/k7uxxn35joeLL+bGQTt8ijEfRBiBkWBkzO7k1Bq/hH3wDsJCmvkRQx3rQYmylGq3KQBOr5V9N9yN6vaRC0TMUS4qlcVgxfobbPbpqB0J306AcQGuivCJKJHh3xooB1BqXGlSFtqWcQAnNVmERPRlIiolkLkdq1d3npzO7pHu+pQyJ2YmFLgtSUa/oxqFj3tzcL9XkbquxAkOoUASGzEZla1atVSShMAAHUm4C1zXKJ/tyW7Y2oRH49GDfBqRgDDAIc5ItWxCe9hNqHZzSwduGafqjZh7R8+8pE7tjLYSPfsxYzwwwl3O63Zb+E2ImE00GQHWurXMZeVQOau5gAZ07e3d1Z9/+2399c3aD2lBM3fXixP9eVXvL7x65XebqhaS1ndrK4FTtgERlbI46cSu5Al4fR0mlhE5kzCPAlHfT0GQTQMnWbHB08MmP2UKWWOsHpKlISipxKPSCmYmEe5ddew7MBC3f2vf/tb2a7PT+fTaeF0g6Rtq6/fLsxyOj9N8/TDP/y0nJbl01OepyzZUi5ab5taLfrtRSQt0zVJeno655xPc57mJGmaclZQBYrV99u2qf5yeVOz03LKKZ1SniXX21qua63b9XphILMn5kpk7m+v327r7bev3769vV1vt/fLxRGoPzzNc05TSrlV1rrf65lHjoyGW4fmdwxdRzrXpO+4ecJZFQnzRLQXBbWfXVnuWmfLlWk3ehAhH0z8h+Ojz2D8HCKQg2N1+j5eUGq9beVg9u8j7+DmrT0otQbQDXQRHrwZPEBZ+oy1fhNtWkDsEQtiatnc3PJfW1fyoE0kceHaEAFBTEYUFfAmrT9e0wtCcTho1qE93xctEo38czhGBllsDALcqJvpYyrBH0TpHlB6XIjvLE3n6PSgQH1PFeA70X7UGbrieDi5YWoKHzlX8yP1egVmCvRxZk4p7WJYhHqGfIuNdokera1CD4g36HjnIcV9hFbHkMcnjWJ2VegO/O5Qts4B59DnmD+GsUJBV9WjLqXmonvNKfeaW2YR6Y1ig5hC14xMYJGcOE9JSLJMbtDNHW7FiKlqldR6hblCK1gokQjTEq1DEonQ8zKdpiQEAdy4MjG1RiSSwEzkZbttWZCEiHnKsxrWTZl5mWZm1iiur9E2opXwHY870c5ducVgM6EHtalH6xbpFlljwhwp64DVenW3UlYbPT8a3ISItJr21iCtx7OgcCDK481UNWrbtngH7pnhANwc7L15jUXe90N9m9PYNoFb1RLeDktOzNwSB2JEGP/FvuIHQ3pX57oRSh+k+4PpjQ+2+HDaDwXzYcMOYr3fyRiqLfcd1jdjsK17yw/kjvBXrNv2Wsv1/VLWwm60JHJZr35519vF1wutV9xuKJvdrkWr3i5XV/cVcHIlcmZkoTSleUqJU5rywsKUU+DXoyeERs4FSa+AaiqOhB7FrberjByFSP4Pe/bOdtwl+12+2DjhcnlnqDBNOdVauWyX98svf/uFiU/L03JaTqdTAi3LkvIUyZxqagRz021llk1NJFniGTNPwpItC6YcsP2b29t221Tfy2ruLd1PZE7JHVg337btck3M03lioqi62bb18v7++vrt68u3rdZ125gpAo4pwNtFuGHj71CfncvuPCb8km3btXIubkWSjT0dnefNshn0z8ze+6Gj+4Tb7wcvemdd+2kf5TR9OB7IcizNePQga3RgryNyCjogz8ebh8zsSaqtbALdXo/bo+u57V4U8grdgG/Si1suX0u84HatcPRWjW3avG7s3OQ6tX4t5MSQpmDgoKQPO5y6kNtfYx9fF+QHY3dYNhiGMg3DkA7EP2TW3xfthxc5bJu7d/meDtBfdye2vmrthR4ukIFHdvcOd2sdru/Byrz1QoaI7In49z3audePdSv8kCl1f4yXvC+i61Kpf34vvBuTNtvtrAYj1m/l7ixMzsfiNwK5w/aE4OOigx3ccqs6tmB81VtWiyRhkYa1Z+4IMARxIkV0XXSDOQlRApg4JyamJMRMc5bTnBkuMGUmk64AUc7MAvZirpJbYCilZGamJiJpEWY2UgKCfbEQcxoiO467pq61btt6hdW63XLOl2UhIKCz3eNGCnjt0RS3gQvoRBVwRJOxWBVpld/d+DcyMoAIDgW8FlN1GNw8fLR3DMiju0krk6itvshKKQFOvG8bDN06/A5BDo/EHkkT0UseXQsNZuREvUQiofVB72SDoRQw79bIbg4NegpqOZzwaKT8nkT/jjkTJzQTLuzAVtxK++PubueAOUAQxqYOt7KW6Guz3aop/l//z//v8rT88vrt/Xa9lW0tqwdKqrnVDDS/KItwkkC2TSlLyhCuqRIziQZXYOfe/WIEMIKnB5dOxHzMfm8stedFOyL9CeTDfOgsbGzIe+GnZlVrqWWtWyGsbpfr7bquZv76+p5yruSnp/OnL1+W82l+Os9PCyc5TSnn6XQ+E0t0nam1VK2bbimnZZqXeYYDZoiSFacv0+LwyVx8u71fV4PetnpdCTZnAXy93Uz19eVb2da//vzz2+X92/vl/XqLJMyUhHNiEU6ZUwKNbppDJ6Mjqx2UEUMesVjsmN77mYM59hnC8fIjhR21gOMJXbN8fDr9XdH+8eSPf3oEwBlEfBdNCVfeAJUdt42fzf8pHI4HNLQvOFmDDwvC6oXdLc+EumgfRaneBSiHwG7GOnave5SuERHUqffVYAQQpAjDA6G86Q7sTty7fPfWa51AjzPQVZHG+buq1rykdDcT1JMCxqqMf2ONjpPdZSpCEWl91h72S9hjQ3v5znFUOeJvIiAKewIzu61BmGB8iJtwgAPeGUgASilh4VO/X4hP6orgmKTwyaPb7vH7sTfSEOpHq70zZ+KgpUbvRD0hIaQPH46hXgSMiOrB49Ls1KZ9HuelUyYRcCwY6UTTSC4S9mo1M1Q1EcrCOQsTRcPfWp1ANGxugWThRCngSghMKszLvEhKU84ismROZETOsETRa4QYLg1ZnJe85JS/fD59Oi+v1/rbW32HvejGJDcWZq61dVGpqiyZJanpkbHcWe1Wa91uWtb1lpJIzglALRWAW43C4mM2+pgIEUrJw2QJIRjOkoPYaszIXAGvdXO3da1aLLZNzmk+5d1qdgDk1bxZ517ZVCQwZAYlHQmu8c6Q7Q8KTDvH3ayZ6d0rFXZ857VCBGYZQOZ9LzEPB8BH7PYP7I9oH/bRuUXNsmmT1t/2zg3Qx9FyjpkI7iwNR68VxgkRP75HS/N0kFCtVUvxUsKrWaptm17+93+F8OvteqtVzcycEYKXhBITKAsL5SVLkjxNKWVJiZKASMl2EPEWRJbuw4gUkRhJM8BCcx5R9pDrEnHHFrNsbP3ICPoUBbM4Ll8op9FlpsKdtF5v67WsWvT2fmWW4rqcTp++fF5Op88/fvn85fP5+enLn74sOX9+fgbLpmrul3WrZrYROrpqBL4y80lyYnrOExPZVtxsfb/U2wY1UktJ5iWb+W1dS9m+/vrL9Xr75def3y7v16Jr1abOJxZJkoRTYknUMLzvaOD47yDNyNH1LiE+CulOIePi7ygHTX4P8ro/gX7/eNAMDo97rFmn7wr7vn/QcqPuBmwOtV2bGa/HGATUgus00taaRGshJ4mQastzo7DF++37nXulxeGPtrXbU/qbubmAqIv2oFfhYec1Ox9jnjGcB9+bOvaDQg8QowWa4I894mifpvs5H5tg+Fn6ydhXVgZPuiMAYCjW/MBu+O60w09qjs0wP2OqDmLyuNR3oh3d1CZqeY7hCf9OdRIRHUT+AJoNMT/0gKFrPvRC5M5Ount/L1tjpmhcTE0GS9joIdqH5/9w8/7qjytH5i7ufE/SXagP9w1HYLSqEXdAp4a3EH6emD6Z50WSJO44diH+gj2qCssySc5pnqckksgEIYldiFJzfDpT9EOX56d5mfBPf/n8px/OP3+9bfpeSvFaHBy9XEK/KaVUVRaXlEx/r187UNbr9e1lX2Vh6hWH8V/LvQ+5zszUQUN53GO3EiLHubUoIAZiRxoBaiWwu0U4T1POE7d8OreqgLt6cxL0zj/g7ls5kNFQOXtCV8+dg5tVd71T01qkGvFOwzlEvQDigJQtff+0WhxmRiuj4SOZHBS9ltHTY9DdLKC+w9q9CWPVf8ceGnMZn43kAI8qkqGN3vdrP5jNaI0JmQMAW7UCDnYSVlfAOJKQiTOlsLJJiDJIiCchYU9MiYyNWyPKMH+Emy+GGAFDIvvG6P5Y3zl2dM0bbGXX0BvRH8jm3r+Io+UHIjXfql3XApHoI1vVmplLBMJtWwNrKU/5tt7eXl8/ff5U1/X89EROKWeZpsT8aZ6dSJmMkHKWnFuHXNAEIodvG7lrKTBj08xAYpC42+W6lVK+vXzd1u3Xry/rbb3cblvVUPxFOKWcUgOajhyfIaICS4tHG0Hcay6NMkLn6cLqKCDb5AQ7u9OEDhN4EO1jUe7NwAf+dqRA3Lsljx/i2L7qe8Ke+mLHqrv73bs5Dor48ErvJGKtbgjuzMIyWp+3XktMAiaWyO9o8gvc7eijshwXdDV9qJtEwX9i/xtH+spArQvVvmtNYYRwJ1FuIMg0wmJ3ww9f4DCNObL3D974JoTAHT7uoEXhkQqIiI7hqbGsAwaHx7o0BiWN++1xBBrnPS4jjfcZHcC6jGzLcv9GUdK5jYS4+6IJDME/JPTOxO4/Ofrwjy80dIXjnYe2QdZiVTH53Nhr8La4G7caQESNmQfB3GsObYAsAn/AkEdPu4t/R5WTpFD10JEbqNfvMEB7tdNowCQcgKEyzZITp8TRWyZ8oNP0FI1CKbYDuRCIqRTdtmLOaq0lCDNdqqbEavx04k/X6Tzztm1aKwPn88mdWRJhb4GTUmKJ/+4279Ehj9v1Lf32y4GovK0Sk0xtEH2iSCTllJiTyNz2QdR8dJoefQICSjAgKYSjoF8JSHlOkp+ezs/Pn7WWUlatdQujvJX4GXURbqPS7RBiH6kr1HZwC+IbTHVTLffsLzwzzesZFfzkhuiouRsb3FWG444KqdZY83c1+FAv0MEax4vd0VIoeh8U5J0vB3k10g/UcQGD3CJFmzkRWJqov9dze614mMtgUri6bXVzGEhIWM1AoEAiYMmchSVLIiHMgLS+HAHj6ewtHMlg5sxZiFNY991gjx89hYqH1T5y5TDgEDwwmTzyWgm7nOiCfF8At11xAahUcwByW6tOy7KcUYpG8pIxAX65XImJ3l6JaJ6maZp+/OHL7aefPn35TGrL6fTlzz9O8/z06VOapgJXgjMjKtolwRxbgdv2/u6qWgvMUkqTCISR5HYr315fr9frv/3bv23r+vLb17KVTau6xXiTpAD0CPXKzbmjwgXZhsbcPrEHtQwBs7LHkLt5h91K29nukNpHFkkfLJPBxAeN+aFZHH/wtX68w/GTOxlw+KVLqS5hiY6IZrG4bt7f+5hh141pciay8LB2rTeEjki0DaKmCXLrONBiO43pDvgEQaiiTAhEqFYAzk0f6PU0fZv0oXjUPnexa+GLb1ord+iGR6neRIOZ31mc6PhDd6d2lnJwUX2Hh1DX4D4+aHx2H98B9bAnP/Ca/uBBGui2LPcctO8I5sNbObBtW0pp2zZVjaq2g+N6X+Wg/ODMR7Y2zOj42ToT9heKLPpaKx1okohSSuNuPSOvRVkH1+z3FKAhyAa3dPfdYXpQYlhYIHYn2ruNGl6MYLatnWFT7iK1uumFYw0CZ5coZ5aUk/CURZhTSsJyXqZpTu5qbkJIRHPOn5/OzFRVATJzOCcBhK5rffl2UUj13NaeYFARqM0/PKenhZfk10spWyGiT5+e3UlrVOc4gChPI5ZAWjku/H2GPJygzc5y9OxcBkcdHDcK3cs2QYRIkekrurOYbl53v3bPneLm4YIwJeGURJKwcYhts+jS0jJiwnaNgPPActrJdmhloW1w1BGZu5pWN73fYIP59Kw07NGzvmy7IckD4HFcSt+V6fe3HzyZ23bhD2ACd1N+4MtDd+5ldGh3xKjlkCgWi3KFu/v0SGUML9bAhF3YEwMiUybhJEwtjs2JWmuHgMbvjr0mse9HRRwAkxEMaEiMNDTNMTGdXTP3QGr7/CCnB3kwD77TJ6HztYcZMwepl6ItHSAlUxtWlO+oFUxMtaqbX/Pt2/zqwKfPn2utJDzPExNNy4IgOWYSZneQuWq5rK7a7HV0sDag1rqVcr1ev337drutl8t1K2Xb800giSJM2QJ9xEPR6SbWMA5ak8AHvo/mfmictckr6hGLB6urT85H0b6vWWfWuzJxMBjHaQ9RrXEh3Vvnd3LrAxItuqsAbZff6wcxKseQV+M77i+DpkSHFGLmyH9rxbEj5h0uEOehQ+/RZ0YPUB3UIgI3RyGjvxeImg1OIO50HjKkeQF2wTp+ifFEcshjYSH6cZiNzrboTs49TmznC8drmfluhY4qVNtwxy9jWnD/4ePx8IZHu2JQyNhHD3kStdZSSljtA59LJLJI2+sf1YUH0f5gwByz57oH1j/MHtEhSN83C3cokX0EYXcd1FPEK4zHxXZ0BxGzk0XuxmHuOvdnosfXbrftYchYq4FLTS2UQ9EeI+foZA4mF4aExeMAuzkpuGRl5iiCYTYmcqEspNpgrHrIn4i6zxVsxutml1u9rboVrUpmDO9K6cEt1H3pv1/XLjBBafmejpZNH/ko0ckvag2JmMmcnYWVTXtv4Ps2AD03XpIkis6+xALvb4ZIRsg5T/OkWky11rqtG9wTc1h/RBw1kt7T9j/STUx/NAutpqWsWkvZbqb1Xg84knsoDOCdsHZHJx/O7ks+vn1ko8ejqebeyKbbq7uGcPzlqADd3WRX2p2I4cYszRBByyZnsPtBcQl1SZpoAMHJlVES2yS2TERYnk8ppUAEArpHppk4AEX3tF31bzK/i2gmZkqMFqCnDqvTVVqiAAZrKoJECx6003aFKfpKNCFwEELHeQ3t+6hGbcWYqajLWk8nt6ipjNpyNYeng0WylU3V1tv2+vr25ctnIprm6Xw+TfP0z//8T0/PT8+fPi3nsySRyN4otWzby8s3uIm7MH96epryFNCJb6+vv/z66/v75W+//LJu5du3t4BHHpXokiVLzilNvQKHiZOk1CrSIl3Hgl0MFno0whSmruj6WdOLQqR3OFEMsdF1qAfBQAeuPT4CIEP232sAuL/8aJQf5fo4+ffI/qNWYfcftdKwOPf+2pCt4QpsSf7BcqSlIPcI1IArv9v13H2IvbCva4a7lkg9QMRgsuZgZeZDeJxGCVbT7omo6cgcdaocbvsgU3/wSRzCz33c/Ua9VIDvmckuTWlfxHEHfuQ8oUaj2zpj2g+vH6d9SAN6UMLiGK74fh8M92qUFu/cx/1yuahqNAuepimM7zCpay1EPebRrf8HKjo+F0D00fHDgUPSO3XxUUp5UERoN3YicT0xs5gQU065l+F5BMXGaTnnY96+A9vhzkTdndb0klZxGshs05SJoBq6njQBCpcmd4kciVkYWfi85CRsxQiUGRMRAe4BRVVrUqsgavvCVB2+JJ6EDCDOIDdVEMFJhJd5ylkcUpRf3mrZ7LLW10tt7emZpzQxUdTIhB7iZlVN7fdi7Y1QuliintHczE8manU5TZ1tmgxbMzO/Q0adxHZxtqvxByslJj6IK+A7aG8VT52Hdur/ri7cdyTcor+Luz64rPdXO67ufoOdH6D70g+2+l1C1INy2pVf6rmy+5373B1euJkg+60euHMoqdT91dwUmsbLD+7Zw1Q3JoEWdGiOx4E0LMRo+P4QRKJpqLcd5+vIKe8mdswIh0+Ax2R3dIdQaQ/yZIDqNZI4oGEB6J06dwudH0U7fU+BOtroPfhHnTQeLctxWhSHpJSCwkrZwr52s5SSpORmtWoppW6ru2dm6T3WIkXler1dL5fr9Xq7rSWwku+jQnw00fuf3AOZw9k5cjvQZchh9fpOGGJhF+CE4X3us9JTGB7JYIjkYcF2F8jYO0TD7Kbv3OHvHP9B0f6dTx5Uivvv+Phhn8I+U81kZ4YQHBzeFIxcM2LZ7XcM3wE14jw4Lfo8+BASh/fZK9PbV2gv01dqLErTke5G0K/adzRRk+t9Ib63Rh8nKsb1wFvo3iYZMzV8Np1hPcpR+nDg3otz/B2HEvP7R+/x+ON9DqcBIOupJA9CnQ8bYPyMpxyr28clIdqHY/9OxbxTgUJ/BTM7W0wFAHdm9vFWoUBH6u7QI+4G0n7cS5NBK41lDaVpz1cMF3+ShtsV+zwQ1pt3KIRnT9Ew8ybaW8Kge2CgtYKQxtdlb0vC0ZBSndRD62UiuBlxJF/RmDwnWMdvP47jrvgN7mipZ3FZaAFMYBhR947tTorOw2Kk3GMqcvg8TiWihtZoCriXCrhJIlAtWynrVtZ1XbXWsMiiqFdrt43QsFuHkOjsibiHwtid3Ot6u7x9c1et5YFSW4b80clCfR8zE0kk0TYVmHrsIcCofUiW7/Eyah6VLsUOUr/X0cfaBLsI//qR0B/2AHedhjtbp4B4iez9CPnfL6SbR+qpOEi1ubQCNHCemIjzxCmqd5nJIoI1UM5Aww4P8d6EfNPauCXN7JZ6W9Qm4/kglnpXIqLmum/VIw5XKLN4wENS1/n7mh5X1u+TBHnfQ+Ru27ahW+0hLN2FqCGeMVHOIbglon3TNH3+9DnndH2/XN7e//bvfwM855xzDt7l7hHzm3IW5vV2Y+L3y2W93b5+/frLr79upb5frh1MvhlqYRb0+7C7jxBmgG5OU4B2AWTuTr3G/SGdx4mMKOgCzddJQ74QwY9qQbjw0HD2dw2jJwbfpTQf2GWb77iEqQcaO8kdmPK4w7Avjw96JP4Pguq4dqFHRo8Qapxg3x3cqtFp7OZBdd6GC2aEnyfAEaSjxbUWKcJM8Ea7+0CaKGijCrTgKKije9Ilis6hZi3ZoSGCces118DPhwmCkbf/9w/0B+zikx7tgYNkHfpBcNljVfeYqvHW7fK2WJwSJ6LA52v3tPukivHQoPMjqcTvxw4G4xCRT58+PT09BYCYuw+ze8xwvH5DGGshKR5kE7tjDPbIkEMaPTzyu0SI/XGtKJasEqLNOVtOqUFMRi7UTqvm2j/mFrW/aw8TrpCW0ht1wh4Ocm/Imm4gYpFITgILCUsSzjkt08IEZk/S4tynT+ckUouWaGumxJKXJRMhkNyqFgeEnYmyTDknNlXT5C5uLGlaFhFJWYRJzVfy0zJBpjynZ5J1q9frqmbrpgCnPDFLUTPztdRSNeLx47hv6jos44O62gXg71MzEHuzS3ORQ0jkSAKRLBsOykD54+TeS+S9Yd0MvtaoYSxV18d3RxN3zwEzh9XvZqY1btfudnhP3FuX9zcmCsUs5qBvBz5o+d+X64O1NQMC3S8/1MKDXKfmXvuuydUHNQR8f58oAG+v0Obg4U0a5/cBxUNh+LdwUFfFWi5gtzL5bjrunOSDz47f+y/cZTlzj4HhsNB0f8lRMACNkw8LhQ6OwbvJfLgXMx8gNdCS8nbW0OetnSsdoI268pSS9ISgWraiqlPOeZqC+wSlhY7NzKUQES6Xy/V6fb9cb7dbqdEvmOggOLuhInywbLpaK10I9dExDXCk71DRkOsthYW6V6Std0wcWp0JmuH+IHG7/fJAGLRLmkFYzVWwU2c344apNBj03xft31u7+xeg4ysx7RIOw/5unp59v7QPAx+Uw2D3QbPeqIGilIWl2+z3R6eIIWQp5PRhYvubN++PHyphu5joZ9I+G3+PFw4u1f/pg/o7rOPA23YfwFgO6ltx10gOjkDe85zaKcdF7Oc8ugpCDf07axrHSLVrWVB3dva4XzPBh2gf1Wjj/eP3UeHGzA+i/btCvd8efQfQYREgBGYOJ3R7KDcgxHFXomjzFO/zAUpw2O271EETVOEsbRqdcHeMhFUlQ8i1niHw0ASFG0yGwRyBvAq0HmYxXpbAwAlJhAGb1vuLtJcyAzd1hIg4STTlsfC9AyQph9W056j9nX7t5l5Vg0+1uWTm3thu/M7t/9I5W09mHb/HhnFHL00IXkxwqYXcbVvh5sTJPS/L1Fukh50KglYluksk7htuLDeo9yCJo5atrtd1vapu1ETIA4s5uMgIiI5GkWrXgsWDBYwHtRozHHY2HSyku72BYbV/PIY0JxD4Tnf8IKGbXU+ShBDu9AZTPGpAiLlD67ShubmpwV0AashmxCKCzClqDxt2IolwBJAOZgATefdmDKaxv5b0h1L3PPOQ601TiOoEdP68M++DyRiqBPNoecLdrt/5TucF92SaU0ocMb9+pt0n/ewsIuc8TY2wt23729/+9unT85cvn+YFpWy11uvbZVvXeZ7naWrtYRp/5HUlgG63W6319e3ter1u23Zbb0TR/4F6qZsw8ZSnlFLOaXC0cBLEEVk8YYSZ6WDK7q52lwUSYKWGjlrDndU0UOmj0RPWRLQ/GwK1GeOxPCBI51cYBHZkx0eHSFdBeczgh2DTeNUHF8vDcS88cPj847n04VsMfbg/lLinK0c9sbQ/D1glkcnTcCebJdHAWIIk0XTzNqNRTTeMhSb3OxePZBG0liOgITNbm+YDA/gwiiF46IEgmyowdCg+TM29Fx2PZgZ6Sl8oz227Pqo/BELrW8/dmjrqZ+1RTbYdnjzuEcTrHp1AdsRWd397fY02htbbNXX5HQK4GeK11rFzhxMrBGp8dfS078Hvrg3QwbCho4ep1UMb9Y5ZMeD75DsAiN3mTuFp7lMfoxDqGQYfdavmj2UOE7wJLo6aDo5cJGllfiHOneBaAdMWiSO63VyYruc1J3FnOKuZqadU87QRADcAqpXI0yQMdiUlrWpVraoXdTJfDcyckwjTlCyzz0kzn4RJiN1NzRzI80wk07yIiIGJeSZmlinfN3u7HykckLG3m523y28evROGRO3ynvrHj3SN1gCgZcKpkrvWCneeFCLWco3vjGyMHmJD7d4X635tuOk6pla2TWsZ3s67fRMXN0ZI1GshD8LhzrDY62dB1A3uI/Mamwc7K8S4/oFlPjzhUXX8wExpvzN1lSE4RBeu0YMGdzfx1nzQ94g/Cwk4UqkGumSUtPe/+iv1ex0W8XA0uc4tiXLY7u3Pg9FxmPFusI5tfJwxjBTlg+wZN3hY6ehI1Fq5AACY/Yib9PHkYApmdrlcmbmqppzCVqi1lG0jgNxTSlF0nlICkQHu/vZ+2bbt7e3ter1GsxkRSTntJNJN86h4OaqYR7dkXxofLlZ8qA+OIXvzuWCkn1Cru95JDruvviGkH76kplI3MDei4Qru9uJOiejy4mAyD/ul+VQOD8X9Vtof+buffCTwgy5xSAhAM4Po6FPofw5SiUqkURECopZdJykFX8aBHwWRCQ/PUB8ed4jDjo36sO/up7NrVzI+G1rO4+g64Y97tnu1pepCCOFx6dd0HvtwK9p3zthPTXdu6k8LIX6YXqZePNB54tHr0/SCO3k/DI4wzaiDVuz3LVtx9xDtwd5jDw4oumNOHPdnjy2Abqn7wePv997/sXB0r0cOMW9Rz8Y0ttS4nFu+LYncVYJ0yjnOatNFPq5dY6+9ciI2E4Zns4mXbtiGLHBVN6YGNKtamcnhKQlzZmp8xsG9N6wD7qZMoExM0i2T7rB2j657HC5+JkoGca25VsmSOIX176DoH9+MBxFjkSRA7u0q+nGPId88/U1KB3FIAwAfMCt3m4EIrfXFgerD0h06WiDFRlIxlQI32zZyn9zzsqRpycu5bjXaqpraLrQGyTY63GUH0DUpJqtF3bbttm03s9q0Yw5f3c4bO/9s3NVMByUczNQGn3EUev2L2BuP9ULtUmYmtq6bU6OBwz7ttxvs60Cme2UBupzb3fIeYVUetlNbDrp7E+/eeAbIna11IyImiHeFnwfuTnMd7O+2+7MfOXk3nYaBPvSeVpOH4KTU5Q6IaLRlintEqmqbKJZuq38nI5J2zb0PmHlZTssyhdWuqrXWSKFGoBH3WrUodeXu7jNVZi6lAP7rr7+ez+cpp5RSnvI0T8RUzdSMa0Xfapuqml9vN611K6WqElFUjsa4dgOdRZJQhDgO9nqrbg8D013VmKs7DnHNx2SlO4bDQ6r5nQepy/uhCT1cNPi9917TD5rf/SPvlFEcSBzH0nPeG6Lw4zP/o8eRX394hT0yddCEDoIvGL6A70FY2cDMBgvnfLQUTCP3m5mp5Qn1+4AocuSxgyKCoo4hpEaYcJ3fhFeMo5eoUzP1qYex+7zBYY46DPNB/yPecXST3suasTtCXt8PkLsuf/xwiOJdC4vn+VifoITgxXsp7L1LAEQt/4VGpic35P5jNizz6Xw6nU6RaJSntgH3nm9AoI1spUQU3w/4r0nEhggIX3R4yFk6Ks+u/Y8ofqMWUBSwRBhAulM4UtUaBwMBEcVtT+G7zH8KXm1m7sg5T9MUzuAHCowpAPb9xUy9mTMJcxKRxFOSlLhValvvsK7VHaoKgqoxs0hmTiIUjVNSEkL0LZK2LpxIJE/TNCWj6lZaDyOwMJLQ85Jykk/n0zzJlMnNN/UNVNXyNAvYKYNoXVe4F7XevE4e+PadaBeRlPNBker61IHd8z4njbrQAti+u6y82SboWcpmVmqBu5cN7l4K3I1lcsznrWwlwMxD5NJAi+j752hO4KBeJ2JhLlat1lLWUkpL/et5WndHvFkL9rt14dEFVxdtvc5tqNh9xExkx5sd90DfH0PT5t3+RX9GvzQ+GSy6O452R2Gj+/iXG50eBhJweUfRjtaCHmCArceVgjZbyU+bmPbG34m0PaTZPk5guEibE74l8Dc2E89y7Lbhbql0eSbMDoyU2+BD35fuh2khImaa5+l8Pg9noHvLye2mSsuuCk0WiN7AVusAVcbrt9da659+/GGep5RyyjkSM4JgzWzbNnW/rFv7vccFm8+wvXx7+0igO+6REO3BQcaI3J25dYmONKM2OHq02vtmGl5X0OA1+4TsHl/0mWm0NDTFRkG79BiPuFtafvzkqILefdWFw3cI4n69fueLXbRzG+n9ijMwCvg/bCsaUpkb/R2u62/KzR0P6SDej28aT3cixS58iYgS0DN/Zcxds9valgexOBH6jn3wuDjMocc3HwK+/ez7lHnPJ6AInTRLCW08bTS7xO/cZCwvjcX9YC/EXjyU6NBgnQeWMtQ32rfnmC7wHWVGNuj5fI581GVZpi7d+/0b9Pi6bWa2rmtI97HcTJGa7fGhjATrDq4yRMbRVx9pmGKSknS4+Oi6JERHVDsM0kL3C8Zqjk/CpDQz9zm2+SNhhNHaCHBn0a0KtRvr0Roip5ST5CTKVhyq3tqvqTpQWt2miaRpStMk0R+KQE6CqK6MBZYkecpTFnOqTN6LbAhJ+DTLPKUvn8+nOdeymRYNvHVQylnATskMtVxrVQMcJJKP6T5x3AHNrpd3DMC9vrHiZ0zDuJT7Sx7mqO/MY2Q6woPugKsZecuQhxoItF5VK9y228Wqasj7sJPuFoAjxNGU4SHymDUnIVYtMCvrLQxxgvf42c6l4Pi3f/23bSvUcW9Cmz5YO9RX+GHxe0sHIvhDye64ilmkj/7wRf+y/9n5MqM/rRFUrGzX+2PMw0vS9IKDqGNivrxfIqk7Rnf7+WfbNm7cHy2/QjUUGo4GBNzrzL7nyu4P/jC8wzD3le/fDFcoMbeOkCKRUrJfsyuJ8Yc83uPDsb2/uzUVG6DbdVW16F5hHRjL7Ahi5JH1Ja2BQGActTHVar99/Ta9X9/fLzmlshWtNbhIUJU71NQdpVbvMNdB0Cxg9rELwsZLooMHd89YO3LOY9fklELhGKVwcc/L+2VwGTP77T//p9vb69BZu0jYBflYon0PfG/WPipJbQF27fg7J+NQATk8SeOMoOm/I9R3kdMVgNv725B/ZvbzX//98v529z778z9IqXji3XkYG+heIRkn0DAHuecBEe17f48XRapiHzYRBXIRR3J1D2EMbb8b1iOzjgj09evXw+j0t6//+XJ92e94sD2G6k73dD6YKd+5Jo77j4fVTgc+QpEmgTbfO/ONBbof9VEdOKz+PtkxZe1hnUgul2/jTczs28u36/U61NmUcnirhsbsB1j4WtXcel1D+zrEXuzFAwegnXAapR+p3qkjFoUQoZ7lJR2ZvU91m/NQruPHfmcHCGYGR0maUt62va4d8HJ717IKN9j5ZlWF1d5kIJh5u2URzimJcBKRZrWbA6pAM6na24T6EuU5Kcs8JWpuIoRoe3vNKck85ZylVN1qNYeqD0PsfZ5ykp9P05TFNKq40WEXwvQXANu2hcEOEEtilvf3tzvNmH73+Dtf/f7pR43xP37l3bX/8QvHg/9Dl3zXOvy/9XEnnvfd8p0T/2u+xX+1Wf0/5P79+8edMnowf/9PfcT+69857X7t/qOk+R3J9t/e0UVPP/6723j3avF/YXgjnPGd4/+seTk6VT6SyN8h8Q8vcPTbP5z5wRfy8dr/qnzm//LjXn36vYn63vlxdIX5O6fuM/dfnOX7y47m3n/v8//H8cfxx/HH8cfxx/HH8cfxx/HH8cfxx/HH8cfxx/HH8cfxx/HH8cfxx/HH8d/i8f8HtxaUxQplbmRzdHJlYW0KZW5kb2JqCjE0IDAgb2JqCjU1Mjg0CmVuZG9iagoyIDAgb2JqCjw8IC9Db3VudCAxIC9LaWRzIFsgMTEgMCBSIF0gL1R5cGUgL1BhZ2VzID4+CmVuZG9iagoxNSAwIG9iago8PCAvQ3JlYXRpb25EYXRlIChEOjIwMjEwOTE2MTQ0MTMwKzAyJzAwJykKL0NyZWF0b3IgKE1hdHBsb3RsaWIgdjMuNC4zLCBodHRwczovL21hdHBsb3RsaWIub3JnKQovUHJvZHVjZXIgKE1hdHBsb3RsaWIgcGRmIGJhY2tlbmQgdjMuNC4zKSA+PgplbmRvYmoKeHJlZgowIDE2CjAwMDAwMDAwMDAgNjU1MzUgZiAKMDAwMDAwMDAxNiAwMDAwMCBuIAowMDAwMDU2Mzc4IDAwMDAwIG4gCjAwMDAwMDA2NTAgMDAwMDAgbiAKMDAwMDAwMDY3MSAwMDAwMCBuIAowMDAwMDAwNzcwIDAwMDAwIG4gCjAwMDAwMDA3OTEgMDAwMDAgbiAKMDAwMDAwMDgxMiAwMDAwMCBuIAowMDAwMDAwMDY1IDAwMDAwIG4gCjAwMDAwMDAzOTggMDAwMDAgbiAKMDAwMDAwMDYzMCAwMDAwMCBuIAowMDAwMDAwMjA4IDAwMDAwIG4gCjAwMDAwMDA2MTAgMDAwMDAgbiAKMDAwMDAwMDg0NCAwMDAwMCBuIAowMDAwMDU2MzU2IDAwMDAwIG4gCjAwMDAwNTY0MzggMDAwMDAgbiAKdHJhaWxlcgo8PCAvSW5mbyAxNSAwIFIgL1Jvb3QgMSAwIFIgL1NpemUgMTYgPj4Kc3RhcnR4cmVmCjU2NTk1CiUlRU9GCg==\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:30.820816\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:31.016958\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:31.210678\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:31.412500\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:31.614177\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:31.816167\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["# Plot the closest images for the first N test images as example\n", "for i in range(8):\n", " find_similar_images(test_img_embeds[0][i], test_img_embeds[1][i], key_embeds=train_img_embeds)"]}, {"cell_type": "markdown", "id": "219968d0", "metadata": {"papermill": {"duration": 0.089878, "end_time": "2021-09-16T12:41:32.117877", "exception": false, "start_time": "2021-09-16T12:41:32.027999", "status": "completed"}, "tags": []}, "source": ["Based on our autoencoder, we see that we are able to retrieve many similar images to the test input.\n", "In particular, in row 4, we can spot that some test images might not be that different\n", "from the training set as we thought (same poster, just different scaling/color scaling).\n", "We also see that although we haven't given the model any labels,\n", "it can cluster different classes in different parts of the latent space (airplane + ship, animals, etc.).\n", "This is why autoencoders can also be used as a pre-training strategy for deep networks,\n", "especially when we have a large set of unlabeled images (often the case).\n", "However, it should be noted that the background still plays a big role in autoencoders while it doesn't for classification.\n", "Hence, we don't get \"perfect\" clusters and need to finetune such models for classification."]}, {"cell_type": "markdown", "id": "29ef8f54", "metadata": {"papermill": {"duration": 0.10508, "end_time": "2021-09-16T12:41:32.310940", "exception": false, "start_time": "2021-09-16T12:41:32.205860", "status": "completed"}, "tags": []}, "source": ["### Tensorboard clustering\n", "\n", "Another way of exploring the similarity of images in the latent space is by dimensionality-reduction methods like PCA or T-SNE.\n", "Luckily, Tensorboard provides a nice interface for this and we can make use of it in the following:"]}, {"cell_type": "code", "execution_count": 22, "id": "24541e26", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:32.501797Z", "iopub.status.busy": "2021-09-16T12:41:32.501308Z", "iopub.status.idle": "2021-09-16T12:41:32.503351Z", "shell.execute_reply": "2021-09-16T12:41:32.502954Z"}, "papermill": {"duration": 0.094572, "end_time": "2021-09-16T12:41:32.503454", "exception": false, "start_time": "2021-09-16T12:41:32.408882", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# We use the following model throughout this section.\n", "# If you want to try a different latent dimensionality, change it here!\n", "model = model_dict[128][\"model\"]"]}, {"cell_type": "code", "execution_count": 23, "id": "e6814b9e", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:32.685746Z", "iopub.status.busy": "2021-09-16T12:41:32.685203Z", "iopub.status.idle": "2021-09-16T12:41:32.687965Z", "shell.execute_reply": "2021-09-16T12:41:32.687568Z"}, "papermill": {"duration": 0.09501, "end_time": "2021-09-16T12:41:32.688067", "exception": false, "start_time": "2021-09-16T12:41:32.593057", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# Create a summary writer\n", "writer = SummaryWriter(\"tensorboard/\")"]}, {"cell_type": "markdown", "id": "2e102b0e", "metadata": {"papermill": {"duration": 0.08963, "end_time": "2021-09-16T12:41:32.865990", "exception": false, "start_time": "2021-09-16T12:41:32.776360", "status": "completed"}, "tags": []}, "source": ["The function `add_embedding` allows us to add high-dimensional feature vectors to TensorBoard on which we can perform clustering.\n", "What we have to provide in the function are the feature vectors, additional metadata such as the labels,\n", "and the original images so that we can identify a specific image in the clustering."]}, {"cell_type": "code", "execution_count": 24, "id": "ad24adb2", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:33.048000Z", "iopub.status.busy": "2021-09-16T12:41:33.046657Z", "iopub.status.idle": "2021-09-16T12:41:33.048961Z", "shell.execute_reply": "2021-09-16T12:41:33.048577Z"}, "papermill": {"duration": 0.093963, "end_time": "2021-09-16T12:41:33.049070", "exception": false, "start_time": "2021-09-16T12:41:32.955107", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# In case you obtain the following error in the next cell, execute the import statements and last line in this cell\n", "# AttributeError: module 'tensorflow._api.v2.io.gfile' has no attribute 'get_filesystem'\n", "\n", "# import tensorflow as tf\n", "# import tensorboard as tb\n", "# tf.io.gfile = tb.compat.tensorflow_stub.io.gfile"]}, {"cell_type": "code", "execution_count": 25, "id": "5c4b01da", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:33.232442Z", "iopub.status.busy": "2021-09-16T12:41:33.231963Z", "iopub.status.idle": "2021-09-16T12:41:40.340354Z", "shell.execute_reply": "2021-09-16T12:41:40.339846Z"}, "papermill": {"duration": 7.201161, "end_time": "2021-09-16T12:41:40.340471", "exception": false, "start_time": "2021-09-16T12:41:33.139310", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# Note: the embedding projector in tensorboard is computationally heavy.\n", "# Reduce the image amount below if your computer struggles with visualizing all 10k points\n", "NUM_IMGS = len(test_set)\n", "\n", "writer.add_embedding(\n", " test_img_embeds[1][:NUM_IMGS], # Encodings per image\n", " metadata=[test_set[i][1] for i in range(NUM_IMGS)], # Adding the labels per image to the plot\n", " label_img=(test_img_embeds[0][:NUM_IMGS] + 1) / 2.0,\n", ") # Adding the original images to the plot"]}, {"cell_type": "markdown", "id": "ac506cfa", "metadata": {"papermill": {"duration": 0.089483, "end_time": "2021-09-16T12:41:40.519563", "exception": false, "start_time": "2021-09-16T12:41:40.430080", "status": "completed"}, "tags": []}, "source": ["Finally, we can run tensorboard to explore similarities among images:"]}, {"cell_type": "code", "execution_count": 26, "id": "76094ffa", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:40.700535Z", "iopub.status.busy": "2021-09-16T12:41:40.700065Z", "iopub.status.idle": "2021-09-16T12:41:40.702162Z", "shell.execute_reply": "2021-09-16T12:41:40.701752Z"}, "papermill": {"duration": 0.094032, "end_time": "2021-09-16T12:41:40.702268", "exception": false, "start_time": "2021-09-16T12:41:40.608236", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# Uncomment the next line to start the tensorboard\n", "# %tensorboard --logdir tensorboard/"]}, {"cell_type": "markdown", "id": "954ad9a4", "metadata": {"papermill": {"duration": 0.089519, "end_time": "2021-09-16T12:41:40.880536", "exception": false, "start_time": "2021-09-16T12:41:40.791017", "status": "completed"}, "tags": []}, "source": ["You should be able to see something similar as in the following image.\n", "In case the projector stays empty, try to start the TensorBoard outside of the Jupyter notebook.\n", "\n", "
\n", "\n", "Overall, we can see that the model indeed clustered images together that are visually similar.\n", "Especially the background color seems to be a crucial factor in the encoding.\n", "This correlates to the chosen loss function, here Mean Squared Error on pixel-level\n", "because the background is responsible for more than half of the pixels in an average image.\n", "Hence, the model learns to focus on it.\n", "Nevertheless, we can see that the encodings also separate a couple of classes in the latent space although it hasn't seen any labels.\n", "This shows again that autoencoding can also be used as a \"pre-training\"/transfer learning task before classification."]}, {"cell_type": "code", "execution_count": 27, "id": "ecbf40ea", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:41.069819Z", "iopub.status.busy": "2021-09-16T12:41:41.069325Z", "iopub.status.idle": "2021-09-16T12:41:41.071450Z", "shell.execute_reply": "2021-09-16T12:41:41.070984Z"}, "papermill": {"duration": 0.101313, "end_time": "2021-09-16T12:41:41.071558", "exception": false, "start_time": "2021-09-16T12:41:40.970245", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# Closing the summary writer\n", "writer.close()"]}, {"cell_type": "markdown", "id": "d031e7eb", "metadata": {"papermill": {"duration": 0.088397, "end_time": "2021-09-16T12:41:41.248822", "exception": false, "start_time": "2021-09-16T12:41:41.160425", "status": "completed"}, "tags": []}, "source": ["## Conclusion\n", "\n", "In this tutorial, we have implemented our own autoencoder on small RGB images and explored various properties of the model.\n", "In contrast to variational autoencoders, vanilla AEs are not generative and can work on MSE loss functions.\n", "This makes them often easier to train.\n", "Both versions of AE can be used for dimensionality reduction, as we have seen for finding visually similar images beyond pixel distances.\n", "Despite autoencoders gaining less interest in the research community due to their more \"theoretically\"\n", "challenging counterpart of VAEs, autoencoders still find usage in a lot of applications like denoising and compression.\n", "Hence, AEs are an essential tool that every Deep Learning engineer/researcher should be familiar with."]}, {"cell_type": "markdown", "id": "a94ed780", "metadata": {"papermill": {"duration": 0.088321, "end_time": "2021-09-16T12:41:41.426630", "exception": false, "start_time": "2021-09-16T12:41:41.338309", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "![Pytorch Lightning](){height=\"60px\" width=\"240px\"}"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: Tutorial 8: Deep Autoencoders\n", " :card_description: In this tutorial, we will take a closer look at autoencoders (AE). Autoencoders are trained on encoding input data such as images into a smaller feature vector, and afterward,...\n", " :tags: Image,GPU/TPU,UvA-DL-Course\n", " :image: _static/images/course_UvA-DL/08-deep-autoencoders.jpg"]}], "metadata": {"jupytext": {"cell_metadata_filter": "colab_type,colab,id,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 45.56469, "end_time": "2021-09-16T12:41:42.325691", "environment_variables": {}, "exception": null, "input_path": "course_UvA-DL/08-deep-autoencoders/Deep_Autoencoders.ipynb", "output_path": ".notebooks/course_UvA-DL/08-deep-autoencoders.ipynb", "parameters": {}, "start_time": "2021-09-16T12:40:56.761001", "version": "2.3.3"}, "widgets": {"application/vnd.jupyter.widget-state+json": {"state": {"02ff956b061147d68a9e47093990d34a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "032dc48ab9b841529716759ce8fda730": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_857875e983ac42ea9452284506e04bc6", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_3f9a3874e40547b38769ed9fa108dae9", "value": 1.0}}, "052e7097bcfc4f65a96e2a7a9268431e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "07a7fcadf97f442ca3088a5bbbcba662": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_674fe5a450c3481c9a34d5e9192e82c0", "IPY_MODEL_bf0e3475b48945bc9619bf292f63051c", "IPY_MODEL_88da781ac6a04e4c9e80f207b9785e92"], "layout": "IPY_MODEL_44aeb54ba2f14b3bb7e032fabd114c92"}}, "07b7c4404f814aa5a589ef143940b644": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "0cbcb50fc4904a38bf209a5b60ba6de2": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "0cdd717c36684008add2d6d3f93caa65": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_83d382db2c604f96864c7ab7bb703e70", "IPY_MODEL_e8bc86b2c81446f9bfcdb05b0c482531", "IPY_MODEL_5eeb17acc1fb4264ba59ec99aef37eb0"], "layout": "IPY_MODEL_214f0cd9ddc44f778d07cd0c33ebbc9d"}}, "0d066a20bb76435498f29b34812ebe38": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_11b51cc5b5204ca68070a5453a53a936", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_11acd217386e4efcacffe4cf2d9ff5d5", "value": 1.0}}, "0e75a210006e4d18be55bf96806992bb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "0f11cd1f8ebc4c9cbc69478f55dac457": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_2f4fba8d2685419fa7765bef262e0040", "IPY_MODEL_ba6b2c1b4af4442ca18b2a842fd567dc", "IPY_MODEL_74cec57148994f20859b662fef841d95"], "layout": "IPY_MODEL_b6fc2a070765455d9e39949c9f1ebcbb"}}, "11acd217386e4efcacffe4cf2d9ff5d5": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "11b51cc5b5204ca68070a5453a53a936": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "11fb9b7b81cb40eab94743b2e2d33846": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "12134f3f7f2c45bb80b55727e4077eec": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_5b35c5a56116497d9a3cb0665e9f8834", "placeholder": "\u200b", "style": "IPY_MODEL_62f2a45626e640b68afcc925672c9c9b", "value": "Testing: 100%"}}, "1242f7a22a564aaeb2af5c69667e5b5f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_585e2c48fa264803aa392ef3e9b5293e", "max": 175.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_47ee5b345c494618bf130b0afe0f0ee3", "value": 175.0}}, "12661357d2f64a5e81125f174cdb1093": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "143085e1474446dc918656c1e9794bce": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "18580ac83490417aa9cc17a95c1b9ff4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "1912fb8fcada468ebf4a0aa5485ace52": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "1b5ee62eae394996877439600f6099ee": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1c6d3153688c46c98c7c47bf74d52109": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "1eeadd6528c746868701b83f54b200dc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_f95afa94d4fc4c24982982b1189a2676", "IPY_MODEL_0d066a20bb76435498f29b34812ebe38", "IPY_MODEL_fe252e86330c4fb7a39557edc2947f62"], "layout": "IPY_MODEL_3bfb9f151a9b4190915c20d6daee85e6"}}, "213f1af06c854f0fa5ac9c7f42e86b8b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_587fdc2ccf4c434a98f70a1326e2090e", "IPY_MODEL_f6fd3371cdab45bdb95c5bbefc92bcbc", "IPY_MODEL_e4225879509b44d78af0a9382ffafb9e"], "layout": "IPY_MODEL_d88f9144beae4195b8b4061fd162f798"}}, "214f0cd9ddc44f778d07cd0c33ebbc9d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "23042c045dfa410788b0f5920d93ec12": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_31e9b650f9854da0889238dfe45f463e", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_be4e06b3dab944b4b164305c4639fa3f", "value": 1.0}}, "27a44cca69884cefac383be100126891": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "2d005f68d81b4b48b123df6224ce852e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "2d578b2eca444fd68545eb1bf1e2e4e3": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "2de27b190618498d9d521357b81fa7fe": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "2f4fba8d2685419fa7765bef262e0040": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2d578b2eca444fd68545eb1bf1e2e4e3", "placeholder": "\u200b", "style": "IPY_MODEL_6db10f3f605d44cfa3ae7abd547994c6", "value": "Testing: 100%"}}, "2fb2f64a98454ffa9d94d792eedf790f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "31e9b650f9854da0889238dfe45f463e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3bfb9f151a9b4190915c20d6daee85e6": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "3f9a3874e40547b38769ed9fa108dae9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "4019b8c2ccf54144af57dfeb0cc89fa1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f41f045f24ce4c3496a79fcd2cb4de07", "placeholder": "\u200b", "style": "IPY_MODEL_52802f27f74f437a86f46ec7faf29012", "value": " 173/175 [00:10<00:00, 22.02it/s]"}}, "4046be872d3b49a99d2e9e038031024f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "4082d73bb40f41e38f650c4eb97de99a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "413b085486e84775a6d12632a2c21ae1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_7800181f82774088bec790534ea16b09", "placeholder": "\u200b", "style": "IPY_MODEL_58efd7c3b680415992c128d95298a9e7", "value": " 36/40 [00:02<00:00, 23.55it/s]"}}, "41de7a8567ee401d91f43538a6074c58": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_bbf19a83e8f84c9f9aff45a99ca95f62", "placeholder": "\u200b", "style": "IPY_MODEL_4082d73bb40f41e38f650c4eb97de99a", "value": "Encoding images: 99%"}}, "43ed398167354898a99662e48cd235fc": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "44aeb54ba2f14b3bb7e032fabd114c92": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "47c8df90b5414d1e8ee6e8afc2057c52": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_96b3327de0924445bda563cf42aa0924", "IPY_MODEL_4d5fc2a2e0f74d0cb56cdc13d48d251d", "IPY_MODEL_f5624c88273640a6af037ce8918fa0dc"], "layout": "IPY_MODEL_e3387fbc3e8e4cc4bdff0f609206a150"}}, "47ee5b345c494618bf130b0afe0f0ee3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "4c1be50487394dac88a9368c031dc7ac": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4d5fc2a2e0f74d0cb56cdc13d48d251d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f9a48cf7360a4948abc62fafc7e2ae37", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_4f32d4b2dd764f2a8af01d4382ea8605", "value": 1.0}}, "4da71fe1cdb746d781dbfcfb0078ea11": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d217a0bdcc694c7faa75b69d0b1d454a", "placeholder": "\u200b", "style": "IPY_MODEL_b22da0fb272442a6a9009a443d8af0aa", "value": "Testing: 100%"}}, "4f32d4b2dd764f2a8af01d4382ea8605": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "52802f27f74f437a86f46ec7faf29012": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "57b7fd1cc58c48e38d1ff2a4d1b52646": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "585e2c48fa264803aa392ef3e9b5293e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "587fdc2ccf4c434a98f70a1326e2090e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_0cbcb50fc4904a38bf209a5b60ba6de2", "placeholder": "\u200b", "style": "IPY_MODEL_143085e1474446dc918656c1e9794bce", "value": "Testing: 100%"}}, "58efd7c3b680415992c128d95298a9e7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "5adc386ad05f4b3cb2ee9972198d120a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "5b35c5a56116497d9a3cb0665e9f8834": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "5b9b18fb8e734702ad6e5fc7c5b33876": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "5cf0706e7c07460880d2fe93a1e1d4c4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_12134f3f7f2c45bb80b55727e4077eec", "IPY_MODEL_23042c045dfa410788b0f5920d93ec12", "IPY_MODEL_ad8c8c3a834347e4ad64626d981788b4"], "layout": "IPY_MODEL_9f61b932d4844223ba828954c8bed3fd"}}, "5da12d195bd64785adab94f45d45a515": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "5eeb17acc1fb4264ba59ec99aef37eb0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_abea5e10b6774b328a1a788602d20f15", "placeholder": "\u200b", "style": "IPY_MODEL_4046be872d3b49a99d2e9e038031024f", "value": " 40/40 [00:00<00:00, 64.57it/s]"}}, "62f2a45626e640b68afcc925672c9c9b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "674fe5a450c3481c9a34d5e9192e82c0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_07b7c4404f814aa5a589ef143940b644", "placeholder": "\u200b", "style": "IPY_MODEL_2d005f68d81b4b48b123df6224ce852e", "value": "Testing: 100%"}}, "6864ca7ec5744fae8c73bff0ac83cf8b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_a8007361e51a49a5bc066a39d3678f91", "IPY_MODEL_6ca429fcea5f49caa41079c5e0628bb2", "IPY_MODEL_413b085486e84775a6d12632a2c21ae1"], "layout": "IPY_MODEL_1b5ee62eae394996877439600f6099ee"}}, "6b9d419c65ee495298ceab7998051791": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "6ca429fcea5f49caa41079c5e0628bb2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8a4bb250050840ba8a1005f97cf7be6c", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_8bf4d98e6a9e4136b0902e882efc0796", "value": 40.0}}, "6db10f3f605d44cfa3ae7abd547994c6": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "74cec57148994f20859b662fef841d95": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4c1be50487394dac88a9368c031dc7ac", "placeholder": "\u200b", "style": "IPY_MODEL_1c6d3153688c46c98c7c47bf74d52109", "value": " 20/20 [00:00<00:00, 49.16it/s]"}}, "75d4f899cdbb4ddb9f24362935235e37": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "7648e1309ffe4d7b9df012f6c619e838": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "7800181f82774088bec790534ea16b09": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "7f45f3088a694253bc20a6d06382a53a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "83d382db2c604f96864c7ab7bb703e70": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_12661357d2f64a5e81125f174cdb1093", "placeholder": "\u200b", "style": "IPY_MODEL_2de27b190618498d9d521357b81fa7fe", "value": "Testing: 100%"}}, "857875e983ac42ea9452284506e04bc6": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "8839373ba012435c92a3f7c82bec4d8e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "88da781ac6a04e4c9e80f207b9785e92": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_052e7097bcfc4f65a96e2a7a9268431e", "placeholder": "\u200b", "style": "IPY_MODEL_e3da440d50ac44b49c12bed6e738ead0", "value": " 20/20 [00:00<00:00, 47.70it/s]"}}, "8a4bb250050840ba8a1005f97cf7be6c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "8bedc95274e84f799bbef9fc04ca9934": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_4da71fe1cdb746d781dbfcfb0078ea11", "IPY_MODEL_032dc48ab9b841529716759ce8fda730", "IPY_MODEL_d44f42635e084ca8afad50efccc551c5"], "layout": "IPY_MODEL_6b9d419c65ee495298ceab7998051791"}}, "8bf4d98e6a9e4136b0902e882efc0796": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "92a150b2ba204b55884a4344b05daa57": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "96b3327de0924445bda563cf42aa0924": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_02ff956b061147d68a9e47093990d34a", "placeholder": "\u200b", "style": "IPY_MODEL_7f45f3088a694253bc20a6d06382a53a", "value": "Testing: 100%"}}, "9f61b932d4844223ba828954c8bed3fd": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "a8007361e51a49a5bc066a39d3678f91": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_92a150b2ba204b55884a4344b05daa57", "placeholder": "\u200b", "style": "IPY_MODEL_11fb9b7b81cb40eab94743b2e2d33846", "value": "Encoding images: 90%"}}, "abea5e10b6774b328a1a788602d20f15": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ad8c8c3a834347e4ad64626d981788b4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f92786d9462849c3b05616928d6445f3", "placeholder": "\u200b", "style": "IPY_MODEL_1912fb8fcada468ebf4a0aa5485ace52", "value": " 40/40 [00:00<00:00, 66.65it/s]"}}, "b03085321f064773bcbd73645caea3e5": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "b22da0fb272442a6a9009a443d8af0aa": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "b6b8ff22558b4341af2937a7ea644f98": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "b6fc2a070765455d9e39949c9f1ebcbb": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "ba6b2c1b4af4442ca18b2a842fd567dc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_43ed398167354898a99662e48cd235fc", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_5b9b18fb8e734702ad6e5fc7c5b33876", "value": 1.0}}, "bbf19a83e8f84c9f9aff45a99ca95f62": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "be4e06b3dab944b4b164305c4639fa3f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "bec0502d94244f92bde1e6e0245723a2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "bf0e3475b48945bc9619bf292f63051c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8839373ba012435c92a3f7c82bec4d8e", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_7648e1309ffe4d7b9df012f6c619e838", "value": 1.0}}, "cdd59b859bba4f88984895bf930fcc0f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d217a0bdcc694c7faa75b69d0b1d454a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d44f42635e084ca8afad50efccc551c5": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f1e290d5524546e0b62af75e706b6738", "placeholder": "\u200b", "style": "IPY_MODEL_b03085321f064773bcbd73645caea3e5", "value": " 20/20 [00:00<00:00, 47.57it/s]"}}, "d88f9144beae4195b8b4061fd162f798": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "da089a2c86cf484ab1e2470e7b666dc1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "e22e704f14db414bb6c784ee29e158d6": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "e3387fbc3e8e4cc4bdff0f609206a150": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "e3da440d50ac44b49c12bed6e738ead0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "e4225879509b44d78af0a9382ffafb9e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_5adc386ad05f4b3cb2ee9972198d120a", "placeholder": "\u200b", "style": "IPY_MODEL_bec0502d94244f92bde1e6e0245723a2", "value": " 40/40 [00:00<00:00, 59.08it/s]"}}, "e8bc86b2c81446f9bfcdb05b0c482531": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_cdd59b859bba4f88984895bf930fcc0f", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_5da12d195bd64785adab94f45d45a515", "value": 1.0}}, "f1e290d5524546e0b62af75e706b6738": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "f41f045f24ce4c3496a79fcd2cb4de07": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "f5624c88273640a6af037ce8918fa0dc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_da089a2c86cf484ab1e2470e7b666dc1", "placeholder": "\u200b", "style": "IPY_MODEL_b6b8ff22558b4341af2937a7ea644f98", "value": " 20/20 [00:00<00:00, 58.91it/s]"}}, "f6fd3371cdab45bdb95c5bbefc92bcbc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_75d4f899cdbb4ddb9f24362935235e37", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_18580ac83490417aa9cc17a95c1b9ff4", "value": 1.0}}, "f92786d9462849c3b05616928d6445f3": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "f95afa94d4fc4c24982982b1189a2676": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e22e704f14db414bb6c784ee29e158d6", "placeholder": "\u200b", "style": "IPY_MODEL_27a44cca69884cefac383be100126891", "value": "Testing: 100%"}}, "f9a48cf7360a4948abc62fafc7e2ae37": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "fc07ca3d23014b6f9d5fb7b961f16005": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_41de7a8567ee401d91f43538a6074c58", "IPY_MODEL_1242f7a22a564aaeb2af5c69667e5b5f", "IPY_MODEL_4019b8c2ccf54144af57dfeb0cc89fa1"], "layout": "IPY_MODEL_57b7fd1cc58c48e38d1ff2a4d1b52646"}}, "fe252e86330c4fb7a39557edc2947f62": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2fb2f64a98454ffa9d94d792eedf790f", "placeholder": "\u200b", "style": "IPY_MODEL_0e75a210006e4d18be55bf96806992bb", "value": " 40/40 [00:00<00:00, 68.86it/s]"}}}, "version_major": 2, "version_minor": 0}}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/course_UvA-DL/09-normalizing-flows.ipynb b/source/notebooks/course_UvA-DL/09-normalizing-flows.ipynb deleted file mode 100644 index 704aefd..0000000 --- a/source/notebooks/course_UvA-DL/09-normalizing-flows.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "c331ad54", "metadata": {"papermill": {"duration": 0.030587, "end_time": "2021-09-16T12:41:51.358101", "exception": false, "start_time": "2021-09-16T12:41:51.327514", "status": "completed"}, "tags": []}, "source": ["\n", "# Tutorial 9: Normalizing Flows for Image Modeling\n", "\n", "* **Author:** Phillip Lippe\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-09-16T14:32:34.242172\n", "\n", "In this tutorial, we will take a closer look at complex, deep normalizing flows.\n", "The most popular, current application of deep normalizing flows is to model datasets of images.\n", "As for other generative models, images are a good domain to start working on because\n", "(1) CNNs are widely studied and strong models exist,\n", "(2) images are high-dimensional and complex,\n", "and (3) images are discrete integers.\n", "In this tutorial, we will review current advances in normalizing flows for image modeling,\n", "and get hands-on experience on coding normalizing flows.\n", "Note that normalizing flows are commonly parameter heavy and therefore computationally expensive.\n", "We will use relatively simple and shallow flows to save computational cost and allow you to run the notebook on CPU,\n", "but keep in mind that a simple way to improve the scores of the flows we study here is to make them deeper.\n", "This notebook is part of a lecture series on Deep Learning at the University of Amsterdam.\n", "The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io.\n", "\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/course_UvA-DL/09-normalizing-flows.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "cb8074e8", "metadata": {"papermill": {"duration": 0.029722, "end_time": "2021-09-16T12:41:51.416816", "exception": false, "start_time": "2021-09-16T12:41:51.387094", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "4c53849b", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-09-16T12:41:51.477802Z", "iopub.status.busy": "2021-09-16T12:41:51.477304Z", "iopub.status.idle": "2021-09-16T12:41:51.479831Z", "shell.execute_reply": "2021-09-16T12:41:51.479366Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 0.03456, "end_time": "2021-09-16T12:41:51.479947", "exception": false, "start_time": "2021-09-16T12:41:51.445387", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# ! pip install --quiet \"seaborn\" \"tabulate\" \"matplotlib\" \"pytorch-lightning>=1.3\" \"torch>=1.6, <1.9\" \"torchmetrics>=0.3\" \"torchvision\""]}, {"cell_type": "markdown", "id": "03ad92b7", "metadata": {"papermill": {"duration": 0.02881, "end_time": "2021-09-16T12:41:51.538089", "exception": false, "start_time": "2021-09-16T12:41:51.509279", "status": "completed"}, "tags": []}, "source": ["
\n", "Throughout this notebook, we make use of [PyTorch Lightning](https://pytorch-lightning.readthedocs.io/en/latest/).\n", "The first cell imports our usual libraries."]}, {"cell_type": "code", "execution_count": 2, "id": "6dcb9f29", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:51.604711Z", "iopub.status.busy": "2021-09-16T12:41:51.604228Z", "iopub.status.idle": "2021-09-16T12:41:53.319528Z", "shell.execute_reply": "2021-09-16T12:41:53.320210Z"}, "papermill": {"duration": 1.753622, "end_time": "2021-09-16T12:41:53.320362", "exception": false, "start_time": "2021-09-16T12:41:51.566740", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/tmp/ipykernel_3359/964175757.py:27: DeprecationWarning: `set_matplotlib_formats` is deprecated since IPython 7.23, directly use `matplotlib_inline.backend_inline.set_matplotlib_formats()`\n", " set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "Global seed set to 42\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Using device cuda:0\n"]}], "source": ["import math\n", "import os\n", "import time\n", "import urllib.request\n", "from urllib.error import HTTPError\n", "\n", "import matplotlib\n", "import matplotlib.pyplot as plt\n", "import numpy as np\n", "import pytorch_lightning as pl\n", "import seaborn as sns\n", "import tabulate\n", "import torch\n", "import torch.nn as nn\n", "import torch.nn.functional as F\n", "import torch.optim as optim\n", "import torch.utils.data as data\n", "import torchvision\n", "from IPython.display import HTML, display, set_matplotlib_formats\n", "from matplotlib.colors import to_rgb\n", "from pytorch_lightning.callbacks import LearningRateMonitor, ModelCheckpoint\n", "from torchvision import transforms\n", "from torchvision.datasets import MNIST\n", "from tqdm.notebook import tqdm\n", "\n", "# %matplotlib inline\n", "set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "matplotlib.rcParams[\"lines.linewidth\"] = 2.0\n", "sns.reset_orig()\n", "\n", "# Path to the folder where the datasets are/should be downloaded (e.g. MNIST)\n", "DATASET_PATH = os.environ.get(\"PATH_DATASETS\", \"data\")\n", "# Path to the folder where the pretrained models are saved\n", "CHECKPOINT_PATH = os.environ.get(\"PATH_CHECKPOINT\", \"saved_models/tutorial11\")\n", "\n", "# Setting the seed\n", "pl.seed_everything(42)\n", "\n", "# Ensure that all operations are deterministic on GPU (if used) for reproducibility\n", "torch.backends.cudnn.determinstic = True\n", "torch.backends.cudnn.benchmark = False\n", "\n", "# Fetching the device that will be used throughout this notebook\n", "device = torch.device(\"cpu\") if not torch.cuda.is_available() else torch.device(\"cuda:0\")\n", "print(\"Using device\", device)"]}, {"cell_type": "markdown", "id": "3cd3ed62", "metadata": {"papermill": {"duration": 0.029414, "end_time": "2021-09-16T12:41:53.382047", "exception": false, "start_time": "2021-09-16T12:41:53.352633", "status": "completed"}, "tags": []}, "source": ["Again, we have a few pretrained models. We download them below to the specified path above."]}, {"cell_type": "code", "execution_count": 3, "id": "78d63583", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:53.446715Z", "iopub.status.busy": "2021-09-16T12:41:53.445099Z", "iopub.status.idle": "2021-09-16T12:41:54.071021Z", "shell.execute_reply": "2021-09-16T12:41:54.070611Z"}, "papermill": {"duration": 0.659621, "end_time": "2021-09-16T12:41:54.071141", "exception": false, "start_time": "2021-09-16T12:41:53.411520", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial11/MNISTFlow_simple.ckpt...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial11/MNISTFlow_vardeq.ckpt...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial11/MNISTFlow_multiscale.ckpt...\n"]}], "source": ["# Github URL where saved models are stored for this tutorial\n", "base_url = \"https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial11/\"\n", "# Files to download\n", "pretrained_files = [\"MNISTFlow_simple.ckpt\", \"MNISTFlow_vardeq.ckpt\", \"MNISTFlow_multiscale.ckpt\"]\n", "# Create checkpoint path if it doesn't exist yet\n", "os.makedirs(CHECKPOINT_PATH, exist_ok=True)\n", "\n", "# For each file, check whether it already exists. If not, try downloading it.\n", "for file_name in pretrained_files:\n", " file_path = os.path.join(CHECKPOINT_PATH, file_name)\n", " if not os.path.isfile(file_path):\n", " file_url = base_url + file_name\n", " print(\"Downloading %s...\" % file_url)\n", " try:\n", " urllib.request.urlretrieve(file_url, file_path)\n", " except HTTPError as e:\n", " print(\n", " \"Something went wrong. Please try to download the file from the GDrive folder, or contact the author with the full output including the following error:\\n\",\n", " e,\n", " )"]}, {"cell_type": "markdown", "id": "98588147", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.02986, "end_time": "2021-09-16T12:41:54.131396", "exception": false, "start_time": "2021-09-16T12:41:54.101536", "status": "completed"}, "tags": []}, "source": ["We will use the MNIST dataset in this notebook.\n", "MNIST constitutes, despite its simplicity, a challenge for small generative models as it requires the global understanding of an image.\n", "At the same time, we can easily judge whether generated images come from the same distribution as the dataset\n", "(i.e. represent real digits), or not.\n", "\n", "To deal better with the discrete nature of the images, we transform them\n", "from a range of 0-1 to a range of 0-255 as integers."]}, {"cell_type": "code", "execution_count": 4, "id": "47598513", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:54.196645Z", "iopub.status.busy": "2021-09-16T12:41:54.192801Z", "iopub.status.idle": "2021-09-16T12:41:54.232017Z", "shell.execute_reply": "2021-09-16T12:41:54.231591Z"}, "papermill": {"duration": 0.071068, "end_time": "2021-09-16T12:41:54.232133", "exception": false, "start_time": "2021-09-16T12:41:54.161065", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}], "source": ["# Convert images from 0-1 to 0-255 (integers)\n", "def discretize(sample):\n", " return (sample * 255).to(torch.int32)\n", "\n", "\n", "# Transformations applied on each image => make them a tensor and discretize\n", "transform = transforms.Compose([transforms.ToTensor(), discretize])\n", "\n", "# Loading the training dataset. We need to split it into a training and validation part\n", "train_dataset = MNIST(root=DATASET_PATH, train=True, transform=transform, download=True)\n", "pl.seed_everything(42)\n", "train_set, val_set = torch.utils.data.random_split(train_dataset, [50000, 10000])\n", "\n", "# Loading the test set\n", "test_set = MNIST(root=DATASET_PATH, train=False, transform=transform, download=True)\n", "\n", "# We define a set of data loaders that we can use for various purposes later.\n", "# Note that for actually training a model, we will use different data loaders\n", "# with a lower batch size.\n", "train_loader = data.DataLoader(train_set, batch_size=256, shuffle=False, drop_last=False)\n", "val_loader = data.DataLoader(val_set, batch_size=64, shuffle=False, drop_last=False, num_workers=4)\n", "test_loader = data.DataLoader(test_set, batch_size=64, shuffle=False, drop_last=False, num_workers=4)"]}, {"cell_type": "markdown", "id": "a20ba18c", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.030353, "end_time": "2021-09-16T12:41:54.293285", "exception": false, "start_time": "2021-09-16T12:41:54.262932", "status": "completed"}, "tags": []}, "source": ["In addition, we will define below a function to simplify the visualization of images/samples.\n", "Some training examples of the MNIST dataset is shown below."]}, {"cell_type": "code", "execution_count": 5, "id": "9f49ed4e", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:54.360403Z", "iopub.status.busy": "2021-09-16T12:41:54.359918Z", "iopub.status.idle": "2021-09-16T12:41:54.446277Z", "shell.execute_reply": "2021-09-16T12:41:54.445797Z"}, "papermill": {"duration": 0.12252, "end_time": "2021-09-16T12:41:54.446381", "exception": false, "start_time": "2021-09-16T12:41:54.323861", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "JVBERi0xLjQKJazcIKu6CjEgMCBvYmoKPDwgL1BhZ2VzIDIgMCBSIC9UeXBlIC9DYXRhbG9nID4+CmVuZG9iago4IDAgb2JqCjw8IC9FeHRHU3RhdGUgNCAwIFIgL0ZvbnQgMyAwIFIgL1BhdHRlcm4gNSAwIFIKL1Byb2NTZXQgWyAvUERGIC9UZXh0IC9JbWFnZUIgL0ltYWdlQyAvSW1hZ2VJIF0gL1NoYWRpbmcgNiAwIFIKL1hPYmplY3QgNyAwIFIgPj4KZW5kb2JqCjExIDAgb2JqCjw8IC9Bbm5vdHMgMTAgMCBSIC9Db250ZW50cyA5IDAgUgovR3JvdXAgPDwgL0NTIC9EZXZpY2VSR0IgL1MgL1RyYW5zcGFyZW5jeSAvVHlwZSAvR3JvdXAgPj4KL01lZGlhQm94IFsgMCAwIDMzNS4yOTkzNTQ4Mzg3IDE3Ny40OCBdIC9QYXJlbnQgMiAwIFIgL1Jlc291cmNlcyA4IDAgUgovVHlwZSAvUGFnZSA+PgplbmRvYmoKOSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDEyIDAgUiA+PgpzdHJlYW0KeJxNjrEOwjAMRHd/xX1BYsdpk45FlSLGsvABVQVUtAgqwe/jMgDDSb6T7XuCiXwrOK1gTKYXBAW+G5+XYTyUHYaV2PKZVCsXmkaryuz130pKLmbL+DeeiRa6I7nwkQZ2eduOWXOC1Oo44zHiiAW+DRuAGIAYAKPYpQbBVix1/H4ZZvi9oLuhp57eJg8oJwplbmRzdHJlYW0KZW5kb2JqCjEyIDAgb2JqCjE0MgplbmRvYmoKMTAgMCBvYmoKWyBdCmVuZG9iagozIDAgb2JqCjw8ID4+CmVuZG9iago0IDAgb2JqCjw8IC9BMSA8PCAvQ0EgMCAvVHlwZSAvRXh0R1N0YXRlIC9jYSAxID4+Ci9BMiA8PCAvQ0EgMSAvVHlwZSAvRXh0R1N0YXRlIC9jYSAxID4+ID4+CmVuZG9iago1IDAgb2JqCjw8ID4+CmVuZG9iago2IDAgb2JqCjw8ID4+CmVuZG9iago3IDAgb2JqCjw8IC9JMSAxMyAwIFIgPj4KZW5kb2JqCjEzIDAgb2JqCjw8IC9CaXRzUGVyQ29tcG9uZW50IDgKL0NvbG9yU3BhY2UgWy9JbmRleGVkIC9EZXZpY2VSR0IgMjIyICj////+/v79/f38/Pz7+/v6+vr5+fn4+Pj39/f19fX09PTz8/Py8vLx8fHw8PDv7+/u7u7t7e3s7Ozr6+vq6urp6eno6Ojn5+fm5ubl5eXk5OTj4+Pi4uLh4eHg4ODf39/e3t7d3d3c3Nzb29va2trZ2dnY2NjX19fW1tbV1dXU1NTT09PR0dHQ0NDPz8/Ozs7Nzc3MzMzLy8vJycnHx8fGxsbFxcXExMTDw8PCwsLBwcHAwMC/v7++vr69vb28vLy7u7u6urq5ubm4uLi3t7e2tra1tbW0tLSzs7OysrKwsLCvr6+urq6tra2srKyqqqqpqamoqKinp6elpaWkpKSioqKhoaGgoKCenp6cnJyampqZmZmYmJiXl5eWlpaVlZWUlJSTk5ORkZGPj4+NjY2Li4uKioqJiYmIiIiHh4eGhoaFhYWEhISDg4OCgoKAgIB+fn59fX18fHx7e3t5eXl4eHh3d3d2dnZ1dXV0dHRzc3NycnJxcXFwcHBvb29ubm5qampnZ2dmZmZkZGRjY2NiYmJgYGBfX19eXl5dXV1cXFxcXFxbW1taWlpZWVlYWFhXV1dWVlZVVVVUVFRTU1NRUVFQUFBPT09MTExLS0tKSkpJSUlISEhHR0dGRkZFRUVERERDQ0NCQkJBQUFAQEA/Pz8+Pj48PDw7Ozs6Ojo5OTk4ODg3Nzc1NTU0NDQzMzMyMjIxMTEwMDAvLy8uLi4sLCwrKysqKipcKFwoXCgnJycmJiYlJSUkJCQjIyMiIiIgICAfHx8eHh4dHR0cHBwbGxsaGhoZGRkYGBgXFxcWFhYVFRUUFBQTExMSEhIREREQEBAPDw8ODg5cclxyXHIMDAwLCwtcblxuXG4JCQkICAgHBwcGBgYFBQUEBAQDAwMCAgIBAQEAAAApXQovRGVjb2RlUGFybXMgPDwgL0NvbG9ycyAxIC9Db2x1bW5zIDMyMSAvUHJlZGljdG9yIDEwID4+Ci9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9IZWlnaHQgMTY0IC9MZW5ndGggMTQgMCBSIC9TdWJ0eXBlIC9JbWFnZQovVHlwZSAvWE9iamVjdCAvV2lkdGggMzIxID4+CnN0cmVhbQp4nO2d+19M+R/HZ6ZRKWFGJRoUWdEWspVLqnHLJSqXZV1qI7llv+7azTJZwmZlKXeKWLnLZWklconUisxmhPlbvu85M6dpTufymflMzNr384c8zmVe8/48M5/z+ZxzOiP7H0KH7HMX8K8HDdKCBmlBg7SYDRqdxn8vDg3SxqFB2jg0SBuHBmnj0CBt3JdhsLa2dvTo0adPOymOFDRIi6MGHz16VFrapUsXuVwuk0VHR3d4jVI76fVarRaqmTHDKXHkoEFa0CAtDhnctGnTpEmTFK3ExMR0eI2ie9TV1cXHyxny8ujj7AIN0oIGabHDoMGg1+uLi4ujojw9PRVt6d69+86dHVyj6B5Tpkxh9Pn6+hoM9HF2gQZpITX45MmTtp9bW8g/xfn5+TKZLCODZ5PB0NLSIlyjaHWDBg1iDO60+UUKIB23Z8+ekBBoFyQmJUHJr15JxaFBW9CgOJ/FYE7O5MmThfwpFAUFBUQ1vnoVHh4O++/fb7P62rVry5cvV6kiIiKKi4VqFKnOYhDG94cOHRLdTzqusXH27NnQz7uZgFKZf8PCSktLRePQYCvONvjxY319/dq1a728eLx17Xr+/PmbJj58+EBU49On5lfu2mU06YTsy5cvL1ni7+/PZmZl2dtkBsZgfHy86E5Ecfn5YMzPz++XXzZv3swadHPz8vI6d+6ccBwabAUNEvBJDer1vP3e1KlTU1NTL160t8b9+82v79EjPT29Xz9u7MiRI/V6e5tsNG7ZskWpVMrlixcvFt6JKO7x48chIeDroqlpVVVVB0xotVpGYlBQ0MuXQnFo0Awa/FcYhMFzXt6bN28cqlGvT0pKgkGHNa5z585abUZGBrOQxdsLShisqxs+fDgznK6trRWtSjpOp9MpFMuWLbMZ2sPCli09evSAAtPShOLQoBmnGmxuboZVzNyGRa2OjIx89uyZdSf4X/+S73+2aJPhAJ6b+5UJOMiXlJQYjXPnzlWYDu0wc7SzyUBhodyC2WBR0UETR44cEXqFQFxlZaVarQ4IgEZxN715M2DAAHiH1FShODRoRIOuZxAmgjb9X3BwcFkZ9H+72gJd2sSJE3ftOnr0KHmTuZw4oVKp4B2Ep7SicVFRrMFJkyZNnz7dzY1ZgKktLPAenQXilixZwkyBeV5RVmaeJP/2m1AcGjSiQVc36OMDs8L8/OTkZO7ohgEmtgcPkjaZyzffMH2suqZGaA9Cgzz06lVRUUEYl5KSAp50Ou56mPTPnAlbhg4d+u6dUHVo0Oh8g+YhJItSqdFo2o6E29G1a3l5OVGTuTAGly5dKrwHoUH4PQa0xcfHRyaD3oc70uaNa2zs06cPeGr/Bps2bWJmdcW8Z3/RIAsadD2DUJGILz7OnDlD1GQbioqKunUbNWpUU1OT8E5EBmNjX79+bbOlrKzMzw+2VFdXS8c9f24+lWpzuG1oaMjMdHd3Z7aIVocG0eB/1CCMNLp166ZQzJC4a5LI4E8/cbfU19eHhvr5+XEnusKjGWgFO/WtqSksLJTJZJbGZfDeJGCNQ4PGT2QQpkrDhg0rLHz69Cn4io1tsykg4PLly0RNtrJjxw7mtYcPHxbdj8hgQoLNpxgW4uPj/fzOnz9PGLdq1Sr4rHp7j2Xw94cF+P2mpo4YMcLNDQ0SxKFBVzPIOwVWqVS5JlauXMnd9MMPpE1maWiIiIiAV44eree9QkcY9+237IgafhHM+V+YyJaXjx8/HlYNHkweZzAYFi5cqFabj8mengkJCcxFdn+TzN27d4tWhwaNaND1DHLPsIoyZMiQykrSJrNYOkGFRCcoFffqFXsTNRAXF5eeDh7Y5Zwc++OYy+wHzp41Lz9/Dv9t1OoHDx6IVocG28Q5y+CVK1c0Go20vMDAwLNnDZwb6IkMJibCy3v37l1VJbWnRFxzc/PAgQM551Zh2KDT6d6/tz/Olt9/h4+06O0kaFAcNGh/nC2OGwROnTol4TArK+v48eOO1PjixYuvv4aEcePGSbdCOg4Ow4mJrDx3d/e9e4uKihyPawMzbThwQKo6NCgIlUGgvJzXXN++fc+YeMd78YqkxmvXrjE9AM+lNEfi7II8rrq6WqWCTzEadDQODdLGOcGgg0jHzZo1S6GIjY11UpxdkMfdvn2bmeKhQUfj0CBtnOsa/PPPTp06ma7jK9PT09vf8GhvnJOrs4IGaeNc1+CtW8whvV+/fvfv36ePsxPyuLdv3373nZeX1/XrUnFokB80SBvnuga/vDg0SBuHBmnj0CBtHBqkjcOnytOCBmlBg7SgQVrQIC1okBYczdDGoUHaODRIG4cGaePQIG0cGqSNQ4O0cWiQNg4N0sahQdq4T2rw3r17+SZ8fRUKBfvXk9ynCZPH2fDs2bPw8K1bt5JXd/PmzWHD5HJ5cPC0adM2btz4449Qmk6ny8iYMmVKoum2Tihx+vRFixY1NjYKx6FBNGjhizdYUjJ27NjQ0FBlKwrm7hmlUq1Wjx27evXq5mY74tqzfft2uVylUhFWd+zYsbCwsJ9/3rt3L+8bf/z48fXrkpKSDRtGjBjh7e2dklJfX88bhwbRoAVXNnjhwgXrwn7Og/WFa2xDWVmZWt1Gmo1BdiEzkzSOl4SEBLncw8ODsLrm5mapR8paePfuXW5uLvP3o7xxaFAKaoNRUXBEsi5qNBrII6mxDS9fvuzTBzzFxcXFt8Is9O/fnzXo4cFzJO0wg+QYDIYFCxagQXvjrKBBx+KsUBusqbExCPpslklrPHiQ96/tKyoqVq1aZekU16xZQxrHQa/Xx8TEmB7b2Et0P/sN3rkTHR0Nw+7Zs3kefYwGCXC+QTgWO2RQGDhQW6Z4jhs8efIk87ed27ZtE92PvLq3b99WVq5fv97Dw93dHUarf/8tFIcG+UGDtNU50WBuLhx+bdY43yB1P+hUgydOzJ8/v2fPnnI5/EhLu3v3rmgcGmwHGhThsxiMirKZFxsZgw4+gpsXZxhkv+mFyuCJE2lpacxf/UVFRSUmJp458573gSGcODTYSkcZTE7mroFBtfAJms9jMCIigt5gZKT5gSEpKW2ery0dhwZbQYMuaTAzM7P9iRhY2V4rUY28zJkzxzUM/vPP1atXV6xYERCgVCqDgoJ0uoaGBuk4NNgKGnRJg+0HzzAv1phITk6GjRqNzEKyRapdBpuakpKSmMvukODjw/MlzkRxpaVdunQBf76+Dx8+FN2TKK6uDkyuXLnS2zswMHDbNqFnExnRoBDOMwiyYGhpXYBPr6wVWIBVNTX7rZDXyHLlCnutzsfHZ8wYoRqlYgoKoCAwuHy51J52VXf3bqTp8CxyJwkaFAcNOhrHQm8QeruampoLF1hz0NXl5jJrLgifnSGvsaKiIjiYNThv3jwH41paWlJSQB/0WcInUeyvjqG+vj4yEvpY5gsyheLQoAhokKI6BjqDmZlgMMp0vR1+cOfBjhi8c+fOunXr8vJgHjxnDvzw9fVl/YWF8dwYJRHHAt0UM5geOnSo6H6EcVwaGgICAqKjo4Xj0KA4jhqsYa7QmUbMGs7pVTOc8/5SNRYXF8+bN3DgQN57t8LCwoSfSy3d5NOnT3t5gUEo9a+/RPfkiSP58vLs7Gwo9Y8/hOLQoBRoUCyu4wwy8kRutkxO5l48EaqRXcnOfq1PFWYXBg8enJ8v9EZEHVfv3mBw5syZYl98xxO3dOlSsbvQWGDMAPGmryvhj0ODUqBBwbgONSh1tzQzspaukaG2tjbYMnQWvo9648aNhHFc9u3b5+4OTRQa9QrHTZgwQau9LvqIRhOXLl2C+LVrheLQYMcYdJz2cdXV1bzSbBYcn9WFh4czw+kXL17YWd3Vq1djYz09PaOjMzIycnJyfv21rq6O+4qqqpCQECjw4kWhODSIBr98gy0tLZmZmVZpAwYM+P77Bw8eFBQUxMQoLYNqx+fF7qZekOjbYnjimprOnTuXnR0UFARdXWgoTNXHmNBqtXkm4uLiAgOhvg0bNgjHoUHXN2hkhlT+/gsXLgSD2dk3btywNmA3A82sLikpyXGDFh4+fHj48OFHj27dupWVlWXztVkzZoh8OSsaZEGDX77BLzoODdLGoUHaODRIG4cGaePQIG0cGqSNQ4O0cWiQNg4N0sahQdo4fKo8LWiQFjRICxqkBQ3S8n+rQtglCmVuZHN0cmVhbQplbmRvYmoKMTQgMCBvYmoKMzEyNAplbmRvYmoKMiAwIG9iago8PCAvQ291bnQgMSAvS2lkcyBbIDExIDAgUiBdIC9UeXBlIC9QYWdlcyA+PgplbmRvYmoKMTUgMCBvYmoKPDwgL0NyZWF0aW9uRGF0ZSAoRDoyMDIxMDkxNjE0NDE1NCswMicwMCcpCi9DcmVhdG9yIChNYXRwbG90bGliIHYzLjQuMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZykKL1Byb2R1Y2VyIChNYXRwbG90bGliIHBkZiBiYWNrZW5kIHYzLjQuMykgPj4KZW5kb2JqCnhyZWYKMCAxNgowMDAwMDAwMDAwIDY1NTM1IGYgCjAwMDAwMDAwMTYgMDAwMDAgbiAKMDAwMDAwNDkyNiAwMDAwMCBuIAowMDAwMDAwNjU5IDAwMDAwIG4gCjAwMDAwMDA2ODAgMDAwMDAgbiAKMDAwMDAwMDc3OSAwMDAwMCBuIAowMDAwMDAwODAwIDAwMDAwIG4gCjAwMDAwMDA4MjEgMDAwMDAgbiAKMDAwMDAwMDA2NSAwMDAwMCBuIAowMDAwMDAwNDAyIDAwMDAwIG4gCjAwMDAwMDA2MzkgMDAwMDAgbiAKMDAwMDAwMDIwOCAwMDAwMCBuIAowMDAwMDAwNjE5IDAwMDAwIG4gCjAwMDAwMDA4NTMgMDAwMDAgbiAKMDAwMDAwNDkwNSAwMDAwMCBuIAowMDAwMDA0OTg2IDAwMDAwIG4gCnRyYWlsZXIKPDwgL0luZm8gMTUgMCBSIC9Sb290IDEgMCBSIC9TaXplIDE2ID4+CnN0YXJ0eHJlZgo1MTQzCiUlRU9GCg==\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:54.410044\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["def show_imgs(imgs, title=None, row_size=4):\n", " # Form a grid of pictures (we use max. 8 columns)\n", " num_imgs = imgs.shape[0] if isinstance(imgs, torch.Tensor) else len(imgs)\n", " is_int = imgs.dtype == torch.int32 if isinstance(imgs, torch.Tensor) else imgs[0].dtype == torch.int32\n", " nrow = min(num_imgs, row_size)\n", " ncol = int(math.ceil(num_imgs / nrow))\n", " imgs = torchvision.utils.make_grid(imgs, nrow=nrow, pad_value=128 if is_int else 0.5)\n", " np_imgs = imgs.cpu().numpy()\n", " # Plot the grid\n", " plt.figure(figsize=(1.5 * nrow, 1.5 * ncol))\n", " plt.imshow(np.transpose(np_imgs, (1, 2, 0)), interpolation=\"nearest\")\n", " plt.axis(\"off\")\n", " if title is not None:\n", " plt.title(title)\n", " plt.show()\n", " plt.close()\n", "\n", "\n", "show_imgs([train_set[i][0] for i in range(8)])"]}, {"cell_type": "markdown", "id": "122fbad4", "metadata": {"papermill": {"duration": 0.031364, "end_time": "2021-09-16T12:41:54.509186", "exception": false, "start_time": "2021-09-16T12:41:54.477822", "status": "completed"}, "tags": []}, "source": ["## Normalizing Flows as generative model\n", "\n", "In the previous lectures, we have seen Energy-based models, Variational Autoencoders (VAEs)\n", "and Generative Adversarial Networks (GANs) as example of generative models.\n", "However, none of them explicitly learn the probability density function $p(x)$ of the real input data.\n", "While VAEs model a lower bound, energy-based models only implicitly learn the probability density.\n", "GANs on the other hand provide us a sampling mechanism for generating new data, without offering a likelihood estimate.\n", "The generative model we will look at here, called Normalizing Flows, actually models the true data distribution\n", "$p(x)$ and provides us with an exact likelihood estimate.\n", "Below, we can visually compare VAEs, GANs and Flows\n", "(figure credit - [Lilian Weng](https://lilianweng.github.io/lil-log/2018/10/13/flow-based-deep-generative-models.html)):\n", "\n", "
\n", "\n", "The major difference compared to VAEs is that flows use *invertible* functions $f$\n", "to map the input data $x$ to a latent representation $z$.\n", "To realize this, $z$ must be of the same shape as $x$.\n", "This is in contrast to VAEs where $z$ is usually much lower dimensional than the original input data.\n", "However, an invertible mapping also means that for every data point $x$, we have a corresponding latent representation\n", "$z$ which allows us to perform lossless reconstruction ($z$ to $x$).\n", "In the visualization above, this means that $x=x'$ for flows, no matter what invertible function $f$ and input $x$ we choose.\n", "\n", "Nonetheless, how are normalizing flows modeling a probability density with an invertible function?\n", "The answer to this question is the rule for change of variables.\n", "Specifically, given a prior density $p_z(z)$ (e.g. Gaussian) and an invertible function $f$,\n", "we can determine $p_x(x)$ as follows:\n", "\n", "$$\n", "\\begin{split}\n", " \\int p_x(x) dx & = \\int p_z(z) dz = 1 \\hspace{1cm}\\text{(by definition of a probability distribution)}\\\\\n", " \\Leftrightarrow p_x(x) & = p_z(z) \\left|\\frac{dz}{dx}\\right| = p_z(f(x)) \\left|\\frac{df(x)}{dx}\\right|\n", "\\end{split}\n", "$$\n", "\n", "Hence, in order to determine the probability of $x$, we only need to determine its probability in latent space,\n", "and get the derivate of $f$.\n", "Note that this is for a univariate distribution, and $f$ is required to be invertible and smooth.\n", "For a multivariate case, the derivative becomes a Jacobian of which we need to take the determinant.\n", "As we usually use the log-likelihood as objective, we write the multivariate term with logarithms below:\n", "\n", "$$\n", "\\log p_x(\\mathbf{x}) = \\log p_z(f(\\mathbf{x})) + \\log{} \\left|\\det \\frac{df(\\mathbf{x})}{d\\mathbf{x}}\\right|\n", "$$\n", "\n", "Although we now know how a normalizing flow obtains its likelihood, it might not be clear what a normalizing flow does intuitively.\n", "For this, we should look from the inverse perspective of the flow starting with the prior probability density $p_z(z)$.\n", "If we apply an invertible function on it, we effectively \"transform\" its probability density.\n", "For instance, if $f^{-1}(z)=z+1$, we shift the density by one while still remaining a valid probability distribution,\n", "and being invertible.\n", "We can also apply more complex transformations, like scaling: $f^{-1}(z)=2z+1$, but there you might see a difference.\n", "When you scale, you also change the volume of the probability density, as for example on uniform distributions\n", "(figure credit - [Eric Jang](https://blog.evjang.com/2018/01/nf1.html)):\n", "\n", "
\n", "\n", "You can see that the height of $p(y)$ should be lower than $p(x)$ after scaling.\n", "This change in volume represents $\\left|\\frac{df(x)}{dx}\\right|$ in our equation above,\n", "and ensures that even after scaling, we still have a valid probability distribution.\n", "We can go on with making our function $f$ more complex.\n", "However, the more complex $f$ becomes, the harder it will be to find the inverse $f^{-1}$ of it,\n", "and to calculate the log-determinant of the Jacobian $\\log{} \\left|\\det \\frac{df(\\mathbf{x})}{d\\mathbf{x}}\\right|$.\n", "An easier trick to stack multiple invertible functions $f_{1,...,K}$ after each other, as all together,\n", "they still represent a single, invertible function.\n", "Using multiple, learnable invertible functions, a normalizing flow attempts to transform\n", "$p_z(z)$ slowly into a more complex distribution which should finally be $p_x(x)$.\n", "We visualize the idea below\n", "(figure credit - [Lilian Weng](https://lilianweng.github.io/lil-log/2018/10/13/flow-based-deep-generative-models.html)):\n", "\n", "
\n", "\n", "Starting from $z_0$, which follows the prior Gaussian distribution, we sequentially apply the invertible\n", "functions $f_1,f_2,...,f_K$, until $z_K$ represents $x$.\n", "Note that in the figure above, the functions $f$ represent the inverted function from $f$ we had above\n", "(here: $f:Z\\to X$, above: $f:X\\to Z$).\n", "This is just a different notation and has no impact on the actual flow design because all $f$ need to be invertible anyways.\n", "When we estimate the log likelihood of a data point $x$ as in the equations above,\n", "we run the flows in the opposite direction than visualized above.\n", "Multiple flow layers have been proposed that use a neural network as learnable parameters,\n", "such as the planar and radial flow.\n", "However, we will focus here on flows that are commonly used in image\n", "modeling, and will discuss them in the rest of the notebook along with\n", "the details of how to train a normalizing flow."]}, {"cell_type": "markdown", "id": "3f9b2256", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.030707, "end_time": "2021-09-16T12:41:54.571000", "exception": false, "start_time": "2021-09-16T12:41:54.540293", "status": "completed"}, "tags": []}, "source": ["## Normalizing Flows on images\n", "\n", "
\n", "\n", "To become familiar with normalizing flows, especially for the application of image modeling,\n", "it is best to discuss the different elements in a flow along with the implementation.\n", "As a general concept, we want to build a normalizing flow that maps an input image (here MNIST) to an equally sized latent space:\n", "\n", "
\n", "\n", "As a first step, we will implement a template of a normalizing flow in PyTorch Lightning.\n", "During training and validation, a normalizing flow performs density estimation in the forward direction.\n", "For this, we apply a series of flow transformations on the input $x$ and estimate the probability\n", "of the input by determining the probability of the transformed point $z$ given a prior,\n", "and the change of volume caused by the transformations.\n", "During inference, we can do both density estimation and sampling new points by inverting the flow transformations.\n", "Therefore, we define a function `_get_likelihood` which performs density estimation,\n", "and `sample` to generate new examples.\n", "The functions `training_step`, `validation_step` and `test_step` all make use of `_get_likelihood`.\n", "\n", "The standard metric used in generative models, and in particular normalizing flows, is bits per dimensions (bpd).\n", "Bpd is motivated from an information theory perspective and describes how many bits we would need to encode a particular example in our modeled distribution.\n", "The less bits we need, the more likely the example in our distribution.\n", "When we test for the bits per dimension of our test dataset, we can judge whether our model generalizes to new samples of the dataset and didn't memorize the training dataset.\n", "In order to calculate the bits per dimension score, we can rely on the negative log-likelihood and change the log base (as bits are binary while NLL is usually exponential):\n", "\n", "$$\\text{bpd} = \\text{nll} \\cdot \\log_2\\left(\\exp(1)\\right) \\cdot \\left(\\prod d_i\\right)^{-1}$$\n", "\n", "where $d_1,...,d_K$ are the dimensions of the input.\n", "For images, this would be the height, width and channel number.\n", "We divide the log likelihood by these extra dimensions to have a metric which we can compare for different image resolutions.\n", "In the original image space, MNIST examples have a bits per dimension\n", "score of 8 (we need 8 bits to encode each pixel as there are 256\n", "possible values)."]}, {"cell_type": "code", "execution_count": 6, "id": "f731caad", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:54.645154Z", "iopub.status.busy": "2021-09-16T12:41:54.634808Z", "iopub.status.idle": "2021-09-16T12:41:54.647412Z", "shell.execute_reply": "2021-09-16T12:41:54.647011Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.045385, "end_time": "2021-09-16T12:41:54.647510", "exception": false, "start_time": "2021-09-16T12:41:54.602125", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class ImageFlow(pl.LightningModule):\n", " def __init__(self, flows, import_samples=8):\n", " \"\"\"\n", " Args:\n", " flows: A list of flows (each a nn.Module) that should be applied on the images.\n", " import_samples: Number of importance samples to use during testing (see explanation below). Can be changed at any time\n", " \"\"\"\n", " super().__init__()\n", " self.flows = nn.ModuleList(flows)\n", " self.import_samples = import_samples\n", " # Create prior distribution for final latent space\n", " self.prior = torch.distributions.normal.Normal(loc=0.0, scale=1.0)\n", " # Example input for visualizing the graph\n", " self.example_input_array = train_set[0][0].unsqueeze(dim=0)\n", "\n", " def forward(self, imgs):\n", " # The forward function is only used for visualizing the graph\n", " return self._get_likelihood(imgs)\n", "\n", " def encode(self, imgs):\n", " # Given a batch of images, return the latent representation z and ldj of the transformations\n", " z, ldj = imgs, torch.zeros(imgs.shape[0], device=self.device)\n", " for flow in self.flows:\n", " z, ldj = flow(z, ldj, reverse=False)\n", " return z, ldj\n", "\n", " def _get_likelihood(self, imgs, return_ll=False):\n", " \"\"\"Given a batch of images, return the likelihood of those.\n", "\n", " If return_ll is True, this function returns the log likelihood of the input. Otherwise, the ouptut metric is\n", " bits per dimension (scaled negative log likelihood)\n", " \"\"\"\n", " z, ldj = self.encode(imgs)\n", " log_pz = self.prior.log_prob(z).sum(dim=[1, 2, 3])\n", " log_px = ldj + log_pz\n", " nll = -log_px\n", " # Calculating bits per dimension\n", " bpd = nll * np.log2(np.exp(1)) / np.prod(imgs.shape[1:])\n", " return bpd.mean() if not return_ll else log_px\n", "\n", " @torch.no_grad()\n", " def sample(self, img_shape, z_init=None):\n", " \"\"\"Sample a batch of images from the flow.\"\"\"\n", " # Sample latent representation from prior\n", " if z_init is None:\n", " z = self.prior.sample(sample_shape=img_shape).to(device)\n", " else:\n", " z = z_init.to(device)\n", "\n", " # Transform z to x by inverting the flows\n", " ldj = torch.zeros(img_shape[0], device=device)\n", " for flow in reversed(self.flows):\n", " z, ldj = flow(z, ldj, reverse=True)\n", " return z\n", "\n", " def configure_optimizers(self):\n", " optimizer = optim.Adam(self.parameters(), lr=1e-3)\n", " # An scheduler is optional, but can help in flows to get the last bpd improvement\n", " scheduler = optim.lr_scheduler.StepLR(optimizer, 1, gamma=0.99)\n", " return [optimizer], [scheduler]\n", "\n", " def training_step(self, batch, batch_idx):\n", " # Normalizing flows are trained by maximum likelihood => return bpd\n", " loss = self._get_likelihood(batch[0])\n", " self.log(\"train_bpd\", loss)\n", " return loss\n", "\n", " def validation_step(self, batch, batch_idx):\n", " loss = self._get_likelihood(batch[0])\n", " self.log(\"val_bpd\", loss)\n", "\n", " def test_step(self, batch, batch_idx):\n", " # Perform importance sampling during testing => estimate likelihood M times for each image\n", " samples = []\n", " for _ in range(self.import_samples):\n", " img_ll = self._get_likelihood(batch[0], return_ll=True)\n", " samples.append(img_ll)\n", " img_ll = torch.stack(samples, dim=-1)\n", "\n", " # To average the probabilities, we need to go from log-space to exp, and back to log.\n", " # Logsumexp provides us a stable implementation for this\n", " img_ll = torch.logsumexp(img_ll, dim=-1) - np.log(self.import_samples)\n", "\n", " # Calculate final bpd\n", " bpd = -img_ll * np.log2(np.exp(1)) / np.prod(batch[0].shape[1:])\n", " bpd = bpd.mean()\n", "\n", " self.log(\"test_bpd\", bpd)"]}, {"cell_type": "markdown", "id": "bde3e5a1", "metadata": {"papermill": {"duration": 0.030814, "end_time": "2021-09-16T12:41:54.709142", "exception": false, "start_time": "2021-09-16T12:41:54.678328", "status": "completed"}, "tags": []}, "source": ["The `test_step` function differs from the training and validation step in that it makes use of importance sampling.\n", "We will discuss the motiviation and details behind this after\n", "understanding how flows model discrete images in continuous space."]}, {"cell_type": "markdown", "id": "2fbe3846", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.030971, "end_time": "2021-09-16T12:41:54.770996", "exception": false, "start_time": "2021-09-16T12:41:54.740025", "status": "completed"}, "tags": []}, "source": ["### Dequantization\n", "\n", "Normalizing flows rely on the rule of change of variables, which is naturally defined in continuous space.\n", "Applying flows directly on discrete data leads to undesired density models where arbitrarly high likelihood are placed on a few, particular values.\n", "See the illustration below:\n", "\n", "
\n", "\n", "The black points represent the discrete points, and the green volume the density modeled by a normalizing flow in continuous space.\n", "The flow would continue to increase the likelihood for $x=0,1,2,3$ while having no volume on any other point.\n", "Remember that in continuous space, we have the constraint that the overall volume of the probability density must be 1 ($\\int p(x)dx=1$).\n", "Otherwise, we don't model a probability distribution anymore.\n", "However, the discrete points $x=0,1,2,3$ represent delta peaks with no width in continuous space.\n", "This is why the flow can place an infinite high likelihood on these few points while still representing a distribution in continuous space.\n", "Nonetheless, the learned density does not tell us anything about the distribution among the discrete points,\n", "as in discrete space, the likelihoods of those four points would have to sum to 1, not to infinity.\n", "\n", "To prevent such degenerated solutions, a common solution is to add a small amount of noise to each discrete value, which is also referred to as dequantization.\n", "Considering $x$ as an integer (as it is the case for images), the dequantized representation $v$ can be formulated as $v=x+u$ where $u\\in[0,1)^D$.\n", "Thus, the discrete value $1$ is modeled by a distribution over the interval $[1.0, 2.0)$, the value $2$ by an volume over $[2.0, 3.0)$, etc.\n", "Our objective of modeling $p(x)$ becomes:\n", "\n", "$$ p(x) = \\int p(x+u)du = \\int \\frac{q(u|x)}{q(u|x)}p(x+u)du = \\mathbb{E}_{u\\sim q(u|x)}\\left[\\frac{p(x+u)}{q(u|x)} \\right]$$\n", "\n", "with $q(u|x)$ being the noise distribution.\n", "For now, we assume it to be uniform, which can also be written as $p(x)=\\mathbb{E}_{u\\sim U(0,1)^D}\\left[p(x+u) \\right]$.\n", "\n", "In the following, we will implement Dequantization as a flow transformation itself.\n", "After adding noise to the discrete values, we additionally transform the volume into a Gaussian-like shape.\n", "This is done by scaling $x+u$ between $0$ and $1$, and applying the invert of the sigmoid function $\\sigma(z)^{-1} = \\log z - \\log 1-z$.\n", "If we would not do this, we would face two problems:\n", "\n", "1.\n", "The input is scaled between 0 and 256 while the prior distribution is a Gaussian with mean $0$ and standard deviation $1$.\n", "In the first iterations after initializing the parameters of the flow, we would have extremely low likelihoods for large values like $256$.\n", "This would cause the training to diverge instantaneously.\n", "2.\n", "As the output distribution is a Gaussian, it is beneficial for the flow to have a similarly shaped input distribution.\n", "This will reduce the modeling complexity that is required by the flow.\n", "\n", "Overall, we can implement dequantization as follows:"]}, {"cell_type": "code", "execution_count": 7, "id": "14292232", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:54.841782Z", "iopub.status.busy": "2021-09-16T12:41:54.841282Z", "iopub.status.idle": "2021-09-16T12:41:54.843421Z", "shell.execute_reply": "2021-09-16T12:41:54.842957Z"}, "papermill": {"duration": 0.040991, "end_time": "2021-09-16T12:41:54.843517", "exception": false, "start_time": "2021-09-16T12:41:54.802526", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class Dequantization(nn.Module):\n", " def __init__(self, alpha=1e-5, quants=256):\n", " \"\"\"\n", " Args:\n", " alpha: small constant that is used to scale the original input.\n", " Prevents dealing with values very close to 0 and 1 when inverting the sigmoid\n", " quants: Number of possible discrete values (usually 256 for 8-bit image)\n", " \"\"\"\n", " super().__init__()\n", " self.alpha = alpha\n", " self.quants = quants\n", "\n", " def forward(self, z, ldj, reverse=False):\n", " if not reverse:\n", " z, ldj = self.dequant(z, ldj)\n", " z, ldj = self.sigmoid(z, ldj, reverse=True)\n", " else:\n", " z, ldj = self.sigmoid(z, ldj, reverse=False)\n", " z = z * self.quants\n", " ldj += np.log(self.quants) * np.prod(z.shape[1:])\n", " z = torch.floor(z).clamp(min=0, max=self.quants - 1).to(torch.int32)\n", " return z, ldj\n", "\n", " def sigmoid(self, z, ldj, reverse=False):\n", " # Applies an invertible sigmoid transformation\n", " if not reverse:\n", " ldj += (-z - 2 * F.softplus(-z)).sum(dim=[1, 2, 3])\n", " z = torch.sigmoid(z)\n", " else:\n", " z = z * (1 - self.alpha) + 0.5 * self.alpha # Scale to prevent boundaries 0 and 1\n", " ldj += np.log(1 - self.alpha) * np.prod(z.shape[1:])\n", " ldj += (-torch.log(z) - torch.log(1 - z)).sum(dim=[1, 2, 3])\n", " z = torch.log(z) - torch.log(1 - z)\n", " return z, ldj\n", "\n", " def dequant(self, z, ldj):\n", " # Transform discrete values to continuous volumes\n", " z = z.to(torch.float32)\n", " z = z + torch.rand_like(z).detach()\n", " z = z / self.quants\n", " ldj -= np.log(self.quants) * np.prod(z.shape[1:])\n", " return z, ldj"]}, {"cell_type": "markdown", "id": "d1d08852", "metadata": {"papermill": {"duration": 0.030723, "end_time": "2021-09-16T12:41:54.905082", "exception": false, "start_time": "2021-09-16T12:41:54.874359", "status": "completed"}, "tags": []}, "source": ["A good check whether a flow is correctly implemented or not, is to verify that it is invertible.\n", "Hence, we will dequantize a randomly chosen training image, and then quantize it again.\n", "We would expect that we would get the exact same image out:"]}, {"cell_type": "code", "execution_count": 8, "id": "728daf90", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:54.972326Z", "iopub.status.busy": "2021-09-16T12:41:54.971852Z", "iopub.status.idle": "2021-09-16T12:41:54.978174Z", "shell.execute_reply": "2021-09-16T12:41:54.977694Z"}, "papermill": {"duration": 0.042049, "end_time": "2021-09-16T12:41:54.978271", "exception": false, "start_time": "2021-09-16T12:41:54.936222", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Dequantization was not invertible.\n", "Original value: 0\n", "Reconstructed value: 1\n"]}], "source": ["# Testing invertibility of dequantization layer\n", "pl.seed_everything(42)\n", "orig_img = train_set[0][0].unsqueeze(dim=0)\n", "ldj = torch.zeros(\n", " 1,\n", ")\n", "dequant_module = Dequantization()\n", "deq_img, ldj = dequant_module(orig_img, ldj, reverse=False)\n", "reconst_img, ldj = dequant_module(deq_img, ldj, reverse=True)\n", "\n", "d1, d2 = torch.where(orig_img.squeeze() != reconst_img.squeeze())\n", "if len(d1) != 0:\n", " print(\"Dequantization was not invertible.\")\n", " for i in range(d1.shape[0]):\n", " print(\"Original value:\", orig_img[0, 0, d1[i], d2[i]].item())\n", " print(\"Reconstructed value:\", reconst_img[0, 0, d1[i], d2[i]].item())\n", "else:\n", " print(\"Successfully inverted dequantization\")\n", "\n", "# Layer is not strictly invertible due to float precision constraints\n", "# assert (orig_img == reconst_img).all().item()"]}, {"cell_type": "markdown", "id": "063694b6", "metadata": {"papermill": {"duration": 0.031526, "end_time": "2021-09-16T12:41:55.042165", "exception": false, "start_time": "2021-09-16T12:41:55.010639", "status": "completed"}, "tags": []}, "source": ["In contrast to our expectation, the test fails.\n", "However, this is no reason to doubt our implementation here as only one single value is not equal to the original.\n", "This is caused due to numerical inaccuracies in the sigmoid invert.\n", "While the input space to the inverted sigmoid is scaled between 0 and 1, the output space is between $-\\infty$ and $\\infty$.\n", "And as we use 32 bits to represent the numbers (in addition to applying logs over and over again),\n", "such inaccuries can occur and should not be worrisome.\n", "Nevertheless, it is good to be aware of them, and can be improved by using a double tensor (float64).\n", "\n", "Finally, we can take our dequantization and actually visualize the\n", "distribution it transforms the discrete values into:"]}, {"cell_type": "code", "execution_count": 9, "id": "9e42101f", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:55.118016Z", "iopub.status.busy": "2021-09-16T12:41:55.117517Z", "iopub.status.idle": "2021-09-16T12:41:55.544694Z", "shell.execute_reply": "2021-09-16T12:41:55.545080Z"}, "papermill": {"duration": 0.469437, "end_time": "2021-09-16T12:41:55.545218", "exception": false, "start_time": "2021-09-16T12:41:55.075781", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:55.273989\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["\n", "\n", "def visualize_dequantization(quants, prior=None):\n", " \"\"\"Function for visualizing the dequantization values of discrete values in continuous space.\"\"\"\n", " # Prior over discrete values. If not given, a uniform is assumed\n", " if prior is None:\n", " prior = np.ones(quants, dtype=np.float32) / quants\n", " prior = prior / prior.sum() * quants # In the following, we assume 1 for each value means uniform distribution\n", "\n", " inp = torch.arange(-4, 4, 0.01).view(-1, 1, 1, 1) # Possible continuous values we want to consider\n", " ldj = torch.zeros(inp.shape[0])\n", " dequant_module = Dequantization(quants=quants)\n", " # Invert dequantization on continuous values to find corresponding discrete value\n", " out, ldj = dequant_module.forward(inp, ldj, reverse=True)\n", " inp, out, prob = inp.squeeze().numpy(), out.squeeze().numpy(), ldj.exp().numpy()\n", " prob = prob * prior[out] # Probability scaled by categorical prior\n", "\n", " # Plot volumes and continuous distribution\n", " sns.set_style(\"white\")\n", " _ = plt.figure(figsize=(6, 3))\n", " x_ticks = []\n", " for v in np.unique(out):\n", " indices = np.where(out == v)\n", " color = to_rgb(\"C%i\" % v)\n", " plt.fill_between(inp[indices], prob[indices], np.zeros(indices[0].shape[0]), color=color + (0.5,), label=str(v))\n", " plt.plot([inp[indices[0][0]]] * 2, [0, prob[indices[0][0]]], color=color)\n", " plt.plot([inp[indices[0][-1]]] * 2, [0, prob[indices[0][-1]]], color=color)\n", " x_ticks.append(inp[indices[0][0]])\n", " x_ticks.append(inp.max())\n", " plt.xticks(x_ticks, [\"%.1f\" % x for x in x_ticks])\n", " plt.plot(inp, prob, color=(0.0, 0.0, 0.0))\n", " # Set final plot properties\n", " plt.ylim(0, prob.max() * 1.1)\n", " plt.xlim(inp.min(), inp.max())\n", " plt.xlabel(\"z\")\n", " plt.ylabel(\"Probability\")\n", " plt.title(\"Dequantization distribution for %i discrete values\" % quants)\n", " plt.legend()\n", " plt.show()\n", " plt.close()\n", "\n", "\n", "visualize_dequantization(quants=8)"]}, {"cell_type": "markdown", "id": "b4e465fe", "metadata": {"papermill": {"duration": 0.034926, "end_time": "2021-09-16T12:41:55.616011", "exception": false, "start_time": "2021-09-16T12:41:55.581085", "status": "completed"}, "tags": []}, "source": ["The visualized distribution show the sub-volumes that are assigned to the different discrete values.\n", "The value $0$ has its volume between $[-\\infty, -1.9)$, the value $1$ is represented by the interval $[-1.9, -1.1)$, etc.\n", "The volume for each discrete value has the same probability mass.\n", "That's why the volumes close to the center (e.g. 3 and 4) have a smaller area on the z-axis as others\n", "($z$ is being used to denote the output of the whole dequantization flow).\n", "\n", "Effectively, the consecutive normalizing flow models discrete images by the following objective:\n", "\n", "$$\\log p(x) = \\log \\mathbb{E}_{u\\sim q(u|x)}\\left[\\frac{p(x+u)}{q(u|x)} \\right] \\geq \\mathbb{E}_{u}\\left[\\log \\frac{p(x+u)}{q(u|x)} \\right]$$\n", "\n", "Although normalizing flows are exact in likelihood, we have a lower bound.\n", "Specifically, this is an example of the Jensen inequality because we need to move the log into the expectation so we can use Monte-carlo estimates.\n", "In general, this bound is considerably smaller than the ELBO in variational autoencoders.\n", "Actually, we can reduce the bound ourselves by estimating the expectation not by one, but by $M$ samples.\n", "In other words, we can apply importance sampling which leads to the following inequality:\n", "\n", "$$\\log p(x) = \\log \\mathbb{E}_{u\\sim q(u|x)}\\left[\\frac{p(x+u)}{q(u|x)} \\right] \\geq \\mathbb{E}_{u}\\left[\\log \\frac{1}{M} \\sum_{m=1}^{M} \\frac{p(x+u_m)}{q(u_m|x)} \\right] \\geq \\mathbb{E}_{u}\\left[\\log \\frac{p(x+u)}{q(u|x)} \\right]$$\n", "\n", "The importance sampling $\\frac{1}{M} \\sum_{m=1}^{M} \\frac{p(x+u_m)}{q(u_m|x)}$ becomes\n", "$\\mathbb{E}_{u\\sim q(u|x)}\\left[\\frac{p(x+u)}{q(u|x)} \\right]$ if $M\\to \\infty$,\n", "so that the more samples we use, the tighter the bound is.\n", "During testing, we can make use of this property and have it implemented in `test_step` in `ImageFlow`.\n", "In theory, we could also use this tighter bound during training.\n", "However, related work has shown that this does not necessarily lead to\n", "an improvement given the additional computational cost, and it is more\n", "efficient to stick with a single estimate [5]."]}, {"cell_type": "markdown", "id": "decab6f5", "metadata": {"papermill": {"duration": 0.03541, "end_time": "2021-09-16T12:41:55.686454", "exception": false, "start_time": "2021-09-16T12:41:55.651044", "status": "completed"}, "tags": []}, "source": ["### Variational Dequantization\n", "\n", "Dequantization uses a uniform distribution for the noise $u$ which effectively leads to images being represented as hypercubes\n", "(cube in high dimensions) with sharp borders.\n", "However, modeling such sharp borders is not easy for a flow as it uses smooth transformations to convert it into a Gaussian distribution.\n", "\n", "Another way of looking at it is if we change the prior distribution in the previous visualization.\n", "Imagine we have independent Gaussian noise on pixels which is commonly the case for any real-world taken picture.\n", "Therefore, the flow would have to model a distribution as above, but with the individual volumes scaled as follows:"]}, {"cell_type": "code", "execution_count": 10, "id": "a67d1060", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:55.760055Z", "iopub.status.busy": "2021-09-16T12:41:55.759590Z", "iopub.status.idle": "2021-09-16T12:41:56.167204Z", "shell.execute_reply": "2021-09-16T12:41:56.167593Z"}, "papermill": {"duration": 0.446187, "end_time": "2021-09-16T12:41:56.167737", "exception": false, "start_time": "2021-09-16T12:41:55.721550", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:55.917189\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["visualize_dequantization(quants=8, prior=np.array([0.075, 0.2, 0.4, 0.2, 0.075, 0.025, 0.0125, 0.0125]))"]}, {"cell_type": "markdown", "id": "cbe2bafd", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.039099, "end_time": "2021-09-16T12:41:56.246361", "exception": false, "start_time": "2021-09-16T12:41:56.207262", "status": "completed"}, "tags": []}, "source": ["Transforming such a probability into a Gaussian is a difficult task, especially with such hard borders.\n", "Dequantization has therefore been extended to more sophisticated, learnable distributions beyond uniform in a variational framework.\n", "In particular, if we remember the learning objective\n", "$\\log p(x) = \\log \\mathbb{E}_{u}\\left[\\frac{p(x+u)}{q(u|x)} \\right]$,\n", "the uniform distribution can be replaced by a learned distribution $q_{\\theta}(u|x)$ with support over $u\\in[0,1)^D$.\n", "This approach is called Variational Dequantization and has been proposed by Ho et al.\n", "[3].\n", "How can we learn such a distribution?\n", "We can use a second normalizing flow that takes $x$ as external input and learns a flexible distribution over $u$.\n", "To ensure a support over $[0,1)^D$, we can apply a sigmoid activation function as final flow transformation.\n", "\n", "Inheriting the original dequantization class, we can implement variational dequantization as follows:"]}, {"cell_type": "code", "execution_count": 11, "id": "5b61f162", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:56.333681Z", "iopub.status.busy": "2021-09-16T12:41:56.333192Z", "iopub.status.idle": "2021-09-16T12:41:56.335214Z", "shell.execute_reply": "2021-09-16T12:41:56.334809Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.049683, "end_time": "2021-09-16T12:41:56.335320", "exception": false, "start_time": "2021-09-16T12:41:56.285637", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class VariationalDequantization(Dequantization):\n", " def __init__(self, var_flows, alpha=1e-5):\n", " \"\"\"\n", " Args:\n", " var_flows: A list of flow transformations to use for modeling q(u|x)\n", " alpha: Small constant, see Dequantization for details\n", " \"\"\"\n", " super().__init__(alpha=alpha)\n", " self.flows = nn.ModuleList(var_flows)\n", "\n", " def dequant(self, z, ldj):\n", " z = z.to(torch.float32)\n", " img = (z / 255.0) * 2 - 1 # We condition the flows on x, i.e. the original image\n", "\n", " # Prior of u is a uniform distribution as before\n", " # As most flow transformations are defined on [-infinity,+infinity], we apply an inverse sigmoid first.\n", " deq_noise = torch.rand_like(z).detach()\n", " deq_noise, ldj = self.sigmoid(deq_noise, ldj, reverse=True)\n", " for flow in self.flows:\n", " deq_noise, ldj = flow(deq_noise, ldj, reverse=False, orig_img=img)\n", " deq_noise, ldj = self.sigmoid(deq_noise, ldj, reverse=False)\n", "\n", " # After the flows, apply u as in standard dequantization\n", " z = (z + deq_noise) / 256.0\n", " ldj -= np.log(256.0) * np.prod(z.shape[1:])\n", " return z, ldj"]}, {"cell_type": "markdown", "id": "80820d23", "metadata": {"papermill": {"duration": 0.03912, "end_time": "2021-09-16T12:41:56.414896", "exception": false, "start_time": "2021-09-16T12:41:56.375776", "status": "completed"}, "tags": []}, "source": ["Variational dequantization can be used as a substitute for dequantization.\n", "We will compare dequantization and variational dequantization in later experiments."]}, {"cell_type": "markdown", "id": "a46fc99c", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.038999, "end_time": "2021-09-16T12:41:56.493208", "exception": false, "start_time": "2021-09-16T12:41:56.454209", "status": "completed"}, "tags": []}, "source": ["### Coupling layers\n", "\n", "
\n", "\n", "Next, we look at possible transformations to apply inside the flow.\n", "A recent popular flow layer, which works well in combination with deep neural networks,\n", "is the coupling layer introduced by Dinh et al.\n", "[1].\n", "The input $z$ is arbitrarily split into two parts, $z_{1:j}$ and $z_{j+1:d}$, of which the first remains unchanged by the flow.\n", "Yet, $z_{1:j}$ is used to parameterize the transformation for the second part, $z_{j+1:d}$.\n", "Various transformations have been proposed in recent time [3,4], but here we will settle for the simplest and most efficient one: affine coupling.\n", "In this coupling layer, we apply an affine transformation by shifting the input by a bias $\\mu$ and scale it by $\\sigma$.\n", "In other words, our transformation looks as follows:\n", "\n", "$$z'_{j+1:d} = \\mu_{\\theta}(z_{1:j}) + \\sigma_{\\theta}(z_{1:j}) \\odot z_{j+1:d}$$\n", "\n", "The functions $\\mu$ and $\\sigma$ are implemented as a shared neural network,\n", "and the sum and multiplication are performed element-wise.\n", "The LDJ is thereby the sum of the logs of the scaling factors: $\\sum_i \\left[\\log \\sigma_{\\theta}(z_{1:j})\\right]_i$.\n", "Inverting the layer can as simply be done as subtracting the bias and dividing by the scale:\n", "\n", "$$z_{j+1:d} = \\left(z'_{j+1:d} - \\mu_{\\theta}(z_{1:j})\\right) / \\sigma_{\\theta}(z_{1:j})$$\n", "\n", "We can also visualize the coupling layer in form of a computation graph,\n", "where $z_1$ represents $z_{1:j}$, and $z_2$ represents $z_{j+1:d}$:\n", "\n", "
\n", "\n", "In our implementation, we will realize the splitting of variables as masking.\n", "The variables to be transformed, $z_{j+1:d}$, are masked when passing $z$ to the shared network to predict the transformation parameters.\n", "When applying the transformation, we mask the parameters for $z_{1:j}$\n", "so that we have an identity operation for those variables:"]}, {"cell_type": "code", "execution_count": 12, "id": "89c6ff25", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:56.579882Z", "iopub.status.busy": "2021-09-16T12:41:56.574501Z", "iopub.status.idle": "2021-09-16T12:41:56.581937Z", "shell.execute_reply": "2021-09-16T12:41:56.581514Z"}, "papermill": {"duration": 0.048905, "end_time": "2021-09-16T12:41:56.582037", "exception": false, "start_time": "2021-09-16T12:41:56.533132", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class CouplingLayer(nn.Module):\n", " def __init__(self, network, mask, c_in):\n", " \"\"\"Coupling layer inside a normalizing flow.\n", "\n", " Args:\n", " network: A PyTorch nn.Module constituting the deep neural network for mu and sigma.\n", " Output shape should be twice the channel size as the input.\n", " mask: Binary mask (0 or 1) where 0 denotes that the element should be transformed,\n", " while 1 means the latent will be used as input to the NN.\n", " c_in: Number of input channels\n", " \"\"\"\n", " super().__init__()\n", " self.network = network\n", " self.scaling_factor = nn.Parameter(torch.zeros(c_in))\n", " # Register mask as buffer as it is a tensor which is not a parameter,\n", " # but should be part of the modules state.\n", " self.register_buffer(\"mask\", mask)\n", "\n", " def forward(self, z, ldj, reverse=False, orig_img=None):\n", " \"\"\"\n", " Args:\n", " z: Latent input to the flow\n", " ldj: The current ldj of the previous flows.\n", " The ldj of this layer will be added to this tensor.\n", " reverse: If True, we apply the inverse of the layer.\n", " orig_img (optional): Only needed in VarDeq. Allows external\n", " input to condition the flow on (e.g. original image)\n", " \"\"\"\n", " # Apply network to masked input\n", " z_in = z * self.mask\n", " if orig_img is None:\n", " nn_out = self.network(z_in)\n", " else:\n", " nn_out = self.network(torch.cat([z_in, orig_img], dim=1))\n", " s, t = nn_out.chunk(2, dim=1)\n", "\n", " # Stabilize scaling output\n", " s_fac = self.scaling_factor.exp().view(1, -1, 1, 1)\n", " s = torch.tanh(s / s_fac) * s_fac\n", "\n", " # Mask outputs (only transform the second part)\n", " s = s * (1 - self.mask)\n", " t = t * (1 - self.mask)\n", "\n", " # Affine transformation\n", " if not reverse:\n", " # Whether we first shift and then scale, or the other way round,\n", " # is a design choice, and usually does not have a big impact\n", " z = (z + t) * torch.exp(s)\n", " ldj += s.sum(dim=[1, 2, 3])\n", " else:\n", " z = (z * torch.exp(-s)) - t\n", " ldj -= s.sum(dim=[1, 2, 3])\n", "\n", " return z, ldj"]}, {"cell_type": "markdown", "id": "42bd2031", "metadata": {"papermill": {"duration": 0.039104, "end_time": "2021-09-16T12:41:56.660313", "exception": false, "start_time": "2021-09-16T12:41:56.621209", "status": "completed"}, "tags": []}, "source": ["For stabilization purposes, we apply a $\\tanh$ activation function on the scaling output.\n", "This prevents sudden large output values for the scaling that can destabilize training.\n", "To still allow scaling factors smaller or larger than -1 and 1 respectively,\n", "we have a learnable parameter per dimension, called `scaling_factor`.\n", "This scales the tanh to different limits.\n", "Below, we visualize the effect of the scaling factor on the output activation of the scaling terms:"]}, {"cell_type": "code", "execution_count": 13, "id": "c1bed75e", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:56.769037Z", "iopub.status.busy": "2021-09-16T12:41:56.743280Z", "iopub.status.idle": "2021-09-16T12:41:57.496549Z", "shell.execute_reply": "2021-09-16T12:41:57.496937Z"}, "papermill": {"duration": 0.797388, "end_time": "2021-09-16T12:41:57.497082", "exception": false, "start_time": "2021-09-16T12:41:56.699694", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:57.058315\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["with torch.no_grad():\n", " x = torch.arange(-5, 5, 0.01)\n", " scaling_factors = [0.5, 1, 2]\n", " sns.set()\n", " fig, ax = plt.subplots(1, 3, figsize=(12, 3))\n", " for i, scale in enumerate(scaling_factors):\n", " y = torch.tanh(x / scale) * scale\n", " ax[i].plot(x.numpy(), y.numpy())\n", " ax[i].set_title(\"Scaling factor: \" + str(scale))\n", " ax[i].set_ylim(-3, 3)\n", " plt.subplots_adjust(wspace=0.4)\n", " sns.reset_orig()\n", " plt.show()"]}, {"cell_type": "markdown", "id": "12dba007", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.041344, "end_time": "2021-09-16T12:41:57.581362", "exception": false, "start_time": "2021-09-16T12:41:57.540018", "status": "completed"}, "tags": []}, "source": ["Coupling layers generalize to any masking technique we could think of.\n", "However, the most common approach for images is to split the input $z$ in half, using a checkerboard mask or channel mask.\n", "A checkerboard mask splits the variables across the height and width dimensions and assigns each other pixel to $z_{j+1:d}$.\n", "Thereby, the mask is shared across channels.\n", "In contrast, the channel mask assigns half of the channels to $z_{j+1:d}$, and the other half to $z_{1:j+1}$.\n", "Note that when we apply multiple coupling layers, we invert the masking for each other layer so that each variable is transformed a similar amount of times.\n", "\n", "Let's implement a function that creates a checkerboard mask and a channel mask for us:"]}, {"cell_type": "code", "execution_count": 14, "id": "deef0879", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:57.685569Z", "iopub.status.busy": "2021-09-16T12:41:57.685029Z", "iopub.status.idle": "2021-09-16T12:41:57.686454Z", "shell.execute_reply": "2021-09-16T12:41:57.686034Z"}, "papermill": {"duration": 0.063936, "end_time": "2021-09-16T12:41:57.686559", "exception": false, "start_time": "2021-09-16T12:41:57.622623", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def create_checkerboard_mask(h, w, invert=False):\n", " x, y = torch.arange(h, dtype=torch.int32), torch.arange(w, dtype=torch.int32)\n", " xx, yy = torch.meshgrid(x, y)\n", " mask = torch.fmod(xx + yy, 2)\n", " mask = mask.to(torch.float32).view(1, 1, h, w)\n", " if invert:\n", " mask = 1 - mask\n", " return mask\n", "\n", "\n", "def create_channel_mask(c_in, invert=False):\n", " mask = torch.cat([torch.ones(c_in // 2, dtype=torch.float32), torch.zeros(c_in - c_in // 2, dtype=torch.float32)])\n", " mask = mask.view(1, c_in, 1, 1)\n", " if invert:\n", " mask = 1 - mask\n", " return mask"]}, {"cell_type": "markdown", "id": "613e51d7", "metadata": {"papermill": {"duration": 0.041153, "end_time": "2021-09-16T12:41:57.769008", "exception": false, "start_time": "2021-09-16T12:41:57.727855", "status": "completed"}, "tags": []}, "source": ["We can also visualize the corresponding masks for an image of size $8\\times 8\\times 2$ (2 channels):"]}, {"cell_type": "code", "execution_count": 15, "id": "6b1bfc65", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:57.857339Z", "iopub.status.busy": "2021-09-16T12:41:57.856865Z", "iopub.status.idle": "2021-09-16T12:41:57.988833Z", "shell.execute_reply": "2021-09-16T12:41:57.988350Z"}, "papermill": {"duration": 0.177754, "end_time": "2021-09-16T12:41:57.988944", "exception": false, "start_time": "2021-09-16T12:41:57.811190", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:57.893557\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"data": {"application/pdf": "JVBERi0xLjQKJazcIKu6CjEgMCBvYmoKPDwgL1BhZ2VzIDIgMCBSIC9UeXBlIC9DYXRhbG9nID4+CmVuZG9iago4IDAgb2JqCjw8IC9FeHRHU3RhdGUgNCAwIFIgL0ZvbnQgMyAwIFIgL1BhdHRlcm4gNSAwIFIKL1Byb2NTZXQgWyAvUERGIC9UZXh0IC9JbWFnZUIgL0ltYWdlQyAvSW1hZ2VJIF0gL1NoYWRpbmcgNiAwIFIKL1hPYmplY3QgNyAwIFIgPj4KZW5kb2JqCjExIDAgb2JqCjw8IC9Bbm5vdHMgMTAgMCBSIC9Db250ZW50cyA5IDAgUgovR3JvdXAgPDwgL0NTIC9EZXZpY2VSR0IgL1MgL1RyYW5zcGFyZW5jeSAvVHlwZSAvR3JvdXAgPj4KL01lZGlhQm94IFsgMCAwIDE2My44OSAxMTEuMDY1IF0gL1BhcmVudCAyIDAgUiAvUmVzb3VyY2VzIDggMCBSIC9UeXBlIC9QYWdlCj4+CmVuZG9iago5IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMTIgMCBSID4+CnN0cmVhbQp4nE2OMU/DQAyFd/+KN8LQu3uXS5MbW0oj2IpOYkAdqjRtKU1QiAR/Hx9SgcGyn+3nz8RZ7II4TnA4a3yBaGBX3edr2z01S7STzJwOeuG8MHXU8nItSRo3L7WhK3/iJDLIiMr4n2CIJkTUNGXAR4dnDLALn5lUJpXp0KiBZQY51P7X2/awD8TqHRvZYLz6HI7/vVnLKNScH0ERja8K+hIxmCroFVkm2DVBj3SQDEl7ecHN3Wk3DN0F/W56u8UW6VHukyhLvgGjfD17CmVuZHN0cmVhbQplbmRvYmoKMTIgMCBvYmoKMjAyCmVuZG9iagoxMCAwIG9iagpbIF0KZW5kb2JqCjE4IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMjM1ID4+CnN0cmVhbQp4nDVRSW4AMQi75xX+QKWwJ++Zquqh/f+1hlEvAwPY2CTvwUYkPsSQ7ihXfMrqNMvwO1nkxc9K4eS9iAqkKsIKaQfPclYzDJ4bmQKXM/FZZj6ZFjsWUE3EcXbkNINBiGlcR8vpMNM86Am5PhhxY6dZrmJI691Svb7X8p8qykfW3Sy3TtnUSt2iZ+xJXHZeT21pXxh1FDcFkQ4fO7wH+SLmLC46kW72mymHlaQhOC2AH4mhVM8OrxEmfmYkeMqeTu+jNLz2QdP1vXtBR24mZCq3UEYqnqw0xoyh+o1oJqnv/4Ge9b2+/gBDTVS5CmVuZHN0cmVhbQplbmRvYmoKMTkgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAzMDcgPj4Kc3RyZWFtCnicPZJLbgMxDEP3PoUuEMD62Z7zpCi6mN5/2ycl6Yoc2RZFapa6TFlTHpA0k4R/6fBwsZ3yO2zPZmbgWqKXieWU59AVYu6ifNnMRl1ZJ8XqhGY6t+hRORcHNk2qn6sspd0ueA7XJp5b9hE/vNCgHtQ1Lgk3dFejZSk0Y6r7f9J7/Iwy4GpMXWxSq3sfPF5EVejoB0eJImOXF+fjQQnpSsJoWoiVd0UDQe7ytMp7Ce7b3mrIsgepmM47KWaw63RSLm4XhyEeyPKo8OWj2GtCz/iwKyX0SNiGM3In7mjG5tTI4pD+3o0ES4+uaCHz4K9u1i5gvFM6RWJkTnKsaYtVTvdQFNO5w70MEPVsRUMpc5HV6l/DzgtrlmwWeEr6BR6j3SZLDlbZ26hO76082dD3H1rXdB8KZW5kc3RyZWFtCmVuZG9iagoyMCAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDI0OSA+PgpzdHJlYW0KeJw9UDuORCEM6zmFL/Ak8iNwHkarLWbv364DmilQTH62MyTQEYFHDDGUr+MlraCugb+LQvFu4uuDwiCrQ1IgznoPiHTspjaREzodnDM/YTdjjsBFMQac6XSmPQcmOfvCCoRzG2XsVkgniaoijuozjimeKnufeBYs7cg2WyeSPeQg4VJSicmln5TKP23KlAo6ZtEELBK54GQTTTjLu0lSjBmUMuoepnYifaw8yKM66GRNzqwjmdnTT9uZ+Bxwt1/aZE6Vx3QezPictM6DORW69+OJNgdNjdro7PcTaSovUrsdWp1+dRKV3RjnGBKXZ38Z32T/+Qf+h1oiCmVuZHN0cmVhbQplbmRvYmoKMjEgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAxNjQgPj4Kc3RyZWFtCnicRZDHcQUxDEPvqgIlMIAK9azH8w/r/q+G9NNBehhCDGJPwrBcV3FhdMOPty0zDX9HGe7G+jJjvNVYICfoAwyRiavRpPp2xRmq9OTVYq6jolwvOiISzJLjq0AjfDqyx5O2tjP9dF4f7CHvE/8qKuduYQEuqu5A+VIf8dSP2VHqmqGPKitrHmraV4RdEUrbPi6nMk7dvQNa4b2Vqz3a7z8edjryCmVuZHN0cmVhbQplbmRvYmoKMjIgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCA4MyA+PgpzdHJlYW0KeJw9zDkSgDAIBdCeU/wjhMgi93Eci3j/VjDRBh6reqAhOIO6wa3hYMq6dBPvU+PVxpwSCah4Sk2Wugt61LS+1L5o4Lvr5kvViT/NzxedD7sdGd0KZW5kc3RyZWFtCmVuZG9iagoyMyAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDQ3ID4+CnN0cmVhbQp4nDMyt1AwULA0ARKGFiYK5mYGCimGXJYQVi4XTCwHzALRlnAKIp7BlQYAuWcNJwplbmRzdHJlYW0KZW5kb2JqCjI0IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMjU4ID4+CnN0cmVhbQp4nEWRS3IEIAhE956CI4D85DyTSmUxuf82Dc5kNnaXqP2ESiOmEiznFHkwfcnyzWS26Xc5VjsbBRRFKJjJVeixAqs7U8SZa4lq62Nl5LjTOwbFG85dOalkcaOMdVR1KnBMz5X1Ud35dlmUfUcOZQrYrHMcbODKbcMYJ0abre4O94kgTydTR8XtINnwByeNfZWrK3CdbPbRSzAOBP1CE5jki0DrDIHGzVP05BLs4+N254Fgb3kRSNkQyJEhGB2Cdp1c/+LW+b3/cYY7z7UZrhzv4neY1nbHX2KSFXMBi9wpqOdrLlrXGTrekzPH5Kb7hs65YJe7g0zv+T/Wz/r+Ax4pZvoKZW5kc3RyZWFtCmVuZG9iagoyNSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDE2MyA+PgpzdHJlYW0KeJxFkDsSAyEMQ3tOoSP4IwM+z2YyKTb3b2PYbFLA01ggg7sTgtTagonogoe2Jd0F760EZ2P86TZuNRLkBHWAVqTjaJRSfbnFaZV08Wg2cysLrRMdZg56lKMZoBA6Fd7touRypu7O+UNw9V/1v2LdOZuJgcnKHQjN6lPc+TY7orq6yf6kx9ys134r7FVhaVlLywm3nbtmQAncUznaqz0/Hwo69gplbmRzdHJlYW0KZW5kb2JqCjI2IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMzM0ID4+CnN0cmVhbQp4nC1SS3LFIAzbcwpdoDP4B+Q86XS6eL3/tpKTRUYOYPQx5YaJSnxZILej1sS3jcxAheGvq8yFz0jbyDqIy5CLuJIthXtELOQxxDzEgu+r8R4e+azMybMHxi/Zdw8r9tSEZSHjxRnaYRXHYRXkWLB1Iap7eFOkw6kk2OOL/z7Fcy0ELXxG0IBf5J+vjuD5khZp95ht0656sEw7qqSwHGxPc14mX1pnuToezwfJ9q7YEVK7AhSFuTPOc+Eo01ZGtBZ2NkhqXGxvjv1YStCFblxGiiOQn6kiPKCkycwmCuKPnB5yKgNh6pqudHIbVXGnnsw1m4u3M0lm675IsZnCeV04s/4MU2a1eSfPcqLUqQjvsWdL0NA5rp69lllodJsTvKSEz8ZOT06+VzPrITkVCaliWlfBaRSZYgnbEl9TUVOaehn++/Lu8Tt+/gEsc3xzCmVuZHN0cmVhbQplbmRvYmoKMjcgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAxOCA+PgpzdHJlYW0KeJwzNrRQMIDDFEOuNAAd5gNSCmVuZHN0cmVhbQplbmRvYmoKMTYgMCBvYmoKPDwgL0Jhc2VGb250IC9EZWphVnVTYW5zIC9DaGFyUHJvY3MgMTcgMCBSCi9FbmNvZGluZyA8PAovRGlmZmVyZW5jZXMgWyAzMiAvc3BhY2UgNjcgL0MgOTcgL2EgMTAxIC9lIDEwNCAvaCAxMDcgL2sgL2wgL20gL24gMTE1IC9zIF0KL1R5cGUgL0VuY29kaW5nID4+Ci9GaXJzdENoYXIgMCAvRm9udEJCb3ggWyAtMTAyMSAtNDYzIDE3OTQgMTIzMyBdIC9Gb250RGVzY3JpcHRvciAxNSAwIFIKL0ZvbnRNYXRyaXggWyAwLjAwMSAwIDAgMC4wMDEgMCAwIF0gL0xhc3RDaGFyIDI1NSAvTmFtZSAvRGVqYVZ1U2FucwovU3VidHlwZSAvVHlwZTMgL1R5cGUgL0ZvbnQgL1dpZHRocyAxNCAwIFIgPj4KZW5kb2JqCjE1IDAgb2JqCjw8IC9Bc2NlbnQgOTI5IC9DYXBIZWlnaHQgMCAvRGVzY2VudCAtMjM2IC9GbGFncyAzMgovRm9udEJCb3ggWyAtMTAyMSAtNDYzIDE3OTQgMTIzMyBdIC9Gb250TmFtZSAvRGVqYVZ1U2FucyAvSXRhbGljQW5nbGUgMAovTWF4V2lkdGggMTM0MiAvU3RlbVYgMCAvVHlwZSAvRm9udERlc2NyaXB0b3IgL1hIZWlnaHQgMCA+PgplbmRvYmoKMTQgMCBvYmoKWyA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMAo2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDMxOCA0MDEgNDYwIDgzOCA2MzYKOTUwIDc4MCAyNzUgMzkwIDM5MCA1MDAgODM4IDMxOCAzNjEgMzE4IDMzNyA2MzYgNjM2IDYzNiA2MzYgNjM2IDYzNiA2MzYgNjM2CjYzNiA2MzYgMzM3IDMzNyA4MzggODM4IDgzOCA1MzEgMTAwMCA2ODQgNjg2IDY5OCA3NzAgNjMyIDU3NSA3NzUgNzUyIDI5NQoyOTUgNjU2IDU1NyA4NjMgNzQ4IDc4NyA2MDMgNzg3IDY5NSA2MzUgNjExIDczMiA2ODQgOTg5IDY4NSA2MTEgNjg1IDM5MCAzMzcKMzkwIDgzOCA1MDAgNTAwIDYxMyA2MzUgNTUwIDYzNSA2MTUgMzUyIDYzNSA2MzQgMjc4IDI3OCA1NzkgMjc4IDk3NCA2MzQgNjEyCjYzNSA2MzUgNDExIDUyMSAzOTIgNjM0IDU5MiA4MTggNTkyIDU5MiA1MjUgNjM2IDMzNyA2MzYgODM4IDYwMCA2MzYgNjAwIDMxOAozNTIgNTE4IDEwMDAgNTAwIDUwMCA1MDAgMTM0MiA2MzUgNDAwIDEwNzAgNjAwIDY4NSA2MDAgNjAwIDMxOCAzMTggNTE4IDUxOAo1OTAgNTAwIDEwMDAgNTAwIDEwMDAgNTIxIDQwMCAxMDIzIDYwMCA1MjUgNjExIDMxOCA0MDEgNjM2IDYzNiA2MzYgNjM2IDMzNwo1MDAgNTAwIDEwMDAgNDcxIDYxMiA4MzggMzYxIDEwMDAgNTAwIDUwMCA4MzggNDAxIDQwMSA1MDAgNjM2IDYzNiAzMTggNTAwCjQwMSA0NzEgNjEyIDk2OSA5NjkgOTY5IDUzMSA2ODQgNjg0IDY4NCA2ODQgNjg0IDY4NCA5NzQgNjk4IDYzMiA2MzIgNjMyIDYzMgoyOTUgMjk1IDI5NSAyOTUgNzc1IDc0OCA3ODcgNzg3IDc4NyA3ODcgNzg3IDgzOCA3ODcgNzMyIDczMiA3MzIgNzMyIDYxMSA2MDUKNjMwIDYxMyA2MTMgNjEzIDYxMyA2MTMgNjEzIDk4MiA1NTAgNjE1IDYxNSA2MTUgNjE1IDI3OCAyNzggMjc4IDI3OCA2MTIgNjM0CjYxMiA2MTIgNjEyIDYxMiA2MTIgODM4IDYxMiA2MzQgNjM0IDYzNCA2MzQgNTkyIDYzNSA1OTIgXQplbmRvYmoKMTcgMCBvYmoKPDwgL0MgMTggMCBSIC9hIDE5IDAgUiAvZSAyMCAwIFIgL2ggMjEgMCBSIC9rIDIyIDAgUiAvbCAyMyAwIFIgL20gMjQgMCBSCi9uIDI1IDAgUiAvcyAyNiAwIFIgL3NwYWNlIDI3IDAgUiA+PgplbmRvYmoKMyAwIG9iago8PCAvRjEgMTYgMCBSID4+CmVuZG9iago0IDAgb2JqCjw8IC9BMSA8PCAvQ0EgMCAvVHlwZSAvRXh0R1N0YXRlIC9jYSAxID4+Ci9BMiA8PCAvQ0EgMSAvVHlwZSAvRXh0R1N0YXRlIC9jYSAxID4+ID4+CmVuZG9iago1IDAgb2JqCjw8ID4+CmVuZG9iago2IDAgb2JqCjw8ID4+CmVuZG9iago3IDAgb2JqCjw8IC9JMSAxMyAwIFIgPj4KZW5kb2JqCjEzIDAgb2JqCjw8IC9CaXRzUGVyQ29tcG9uZW50IDggL0NvbG9yU3BhY2UgWy9JbmRleGVkIC9EZXZpY2VSR0IgMiAo////f39/AAAAKV0KL0RlY29kZVBhcm1zIDw8IC9Db2xvcnMgMSAvQ29sdW1ucyAxNTAgL1ByZWRpY3RvciAxMCA+PgovRmlsdGVyIC9GbGF0ZURlY29kZSAvSGVpZ2h0IDgyIC9MZW5ndGggMjggMCBSIC9TdWJ0eXBlIC9JbWFnZQovVHlwZSAvWE9iamVjdCAvV2lkdGggMTUwID4+CnN0cmVhbQp4nO3OsQ2AQBDAsIf9h6YGIaF8wxXOAJHXMbL1N+A9rBJWCauEVcIqYZUerLXV/XFuhYWFhYWFhYWFhYWFhYWFhYWFhYWFhYWFhYWFhYWFhfXNmhJWCauEVcIqYZWwSkNZF1/rMA0KZW5kc3RyZWFtCmVuZG9iagoyOCAwIG9iagoxMDIKZW5kb2JqCjIgMCBvYmoKPDwgL0NvdW50IDEgL0tpZHMgWyAxMSAwIFIgXSAvVHlwZSAvUGFnZXMgPj4KZW5kb2JqCjI5IDAgb2JqCjw8IC9DcmVhdGlvbkRhdGUgKEQ6MjAyMTA5MTYxNDQxNTcrMDInMDAnKQovQ3JlYXRvciAoTWF0cGxvdGxpYiB2My40LjMsIGh0dHBzOi8vbWF0cGxvdGxpYi5vcmcpCi9Qcm9kdWNlciAoTWF0cGxvdGxpYiBwZGYgYmFja2VuZCB2My40LjMpID4+CmVuZG9iagp4cmVmCjAgMzAKMDAwMDAwMDAwMCA2NTUzNSBmIAowMDAwMDAwMDE2IDAwMDAwIG4gCjAwMDAwMDU2MDggMDAwMDAgbiAKMDAwMDAwNTAyOCAwMDAwMCBuIAowMDAwMDA1MDYwIDAwMDAwIG4gCjAwMDAwMDUxNTkgMDAwMDAgbiAKMDAwMDAwNTE4MCAwMDAwMCBuIAowMDAwMDA1MjAxIDAwMDAwIG4gCjAwMDAwMDAwNjUgMDAwMDAgbiAKMDAwMDAwMDM5NSAwMDAwMCBuIAowMDAwMDAwNjkyIDAwMDAwIG4gCjAwMDAwMDAyMDggMDAwMDAgbiAKMDAwMDAwMDY3MiAwMDAwMCBuIAowMDAwMDA1MjMzIDAwMDAwIG4gCjAwMDAwMDM4NDkgMDAwMDAgbiAKMDAwMDAwMzY0OSAwMDAwMCBuIAowMDAwMDAzMjk3IDAwMDAwIG4gCjAwMDAwMDQ5MDIgMDAwMDAgbiAKMDAwMDAwMDcxMiAwMDAwMCBuIAowMDAwMDAxMDIwIDAwMDAwIG4gCjAwMDAwMDE0MDAgMDAwMDAgbiAKMDAwMDAwMTcyMiAwMDAwMCBuIAowMDAwMDAxOTU5IDAwMDAwIG4gCjAwMDAwMDIxMTQgMDAwMDAgbiAKMDAwMDAwMjIzMyAwMDAwMCBuIAowMDAwMDAyNTY0IDAwMDAwIG4gCjAwMDAwMDI4MDAgMDAwMDAgbiAKMDAwMDAwMzIwNyAwMDAwMCBuIAowMDAwMDA1NTg4IDAwMDAwIG4gCjAwMDAwMDU2NjggMDAwMDAgbiAKdHJhaWxlcgo8PCAvSW5mbyAyOSAwIFIgL1Jvb3QgMSAwIFIgL1NpemUgMzAgPj4Kc3RhcnR4cmVmCjU4MjUKJSVFT0YK\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:41:57.958494\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["checkerboard_mask = create_checkerboard_mask(h=8, w=8).expand(-1, 2, -1, -1)\n", "channel_mask = create_channel_mask(c_in=2).expand(-1, -1, 8, 8)\n", "\n", "show_imgs(checkerboard_mask.transpose(0, 1), \"Checkerboard mask\")\n", "show_imgs(channel_mask.transpose(0, 1), \"Channel mask\")"]}, {"cell_type": "markdown", "id": "b52dfa44", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.042944, "end_time": "2021-09-16T12:41:58.075778", "exception": false, "start_time": "2021-09-16T12:41:58.032834", "status": "completed"}, "tags": []}, "source": ["As a last aspect of coupling layers, we need to decide for the deep neural network we want to apply in the coupling layers.\n", "The input to the layers is an image, and hence we stick with a CNN.\n", "Because the input to a transformation depends on all transformations before,\n", "it is crucial to ensure a good gradient flow through the CNN back to the input,\n", "which can be optimally achieved by a ResNet-like architecture.\n", "Specifically, we use a Gated ResNet that adds a $\\sigma$-gate to the skip connection,\n", "similarly to the input gate in LSTMs.\n", "The details are not necessarily important here, and the network is\n", "strongly inspired from Flow++ [3] in case you are interested in building\n", "even stronger models."]}, {"cell_type": "code", "execution_count": 16, "id": "310d88c0", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:58.171587Z", "iopub.status.busy": "2021-09-16T12:41:58.169353Z", "iopub.status.idle": "2021-09-16T12:41:58.173708Z", "shell.execute_reply": "2021-09-16T12:41:58.173294Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.055251, "end_time": "2021-09-16T12:41:58.173850", "exception": false, "start_time": "2021-09-16T12:41:58.118599", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class ConcatELU(nn.Module):\n", " \"\"\"Activation function that applies ELU in both direction (inverted and plain).\n", "\n", " Allows non-linearity while providing strong gradients for any input (important for final convolution)\n", " \"\"\"\n", "\n", " def forward(self, x):\n", " return torch.cat([F.elu(x), F.elu(-x)], dim=1)\n", "\n", "\n", "class LayerNormChannels(nn.Module):\n", " def __init__(self, c_in):\n", " \"\"\"This module applies layer norm across channels in an image.\n", "\n", " Has been shown to work well with ResNet connections.\n", " Args:\n", " c_in: Number of channels of the input\n", " \"\"\"\n", " super().__init__()\n", " self.layer_norm = nn.LayerNorm(c_in)\n", "\n", " def forward(self, x):\n", " x = x.permute(0, 2, 3, 1)\n", " x = self.layer_norm(x)\n", " x = x.permute(0, 3, 1, 2)\n", " return x\n", "\n", "\n", "class GatedConv(nn.Module):\n", " def __init__(self, c_in, c_hidden):\n", " \"\"\"\n", " This module applies a two-layer convolutional ResNet block with input gate\n", " Args:\n", " c_in: Number of channels of the input\n", " c_hidden: Number of hidden dimensions we want to model (usually similar to c_in)\n", " \"\"\"\n", " super().__init__()\n", " self.net = nn.Sequential(\n", " nn.Conv2d(c_in, c_hidden, kernel_size=3, padding=1),\n", " ConcatELU(),\n", " nn.Conv2d(2 * c_hidden, 2 * c_in, kernel_size=1),\n", " )\n", "\n", " def forward(self, x):\n", " out = self.net(x)\n", " val, gate = out.chunk(2, dim=1)\n", " return x + val * torch.sigmoid(gate)\n", "\n", "\n", "class GatedConvNet(nn.Module):\n", " def __init__(self, c_in, c_hidden=32, c_out=-1, num_layers=3):\n", " \"\"\"Module that summarizes the previous blocks to a full convolutional neural network.\n", "\n", " Args:\n", " c_in: Number of input channels\n", " c_hidden: Number of hidden dimensions to use within the network\n", " c_out: Number of output channels. If -1, 2 times the input channels are used (affine coupling)\n", " num_layers: Number of gated ResNet blocks to apply\n", " \"\"\"\n", " super().__init__()\n", " c_out = c_out if c_out > 0 else 2 * c_in\n", " layers = []\n", " layers += [nn.Conv2d(c_in, c_hidden, kernel_size=3, padding=1)]\n", " for layer_index in range(num_layers):\n", " layers += [GatedConv(c_hidden, c_hidden), LayerNormChannels(c_hidden)]\n", " layers += [ConcatELU(), nn.Conv2d(2 * c_hidden, c_out, kernel_size=3, padding=1)]\n", " self.nn = nn.Sequential(*layers)\n", "\n", " self.nn[-1].weight.data.zero_()\n", " self.nn[-1].bias.data.zero_()\n", "\n", " def forward(self, x):\n", " return self.nn(x)"]}, {"cell_type": "markdown", "id": "8dd3b2c4", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.042657, "end_time": "2021-09-16T12:41:58.260796", "exception": false, "start_time": "2021-09-16T12:41:58.218139", "status": "completed"}, "tags": []}, "source": ["### Training loop\n", "\n", "Finally, we can add Dequantization, Variational Dequantization and Coupling Layers together to build our full normalizing flow on MNIST images.\n", "We apply 8 coupling layers in the main flow, and 4 for variational dequantization if applied.\n", "We apply a checkerboard mask throughout the network as with a single channel (black-white images),\n", "we cannot apply channel mask.\n", "The overall architecture is visualized below.\n", "\n", "\n", "
"]}, {"cell_type": "code", "execution_count": 17, "id": "27d5089b", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:58.351932Z", "iopub.status.busy": "2021-09-16T12:41:58.351458Z", "iopub.status.idle": "2021-09-16T12:41:58.353625Z", "shell.execute_reply": "2021-09-16T12:41:58.353155Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.050041, "end_time": "2021-09-16T12:41:58.353742", "exception": false, "start_time": "2021-09-16T12:41:58.303701", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def create_simple_flow(use_vardeq=True):\n", " flow_layers = []\n", " if use_vardeq:\n", " vardeq_layers = [\n", " CouplingLayer(\n", " network=GatedConvNet(c_in=2, c_out=2, c_hidden=16),\n", " mask=create_checkerboard_mask(h=28, w=28, invert=(i % 2 == 1)),\n", " c_in=1,\n", " )\n", " for i in range(4)\n", " ]\n", " flow_layers += [VariationalDequantization(var_flows=vardeq_layers)]\n", " else:\n", " flow_layers += [Dequantization()]\n", "\n", " for i in range(8):\n", " flow_layers += [\n", " CouplingLayer(\n", " network=GatedConvNet(c_in=1, c_hidden=32),\n", " mask=create_checkerboard_mask(h=28, w=28, invert=(i % 2 == 1)),\n", " c_in=1,\n", " )\n", " ]\n", "\n", " flow_model = ImageFlow(flow_layers).to(device)\n", " return flow_model"]}, {"cell_type": "markdown", "id": "5b491b9b", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.042728, "end_time": "2021-09-16T12:41:58.439262", "exception": false, "start_time": "2021-09-16T12:41:58.396534", "status": "completed"}, "tags": []}, "source": ["For implementing the training loop, we use the framework of PyTorch Lightning and reduce the code overhead.\n", "If interested, you can take a look at the generated tensorboard file,\n", "in particularly the graph to see an overview of flow transformations that are applied.\n", "Note that we again provide pre-trained models (see later on in the notebook)\n", "as normalizing flows are particularly expensive to train.\n", "We have also run validation and testing as this can take some time as well with the added importance sampling."]}, {"cell_type": "code", "execution_count": 18, "id": "0447d535", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:58.532547Z", "iopub.status.busy": "2021-09-16T12:41:58.532063Z", "iopub.status.idle": "2021-09-16T12:41:58.534199Z", "shell.execute_reply": "2021-09-16T12:41:58.533718Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.052256, "end_time": "2021-09-16T12:41:58.534297", "exception": false, "start_time": "2021-09-16T12:41:58.482041", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def train_flow(flow, model_name=\"MNISTFlow\"):\n", " # Create a PyTorch Lightning trainer\n", " trainer = pl.Trainer(\n", " default_root_dir=os.path.join(CHECKPOINT_PATH, model_name),\n", " gpus=1 if torch.cuda.is_available() else 0,\n", " max_epochs=200,\n", " gradient_clip_val=1.0,\n", " callbacks=[\n", " ModelCheckpoint(save_weights_only=True, mode=\"min\", monitor=\"val_bpd\"),\n", " LearningRateMonitor(\"epoch\"),\n", " ],\n", " )\n", " trainer.logger._log_graph = True\n", " trainer.logger._default_hp_metric = None # Optional logging argument that we don't need\n", "\n", " train_data_loader = data.DataLoader(\n", " train_set, batch_size=128, shuffle=True, drop_last=True, pin_memory=True, num_workers=8\n", " )\n", " result = None\n", "\n", " # Check whether pretrained model exists. If yes, load it and skip training\n", " pretrained_filename = os.path.join(CHECKPOINT_PATH, model_name + \".ckpt\")\n", " if os.path.isfile(pretrained_filename):\n", " print(\"Found pretrained model, loading...\")\n", " ckpt = torch.load(pretrained_filename, map_location=device)\n", " flow.load_state_dict(ckpt[\"state_dict\"])\n", " result = ckpt.get(\"result\", None)\n", " else:\n", " print(\"Start training\", model_name)\n", " trainer.fit(flow, train_data_loader, val_loader)\n", "\n", " # Test best model on validation and test set if no result has been found\n", " # Testing can be expensive due to the importance sampling.\n", " if result is None:\n", " val_result = trainer.test(flow, test_dataloaders=val_loader, verbose=False)\n", " start_time = time.time()\n", " test_result = trainer.test(flow, test_dataloaders=test_loader, verbose=False)\n", " duration = time.time() - start_time\n", " result = {\"test\": test_result, \"val\": val_result, \"time\": duration / len(test_loader) / flow.import_samples}\n", "\n", " return flow, result"]}, {"cell_type": "markdown", "id": "27f6d057", "metadata": {"papermill": {"duration": 0.050519, "end_time": "2021-09-16T12:41:58.627997", "exception": false, "start_time": "2021-09-16T12:41:58.577478", "status": "completed"}, "tags": []}, "source": ["## Multi-scale architecture\n", "\n", "
\n", "\n", "One disadvantage of normalizing flows is that they operate on the exact same dimensions as the input.\n", "If the input is high-dimensional, so is the latent space, which requires larger computational cost to learn suitable transformations.\n", "However, particularly in the image domain, many pixels contain less information in the sense\n", "that we could remove them without loosing the semantical information of the image.\n", "\n", "Based on this intuition, deep normalizing flows on images commonly apply a multi-scale architecture [1].\n", "After the first $N$ flow transformations, we split off half of the latent dimensions and directly evaluate them on the prior.\n", "The other half is run through $N$ more flow transformations, and depending on the size of the input,\n", "we split it again in half or stop overall at this position.\n", "The two operations involved in this setup is `Squeeze` and `Split` which\n", "we will review more closely and implement below."]}, {"cell_type": "markdown", "id": "207a4bd1", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.043555, "end_time": "2021-09-16T12:41:58.714567", "exception": false, "start_time": "2021-09-16T12:41:58.671012", "status": "completed"}, "tags": []}, "source": ["### Squeeze and Split\n", "\n", "When we want to remove half of the pixels in an image, we have the problem of deciding which variables to cut,\n", "and how to rearrange the image.\n", "Thus, the squeezing operation is commonly used before split, which divides the image into subsquares\n", "of shape $2\\times 2\\times C$, and reshapes them into $1\\times 1\\times 4C$ blocks.\n", "Effectively, we reduce the height and width of the image by a factor of 2 while scaling the number of channels by 4.\n", "Afterwards, we can perform the split operation over channels without the need of rearranging the pixels.\n", "The smaller scale also makes the overall architecture more efficient.\n", "Visually, the squeeze operation should transform the input as follows:\n", "\n", "
\n", "\n", "The input of $4\\times 4\\times 1$ is scaled to $2\\times 2\\times 4$ following\n", "the idea of grouping the pixels in $2\\times 2\\times 1$ subsquares.\n", "Next, let's try to implement this layer:"]}, {"cell_type": "code", "execution_count": 19, "id": "3435b3ac", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:58.805945Z", "iopub.status.busy": "2021-09-16T12:41:58.805454Z", "iopub.status.idle": "2021-09-16T12:41:58.807515Z", "shell.execute_reply": "2021-09-16T12:41:58.807040Z"}, "papermill": {"duration": 0.050124, "end_time": "2021-09-16T12:41:58.807614", "exception": false, "start_time": "2021-09-16T12:41:58.757490", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class SqueezeFlow(nn.Module):\n", " def forward(self, z, ldj, reverse=False):\n", " B, C, H, W = z.shape\n", " if not reverse:\n", " # Forward direction: H x W x C => H/2 x W/2 x 4C\n", " z = z.reshape(B, C, H // 2, 2, W // 2, 2)\n", " z = z.permute(0, 1, 3, 5, 2, 4)\n", " z = z.reshape(B, 4 * C, H // 2, W // 2)\n", " else:\n", " # Reverse direction: H/2 x W/2 x 4C => H x W x C\n", " z = z.reshape(B, C // 4, 2, 2, H, W)\n", " z = z.permute(0, 1, 4, 2, 5, 3)\n", " z = z.reshape(B, C // 4, H * 2, W * 2)\n", " return z, ldj"]}, {"cell_type": "markdown", "id": "99659504", "metadata": {"papermill": {"duration": 0.04349, "end_time": "2021-09-16T12:41:58.894090", "exception": false, "start_time": "2021-09-16T12:41:58.850600", "status": "completed"}, "tags": []}, "source": ["Before moving on, we can verify our implementation by comparing our output with the example figure above:"]}, {"cell_type": "code", "execution_count": 20, "id": "f0ffca0f", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:58.984627Z", "iopub.status.busy": "2021-09-16T12:41:58.984154Z", "iopub.status.idle": "2021-09-16T12:41:58.988910Z", "shell.execute_reply": "2021-09-16T12:41:58.988509Z"}, "papermill": {"duration": 0.051435, "end_time": "2021-09-16T12:41:58.989009", "exception": false, "start_time": "2021-09-16T12:41:58.937574", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Image (before)\n", " tensor([[[[ 1, 2, 3, 4],\n", " [ 5, 6, 7, 8],\n", " [ 9, 10, 11, 12],\n", " [13, 14, 15, 16]]]])\n", "\n", "Image (forward)\n", " tensor([[[[ 1, 2, 5, 6],\n", " [ 3, 4, 7, 8]],\n", "\n", " [[ 9, 10, 13, 14],\n", " [11, 12, 15, 16]]]])\n", "\n", "Image (reverse)\n", " tensor([[[[ 1, 2, 3, 4],\n", " [ 5, 6, 7, 8],\n", " [ 9, 10, 11, 12],\n", " [13, 14, 15, 16]]]])\n"]}], "source": ["sq_flow = SqueezeFlow()\n", "rand_img = torch.arange(1, 17).view(1, 1, 4, 4)\n", "print(\"Image (before)\\n\", rand_img)\n", "forward_img, _ = sq_flow(rand_img, ldj=None, reverse=False)\n", "print(\"\\nImage (forward)\\n\", forward_img.permute(0, 2, 3, 1)) # Permute for readability\n", "reconst_img, _ = sq_flow(forward_img, ldj=None, reverse=True)\n", "print(\"\\nImage (reverse)\\n\", reconst_img)"]}, {"cell_type": "markdown", "id": "912fb9c0", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.04387, "end_time": "2021-09-16T12:41:59.077196", "exception": false, "start_time": "2021-09-16T12:41:59.033326", "status": "completed"}, "tags": []}, "source": ["The split operation divides the input into two parts, and evaluates one part directly on the prior.\n", "So that our flow operation fits to the implementation of the previous layers,\n", "we will return the prior probability of the first part as the log determinant jacobian of the layer.\n", "It has the same effect as if we would combine all variable splits at the\n", "end of the flow, and evaluate them together on the prior."]}, {"cell_type": "code", "execution_count": 21, "id": "420c7e21", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:59.170054Z", "iopub.status.busy": "2021-09-16T12:41:59.169563Z", "iopub.status.idle": "2021-09-16T12:41:59.171697Z", "shell.execute_reply": "2021-09-16T12:41:59.171229Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.05122, "end_time": "2021-09-16T12:41:59.171798", "exception": false, "start_time": "2021-09-16T12:41:59.120578", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class SplitFlow(nn.Module):\n", " def __init__(self):\n", " super().__init__()\n", " self.prior = torch.distributions.normal.Normal(loc=0.0, scale=1.0)\n", "\n", " def forward(self, z, ldj, reverse=False):\n", " if not reverse:\n", " z, z_split = z.chunk(2, dim=1)\n", " ldj += self.prior.log_prob(z_split).sum(dim=[1, 2, 3])\n", " else:\n", " z_split = self.prior.sample(sample_shape=z.shape).to(device)\n", " z = torch.cat([z, z_split], dim=1)\n", " ldj -= self.prior.log_prob(z_split).sum(dim=[1, 2, 3])\n", " return z, ldj"]}, {"cell_type": "markdown", "id": "5d191c06", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.043739, "end_time": "2021-09-16T12:41:59.259120", "exception": false, "start_time": "2021-09-16T12:41:59.215381", "status": "completed"}, "tags": []}, "source": ["### Building a multi-scale flow\n", "\n", "After defining the squeeze and split operation, we are finally able to build our own multi-scale flow.\n", "Deep normalizing flows such as Glow and Flow++ [2,3] often apply a split operation directly after squeezing.\n", "However, with shallow flows, we need to be more thoughtful about where to place the split operation as we need at least a minimum amount of transformations on each variable.\n", "Our setup is inspired by the original RealNVP architecture [1] which is shallower than other,\n", "more recent state-of-the-art architectures.\n", "\n", "Hence, for the MNIST dataset, we will apply the first squeeze operation after two coupling layers, but don't apply a split operation yet.\n", "Because we have only used two coupling layers and each the variable has been only transformed once, a split operation would be too early.\n", "We apply two more coupling layers before finally applying a split flow and squeeze again.\n", "The last four coupling layers operate on a scale of $7\\times 7\\times 8$.\n", "The full flow architecture is shown below.\n", "\n", "
\n", "\n", "Note that while the feature maps inside the coupling layers reduce with the height and width of the input,\n", "the increased number of channels is not directly considered.\n", "To counteract this, we increase the hidden dimensions for the coupling layers on the squeezed input.\n", "The dimensions are often scaled by 2 as this approximately increases the computation cost by 4 canceling with the squeezing operation.\n", "However, we will choose the hidden dimensionalities $32, 48, 64$ for the\n", "three scales respectively to keep the number of parameters reasonable\n", "and show the efficiency of multi-scale architectures."]}, {"cell_type": "code", "execution_count": 22, "id": "f1aa3acb", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:59.353192Z", "iopub.status.busy": "2021-09-16T12:41:59.352715Z", "iopub.status.idle": "2021-09-16T12:41:59.354799Z", "shell.execute_reply": "2021-09-16T12:41:59.354387Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.052212, "end_time": "2021-09-16T12:41:59.354899", "exception": false, "start_time": "2021-09-16T12:41:59.302687", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def create_multiscale_flow():\n", " flow_layers = []\n", "\n", " vardeq_layers = [\n", " CouplingLayer(\n", " network=GatedConvNet(c_in=2, c_out=2, c_hidden=16),\n", " mask=create_checkerboard_mask(h=28, w=28, invert=(i % 2 == 1)),\n", " c_in=1,\n", " )\n", " for i in range(4)\n", " ]\n", " flow_layers += [VariationalDequantization(vardeq_layers)]\n", "\n", " flow_layers += [\n", " CouplingLayer(\n", " network=GatedConvNet(c_in=1, c_hidden=32),\n", " mask=create_checkerboard_mask(h=28, w=28, invert=(i % 2 == 1)),\n", " c_in=1,\n", " )\n", " for i in range(2)\n", " ]\n", " flow_layers += [SqueezeFlow()]\n", " for i in range(2):\n", " flow_layers += [\n", " CouplingLayer(\n", " network=GatedConvNet(c_in=4, c_hidden=48), mask=create_channel_mask(c_in=4, invert=(i % 2 == 1)), c_in=4\n", " )\n", " ]\n", " flow_layers += [SplitFlow(), SqueezeFlow()]\n", " for i in range(4):\n", " flow_layers += [\n", " CouplingLayer(\n", " network=GatedConvNet(c_in=8, c_hidden=64), mask=create_channel_mask(c_in=8, invert=(i % 2 == 1)), c_in=8\n", " )\n", " ]\n", "\n", " flow_model = ImageFlow(flow_layers).to(device)\n", " return flow_model"]}, {"cell_type": "markdown", "id": "ca021fca", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.043766, "end_time": "2021-09-16T12:41:59.442691", "exception": false, "start_time": "2021-09-16T12:41:59.398925", "status": "completed"}, "tags": []}, "source": ["We can show the difference in number of parameters below:"]}, {"cell_type": "code", "execution_count": 23, "id": "c13d7d7c", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:41:59.534720Z", "iopub.status.busy": "2021-09-16T12:41:59.534247Z", "iopub.status.idle": "2021-09-16T12:42:02.273185Z", "shell.execute_reply": "2021-09-16T12:42:02.272760Z"}, "papermill": {"duration": 2.786959, "end_time": "2021-09-16T12:42:02.273302", "exception": false, "start_time": "2021-09-16T12:41:59.486343", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Number of parameters: 335,128\n", "Number of parameters: 379,556\n", "Number of parameters: 1,062,090\n"]}], "source": ["def print_num_params(model):\n", " num_params = sum(np.prod(p.shape) for p in model.parameters())\n", " print(f\"Number of parameters: {num_params:,}\")\n", "\n", "\n", "print_num_params(create_simple_flow(use_vardeq=False))\n", "print_num_params(create_simple_flow(use_vardeq=True))\n", "print_num_params(create_multiscale_flow())"]}, {"cell_type": "markdown", "id": "949772c8", "metadata": {"papermill": {"duration": 0.04404, "end_time": "2021-09-16T12:42:02.361991", "exception": false, "start_time": "2021-09-16T12:42:02.317951", "status": "completed"}, "tags": []}, "source": ["Although the multi-scale flow has almost 3 times the parameters of the single scale flow,\n", "it is not necessarily more computationally expensive than its counterpart.\n", "We will compare the runtime in the following experiments as well."]}, {"cell_type": "markdown", "id": "a40ce763", "metadata": {"papermill": {"duration": 0.043937, "end_time": "2021-09-16T12:42:02.450029", "exception": false, "start_time": "2021-09-16T12:42:02.406092", "status": "completed"}, "tags": []}, "source": ["## Analysing the flows\n", "\n", "In the last part of the notebook, we will train all the models we have implemented above,\n", "and try to analyze the effect of the multi-scale architecture and variational dequantization.\n", "\n", "### Training flow variants\n", "\n", "Before we can analyse the flow models, we need to train them first.\n", "We provide pre-trained models that contain the validation and test performance, and run-time information.\n", "As flow models are computationally expensive, we advice you to rely on\n", "those pretrained models for a first run through the notebook."]}, {"cell_type": "code", "execution_count": 24, "id": "8b210a38", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:02.543059Z", "iopub.status.busy": "2021-09-16T12:42:02.542580Z", "iopub.status.idle": "2021-09-16T12:42:02.794090Z", "shell.execute_reply": "2021-09-16T12:42:02.793670Z"}, "papermill": {"duration": 0.300432, "end_time": "2021-09-16T12:42:02.794206", "exception": false, "start_time": "2021-09-16T12:42:02.493774", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model, loading...\n", "Found pretrained model, loading...\n", "Found pretrained model, loading...\n"]}], "source": ["flow_dict = {\"simple\": {}, \"vardeq\": {}, \"multiscale\": {}}\n", "flow_dict[\"simple\"][\"model\"], flow_dict[\"simple\"][\"result\"] = train_flow(\n", " create_simple_flow(use_vardeq=False), model_name=\"MNISTFlow_simple\"\n", ")\n", "flow_dict[\"vardeq\"][\"model\"], flow_dict[\"vardeq\"][\"result\"] = train_flow(\n", " create_simple_flow(use_vardeq=True), model_name=\"MNISTFlow_vardeq\"\n", ")\n", "flow_dict[\"multiscale\"][\"model\"], flow_dict[\"multiscale\"][\"result\"] = train_flow(\n", " create_multiscale_flow(), model_name=\"MNISTFlow_multiscale\"\n", ")"]}, {"cell_type": "markdown", "id": "0f554c5e", "metadata": {"papermill": {"duration": 0.046682, "end_time": "2021-09-16T12:42:02.888035", "exception": false, "start_time": "2021-09-16T12:42:02.841353", "status": "completed"}, "tags": []}, "source": ["### Density modeling and sampling\n", "\n", "Firstly, we can compare the models on their quantitative results.\n", "The following table shows all important statistics.\n", "The inference time specifies the time needed to determine the\n", "probability for a batch of 64 images for each model, and the sampling\n", "time the duration it took to sample a batch of 64 images."]}, {"cell_type": "code", "execution_count": 25, "id": "1a7fa75f", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:02.984361Z", "iopub.status.busy": "2021-09-16T12:42:02.983766Z", "iopub.status.idle": "2021-09-16T12:42:02.986662Z", "shell.execute_reply": "2021-09-16T12:42:02.987047Z"}, "papermill": {"duration": 0.052662, "end_time": "2021-09-16T12:42:02.987161", "exception": false, "start_time": "2021-09-16T12:42:02.934499", "status": "completed"}, "tags": []}, "outputs": [{"data": {"text/html": ["\n", "\n"], "text/plain": [""]}, "metadata": {}, "output_type": "display_data"}], "source": ["%%html\n", "\n", ""]}, {"cell_type": "code", "execution_count": 26, "id": "30428798", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:03.098132Z", "iopub.status.busy": "2021-09-16T12:42:03.092877Z", "iopub.status.idle": "2021-09-16T12:42:03.101398Z", "shell.execute_reply": "2021-09-16T12:42:03.100990Z"}, "papermill": {"duration": 0.067197, "end_time": "2021-09-16T12:42:03.101499", "exception": false, "start_time": "2021-09-16T12:42:03.034302", "status": "completed"}, "tags": []}, "outputs": [{"data": {"text/html": ["\n", "\n", "\n", "\n", "\n", "\n", "\n", "\n", "\n", "
Model Validation Bpd Test Bpd Inference time Sampling time Num Parameters
simple 1.109 bpd 1.107 bpd 51 ms 50 ms 335,128
vardeq 1.068 bpd 1.066 bpd 69 ms 50 ms 379,556
multiscale1.029 bpd 1.026 bpd 40 ms 22 ms 1,062,090
"], "text/plain": [""]}, "metadata": {}, "output_type": "display_data"}], "source": ["\n", "table = [\n", " [\n", " key,\n", " \"%4.3f bpd\" % flow_dict[key][\"result\"][\"val\"][0][\"test_bpd\"],\n", " \"%4.3f bpd\" % flow_dict[key][\"result\"][\"test\"][0][\"test_bpd\"],\n", " \"%2.0f ms\" % (1000 * flow_dict[key][\"result\"][\"time\"]),\n", " \"%2.0f ms\" % (1000 * flow_dict[key][\"result\"].get(\"samp_time\", 0)),\n", " \"{:,}\".format(sum(np.prod(p.shape) for p in flow_dict[key][\"model\"].parameters())),\n", " ]\n", " for key in flow_dict\n", "]\n", "display(\n", " HTML(\n", " tabulate.tabulate(\n", " table,\n", " tablefmt=\"html\",\n", " headers=[\"Model\", \"Validation Bpd\", \"Test Bpd\", \"Inference time\", \"Sampling time\", \"Num Parameters\"],\n", " )\n", " )\n", ")"]}, {"cell_type": "markdown", "id": "0c8899de", "metadata": {"papermill": {"duration": 0.047332, "end_time": "2021-09-16T12:42:03.196088", "exception": false, "start_time": "2021-09-16T12:42:03.148756", "status": "completed"}, "tags": []}, "source": ["As we have intially expected, using variational dequantization improves upon standard dequantization in terms of bits per dimension.\n", "Although the difference with 0.04bpd doesn't seem impressive first, it is a considerably step for generative models\n", "(most state-of-the-art models improve upon previous models in a range of 0.02-0.1bpd on CIFAR with three times as high bpd).\n", "While it takes longer to evaluate the probability of an image due to the variational dequantization,\n", "which also leads to a longer training time, it does not have an effect on the sampling time.\n", "This is because inverting variational dequantization is the same as dequantization: finding the next lower integer.\n", "\n", "When we compare the two models to multi-scale architecture, we can see that the bits per dimension score again dropped by about 0.04bpd.\n", "Additionally, the inference time and sampling time improved notably despite having more parameters.\n", "Thus, we see that the multi-scale flow is not only stronger for density modeling, but also more efficient.\n", "\n", "Next, we can test the sampling quality of the models.\n", "We should note that the samples for variational dequantization and standard dequantization are very similar,\n", "and hence we visualize here only the ones for variational dequantization and the multi-scale model.\n", "However, feel free to also test out the `\"simple\"` model.\n", "The seeds are set to obtain reproducable generations and are not cherry picked."]}, {"cell_type": "code", "execution_count": 27, "id": "ab20301b", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:03.294176Z", "iopub.status.busy": "2021-09-16T12:42:03.293684Z", "iopub.status.idle": "2021-09-16T12:42:03.408730Z", "shell.execute_reply": "2021-09-16T12:42:03.408245Z"}, "papermill": {"duration": 0.165353, "end_time": "2021-09-16T12:42:03.408844", "exception": false, "start_time": "2021-09-16T12:42:03.243491", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 44\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:03.360522\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["pl.seed_everything(44)\n", "samples = flow_dict[\"vardeq\"][\"model\"].sample(img_shape=[16, 1, 28, 28])\n", "show_imgs(samples.cpu())"]}, {"cell_type": "code", "execution_count": 28, "id": "4ff785f9", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:03.509095Z", "iopub.status.busy": "2021-09-16T12:42:03.508627Z", "iopub.status.idle": "2021-09-16T12:42:03.616157Z", "shell.execute_reply": "2021-09-16T12:42:03.615677Z"}, "papermill": {"duration": 0.158469, "end_time": "2021-09-16T12:42:03.616267", "exception": false, "start_time": "2021-09-16T12:42:03.457798", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 44\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:03.572464\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["pl.seed_everything(44)\n", "samples = flow_dict[\"multiscale\"][\"model\"].sample(img_shape=[16, 8, 7, 7])\n", "show_imgs(samples.cpu())"]}, {"cell_type": "markdown", "id": "d070c015", "metadata": {"papermill": {"duration": 0.049106, "end_time": "2021-09-16T12:42:03.715575", "exception": false, "start_time": "2021-09-16T12:42:03.666469", "status": "completed"}, "tags": []}, "source": ["From the few samples, we can see a clear difference between the simple and the multi-scale model.\n", "The single-scale model has only learned local, small correlations while the multi-scale model was able to learn full,\n", "global relations that form digits.\n", "This show-cases another benefit of the multi-scale model.\n", "In contrast to VAEs, the outputs are sharp as normalizing flows can naturally model complex,\n", "multi-modal distributions while VAEs have the independent decoder output noise.\n", "Nevertheless, the samples from this flow are far from perfect as not all samples show true digits."]}, {"cell_type": "markdown", "id": "e16d33ec", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.049321, "end_time": "2021-09-16T12:42:03.814088", "exception": false, "start_time": "2021-09-16T12:42:03.764767", "status": "completed"}, "tags": []}, "source": ["### Interpolation in latent space\n", "\n", "Another popular test for the smoothness of the latent space of generative models is to interpolate between two training examples.\n", "As normalizing flows are strictly invertible, we can guarantee that any image is represented in the latent space.\n", "We again compare the variational dequantization model with the multi-scale model below."]}, {"cell_type": "code", "execution_count": 29, "id": "c066c621", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:03.919045Z", "iopub.status.busy": "2021-09-16T12:42:03.918562Z", "iopub.status.idle": "2021-09-16T12:42:03.949438Z", "shell.execute_reply": "2021-09-16T12:42:03.948964Z"}, "papermill": {"duration": 0.085776, "end_time": "2021-09-16T12:42:03.949542", "exception": false, "start_time": "2021-09-16T12:42:03.863766", "status": "completed"}, "tags": []}, "outputs": [], "source": ["@torch.no_grad()\n", "def interpolate(model, img1, img2, num_steps=8):\n", " \"\"\"\n", " Args:\n", " model: object of ImageFlow class that represents the (trained) flow model\n", " img1, img2: Image tensors of shape [1, 28, 28]. Images between which should be interpolated.\n", " num_steps: Number of interpolation steps. 8 interpolation steps mean 6 intermediate pictures besides img1 and img2\n", " \"\"\"\n", " imgs = torch.stack([img1, img2], dim=0).to(model.device)\n", " z, _ = model.encode(imgs)\n", " alpha = torch.linspace(0, 1, steps=num_steps, device=z.device).view(-1, 1, 1, 1)\n", " interpolations = z[0:1] * alpha + z[1:2] * (1 - alpha)\n", " interp_imgs = model.sample(interpolations.shape[:1] + imgs.shape[1:], z_init=interpolations)\n", " show_imgs(interp_imgs, row_size=8)\n", "\n", "\n", "exmp_imgs, _ = next(iter(train_loader))"]}, {"cell_type": "code", "execution_count": 30, "id": "dc209bbb", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:04.053707Z", "iopub.status.busy": "2021-09-16T12:42:04.053237Z", "iopub.status.idle": "2021-09-16T12:42:04.365802Z", "shell.execute_reply": "2021-09-16T12:42:04.366194Z"}, "papermill": {"duration": 0.36694, "end_time": "2021-09-16T12:42:04.366333", "exception": false, "start_time": "2021-09-16T12:42:03.999393", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:04.133364\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:04.336241\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["pl.seed_everything(42)\n", "for i in range(2):\n", " interpolate(flow_dict[\"vardeq\"][\"model\"], exmp_imgs[2 * i], exmp_imgs[2 * i + 1])"]}, {"cell_type": "code", "execution_count": 31, "id": "6a103456", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:04.481539Z", "iopub.status.busy": "2021-09-16T12:42:04.481065Z", "iopub.status.idle": "2021-09-16T12:42:04.697014Z", "shell.execute_reply": "2021-09-16T12:42:04.696379Z"}, "papermill": {"duration": 0.278454, "end_time": "2021-09-16T12:42:04.697129", "exception": false, "start_time": "2021-09-16T12:42:04.418675", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:04.561824\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:04.667333\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["pl.seed_everything(42)\n", "for i in range(2):\n", " interpolate(flow_dict[\"multiscale\"][\"model\"], exmp_imgs[2 * i], exmp_imgs[2 * i + 1])"]}, {"cell_type": "markdown", "id": "ac2dff10", "metadata": {"papermill": {"duration": 0.053429, "end_time": "2021-09-16T12:42:04.804401", "exception": false, "start_time": "2021-09-16T12:42:04.750972", "status": "completed"}, "tags": []}, "source": ["The interpolations of the multi-scale model result in more realistic digits\n", "(first row $7\\leftrightarrow 8\\leftrightarrow 6$, second row $9\\leftrightarrow 4\\leftrightarrow 6$),\n", "while the variational dequantization model focuses on local patterns that globally do not form a digit.\n", "For the multi-scale model, we actually did not do the \"true\" interpolation between the two images\n", "as we did not consider the variables that were split along the flow (they have been sampled randomly for all samples).\n", "However, as we will see in the next experiment, the early variables do not effect the overall image much."]}, {"cell_type": "markdown", "id": "e3c5cbb6", "metadata": {"papermill": {"duration": 0.052651, "end_time": "2021-09-16T12:42:04.909712", "exception": false, "start_time": "2021-09-16T12:42:04.857061", "status": "completed"}, "tags": []}, "source": ["### Visualization of latents in different levels of multi-scale\n", "\n", "In the following we will focus more on the multi-scale flow.\n", "We want to analyse what information is being stored in the variables split at early layers,\n", "and what information for the final variables.\n", "For this, we sample 8 images where each of them share the same final latent variables,\n", "but differ in the other part of the latent variables.\n", "Below we visualize three examples of this:"]}, {"cell_type": "code", "execution_count": 32, "id": "4c3c81a9", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:05.022247Z", "iopub.status.busy": "2021-09-16T12:42:05.021766Z", "iopub.status.idle": "2021-09-16T12:42:05.288274Z", "shell.execute_reply": "2021-09-16T12:42:05.287851Z"}, "papermill": {"duration": 0.323428, "end_time": "2021-09-16T12:42:05.288390", "exception": false, "start_time": "2021-09-16T12:42:04.964962", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 44\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:05.083293\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"data": {"application/pdf": "JVBERi0xLjQKJazcIKu6CjEgMCBvYmoKPDwgL1BhZ2VzIDIgMCBSIC9UeXBlIC9DYXRhbG9nID4+CmVuZG9iago4IDAgb2JqCjw8IC9FeHRHU3RhdGUgNCAwIFIgL0ZvbnQgMyAwIFIgL1BhdHRlcm4gNSAwIFIKL1Byb2NTZXQgWyAvUERGIC9UZXh0IC9JbWFnZUIgL0ltYWdlQyAvSW1hZ2VJIF0gL1NoYWRpbmcgNiAwIFIKL1hPYmplY3QgNyAwIFIgPj4KZW5kb2JqCjExIDAgb2JqCjw8IC9Bbm5vdHMgMTAgMCBSIC9Db250ZW50cyA5IDAgUgovR3JvdXAgPDwgL0NTIC9EZXZpY2VSR0IgL1MgL1RyYW5zcGFyZW5jeSAvVHlwZSAvR3JvdXAgPj4KL01lZGlhQm94IFsgMCAwIDMzNS4yOTkzNTQ4Mzg3IDE3Ny40OCBdIC9QYXJlbnQgMiAwIFIgL1Jlc291cmNlcyA4IDAgUgovVHlwZSAvUGFnZSA+PgplbmRvYmoKOSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDEyIDAgUiA+PgpzdHJlYW0KeJxNjrEOwjAMRHd/xX1BYsdpk45FlSLGsvABVQVUtAgqwe/jMgDDSb6T7XuCiXwrOK1gTKYXBAW+G5+XYTyUHYaV2PKZVCsXmkaryuz130pKLmbL+DeeiRa6I7nwkQZ2eduOWXOC1Oo44zHiiAW+DRuAGIAYAKPYpQbBVix1/H4ZZvi9oLuhp57eJg8oJwplbmRzdHJlYW0KZW5kb2JqCjEyIDAgb2JqCjE0MgplbmRvYmoKMTAgMCBvYmoKWyBdCmVuZG9iagozIDAgb2JqCjw8ID4+CmVuZG9iago0IDAgb2JqCjw8IC9BMSA8PCAvQ0EgMCAvVHlwZSAvRXh0R1N0YXRlIC9jYSAxID4+Ci9BMiA8PCAvQ0EgMSAvVHlwZSAvRXh0R1N0YXRlIC9jYSAxID4+ID4+CmVuZG9iago1IDAgb2JqCjw8ID4+CmVuZG9iago2IDAgb2JqCjw8ID4+CmVuZG9iago3IDAgb2JqCjw8IC9JMSAxMyAwIFIgPj4KZW5kb2JqCjEzIDAgb2JqCjw8IC9CaXRzUGVyQ29tcG9uZW50IDgKL0NvbG9yU3BhY2UgWy9JbmRleGVkIC9EZXZpY2VSR0IgMjE4ICj////+/v79/f38/Pz7+/v6+vr5+fn4+Pj39/f29vb19fX09PTz8/Py8vLx8fHw8PDv7+/u7u7t7e3s7Ozr6+vq6urp6eno6Ojn5+fl5eXk5OTi4uLh4eHg4ODf39/e3t7c3Nzb29vZ2dnX19fV1dXU1NTT09PS0tLR0dHQ0NDPz8/Ozs7Nzc3MzMzLy8vKysrJycnFxcXExMTDw8PCwsLBwcG/v7+9vb28vLy7u7u6urq5ubm4uLi3t7e2tra1tbW0tLSzs7OysrKwsLCurq6tra2rq6uqqqqpqamoqKilpaWkpKSioqKhoaGgoKCenp6dnZ2cnJybm5uampqZmZmYmJiXl5eWlpaVlZWUlJSTk5OSkpKRkZGQkJCPj4+Ojo6NjY2MjIyLi4uIiIiHh4eGhoaFhYWEhISDg4OCgoKBgYGAgIB/f39+fn59fX18fHx7e3t6enp5eXl4eHh3d3d2dnZ1dXV0dHRycnJxcXFvb29ubm5tbW1sbGxra2tpaWloaGhnZ2dmZmZkZGRjY2NiYmJhYWFgYGBfX19dXV1cXFxcXFxbW1tXV1dWVlZVVVVUVFRSUlJRUVFQUFBPT09NTU1MTExLS0tKSkpJSUlISEhGRkZFRUVCQkJBQUFAQEA/Pz8+Pj49PT08PDw7Ozs6Ojo5OTk4ODg3Nzc1NTU0NDQzMzMyMjIxMTEwMDAvLy8uLi4sLCwrKysqKipcKVwpXClcKFwoXCgnJycmJiYlJSUkJCQjIyMiIiIhISEgICAfHx8eHh4dHR0cHBwbGxsaGhoZGRkYGBgXFxcWFhYVFRUUFBQTExMREREQEBAPDw9cclxyXHIMDAwLCwtcblxuXG4JCQkICAgHBwcGBgYFBQUEBAQDAwMCAgIBAQEAAAApXQovRGVjb2RlUGFybXMgPDwgL0NvbG9ycyAxIC9Db2x1bW5zIDMyMSAvUHJlZGljdG9yIDEwID4+Ci9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9IZWlnaHQgMTY0IC9MZW5ndGggMTQgMCBSIC9TdWJ0eXBlIC9JbWFnZQovVHlwZSAvWE9iamVjdCAvV2lkdGggMzIxID4+CnN0cmVhbQp4nO2d61cT1xqHsydAuIgEayMWIyqitUUrWm1VLoIRrEQFL1XQtloNXg6C9QZa79dqqoWi1SrWKqJoixIUJKCiQhFFqUAjSf6a8yY5rnVcjNnjeves41m+v0982OtZv3lmZWZPyOyt+RcFF83/usD/fcggNmQQGzKIjc+gW1jePRwZxOLIIBZHBrE4MojFkUEsjgxicWQQiyODWBwZxOLIIBb3BganT58eH19eXu5yuThQRbjU1NSIiJs3b/I7KsIlJSWNGSMON378+OzskydP8nFkUD5kEIsTb3DXrl2SJI0ZU19f73A4Xu9QIS4nJ0en03355fPnz/kd+bjLly9Du08+efjwoQhcc3NzfHx8v37FxcV8HBmUiSoGY2NjoePp07xxCnFGoxFwV64IwsEVQavVnj8vCDdp0iTArVihCEcGZUIGsTgVDD59OnLkSDjk8eMfP36M79jVNXr0aMAtWtTe3o7HtbWFhYXBIRsMdrsdjyspCQkJCQwMtFq7u7v5ODLYJ6oYtFoZY8HBwYxdv34d3/Gvv0AfHLJGc4XzQVaEu3wZWAEBAYzZbDY8rrbW146xxsZGPo4M9gkZxOLEG2xtbZ00CZ5yFi5cKMigywXXv3nz5jGm6LmJh6uqmjBhgveQa2tr8Tin8/jx4xEREYzduXOHjyODfUIGsTjxBl9m7NixjF28eBHf0Zv09HTGTnPm6Apxvb29ZrOZscrKSkHt0tLSGLtw4QIfRwblo4rBmJgYSVq2bJmgjgUFBZ7HRCEGIdu3b2esvLxcEG7x4sWMJSUl8XFkUD5kEItTxeCcOXMkyWKxCOq4Z88eSSosLBSEO3bsmCSVlJQIwpWWlkpSfn4+H0cG5UMGsTjxBl0uV2RkpLALl91uHzFihCTB1UsEDpKbmytJFRUVInBwsPCYrdXW1NTwcWRQJqoYbG5uZox98MGjR49EdLTZbBqNZtAgQf9cgxMC7d5//8GDByJwbW1tgBswAJ5n+TgyKBMyiMWpYnD9+vWSJM2axRunELdo0SLo+N13gnCbNm0C3Lp1gnBLliwBHGfW4SaDrw8ZxOJUMNjQ4Pt/4k8/Cen4xx8GgwHmC5y5h1JcXV1UVBTgfvlFCK66euDAgUFBQWfPKsKRwT5RxeD338NHeNy4cU1NQjpaLPAhiYuL++cfIbi6Orivr1y5kjdOIa60FHA5OTn+fib5Xzgy2CdkEItTxeDUqcHBwU18fwo7pqSEh4ffuHFDEC4hwWg03rp1SxAuMVGv19+9e1chjgz2CRnE4sQbvHr1amjohg0bXC5XaWl0dHRqaiqmI2BiY7Ozs+HPb74Bk3B5xeC8s9+ioiLv4LKysq4uP4P5uKqqqoCA/fv3O53O9HSY1TgcPBwZfDWqGARjsbFtbW1w6GYzTKtnzJiB6Qj1PDf1pt7eXoMBbvEr/P3alo8zm82Rkb5vVocPB1xZmZ/BfJzJZEpM9B3shx/269fP73SBDMqEDL6VBg8cOLB9+9atWyVP4HnR72A+btasWRoNHDJ01Wrhsur3Fs/HdXZ2Rkc7HA673T50KBRcuhTV7tChQ3/++eTJk4kTJwYEgEG/g8mgTFQx6E1ra+uaNWu0WtDJh/JxPT09eXl5Wu2pU6dE4NyeOWbKwIHFxcX8jx2fBSdk48aNjFmtVn47MigTMojFqWJQad49HBnE4sggFkcGsTgyiMWRQSyODGJxZBCLI4NYHBnE4sggFkcGsTgyiMXRqvLYkEFsyCA2ZBAbMogNGcSGZjNYHBnE4sggFkcGsTgyiMWRQSyODGJxZBCLI4NYHBnE4t7AYFpamslU5vdXtoo7ulyuuXPnxsby3lFRiHM6nfPnz//444aGBhE4t/enz++9d+LECT6ODMqHDKJwbjUMrlq1SvKs/OZ3cxLlHa1WK+C+/vrFixcicAUFBVqtds6cnp4eEbi8vLzAwMDPP8/NzeXjyKBMyCAWp4rB5ORk3usub9Jx9uzZcMi//y4I59s1QNAqEN4XNrSeVbcU4cigTFQw2NCg0+kYY198cenSJXzHrq6QkBDoaLE4/L47qRDX02M0GqHdt9+e52xRogj399/h4eFwQhITeS8Zk0H5kEEsThWDVVVBQUFhYWEazZkzZ/AdS0q03jCmqCMPl5Xlw2k0paWleNzZsy93rlB0sGSwT1Qx2NJSWVk5bdo0SRKys0FDw6hRoyIjIzUa3voSfBw80BmN/fv31+v1knTkyBF8u127srKyhnpeFO3o6ODjyGCfkEFsO1UMepOZmcmYkLudNxkZGYwpWm1XEc5kMjF27tw5QbjJkycr3AiDDMqHDGJxqhiEep6FP/2v/Kkct2/fPsb8LvTxRjibzSby/MbHxzO2e/duPo4MykcVgwcPHpQkcQYPHz4s8oTs3LlTkmbOnCkIZzabJUno/sVuMvgaHBmUj3iDLpdruGdVpm3btgnqGB4eHhioaDcuPqu7u9s7BRbXDnCMHT16lI8jg/Ihg9h24g02NTUxxiIihHwd9XIzh+jo+/fvi8C1tLQATq+/d++eCFx9fT3ghg9XtNUEGZSJKganTJkC0B9+4I1TiMvOzgZcSoqQb/nd7nXr1gGOs2uWclx+fr4kSQUFinBkUCZkEItTwWBzc6g31dVCOlZUGAwGnU73889CcDdvwn0dcL/9JgRnt+v1ejghP/6oCEcG+4QMYnGqGKyuhuuC1WoVtJnDsmVQcPPmzbxxCnH790O7pKQkhZs58AZdugS4lJQUzu/A3GTwdVHFYEJCVFQUb36pvOPkyYMHD759+7Yg3NSpcFFobGwUhPvsM/gUV/MvWGTwdSGDWJx4g11dXTrd0v+slP3s2TO/PwTm43p7ewMCMjIy3J7VuOPi4trb2zG42tra0NCioiLvzhUmk6muzs9gPu7atWuMZWZmuj0bLC9fvryqiocjg6+GDL6VBhcsWPDRR75XZw4cgGm131W4+bjCwsKEBN+rM199pdVq/b7jw8clJydPnOj7L+enn8I05PBhP4P5OIvFEhMDGp1OZ1AQ4Py+k0MGZaKKwbq6ugEDQOOwYcO8e0N0dnZiOsJkWqPxPTdJEjyL2e12DM7hcFy9+vTp07179wYGwgn59Vc/g/m4HTt2DBoUExOTnp4eFAQ4m42HI4Ovhgy+lQa9aWlpSUtLCwvbsmWL33EKcR0dHXA77t/fwtkkWCEO7u+rV68ODeUNVoirqakZMmSIwbB27Vo+jgzKRBWDSvPu4cggFkcGsTgyiMWRQSyODGJxZBCLI4NYHBnE4sggFkcGsTgyiMWRQSyODGJxtKo8NmQQGzKIDRnEhgxi829rp63ZCmVuZHN0cmVhbQplbmRvYmoKMTQgMCBvYmoKMjQ5NwplbmRvYmoKMiAwIG9iago8PCAvQ291bnQgMSAvS2lkcyBbIDExIDAgUiBdIC9UeXBlIC9QYWdlcyA+PgplbmRvYmoKMTUgMCBvYmoKPDwgL0NyZWF0aW9uRGF0ZSAoRDoyMDIxMDkxNjE0NDIwNSswMicwMCcpCi9DcmVhdG9yIChNYXRwbG90bGliIHYzLjQuMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZykKL1Byb2R1Y2VyIChNYXRwbG90bGliIHBkZiBiYWNrZW5kIHYzLjQuMykgPj4KZW5kb2JqCnhyZWYKMCAxNgowMDAwMDAwMDAwIDY1NTM1IGYgCjAwMDAwMDAwMTYgMDAwMDAgbiAKMDAwMDAwNDI5MCAwMDAwMCBuIAowMDAwMDAwNjU5IDAwMDAwIG4gCjAwMDAwMDA2ODAgMDAwMDAgbiAKMDAwMDAwMDc3OSAwMDAwMCBuIAowMDAwMDAwODAwIDAwMDAwIG4gCjAwMDAwMDA4MjEgMDAwMDAgbiAKMDAwMDAwMDA2NSAwMDAwMCBuIAowMDAwMDAwNDAyIDAwMDAwIG4gCjAwMDAwMDA2MzkgMDAwMDAgbiAKMDAwMDAwMDIwOCAwMDAwMCBuIAowMDAwMDAwNjE5IDAwMDAwIG4gCjAwMDAwMDA4NTMgMDAwMDAgbiAKMDAwMDAwNDI2OSAwMDAwMCBuIAowMDAwMDA0MzUwIDAwMDAwIG4gCnRyYWlsZXIKPDwgL0luZm8gMTUgMCBSIC9Sb290IDEgMCBSIC9TaXplIDE2ID4+CnN0YXJ0eHJlZgo0NTA3CiUlRU9GCg==\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:05.171845\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:05.257858\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["pl.seed_everything(44)\n", "for _ in range(3):\n", " z_init = flow_dict[\"multiscale\"][\"model\"].prior.sample(sample_shape=[1, 8, 7, 7])\n", " z_init = z_init.expand(8, -1, -1, -1)\n", " samples = flow_dict[\"multiscale\"][\"model\"].sample(img_shape=z_init.shape, z_init=z_init)\n", " show_imgs(samples.cpu())"]}, {"cell_type": "markdown", "id": "8cb113a3", "metadata": {"papermill": {"duration": 0.054683, "end_time": "2021-09-16T12:42:05.399905", "exception": false, "start_time": "2021-09-16T12:42:05.345222", "status": "completed"}, "tags": []}, "source": ["We see that the early split variables indeed have a smaller effect on the image.\n", "Still, small differences can be spot when we look carefully at the borders of the digits.\n", "For instance, the hole at the top of the 8 changes for different samples although all of them represent the same coarse structure.\n", "This shows that the flow indeed learns to separate the higher-level\n", "information in the final variables, while the early split ones contain\n", "local noise patterns."]}, {"cell_type": "markdown", "id": "256310bb", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.054446, "end_time": "2021-09-16T12:42:05.508976", "exception": false, "start_time": "2021-09-16T12:42:05.454530", "status": "completed"}, "tags": []}, "source": ["### Visualizing Dequantization\n", "\n", "As a final part of this notebook, we will look at the effect of variational dequantization.\n", "We have motivated variational dequantization by the issue of sharp edges/boarders being difficult to model,\n", "and a flow would rather prefer smooth, prior-like distributions.\n", "To check how what noise distribution $q(u|x)$ the flows in the\n", "variational dequantization module have learned, we can plot a histogram\n", "of output values from the dequantization and variational dequantization\n", "module."]}, {"cell_type": "code", "execution_count": 33, "id": "665bc626", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:05.628077Z", "iopub.status.busy": "2021-09-16T12:42:05.623860Z", "iopub.status.idle": "2021-09-16T12:42:05.658084Z", "shell.execute_reply": "2021-09-16T12:42:05.657594Z"}, "papermill": {"duration": 0.093163, "end_time": "2021-09-16T12:42:05.658187", "exception": false, "start_time": "2021-09-16T12:42:05.565024", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def visualize_dequant_distribution(model: ImageFlow, imgs: torch.Tensor, title: str = None):\n", " \"\"\"\n", " Args:\n", " model: The flow of which we want to visualize the dequantization distribution\n", " imgs: Example training images of which we want to visualize the dequantization distribution\n", " \"\"\"\n", " imgs = imgs.to(device)\n", " ldj = torch.zeros(imgs.shape[0], dtype=torch.float32).to(device)\n", " with torch.no_grad():\n", " dequant_vals = []\n", " for _ in tqdm(range(8), leave=False):\n", " d, _ = model.flows[0](imgs, ldj, reverse=False)\n", " dequant_vals.append(d)\n", " dequant_vals = torch.cat(dequant_vals, dim=0)\n", " dequant_vals = dequant_vals.view(-1).cpu().numpy()\n", " sns.set()\n", " plt.figure(figsize=(10, 3))\n", " plt.hist(dequant_vals, bins=256, color=to_rgb(\"C0\") + (0.5,), edgecolor=\"C0\", density=True)\n", " if title is not None:\n", " plt.title(title)\n", " plt.show()\n", " plt.close()\n", "\n", "\n", "sample_imgs, _ = next(iter(train_loader))"]}, {"cell_type": "code", "execution_count": 34, "id": "0e0a4cb8", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:05.770898Z", "iopub.status.busy": "2021-09-16T12:42:05.770412Z", "iopub.status.idle": "2021-09-16T12:42:06.769321Z", "shell.execute_reply": "2021-09-16T12:42:06.769715Z"}, "papermill": {"duration": 1.056909, "end_time": "2021-09-16T12:42:06.769866", "exception": false, "start_time": "2021-09-16T12:42:05.712957", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "b632bd849f444d76b9cdb1ce9b458ecc", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0/8 [00:00\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:06.250107\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["visualize_dequant_distribution(flow_dict[\"simple\"][\"model\"], sample_imgs, title=\"Dequantization\")"]}, {"cell_type": "code", "execution_count": 35, "id": "c3deeaa6", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:06.894994Z", "iopub.status.busy": "2021-09-16T12:42:06.894523Z", "iopub.status.idle": "2021-09-16T12:42:08.443397Z", "shell.execute_reply": "2021-09-16T12:42:08.443791Z"}, "papermill": {"duration": 1.612603, "end_time": "2021-09-16T12:42:08.443933", "exception": false, "start_time": "2021-09-16T12:42:06.831330", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "e14299cd737b4a32ae911b93b2592618", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0/8 [00:00\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:07.870733\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["visualize_dequant_distribution(flow_dict[\"vardeq\"][\"model\"], sample_imgs, title=\"Variational dequantization\")"]}, {"cell_type": "markdown", "id": "37caab54", "metadata": {"papermill": {"duration": 0.062935, "end_time": "2021-09-16T12:42:08.571623", "exception": false, "start_time": "2021-09-16T12:42:08.508688", "status": "completed"}, "tags": []}, "source": ["The dequantization distribution in the first plot shows that the MNIST images have a strong bias towards 0 (black),\n", "and the distribution of them have a sharp border as mentioned before.\n", "The variational dequantization module has indeed learned a much smoother distribution with a Gaussian-like curve which can be modeled much better.\n", "For the other values, we would need to visualize the distribution $q(u|x)$ on a deeper level, depending on $x$.\n", "However, as all $u$'s interact and depend on each other, we would need\n", "to visualize a distribution in 784 dimensions, which is not that\n", "intuitive anymore."]}, {"cell_type": "markdown", "id": "2cc36677", "metadata": {"papermill": {"duration": 0.062538, "end_time": "2021-09-16T12:42:08.696736", "exception": false, "start_time": "2021-09-16T12:42:08.634198", "status": "completed"}, "tags": []}, "source": ["## Conclusion\n", "\n", "In conclusion, we have seen how to implement our own normalizing flow, and what difficulties arise if we want to apply them on images.\n", "Dequantization is a crucial step in mapping the discrete images into continuous space to prevent underisable delta-peak solutions.\n", "While dequantization creates hypercubes with hard border, variational dequantization allows us to fit a flow much better on the data.\n", "This allows us to obtain a lower bits per dimension score, while not affecting the sampling speed.\n", "The most common flow element, the coupling layer, is simple to implement, and yet effective.\n", "Furthermore, multi-scale architectures help to capture the global image context while allowing us to efficiently scale up the flow.\n", "Normalizing flows are an interesting alternative to VAEs as they allow an exact likelihood estimate in continuous space,\n", "and we have the guarantee that every possible input $x$ has a corresponding latent vector $z$.\n", "However, even beyond continuous inputs and images, flows can be applied and allow us to exploit\n", "the data structure in latent space, as e.g. on graphs for the task of molecule generation [6].\n", "Recent advances in [Neural ODEs](https://arxiv.org/pdf/1806.07366.pdf) allow a flow with infinite number of layers,\n", "called Continuous Normalizing Flows, whose potential is yet to fully explore.\n", "Overall, normalizing flows are an exciting research area which will continue over the next couple of years."]}, {"cell_type": "markdown", "id": "d5a736a3", "metadata": {"papermill": {"duration": 0.06309, "end_time": "2021-09-16T12:42:08.823219", "exception": false, "start_time": "2021-09-16T12:42:08.760129", "status": "completed"}, "tags": []}, "source": ["## References\n", "\n", "[1] Dinh, L., Sohl-Dickstein, J., and Bengio, S. (2017).\n", "\u201cDensity estimation using Real NVP,\u201d In: 5th International Conference on Learning Representations, ICLR 2017.\n", "[Link](https://arxiv.org/abs/1605.08803)\n", "\n", "[2] Kingma, D. P., and Dhariwal, P. (2018).\n", "\u201cGlow: Generative Flow with Invertible 1x1 Convolutions,\u201d In: Advances in Neural Information Processing Systems, vol.\n", "31, pp.\n", "10215--10224.\n", "[Link](http://papers.nips.cc/paper/8224-glow-generative-flow-with-invertible-1x1-convolutions.pdf)\n", "\n", "[3] Ho, J., Chen, X., Srinivas, A., Duan, Y., and Abbeel, P. (2019).\n", "\u201cFlow++: Improving Flow-Based Generative Models with Variational Dequantization and Architecture Design,\u201d\n", "in Proceedings of the 36th International Conference on Machine Learning, vol.\n", "97, pp.\n", "2722\u20132730.\n", "[Link](https://arxiv.org/abs/1902.00275)\n", "\n", "[4] Durkan, C., Bekasov, A., Murray, I., and Papamakarios, G. (2019).\n", "\u201cNeural Spline Flows,\u201d In: Advances in Neural Information Processing Systems, pp.\n", "7509\u20137520.\n", "[Link](http://papers.neurips.cc/paper/8969-neural-spline-flows.pdf)\n", "\n", "[5] Hoogeboom, E., Cohen, T. S., and Tomczak, J. M. (2020).\n", "\u201cLearning Discrete Distributions by Dequantization,\u201d arXiv preprint arXiv2001.11235v1.\n", "[Link](https://arxiv.org/abs/2001.11235)\n", "\n", "[6] Lippe, P., and Gavves, E. (2021).\n", "\u201cCategorical Normalizing Flows via Continuous Transformations,\u201d\n", "In: International Conference on Learning Representations, ICLR 2021.\n", "[Link](https://openreview.net/pdf?id=-GLNZeVDuik)"]}, {"cell_type": "markdown", "id": "d586cc6a", "metadata": {"papermill": {"duration": 0.065018, "end_time": "2021-09-16T12:42:08.951852", "exception": false, "start_time": "2021-09-16T12:42:08.886834", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "![Pytorch Lightning](){height=\"60px\" width=\"240px\"}"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: Tutorial 9: Normalizing Flows for Image Modeling\n", " :card_description: In this tutorial, we will take a closer look at complex, deep normalizing flows. The most popular, current application of deep normalizing flows is to model datasets of...\n", " :tags: Image,GPU/TPU,UvA-DL-Course\n", " :image: _static/images/course_UvA-DL/09-normalizing-flows.jpg"]}], "metadata": {"jupytext": {"cell_metadata_filter": "colab,id,colab_type,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 19.664801, "end_time": "2021-09-16T12:42:09.722798", "environment_variables": {}, "exception": null, "input_path": "course_UvA-DL/09-normalizing-flows/NF_image_modeling.ipynb", "output_path": ".notebooks/course_UvA-DL/09-normalizing-flows.ipynb", "parameters": {}, "start_time": "2021-09-16T12:41:50.057997", "version": "2.3.3"}, "widgets": {"application/vnd.jupyter.widget-state+json": {"state": {"0989ef9cef0e410d8ba8708d70a44485": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_bd437d01e4504868a0eab569e54fc653", "placeholder": "\u200b", "style": "IPY_MODEL_ddf110132d7a4b79a55b81c2445d20f3", "value": " 5/8 [00:00<00:00, 34.55it/s]"}}, "121d677b3fe64b379404376f171236bb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "20eced8f26104528a837da146da0288f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "212476674e8742c5a36d5a6a59b8d2cf": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "21d9114cc8a54f54998866b9b4c3f542": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "301d6460224d44a69468ee761437b216": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_20eced8f26104528a837da146da0288f", "placeholder": "\u200b", "style": "IPY_MODEL_52759cf555ba4bb79cbb72b597401e1c", "value": " 0/8 [00:00<?, ?it/s]"}}, "3420b49f1b7245029561a3537f3672e5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "360f088f7aa34336bba895d5688f18f3": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "52759cf555ba4bb79cbb72b597401e1c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "5cac1945d4b94e45a8cb5128a7462916": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "63e7d0109110426fad97b7d711fa9919": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e7fb1721fcec4c4eab30b9ff09edbb4a", "max": 8.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_212476674e8742c5a36d5a6a59b8d2cf", "value": 8.0}}, "9caa927d490648dca2d1d7c54e448858": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ee2e2fb65a534444bfa51ad704a04f35", "max": 8.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_121d677b3fe64b379404376f171236bb", "value": 8.0}}, "a26ef8f75ac44f1c9a6872f079431d43": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_21d9114cc8a54f54998866b9b4c3f542", "placeholder": "\u200b", "style": "IPY_MODEL_edb3a164cc18459694b2c1dbb050b44a", "value": " 0%"}}, "b632bd849f444d76b9cdb1ce9b458ecc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_a26ef8f75ac44f1c9a6872f079431d43", "IPY_MODEL_63e7d0109110426fad97b7d711fa9919", "IPY_MODEL_301d6460224d44a69468ee761437b216"], "layout": "IPY_MODEL_3420b49f1b7245029561a3537f3672e5"}}, "bd437d01e4504868a0eab569e54fc653": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ca544fad59514bc6b35ed43510f6bb85": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "ddf110132d7a4b79a55b81c2445d20f3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "e14299cd737b4a32ae911b93b2592618": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_f797208673e64a9aac664d03c1b76f3a", "IPY_MODEL_9caa927d490648dca2d1d7c54e448858", "IPY_MODEL_0989ef9cef0e410d8ba8708d70a44485"], "layout": "IPY_MODEL_360f088f7aa34336bba895d5688f18f3"}}, "e7fb1721fcec4c4eab30b9ff09edbb4a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "edb3a164cc18459694b2c1dbb050b44a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "ee2e2fb65a534444bfa51ad704a04f35": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "f797208673e64a9aac664d03c1b76f3a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_5cac1945d4b94e45a8cb5128a7462916", "placeholder": "\u200b", "style": "IPY_MODEL_ca544fad59514bc6b35ed43510f6bb85", "value": " 62%"}}}, "version_major": 2, "version_minor": 0}}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/course_UvA-DL/10-autoregressive-image-modeling.ipynb b/source/notebooks/course_UvA-DL/10-autoregressive-image-modeling.ipynb deleted file mode 100644 index f7164e0..0000000 --- a/source/notebooks/course_UvA-DL/10-autoregressive-image-modeling.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "10249518", "metadata": {"papermill": {"duration": 0.025611, "end_time": "2021-09-16T12:42:18.560094", "exception": false, "start_time": "2021-09-16T12:42:18.534483", "status": "completed"}, "tags": []}, "source": ["\n", "# Tutorial 10: Autoregressive Image Modeling\n", "\n", "* **Author:** Phillip Lippe\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-09-16T14:32:36.593971\n", "\n", "In this tutorial, we implement an autoregressive likelihood model for the task of image modeling.\n", "Autoregressive models are naturally strong generative models that constitute one of the current\n", "state-of-the-art architectures on likelihood-based image modeling,\n", "and are also the basis for large language generation models such as GPT3.\n", "We will focus on the PixelCNN architecture in this tutorial, and apply it to MNIST modeling.\n", "This notebook is part of a lecture series on Deep Learning at the University of Amsterdam.\n", "The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io.\n", "\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/course_UvA-DL/10-autoregressive-image-modeling.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "3109481c", "metadata": {"papermill": {"duration": 0.024038, "end_time": "2021-09-16T12:42:18.608085", "exception": false, "start_time": "2021-09-16T12:42:18.584047", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "86088e31", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-09-16T12:42:18.659637Z", "iopub.status.busy": "2021-09-16T12:42:18.659166Z", "iopub.status.idle": "2021-09-16T12:42:18.661686Z", "shell.execute_reply": "2021-09-16T12:42:18.661233Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 0.029126, "end_time": "2021-09-16T12:42:18.661813", "exception": false, "start_time": "2021-09-16T12:42:18.632687", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# ! pip install --quiet \"torch>=1.6, <1.9\" \"seaborn\" \"torchvision\" \"matplotlib\" \"torchmetrics>=0.3\" \"pytorch-lightning>=1.3\""]}, {"cell_type": "markdown", "id": "e1dc997d", "metadata": {"papermill": {"duration": 0.024049, "end_time": "2021-09-16T12:42:18.710135", "exception": false, "start_time": "2021-09-16T12:42:18.686086", "status": "completed"}, "tags": []}, "source": ["
\n", "\n", "Similar to the language generation you have seen in assignment 2, autoregressive models work on images by modeling the likelihood of a pixel given all previous ones.\n", "For instance, in the picture below, we model the pixel $x_i$ as a conditional probability distribution\n", "based on all previous (here blue) pixels (figure credit - [Aaron van den Oord et al. ](https://arxiv.org/abs/1601.06759)):\n", "\n", "
\n", "\n", "Generally, autoregressive model over high-dimensional data $\\mathbf{x}$ factor the joint distribution as the following product of conditionals:\n", "\n", "$$p(\\mathbf{x})=p(x_1, ..., x_n)=\\prod_{i=1}^{n} p(x_i|x_1,...,x_{i-1})$$\n", "\n", "Learning these conditionals is often much simpler than learning the joint distribution $p(\\mathbf{x})$ all together.\n", "However, disadvantages of autoregressive models include slow sampling, especially for large images,\n", "as we need height-times-width forward passes through the model.\n", "In addition, for some applications, we require a latent space as modeled in VAEs and Normalizing Flows.\n", "For instance, in autoregressive models, we cannot interpolate between two images because of the lack of a latent representation.\n", "We will explore and discuss these benefits and drawbacks alongside with our implementation.\n", "\n", "Our implementation will focus on the [PixelCNN](https://arxiv.org/pdf/1606.05328.pdf) [2] model which has been discussed in detail in the lecture.\n", "Most current SOTA models use PixelCNN as their fundamental architecture,\n", "and various additions have been proposed to improve the performance\n", "(e.g. [PixelCNN++](https://arxiv.org/pdf/1701.05517.pdf) and [PixelSNAIL](http://proceedings.mlr.press/v80/chen18h/chen18h.pdf)).\n", "Hence, implementing PixelCNN is a good starting point for our short tutorial.\n", "\n", "First of all, we need to import our standard libraries. Similarly as in\n", "the last couple of tutorials, we will use [PyTorch\n", "Lightning](https://pytorch-lightning.readthedocs.io/en/latest/) here as\n", "well."]}, {"cell_type": "code", "execution_count": 2, "id": "6c3a3524", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:18.766239Z", "iopub.status.busy": "2021-09-16T12:42:18.759431Z", "iopub.status.idle": "2021-09-16T12:42:20.494992Z", "shell.execute_reply": "2021-09-16T12:42:20.494567Z"}, "papermill": {"duration": 1.761266, "end_time": "2021-09-16T12:42:20.495107", "exception": false, "start_time": "2021-09-16T12:42:18.733841", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/tmp/ipykernel_3486/3450944711.py:26: DeprecationWarning: `set_matplotlib_formats` is deprecated since IPython 7.23, directly use `matplotlib_inline.backend_inline.set_matplotlib_formats()`\n", " set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "Global seed set to 42\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Using device cuda:0\n"]}, {"data": {"text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["\n", "import math\n", "import os\n", "import urllib.request\n", "from urllib.error import HTTPError\n", "\n", "# Imports for plotting\n", "import matplotlib.pyplot as plt\n", "import numpy as np\n", "import pytorch_lightning as pl\n", "import seaborn as sns\n", "import torch\n", "import torch.nn as nn\n", "import torch.nn.functional as F\n", "import torch.optim as optim\n", "import torch.utils.data as data\n", "import torchvision\n", "from IPython.display import set_matplotlib_formats\n", "from matplotlib.colors import to_rgb\n", "from pytorch_lightning.callbacks import LearningRateMonitor, ModelCheckpoint\n", "from torchvision import transforms\n", "from torchvision.datasets import MNIST\n", "from tqdm.notebook import tqdm\n", "\n", "plt.set_cmap(\"cividis\")\n", "# %matplotlib inline\n", "set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "\n", "# Path to the folder where the datasets are/should be downloaded (e.g. MNIST)\n", "DATASET_PATH = os.environ.get(\"PATH_DATASETS\", \"data\")\n", "# Path to the folder where the pretrained models are saved\n", "CHECKPOINT_PATH = os.environ.get(\"PATH_CHECKPOINT\", \"saved_models/tutorial12\")\n", "\n", "# Setting the seed\n", "pl.seed_everything(42)\n", "\n", "# Ensure that all operations are deterministic on GPU (if used) for reproducibility\n", "torch.backends.cudnn.determinstic = True\n", "torch.backends.cudnn.benchmark = False\n", "\n", "# Fetching the device that will be used throughout this notebook\n", "device = torch.device(\"cpu\") if not torch.cuda.is_available() else torch.device(\"cuda:0\")\n", "print(\"Using device\", device)"]}, {"cell_type": "markdown", "id": "9527732b", "metadata": {"papermill": {"duration": 0.024895, "end_time": "2021-09-16T12:42:20.545620", "exception": false, "start_time": "2021-09-16T12:42:20.520725", "status": "completed"}, "tags": []}, "source": ["We again provide a pretrained model, which is downloaded below:"]}, {"cell_type": "code", "execution_count": 3, "id": "9b4b631a", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:20.600149Z", "iopub.status.busy": "2021-09-16T12:42:20.597718Z", "iopub.status.idle": "2021-09-16T12:42:20.772102Z", "shell.execute_reply": "2021-09-16T12:42:20.771611Z"}, "papermill": {"duration": 0.201736, "end_time": "2021-09-16T12:42:20.772216", "exception": false, "start_time": "2021-09-16T12:42:20.570480", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial12/PixelCNN.ckpt...\n"]}], "source": ["# Github URL where saved models are stored for this tutorial\n", "base_url = \"https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial12/\"\n", "# Files to download\n", "pretrained_files = [\"PixelCNN.ckpt\"]\n", "# Create checkpoint path if it doesn't exist yet\n", "os.makedirs(CHECKPOINT_PATH, exist_ok=True)\n", "\n", "# For each file, check whether it already exists. If not, try downloading it.\n", "for file_name in pretrained_files:\n", " file_path = os.path.join(CHECKPOINT_PATH, file_name)\n", " if not os.path.isfile(file_path):\n", " file_url = base_url + file_name\n", " print(\"Downloading %s...\" % file_url)\n", " try:\n", " urllib.request.urlretrieve(file_url, file_path)\n", " except HTTPError as e:\n", " print(\n", " \"Something went wrong. Please try to download the file from the GDrive folder, or contact the author with the full output including the following error:\\n\",\n", " e,\n", " )"]}, {"cell_type": "markdown", "id": "a675f0ec", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.024998, "end_time": "2021-09-16T12:42:20.823035", "exception": false, "start_time": "2021-09-16T12:42:20.798037", "status": "completed"}, "tags": []}, "source": ["Similar to the Normalizing Flows in Tutorial 11, we will work on the\n", "MNIST dataset and use 8-bits per pixel (values between 0 and 255). The\n", "dataset is loaded below:"]}, {"cell_type": "code", "execution_count": 4, "id": "26f824ca", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:20.878881Z", "iopub.status.busy": "2021-09-16T12:42:20.878404Z", "iopub.status.idle": "2021-09-16T12:42:20.910958Z", "shell.execute_reply": "2021-09-16T12:42:20.910469Z"}, "papermill": {"duration": 0.062918, "end_time": "2021-09-16T12:42:20.911075", "exception": false, "start_time": "2021-09-16T12:42:20.848157", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}], "source": ["# Convert images from 0-1 to 0-255 (integers). We use the long datatype as we will use the images as labels as well\n", "def discretize(sample):\n", " return (sample * 255).to(torch.long)\n", "\n", "\n", "# Transformations applied on each image => only make them a tensor\n", "transform = transforms.Compose([transforms.ToTensor(), discretize])\n", "\n", "# Loading the training dataset. We need to split it into a training and validation part\n", "train_dataset = MNIST(root=DATASET_PATH, train=True, transform=transform, download=True)\n", "pl.seed_everything(42)\n", "train_set, val_set = torch.utils.data.random_split(train_dataset, [50000, 10000])\n", "\n", "# Loading the test set\n", "test_set = MNIST(root=DATASET_PATH, train=False, transform=transform, download=True)\n", "\n", "# We define a set of data loaders that we can use for various purposes later.\n", "train_loader = data.DataLoader(train_set, batch_size=128, shuffle=True, drop_last=True, pin_memory=True, num_workers=4)\n", "val_loader = data.DataLoader(val_set, batch_size=128, shuffle=False, drop_last=False, num_workers=4)\n", "test_loader = data.DataLoader(test_set, batch_size=128, shuffle=False, drop_last=False, num_workers=4)"]}, {"cell_type": "markdown", "id": "8392a407", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.025246, "end_time": "2021-09-16T12:42:20.962362", "exception": false, "start_time": "2021-09-16T12:42:20.937116", "status": "completed"}, "tags": []}, "source": ["A good practice is to always visualize some data examples to get an intuition of the data:"]}, {"cell_type": "code", "execution_count": 5, "id": "4c29da69", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:21.018762Z", "iopub.status.busy": "2021-09-16T12:42:21.018292Z", "iopub.status.idle": "2021-09-16T12:42:21.101884Z", "shell.execute_reply": "2021-09-16T12:42:21.102269Z"}, "papermill": {"duration": 0.114672, "end_time": "2021-09-16T12:42:21.102399", "exception": false, "start_time": "2021-09-16T12:42:20.987727", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "JVBERi0xLjQKJazcIKu6CjEgMCBvYmoKPDwgL1BhZ2VzIDIgMCBSIC9UeXBlIC9DYXRhbG9nID4+CmVuZG9iago4IDAgb2JqCjw8IC9FeHRHU3RhdGUgNCAwIFIgL0ZvbnQgMyAwIFIgL1BhdHRlcm4gNSAwIFIKL1Byb2NTZXQgWyAvUERGIC9UZXh0IC9JbWFnZUIgL0ltYWdlQyAvSW1hZ2VJIF0gL1NoYWRpbmcgNiAwIFIKL1hPYmplY3QgNyAwIFIgPj4KZW5kb2JqCjExIDAgb2JqCjw8IC9Bbm5vdHMgMTAgMCBSIC9Db250ZW50cyA5IDAgUgovR3JvdXAgPDwgL0NTIC9EZXZpY2VSR0IgL1MgL1RyYW5zcGFyZW5jeSAvVHlwZSAvR3JvdXAgPj4KL01lZGlhQm94IFsgMCAwIDMzNS4yOTkzNTQ4Mzg3IDE3Ny40OCBdIC9QYXJlbnQgMiAwIFIgL1Jlc291cmNlcyA4IDAgUgovVHlwZSAvUGFnZSA+PgplbmRvYmoKOSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDEyIDAgUiA+PgpzdHJlYW0KeJxNjrEOwjAMRHd/xX1BYsdpk45FlSLGsvABVQVUtAgqwe/jMgDDSb6T7XuCiXwrOK1gTKYXBAW+G5+XYTyUHYaV2PKZVCsXmkaryuz130pKLmbL+DeeiRa6I7nwkQZ2eduOWXOC1Oo44zHiiAW+DRuAGIAYAKPYpQbBVix1/H4ZZvi9oLuhp57eJg8oJwplbmRzdHJlYW0KZW5kb2JqCjEyIDAgb2JqCjE0MgplbmRvYmoKMTAgMCBvYmoKWyBdCmVuZG9iagozIDAgb2JqCjw8ID4+CmVuZG9iago0IDAgb2JqCjw8IC9BMSA8PCAvQ0EgMCAvVHlwZSAvRXh0R1N0YXRlIC9jYSAxID4+Ci9BMiA8PCAvQ0EgMSAvVHlwZSAvRXh0R1N0YXRlIC9jYSAxID4+ID4+CmVuZG9iago1IDAgb2JqCjw8ID4+CmVuZG9iago2IDAgb2JqCjw8ID4+CmVuZG9iago3IDAgb2JqCjw8IC9JMSAxMyAwIFIgPj4KZW5kb2JqCjEzIDAgb2JqCjw8IC9CaXRzUGVyQ29tcG9uZW50IDgKL0NvbG9yU3BhY2UgWy9JbmRleGVkIC9EZXZpY2VSR0IgMjIyICj////+/v79/f38/Pz7+/v6+vr5+fn4+Pj39/f19fX09PTz8/Py8vLx8fHw8PDv7+/u7u7t7e3s7Ozr6+vq6urp6eno6Ojn5+fm5ubl5eXk5OTj4+Pi4uLh4eHg4ODf39/e3t7d3d3c3Nzb29va2trZ2dnY2NjX19fW1tbV1dXU1NTT09PR0dHQ0NDPz8/Ozs7Nzc3MzMzLy8vJycnHx8fGxsbFxcXExMTDw8PCwsLBwcHAwMC/v7++vr69vb28vLy7u7u6urq5ubm4uLi3t7e2tra1tbW0tLSzs7OysrKwsLCvr6+urq6tra2srKyqqqqpqamoqKinp6elpaWkpKSioqKhoaGgoKCenp6cnJyampqZmZmYmJiXl5eWlpaVlZWUlJSTk5ORkZGPj4+NjY2Li4uKioqJiYmIiIiHh4eGhoaFhYWEhISDg4OCgoKAgIB+fn59fX18fHx7e3t5eXl4eHh3d3d2dnZ1dXV0dHRzc3NycnJxcXFwcHBvb29ubm5qampnZ2dmZmZkZGRjY2NiYmJgYGBfX19eXl5dXV1cXFxcXFxbW1taWlpZWVlYWFhXV1dWVlZVVVVUVFRTU1NRUVFQUFBPT09MTExLS0tKSkpJSUlISEhHR0dGRkZFRUVERERDQ0NCQkJBQUFAQEA/Pz8+Pj48PDw7Ozs6Ojo5OTk4ODg3Nzc1NTU0NDQzMzMyMjIxMTEwMDAvLy8uLi4sLCwrKysqKipcKFwoXCgnJycmJiYlJSUkJCQjIyMiIiIgICAfHx8eHh4dHR0cHBwbGxsaGhoZGRkYGBgXFxcWFhYVFRUUFBQTExMSEhIREREQEBAPDw8ODg5cclxyXHIMDAwLCwtcblxuXG4JCQkICAgHBwcGBgYFBQUEBAQDAwMCAgIBAQEAAAApXQovRGVjb2RlUGFybXMgPDwgL0NvbG9ycyAxIC9Db2x1bW5zIDMyMSAvUHJlZGljdG9yIDEwID4+Ci9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9IZWlnaHQgMTY0IC9MZW5ndGggMTQgMCBSIC9TdWJ0eXBlIC9JbWFnZQovVHlwZSAvWE9iamVjdCAvV2lkdGggMzIxID4+CnN0cmVhbQp4nO2d+19M+R/HZ6ZRKWFGJRoUWdEWspVLqnHLJSqXZV1qI7llv+7azTJZwmZlKXeKWLnLZWklconUisxmhPlbvu85M6dpTufymflMzNr384c8zmVe8/48M5/z+ZxzOiP7H0KH7HMX8K8HDdKCBmlBg7SYDRqdxn8vDg3SxqFB2jg0SBuHBmnj0CBt3JdhsLa2dvTo0adPOymOFDRIi6MGHz16VFrapUsXuVwuk0VHR3d4jVI76fVarRaqmTHDKXHkoEFa0CAtDhnctGnTpEmTFK3ExMR0eI2ie9TV1cXHyxny8ujj7AIN0oIGabHDoMGg1+uLi4ujojw9PRVt6d69+86dHVyj6B5Tpkxh9Pn6+hoM9HF2gQZpITX45MmTtp9bW8g/xfn5+TKZLCODZ5PB0NLSIlyjaHWDBg1iDO60+UUKIB23Z8+ekBBoFyQmJUHJr15JxaFBW9CgOJ/FYE7O5MmThfwpFAUFBUQ1vnoVHh4O++/fb7P62rVry5cvV6kiIiKKi4VqFKnOYhDG94cOHRLdTzqusXH27NnQz7uZgFKZf8PCSktLRePQYCvONvjxY319/dq1a728eLx17Xr+/PmbJj58+EBU49On5lfu2mU06YTsy5cvL1ni7+/PZmZl2dtkBsZgfHy86E5Ecfn5YMzPz++XXzZv3swadHPz8vI6d+6ccBwabAUNEvBJDer1vP3e1KlTU1NTL160t8b9+82v79EjPT29Xz9u7MiRI/V6e5tsNG7ZskWpVMrlixcvFt6JKO7x48chIeDroqlpVVVVB0xotVpGYlBQ0MuXQnFo0Awa/FcYhMFzXt6bN28cqlGvT0pKgkGHNa5z585abUZGBrOQxdsLShisqxs+fDgznK6trRWtSjpOp9MpFMuWLbMZ2sPCli09evSAAtPShOLQoBmnGmxuboZVzNyGRa2OjIx89uyZdSf4X/+S73+2aJPhAJ6b+5UJOMiXlJQYjXPnzlWYDu0wc7SzyUBhodyC2WBR0UETR44cEXqFQFxlZaVarQ4IgEZxN715M2DAAHiH1FShODRoRIOuZxAmgjb9X3BwcFkZ9H+72gJd2sSJE3ftOnr0KHmTuZw4oVKp4B2Ep7SicVFRrMFJkyZNnz7dzY1ZgKktLPAenQXilixZwkyBeV5RVmaeJP/2m1AcGjSiQVc36OMDs8L8/OTkZO7ohgEmtgcPkjaZyzffMH2suqZGaA9Cgzz06lVRUUEYl5KSAp50Ou56mPTPnAlbhg4d+u6dUHVo0Oh8g+YhJItSqdFo2o6E29G1a3l5OVGTuTAGly5dKrwHoUH4PQa0xcfHRyaD3oc70uaNa2zs06cPeGr/Bps2bWJmdcW8Z3/RIAsadD2DUJGILz7OnDlD1GQbioqKunUbNWpUU1OT8E5EBmNjX79+bbOlrKzMzw+2VFdXS8c9f24+lWpzuG1oaMjMdHd3Z7aIVocG0eB/1CCMNLp166ZQzJC4a5LI4E8/cbfU19eHhvr5+XEnusKjGWgFO/WtqSksLJTJZJbGZfDeJGCNQ4PGT2QQpkrDhg0rLHz69Cn4io1tsykg4PLly0RNtrJjxw7mtYcPHxbdj8hgQoLNpxgW4uPj/fzOnz9PGLdq1Sr4rHp7j2Xw94cF+P2mpo4YMcLNDQ0SxKFBVzPIOwVWqVS5JlauXMnd9MMPpE1maWiIiIiAV44eree9QkcY9+237IgafhHM+V+YyJaXjx8/HlYNHkweZzAYFi5cqFabj8mengkJCcxFdn+TzN27d4tWhwaNaND1DHLPsIoyZMiQykrSJrNYOkGFRCcoFffqFXsTNRAXF5eeDh7Y5Zwc++OYy+wHzp41Lz9/Dv9t1OoHDx6IVocG28Q5y+CVK1c0Go20vMDAwLNnDZwb6IkMJibCy3v37l1VJbWnRFxzc/PAgQM551Zh2KDT6d6/tz/Olt9/h4+06O0kaFAcNGh/nC2OGwROnTol4TArK+v48eOO1PjixYuvv4aEcePGSbdCOg4Ow4mJrDx3d/e9e4uKihyPawMzbThwQKo6NCgIlUGgvJzXXN++fc+YeMd78YqkxmvXrjE9AM+lNEfi7II8rrq6WqWCTzEadDQODdLGOcGgg0jHzZo1S6GIjY11UpxdkMfdvn2bmeKhQUfj0CBtnOsa/PPPTp06ma7jK9PT09vf8GhvnJOrs4IGaeNc1+CtW8whvV+/fvfv36ePsxPyuLdv3373nZeX1/XrUnFokB80SBvnuga/vDg0SBuHBmnj0CBtHBqkjcOnytOCBmlBg7SgQVrQIC1okBYczdDGoUHaODRIG4cGaePQIG0cGqSNQ4O0cWiQNg4N0sahQdq4T2rw3r17+SZ8fRUKBfvXk9ynCZPH2fDs2bPw8K1bt5JXd/PmzWHD5HJ5cPC0adM2btz4449Qmk6ny8iYMmVKoum2Tihx+vRFixY1NjYKx6FBNGjhizdYUjJ27NjQ0FBlKwrm7hmlUq1Wjx27evXq5mY74tqzfft2uVylUhFWd+zYsbCwsJ9/3rt3L+8bf/z48fXrkpKSDRtGjBjh7e2dklJfX88bhwbRoAVXNnjhwgXrwn7Og/WFa2xDWVmZWt1Gmo1BdiEzkzSOl4SEBLncw8ODsLrm5mapR8paePfuXW5uLvP3o7xxaFAKaoNRUXBEsi5qNBrII6mxDS9fvuzTBzzFxcXFt8Is9O/fnzXo4cFzJO0wg+QYDIYFCxagQXvjrKBBx+KsUBusqbExCPpslklrPHiQ96/tKyoqVq1aZekU16xZQxrHQa/Xx8TEmB7b2Et0P/sN3rkTHR0Nw+7Zs3kefYwGCXC+QTgWO2RQGDhQW6Z4jhs8efIk87ed27ZtE92PvLq3b99WVq5fv97Dw93dHUarf/8tFIcG+UGDtNU50WBuLhx+bdY43yB1P+hUgydOzJ8/v2fPnnI5/EhLu3v3rmgcGmwHGhThsxiMirKZFxsZgw4+gpsXZxhkv+mFyuCJE2lpacxf/UVFRSUmJp458573gSGcODTYSkcZTE7mroFBtfAJms9jMCIigt5gZKT5gSEpKW2ery0dhwZbQYMuaTAzM7P9iRhY2V4rUY28zJkzxzUM/vPP1atXV6xYERCgVCqDgoJ0uoaGBuk4NNgKGnRJg+0HzzAv1phITk6GjRqNzEKyRapdBpuakpKSmMvukODjw/MlzkRxpaVdunQBf76+Dx8+FN2TKK6uDkyuXLnS2zswMHDbNqFnExnRoBDOMwiyYGhpXYBPr6wVWIBVNTX7rZDXyHLlCnutzsfHZ8wYoRqlYgoKoCAwuHy51J52VXf3bqTp8CxyJwkaFAcNOhrHQm8QeruampoLF1hz0NXl5jJrLgifnSGvsaKiIjiYNThv3jwH41paWlJSQB/0WcInUeyvjqG+vj4yEvpY5gsyheLQoAhokKI6BjqDmZlgMMp0vR1+cOfBjhi8c+fOunXr8vJgHjxnDvzw9fVl/YWF8dwYJRHHAt0UM5geOnSo6H6EcVwaGgICAqKjo4Xj0KA4jhqsYa7QmUbMGs7pVTOc8/5SNRYXF8+bN3DgQN57t8LCwoSfSy3d5NOnT3t5gUEo9a+/RPfkiSP58vLs7Gwo9Y8/hOLQoBRoUCyu4wwy8kRutkxO5l48EaqRXcnOfq1PFWYXBg8enJ8v9EZEHVfv3mBw5syZYl98xxO3dOlSsbvQWGDMAPGmryvhj0ODUqBBwbgONSh1tzQzspaukaG2tjbYMnQWvo9648aNhHFc9u3b5+4OTRQa9QrHTZgwQau9LvqIRhOXLl2C+LVrheLQYMcYdJz2cdXV1bzSbBYcn9WFh4czw+kXL17YWd3Vq1djYz09PaOjMzIycnJyfv21rq6O+4qqqpCQECjw4kWhODSIBr98gy0tLZmZmVZpAwYM+P77Bw8eFBQUxMQoLYNqx+fF7qZekOjbYnjimprOnTuXnR0UFARdXWgoTNXHmNBqtXkm4uLiAgOhvg0bNgjHoUHXN2hkhlT+/gsXLgSD2dk3btywNmA3A82sLikpyXGDFh4+fHj48OFHj27dupWVlWXztVkzZoh8OSsaZEGDX77BLzoODdLGoUHaODRIG4cGaePQIG0cGqSNQ4O0cWiQNg4N0sahQdo4fKo8LWiQFjRICxqkBQ3S8n+rQtglCmVuZHN0cmVhbQplbmRvYmoKMTQgMCBvYmoKMzEyNAplbmRvYmoKMiAwIG9iago8PCAvQ291bnQgMSAvS2lkcyBbIDExIDAgUiBdIC9UeXBlIC9QYWdlcyA+PgplbmRvYmoKMTUgMCBvYmoKPDwgL0NyZWF0aW9uRGF0ZSAoRDoyMDIxMDkxNjE0NDIyMSswMicwMCcpCi9DcmVhdG9yIChNYXRwbG90bGliIHYzLjQuMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZykKL1Byb2R1Y2VyIChNYXRwbG90bGliIHBkZiBiYWNrZW5kIHYzLjQuMykgPj4KZW5kb2JqCnhyZWYKMCAxNgowMDAwMDAwMDAwIDY1NTM1IGYgCjAwMDAwMDAwMTYgMDAwMDAgbiAKMDAwMDAwNDkyNiAwMDAwMCBuIAowMDAwMDAwNjU5IDAwMDAwIG4gCjAwMDAwMDA2ODAgMDAwMDAgbiAKMDAwMDAwMDc3OSAwMDAwMCBuIAowMDAwMDAwODAwIDAwMDAwIG4gCjAwMDAwMDA4MjEgMDAwMDAgbiAKMDAwMDAwMDA2NSAwMDAwMCBuIAowMDAwMDAwNDAyIDAwMDAwIG4gCjAwMDAwMDA2MzkgMDAwMDAgbiAKMDAwMDAwMDIwOCAwMDAwMCBuIAowMDAwMDAwNjE5IDAwMDAwIG4gCjAwMDAwMDA4NTMgMDAwMDAgbiAKMDAwMDAwNDkwNSAwMDAwMCBuIAowMDAwMDA0OTg2IDAwMDAwIG4gCnRyYWlsZXIKPDwgL0luZm8gMTUgMCBSIC9Sb290IDEgMCBSIC9TaXplIDE2ID4+CnN0YXJ0eHJlZgo1MTQzCiUlRU9GCg==\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:21.065617\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["def show_imgs(imgs):\n", " num_imgs = imgs.shape[0] if isinstance(imgs, torch.Tensor) else len(imgs)\n", " nrow = min(num_imgs, 4)\n", " ncol = int(math.ceil(num_imgs / nrow))\n", " imgs = torchvision.utils.make_grid(imgs, nrow=nrow, pad_value=128)\n", " imgs = imgs.clamp(min=0, max=255)\n", " np_imgs = imgs.cpu().numpy()\n", " plt.figure(figsize=(1.5 * nrow, 1.5 * ncol))\n", " plt.imshow(np.transpose(np_imgs, (1, 2, 0)), interpolation=\"nearest\")\n", " plt.axis(\"off\")\n", " plt.show()\n", " plt.close()\n", "\n", "\n", "show_imgs([train_set[i][0] for i in range(8)])"]}, {"cell_type": "markdown", "id": "353ee95b", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.026067, "end_time": "2021-09-16T12:42:21.155368", "exception": false, "start_time": "2021-09-16T12:42:21.129301", "status": "completed"}, "tags": []}, "source": ["## Masked autoregressive convolutions\n", "\n", "The core module of PixelCNN is its masked convolutions.\n", "In contrast to language models, we don't apply an LSTM on each pixel one-by-one.\n", "This would be inefficient because images are grids instead of sequences.\n", "Thus, it is better to rely on convolutions that have shown great success in deep CNN classification models.\n", "\n", "Nevertheless, we cannot just apply standard convolutions without any changes.\n", "Remember that during training of autoregressive models, we want to use teacher forcing which both helps the model training, and significantly reduces the time needed for training.\n", "For image modeling, teacher forcing is implemented by using a training image as input to the model, and we want to obtain as output the prediction for each pixel based on *only* its predecessors.\n", "Thus, we need to ensure that the prediction for a specific pixel can only be influenced by its predecessors and not by its own value or any \"future\" pixels.\n", "For this, we apply convolutions with a mask.\n", "\n", "Which mask we use depends on the ordering of pixels we decide on, i.e. which is the first pixel we predict,\n", "which is the second one, etc.\n", "The most commonly used ordering is to denote the upper left pixel as the start pixel,\n", "and sort the pixels row by row, as shown in the visualization at the top of the tutorial.\n", "Thus, the second pixel is on the right of the first one (first row, second column),\n", "and once we reach the end of the row, we start in the second row, first column.\n", "If we now want to apply this to our convolutions, we need to ensure that the prediction of pixel 1\n", "is not influenced by its own \"true\" input, and all pixels on its right and in any lower row.\n", "In convolutions, this means that we want to set those entries of the weight matrix to zero that take pixels on the right and below into account.\n", "As an example for a 5x5 kernel, see a mask below (figure credit - [Aaron van den Oord](https://arxiv.org/pdf/1606.05328.pdf)):\n", "\n", "
\n", "\n", "Before looking into the application of masked convolutions in PixelCNN\n", "in detail, let's first implement a module that allows us to apply an\n", "arbitrary mask to a convolution:"]}, {"cell_type": "code", "execution_count": 6, "id": "7f373c01", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:21.215016Z", "iopub.status.busy": "2021-09-16T12:42:21.214539Z", "iopub.status.idle": "2021-09-16T12:42:21.216213Z", "shell.execute_reply": "2021-09-16T12:42:21.216588Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.033688, "end_time": "2021-09-16T12:42:21.216710", "exception": false, "start_time": "2021-09-16T12:42:21.183022", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class MaskedConvolution(nn.Module):\n", " def __init__(self, c_in, c_out, mask, **kwargs):\n", " \"\"\"Implements a convolution with mask applied on its weights.\n", "\n", " Args:\n", " c_in: Number of input channels\n", " c_out: Number of output channels\n", " mask: Tensor of shape [kernel_size_H, kernel_size_W] with 0s where\n", " the convolution should be masked, and 1s otherwise.\n", " kwargs: Additional arguments for the convolution\n", " \"\"\"\n", " super().__init__()\n", " # For simplicity: calculate padding automatically\n", " kernel_size = (mask.shape[0], mask.shape[1])\n", " dilation = 1 if \"dilation\" not in kwargs else kwargs[\"dilation\"]\n", " padding = tuple(dilation * (kernel_size[i] - 1) // 2 for i in range(2))\n", " # Actual convolution\n", " self.conv = nn.Conv2d(c_in, c_out, kernel_size, padding=padding, **kwargs)\n", "\n", " # Mask as buffer => it is no parameter but still a tensor of the module\n", " # (must be moved with the devices)\n", " self.register_buffer(\"mask\", mask[None, None])\n", "\n", " def forward(self, x):\n", " self.conv.weight.data *= self.mask # Ensures zero's at masked positions\n", " return self.conv(x)"]}, {"cell_type": "markdown", "id": "ab31353f", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.026241, "end_time": "2021-09-16T12:42:21.269129", "exception": false, "start_time": "2021-09-16T12:42:21.242888", "status": "completed"}, "tags": []}, "source": ["### Vertical and horizontal convolution stacks\n", "\n", "To build our own autoregressive image model, we could simply stack a few masked convolutions on top of each other.\n", "This was actually the case for the original PixelCNN model, discussed in the paper\n", "[Pixel Recurrent Neural Networks](https://arxiv.org/pdf/1601.06759.pdf), but this leads to a considerable issue.\n", "When sequentially applying a couple of masked convolutions, the receptive field of a pixel\n", "show to have a \"blind spot\" on the right upper side, as shown in the figure below\n", "(figure credit - [Aaron van den Oord et al. ](https://arxiv.org/pdf/1606.05328.pdf)):\n", "\n", "
\n", "\n", "Although a pixel should be able to take into account all other pixels above and left of it,\n", "a stack of masked convolutions does not allow us to look to the upper pixels on the right.\n", "This is because the features of the pixels above, which we use for convolution,\n", "do not contain any information of the pixels on the right of the same row.\n", "If they would, we would be \"cheating\" and actually looking into the future.\n", "To overcome this issue, van den Oord et.\n", "al [2] proposed to split the convolutions into a vertical and a horizontal stack.\n", "The vertical stack looks at all pixels above the current one, while the horizontal takes into account all on the left.\n", "While keeping both of them separate, we can actually look at the pixels on the right with the vertical stack without breaking any of our assumptions.\n", "The two convolutions are also shown in the figure above.\n", "\n", "Let us implement them here as follows:"]}, {"cell_type": "code", "execution_count": 7, "id": "08032e0c", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:21.326679Z", "iopub.status.busy": "2021-09-16T12:42:21.323108Z", "iopub.status.idle": "2021-09-16T12:42:21.329089Z", "shell.execute_reply": "2021-09-16T12:42:21.328692Z"}, "papermill": {"duration": 0.033791, "end_time": "2021-09-16T12:42:21.329186", "exception": false, "start_time": "2021-09-16T12:42:21.295395", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class VerticalStackConvolution(MaskedConvolution):\n", " def __init__(self, c_in, c_out, kernel_size=3, mask_center=False, **kwargs):\n", " # Mask out all pixels below. For efficiency, we could also reduce the kernel\n", " # size in height, but for simplicity, we stick with masking here.\n", " mask = torch.ones(kernel_size, kernel_size)\n", " mask[kernel_size // 2 + 1 :, :] = 0\n", "\n", " # For the very first convolution, we will also mask the center row\n", " if mask_center:\n", " mask[kernel_size // 2, :] = 0\n", "\n", " super().__init__(c_in, c_out, mask, **kwargs)\n", "\n", "\n", "class HorizontalStackConvolution(MaskedConvolution):\n", " def __init__(self, c_in, c_out, kernel_size=3, mask_center=False, **kwargs):\n", " # Mask out all pixels on the left. Note that our kernel has a size of 1\n", " # in height because we only look at the pixel in the same row.\n", " mask = torch.ones(1, kernel_size)\n", " mask[0, kernel_size // 2 + 1 :] = 0\n", "\n", " # For the very first convolution, we will also mask the center pixel\n", " if mask_center:\n", " mask[0, kernel_size // 2] = 0\n", "\n", " super().__init__(c_in, c_out, mask, **kwargs)"]}, {"cell_type": "markdown", "id": "4d152ec5", "metadata": {"papermill": {"duration": 0.026372, "end_time": "2021-09-16T12:42:21.381597", "exception": false, "start_time": "2021-09-16T12:42:21.355225", "status": "completed"}, "tags": []}, "source": ["Note that we have an input argument called `mask_center`. Remember that\n", "the input to the model is the actual input image. Hence, the very first\n", "convolution we apply cannot use the center pixel as input, but must be\n", "masked. All consecutive convolutions, however, should use the center\n", "pixel as we otherwise lose the features of the previous layer. Hence,\n", "the input argument `mask_center` is True for the very first\n", "convolutions, and False for all others."]}, {"cell_type": "markdown", "id": "cd8536aa", "metadata": {"papermill": {"duration": 0.026279, "end_time": "2021-09-16T12:42:21.434188", "exception": false, "start_time": "2021-09-16T12:42:21.407909", "status": "completed"}, "tags": []}, "source": ["### Visualizing the receptive field\n", "\n", "To validate our implementation of masked convolutions, we can visualize the receptive field we obtain with such convolutions.\n", "We should see that with increasing number of convolutional layers, the receptive field grows in both vertical and horizontal direction, without the issue of a blind spot.\n", "The receptive field can be empirically measured by backpropagating an arbitrary loss for the output features of a speicifc pixel with respect to the input.\n", "We implement this idea below, and visualize the receptive field below."]}, {"cell_type": "code", "execution_count": 8, "id": "52423559", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:21.493549Z", "iopub.status.busy": "2021-09-16T12:42:21.493069Z", "iopub.status.idle": "2021-09-16T12:42:21.641737Z", "shell.execute_reply": "2021-09-16T12:42:21.641316Z"}, "papermill": {"duration": 0.181442, "end_time": "2021-09-16T12:42:21.641845", "exception": false, "start_time": "2021-09-16T12:42:21.460403", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:21.570580\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["inp_img = torch.zeros(1, 1, 11, 11)\n", "inp_img.requires_grad_()\n", "\n", "\n", "def show_center_recep_field(img, out):\n", " \"\"\"Calculates the gradients of the input with respect to the output center pixel, and visualizes the overall\n", " receptive field.\n", "\n", " Args:\n", " img: Input image for which we want to calculate the receptive field on.\n", " out: Output features/loss which is used for backpropagation, and should be\n", " the output of the network/computation graph.\n", " \"\"\"\n", " # Determine gradients\n", " loss = out[0, :, img.shape[2] // 2, img.shape[3] // 2].sum() # L1 loss for simplicity\n", " # Retain graph as we want to stack multiple layers and show the receptive field of all of them\n", " loss.backward(retain_graph=True)\n", " img_grads = img.grad.abs()\n", " img.grad.fill_(0) # Reset grads\n", "\n", " # Plot receptive field\n", " img = img_grads.squeeze().cpu().numpy()\n", " fig, ax = plt.subplots(1, 2)\n", " _ = ax[0].imshow(img)\n", " ax[1].imshow(img > 0)\n", " # Mark the center pixel in red if it doesn't have any gradients (should be\n", " # the case for standard autoregressive models)\n", " show_center = img[img.shape[0] // 2, img.shape[1] // 2] == 0\n", " if show_center:\n", " center_pixel = np.zeros(img.shape + (4,))\n", " center_pixel[center_pixel.shape[0] // 2, center_pixel.shape[1] // 2, :] = np.array([1.0, 0.0, 0.0, 1.0])\n", " for i in range(2):\n", " ax[i].axis(\"off\")\n", " if show_center:\n", " ax[i].imshow(center_pixel)\n", " ax[0].set_title(\"Weighted receptive field\")\n", " ax[1].set_title(\"Binary receptive field\")\n", " plt.show()\n", " plt.close()\n", "\n", "\n", "show_center_recep_field(inp_img, inp_img)"]}, {"cell_type": "markdown", "id": "e9b19d4a", "metadata": {"papermill": {"duration": 0.027207, "end_time": "2021-09-16T12:42:21.696690", "exception": false, "start_time": "2021-09-16T12:42:21.669483", "status": "completed"}, "tags": []}, "source": ["Let's first visualize the receptive field of a horizontal convolution\n", "without the center pixel. We use a small, arbitrary input image\n", "($11\\times 11$ pixels), and calculate the loss for the center pixel. For\n", "simplicity, we initialize all weights with 1 and the bias with 0, and\n", "use a single channel. This is sufficient for our visualization purposes."]}, {"cell_type": "code", "execution_count": 9, "id": "ad09d7c8", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:21.755609Z", "iopub.status.busy": "2021-09-16T12:42:21.755136Z", "iopub.status.idle": "2021-09-16T12:42:21.910953Z", "shell.execute_reply": "2021-09-16T12:42:21.910478Z"}, "papermill": {"duration": 0.18684, "end_time": "2021-09-16T12:42:21.911059", "exception": false, "start_time": "2021-09-16T12:42:21.724219", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:21.840084\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["horiz_conv = HorizontalStackConvolution(c_in=1, c_out=1, kernel_size=3, mask_center=True)\n", "horiz_conv.conv.weight.data.fill_(1)\n", "horiz_conv.conv.bias.data.fill_(0)\n", "horiz_img = horiz_conv(inp_img)\n", "show_center_recep_field(inp_img, horiz_img)"]}, {"cell_type": "markdown", "id": "a4151321", "metadata": {"papermill": {"duration": 0.02825, "end_time": "2021-09-16T12:42:21.967945", "exception": false, "start_time": "2021-09-16T12:42:21.939695", "status": "completed"}, "tags": []}, "source": ["The receptive field is shown in yellow, the center pixel in red, and all other pixels outside of the receptive field are dark blue.\n", "As expected, the receptive field of a single horizontal convolution with the center pixel masked and a $3\\times3$ kernel is only the pixel on the left.\n", "If we use a larger kernel size, more pixels would be taken into account on the left.\n", "\n", "Next, let's take a look at the vertical convolution:"]}, {"cell_type": "code", "execution_count": 10, "id": "4d7db603", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:22.028223Z", "iopub.status.busy": "2021-09-16T12:42:22.026790Z", "iopub.status.idle": "2021-09-16T12:42:22.183299Z", "shell.execute_reply": "2021-09-16T12:42:22.182815Z"}, "papermill": {"duration": 0.186816, "end_time": "2021-09-16T12:42:22.183411", "exception": false, "start_time": "2021-09-16T12:42:21.996595", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:22.111784\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["vert_conv = VerticalStackConvolution(c_in=1, c_out=1, kernel_size=3, mask_center=True)\n", "vert_conv.conv.weight.data.fill_(1)\n", "vert_conv.conv.bias.data.fill_(0)\n", "vert_img = vert_conv(inp_img)\n", "show_center_recep_field(inp_img, vert_img)"]}, {"cell_type": "markdown", "id": "f506aec8", "metadata": {"papermill": {"duration": 0.029554, "end_time": "2021-09-16T12:42:22.243059", "exception": false, "start_time": "2021-09-16T12:42:22.213505", "status": "completed"}, "tags": []}, "source": ["The vertical convolution takes all pixels above into account. Combining\n", "these two, we get the L-shaped receptive field of the original masked\n", "convolution:"]}, {"cell_type": "code", "execution_count": 11, "id": "63b459cc", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:22.305232Z", "iopub.status.busy": "2021-09-16T12:42:22.304151Z", "iopub.status.idle": "2021-09-16T12:42:22.458303Z", "shell.execute_reply": "2021-09-16T12:42:22.457833Z"}, "papermill": {"duration": 0.185539, "end_time": "2021-09-16T12:42:22.458405", "exception": false, "start_time": "2021-09-16T12:42:22.272866", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:22.388054\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["horiz_img = vert_img + horiz_img\n", "show_center_recep_field(inp_img, horiz_img)"]}, {"cell_type": "markdown", "id": "62da8fad", "metadata": {"papermill": {"duration": 0.030338, "end_time": "2021-09-16T12:42:22.519399", "exception": false, "start_time": "2021-09-16T12:42:22.489061", "status": "completed"}, "tags": []}, "source": ["If we stack multiple horizontal and vertical convolutions, we need to take two aspects into account:\n", "\n", "1.\n", "The center should not be masked anymore for the following convolutions as the features at the pixel's position are already independent of its actual value.\n", "If it is hard to imagine why we can do this, just change the value below to `mask_center=True` and see what happens.\n", "2.\n", "The vertical convolution is not allowed to work on features from the horizontal convolution.\n", "In the feature map of the horizontal convolutions, a pixel contains information about all of the \"true\" pixels on the left.\n", "If we apply a vertical convolution which also uses features from the right, we effectively expand our receptive field to the true input which we want to prevent.\n", "Thus, the feature maps can only be merged for the horizontal convolution.\n", "\n", "Using this, we can stack the convolutions in the following way. We have\n", "two feature streams: one for the vertical stack, and one for the\n", "horizontal stack. The horizontal convolutions can operate on the joint\n", "features of the previous horizontals and vertical convolutions, while\n", "the vertical stack only takes its own previous features as input. For a\n", "quick implementation, we can therefore sum the horizontal and vertical\n", "output features at each layer, and use those as final output features to\n", "calculate the loss on. An implementation of 4 consecutive layers is\n", "shown below. Note that we reuse the features from the other convolutions\n", "with `mask_center=True` from above."]}, {"cell_type": "code", "execution_count": 12, "id": "f6dcdf70", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:22.585305Z", "iopub.status.busy": "2021-09-16T12:42:22.584833Z", "iopub.status.idle": "2021-09-16T12:42:23.217060Z", "shell.execute_reply": "2021-09-16T12:42:23.216574Z"}, "papermill": {"duration": 0.666981, "end_time": "2021-09-16T12:42:23.217176", "exception": false, "start_time": "2021-09-16T12:42:22.550195", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Layer 2\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:22.673112\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Layer 3\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:22.838845\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Layer 4\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:22.991369\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Layer 5\n"]}, {"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:23.145226\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["# Initialize convolutions with equal weight to all input pixels\n", "horiz_conv = HorizontalStackConvolution(c_in=1, c_out=1, kernel_size=3, mask_center=False)\n", "horiz_conv.conv.weight.data.fill_(1)\n", "horiz_conv.conv.bias.data.fill_(0)\n", "vert_conv = VerticalStackConvolution(c_in=1, c_out=1, kernel_size=3, mask_center=False)\n", "vert_conv.conv.weight.data.fill_(1)\n", "vert_conv.conv.bias.data.fill_(0)\n", "\n", "# We reuse our convolutions for the 4 layers here. Note that in a standard network,\n", "# we don't do that, and instead learn 4 separate convolution. As this cell is only for\n", "# visualization purposes, we reuse the convolutions for all layers.\n", "for l_idx in range(4):\n", " vert_img = vert_conv(vert_img)\n", " horiz_img = horiz_conv(horiz_img) + vert_img\n", " print(\"Layer %i\" % (l_idx + 2))\n", " show_center_recep_field(inp_img, horiz_img)"]}, {"cell_type": "markdown", "id": "0fb070de", "metadata": {"papermill": {"duration": 0.035948, "end_time": "2021-09-16T12:42:23.289214", "exception": false, "start_time": "2021-09-16T12:42:23.253266", "status": "completed"}, "tags": []}, "source": ["The receptive field above it visualized for the horizontal stack, which includes the features of the vertical convolutions.\n", "It grows over layers without any blind spot as we had before.\n", "The difference between \"weighted\" and \"binary\" receptive field is that for the latter, we check whether there are any gradients flowing back to this pixel.\n", "This indicates that the center pixel indeed can use information from this pixel.\n", "Nevertheless, due to the convolution weights, some pixels have a stronger effect on the prediction than others.\n", "This is visualized in the weighted receptive field by plotting the gradient magnitude for each pixel instead of a binary yes/no.\n", "\n", "\n", "Another receptive field we can check is the one for the vertical stack\n", "as the one above is for the horizontal stack. Let's visualize it below:"]}, {"cell_type": "code", "execution_count": 13, "id": "cd0487f2", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:23.363786Z", "iopub.status.busy": "2021-09-16T12:42:23.363266Z", "iopub.status.idle": "2021-09-16T12:42:23.517870Z", "shell.execute_reply": "2021-09-16T12:42:23.517438Z"}, "papermill": {"duration": 0.193071, "end_time": "2021-09-16T12:42:23.517983", "exception": false, "start_time": "2021-09-16T12:42:23.324912", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:23.446589\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["show_center_recep_field(inp_img, vert_img)"]}, {"cell_type": "markdown", "id": "bbe7c460", "metadata": {"papermill": {"duration": 0.036988, "end_time": "2021-09-16T12:42:23.591980", "exception": false, "start_time": "2021-09-16T12:42:23.554992", "status": "completed"}, "tags": []}, "source": ["As we have discussed before, the vertical stack only looks at pixels above the one we want to predict.\n", "Hence, we can validate that our implementation works as we initially expected it to.\n", "As a final step, let's clean up the computation graph we still had kept\n", "in memory for the visualization of the receptive field:"]}, {"cell_type": "code", "execution_count": 14, "id": "e76aa938", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:23.668813Z", "iopub.status.busy": "2021-09-16T12:42:23.668347Z", "iopub.status.idle": "2021-09-16T12:42:23.670487Z", "shell.execute_reply": "2021-09-16T12:42:23.670021Z"}, "papermill": {"duration": 0.041448, "end_time": "2021-09-16T12:42:23.670586", "exception": false, "start_time": "2021-09-16T12:42:23.629138", "status": "completed"}, "tags": []}, "outputs": [], "source": ["del inp_img, horiz_conv, vert_conv"]}, {"cell_type": "markdown", "id": "193e3fb4", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.037077, "end_time": "2021-09-16T12:42:23.744338", "exception": false, "start_time": "2021-09-16T12:42:23.707261", "status": "completed"}, "tags": []}, "source": ["## Gated PixelCNN\n", "\n", "
\n", "\n", "In the next step, we will use the masked convolutions to build a full autoregressive model, called Gated PixelCNN.\n", "The difference between the original PixelCNN and Gated PixelCNN is the use of separate horizontal and vertical stacks.\n", "However, in literature, you often see that people refer to the Gated PixelCNN simply as \"PixelCNN\".\n", "Hence, in the following, if we say \"PixelCNN\", we usually mean the gated version.\n", "What \"Gated\" refers to in the model name is explained next.\n", "\n", "### Gated Convolutions\n", "\n", "For visualizing the receptive field, we assumed a very simplified stack of vertical and horizontal convolutions.\n", "Obviously, there are more sophisticated ways of doing it, and PixelCNN uses gated convolutions for this.\n", "Specifically, the Gated Convolution block in PixelCNN looks as follows\n", "(figure credit - [Aaron van den Oord et al. ](https://arxiv.org/pdf/1606.05328.pdf)):\n", "\n", "
\n", "\n", "The left path is the vertical stack (the $N\\times N$ convolution is masked correspondingly),\n", "and the right path is the horizontal stack.\n", "Gated convolutions are implemented by having a twice as large output channel size,\n", "and combine them by a element-wise multiplication of $\\tanh$ and a sigmoid.\n", "For a linear layer, we can express a gated activation unit as follows:\n", "\n", "$$\\mathbf{y} = \\tanh\\left(\\mathbf{W}_{f}\\mathbf{x}\\right)\\odot\\sigma\\left(\\mathbf{W}_{g}\\mathbf{x}\\right)$$\n", "\n", "For simplicity, biases have been neglected and the linear layer split into two part, $\\mathbf{W}_{f}$ and $\\mathbf{W}_{g}$.\n", "This concept resembles the input and modulation gate in an LSTM, and has been used in many other architectures as well.\n", "The main motivation behind this gated activation is that it might allow to model more complex interactions and simplifies learning.\n", "But as in any other architecture, this is mostly a design choice and can be considered a hyperparameters.\n", "\n", "Besides the gated convolutions, we also see that the horizontal stack uses a residual connection while the vertical stack does not.\n", "This is because we use the output of the horizontal stack for prediction.\n", "Each convolution in the vertical stack also receives a strong gradient signal\n", "as it is only two $1\\times 1$ convolutions away from the residual connection,\n", "and does not require another residual connection to all its earleri layers.\n", "\n", "The implementation in PyTorch is fairly straight forward for this block,\n", "because the visualization above gives us a computation graph to follow:"]}, {"cell_type": "code", "execution_count": 15, "id": "cc9d393c", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:23.919095Z", "iopub.status.busy": "2021-09-16T12:42:23.918572Z", "iopub.status.idle": "2021-09-16T12:42:23.920520Z", "shell.execute_reply": "2021-09-16T12:42:23.920095Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.138888, "end_time": "2021-09-16T12:42:23.920638", "exception": false, "start_time": "2021-09-16T12:42:23.781750", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class GatedMaskedConv(nn.Module):\n", " def __init__(self, c_in, **kwargs):\n", " \"\"\"Gated Convolution block implemented the computation graph shown above.\"\"\"\n", " super().__init__()\n", " self.conv_vert = VerticalStackConvolution(c_in, c_out=2 * c_in, **kwargs)\n", " self.conv_horiz = HorizontalStackConvolution(c_in, c_out=2 * c_in, **kwargs)\n", " self.conv_vert_to_horiz = nn.Conv2d(2 * c_in, 2 * c_in, kernel_size=1, padding=0)\n", " self.conv_horiz_1x1 = nn.Conv2d(c_in, c_in, kernel_size=1, padding=0)\n", "\n", " def forward(self, v_stack, h_stack):\n", " # Vertical stack (left)\n", " v_stack_feat = self.conv_vert(v_stack)\n", " v_val, v_gate = v_stack_feat.chunk(2, dim=1)\n", " v_stack_out = torch.tanh(v_val) * torch.sigmoid(v_gate)\n", "\n", " # Horizontal stack (right)\n", " h_stack_feat = self.conv_horiz(h_stack)\n", " h_stack_feat = h_stack_feat + self.conv_vert_to_horiz(v_stack_feat)\n", " h_val, h_gate = h_stack_feat.chunk(2, dim=1)\n", " h_stack_feat = torch.tanh(h_val) * torch.sigmoid(h_gate)\n", " h_stack_out = self.conv_horiz_1x1(h_stack_feat)\n", " h_stack_out = h_stack_out + h_stack\n", "\n", " return v_stack_out, h_stack_out"]}, {"cell_type": "markdown", "id": "2b8ce7cc", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.037081, "end_time": "2021-09-16T12:42:23.995828", "exception": false, "start_time": "2021-09-16T12:42:23.958747", "status": "completed"}, "tags": []}, "source": ["### Building the model\n", "\n", "Using the gated convolutions, we can now build our PixelCNN model.\n", "The architecture consists of multiple stacked GatedMaskedConv blocks, where we add an additional dilation factor to a few convolutions.\n", "This is used to increase the receptive field of the model and allows to take a larger context into accout during generation.\n", "As a reminder, dilation on a convolution works looks as follows\n", "(figure credit - [Vincent Dumoulin and Francesco Visin](https://arxiv.org/pdf/1603.07285.pdf)):\n", "\n", "
\n", "\n", "Note that the smaller output size is only because the animation assumes no padding.\n", "In our implementation, we will pad the input image correspondingly.\n", "Alternatively to dilated convolutions, we could downsample the input and use a encoder-decoder architecture as in PixelCNN++ [3].\n", "This is especially beneficial if we want to build a very deep autoregressive model.\n", "Nonetheless, as we seek to train a reasonably small model, dilated convolutions are the more efficient option to use here.\n", "\n", "Below, we implement the PixelCNN model as a PyTorch Lightning module.\n", "Besides the stack of gated convolutions, we also have the initial\n", "horizontal and vertical convolutions which mask the center pixel, and a\n", "final $1\\times 1$ convolution which maps the output features to class\n", "predictions. To determine the likelihood of a batch of images, we first\n", "create our initial features using the masked horizontal and vertical\n", "input convolution. Next, we forward the features through the stack of\n", "gated convolutions. Finally, we take the output features of the\n", "horizontal stack, and apply the $1\\times 1$ convolution for\n", "classification. We use the bits per dimension metric for the likelihood,\n", "similarly to Tutorial 11 and assignment 3."]}, {"cell_type": "code", "execution_count": 16, "id": "16fca558", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:24.082322Z", "iopub.status.busy": "2021-09-16T12:42:24.081826Z", "iopub.status.idle": "2021-09-16T12:42:24.084319Z", "shell.execute_reply": "2021-09-16T12:42:24.083832Z"}, "papermill": {"duration": 0.051889, "end_time": "2021-09-16T12:42:24.084419", "exception": false, "start_time": "2021-09-16T12:42:24.032530", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class PixelCNN(pl.LightningModule):\n", " def __init__(self, c_in, c_hidden):\n", " super().__init__()\n", " self.save_hyperparameters()\n", "\n", " # Initial convolutions skipping the center pixel\n", " self.conv_vstack = VerticalStackConvolution(c_in, c_hidden, mask_center=True)\n", " self.conv_hstack = HorizontalStackConvolution(c_in, c_hidden, mask_center=True)\n", " # Convolution block of PixelCNN. We use dilation instead of downscaling\n", " self.conv_layers = nn.ModuleList(\n", " [\n", " GatedMaskedConv(c_hidden),\n", " GatedMaskedConv(c_hidden, dilation=2),\n", " GatedMaskedConv(c_hidden),\n", " GatedMaskedConv(c_hidden, dilation=4),\n", " GatedMaskedConv(c_hidden),\n", " GatedMaskedConv(c_hidden, dilation=2),\n", " GatedMaskedConv(c_hidden),\n", " ]\n", " )\n", " # Output classification convolution (1x1)\n", " self.conv_out = nn.Conv2d(c_hidden, c_in * 256, kernel_size=1, padding=0)\n", "\n", " self.example_input_array = train_set[0][0][None]\n", "\n", " def forward(self, x):\n", " \"\"\"Forward image through model and return logits for each pixel.\n", "\n", " Args:\n", " x: Image tensor with integer values between 0 and 255.\n", " \"\"\"\n", " # Scale input from 0 to 255 back to -1 to 1\n", " x = (x.float() / 255.0) * 2 - 1\n", "\n", " # Initial convolutions\n", " v_stack = self.conv_vstack(x)\n", " h_stack = self.conv_hstack(x)\n", " # Gated Convolutions\n", " for layer in self.conv_layers:\n", " v_stack, h_stack = layer(v_stack, h_stack)\n", " # 1x1 classification convolution\n", " # Apply ELU before 1x1 convolution for non-linearity on residual connection\n", " out = self.conv_out(F.elu(h_stack))\n", "\n", " # Output dimensions: [Batch, Classes, Channels, Height, Width]\n", " out = out.reshape(out.shape[0], 256, out.shape[1] // 256, out.shape[2], out.shape[3])\n", " return out\n", "\n", " def calc_likelihood(self, x):\n", " # Forward pass with bpd likelihood calculation\n", " pred = self.forward(x)\n", " nll = F.cross_entropy(pred, x, reduction=\"none\")\n", " bpd = nll.mean(dim=[1, 2, 3]) * np.log2(np.exp(1))\n", " return bpd.mean()\n", "\n", " @torch.no_grad()\n", " def sample(self, img_shape, img=None):\n", " \"\"\"Sampling function for the autoregressive model.\n", "\n", " Args:\n", " img_shape: Shape of the image to generate (B,C,H,W)\n", " img (optional): If given, this tensor will be used as\n", " a starting image. The pixels to fill\n", " should be -1 in the input tensor.\n", " \"\"\"\n", " # Create empty image\n", " if img is None:\n", " img = torch.zeros(img_shape, dtype=torch.long).to(device) - 1\n", " # Generation loop\n", " for h in tqdm(range(img_shape[2]), leave=False):\n", " for w in range(img_shape[3]):\n", " for c in range(img_shape[1]):\n", " # Skip if not to be filled (-1)\n", " if (img[:, c, h, w] != -1).all().item():\n", " continue\n", " # For efficiency, we only have to input the upper part of the image\n", " # as all other parts will be skipped by the masked convolutions anyways\n", " pred = self.forward(img[:, :, : h + 1, :])\n", " probs = F.softmax(pred[:, :, c, h, w], dim=-1)\n", " img[:, c, h, w] = torch.multinomial(probs, num_samples=1).squeeze(dim=-1)\n", " return img\n", "\n", " def configure_optimizers(self):\n", " optimizer = optim.Adam(self.parameters(), lr=1e-3)\n", " scheduler = optim.lr_scheduler.StepLR(optimizer, 1, gamma=0.99)\n", " return [optimizer], [scheduler]\n", "\n", " def training_step(self, batch, batch_idx):\n", " loss = self.calc_likelihood(batch[0])\n", " self.log(\"train_bpd\", loss)\n", " return loss\n", "\n", " def validation_step(self, batch, batch_idx):\n", " loss = self.calc_likelihood(batch[0])\n", " self.log(\"val_bpd\", loss)\n", "\n", " def test_step(self, batch, batch_idx):\n", " loss = self.calc_likelihood(batch[0])\n", " self.log(\"test_bpd\", loss)"]}, {"cell_type": "markdown", "id": "0a771ffa", "metadata": {"papermill": {"duration": 0.037059, "end_time": "2021-09-16T12:42:24.159136", "exception": false, "start_time": "2021-09-16T12:42:24.122077", "status": "completed"}, "tags": []}, "source": ["To sample from the autoregressive model, we need to iterate over all dimensions of the input.\n", "We start with an empty image, and fill the pixels one by one, starting from the upper left corner.\n", "Note that as for predicting $x_i$, all pixels below it have no influence on the prediction.\n", "Hence, we can cut the image in height without changing the prediction while increasing efficiency.\n", "Nevertheless, all the loops in the sampling function already show that it will take us quite some time to sample.\n", "A lot of computation could be reused across loop iterations as those the features on the already predicted pixels will not change over iterations.\n", "Nevertheless, this takes quite some effort to implement, and is often not done in implementations because in the end,\n", "autoregressive sampling remains sequential and slow.\n", "Hence, we settle with the default implementation here.\n", "\n", "Before training the model, we can check the full receptive field of the model on an MNIST image of size $28\\times 28$:"]}, {"cell_type": "code", "execution_count": 17, "id": "546c40c3", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:24.236461Z", "iopub.status.busy": "2021-09-16T12:42:24.236001Z", "iopub.status.idle": "2021-09-16T12:42:24.487057Z", "shell.execute_reply": "2021-09-16T12:42:24.486641Z"}, "papermill": {"duration": 0.291233, "end_time": "2021-09-16T12:42:24.487172", "exception": false, "start_time": "2021-09-16T12:42:24.195939", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:24.416262\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["test_model = PixelCNN(c_in=1, c_hidden=64)\n", "inp = torch.zeros(1, 1, 28, 28)\n", "inp.requires_grad_()\n", "out = test_model(inp)\n", "show_center_recep_field(inp, out.squeeze(dim=2))\n", "del inp, out, test_model"]}, {"cell_type": "markdown", "id": "7b3910fe", "metadata": {"papermill": {"duration": 0.038084, "end_time": "2021-09-16T12:42:24.563987", "exception": false, "start_time": "2021-09-16T12:42:24.525903", "status": "completed"}, "tags": []}, "source": ["The visualization shows that for predicting any pixel, we can take almost half of the image into account.\n", "However, keep in mind that this is the \"theoretical\" receptive field and not necessarily\n", "the [effective receptive field](https://arxiv.org/pdf/1701.04128.pdf), which is usually much smaller.\n", "For a stronger model, we should therefore try to increase the receptive\n", "field even further. Especially, for the pixel on the bottom right, the\n", "very last pixel, we would be allowed to take into account the whole\n", "image. However, our current receptive field only spans across 1/4 of the\n", "image. An encoder-decoder architecture can help with this, but it also\n", "shows that we require a much deeper, more complex network in\n", "autoregressive models than in VAEs or energy-based models."]}, {"cell_type": "markdown", "id": "af3db43c", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.039876, "end_time": "2021-09-16T12:42:24.641944", "exception": false, "start_time": "2021-09-16T12:42:24.602068", "status": "completed"}, "tags": []}, "source": ["### Training loop\n", "\n", "To train the model, we again can rely on PyTorch Lightning and write a\n", "function below for loading the pretrained model if it exists. To reduce\n", "the computational cost, we have saved the validation and test score in\n", "the checkpoint already:"]}, {"cell_type": "code", "execution_count": 18, "id": "386d2b64", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:24.724459Z", "iopub.status.busy": "2021-09-16T12:42:24.723984Z", "iopub.status.idle": "2021-09-16T12:42:24.726084Z", "shell.execute_reply": "2021-09-16T12:42:24.725601Z"}, "papermill": {"duration": 0.046099, "end_time": "2021-09-16T12:42:24.726183", "exception": false, "start_time": "2021-09-16T12:42:24.680084", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def train_model(**kwargs):\n", " # Create a PyTorch Lightning trainer with the generation callback\n", " trainer = pl.Trainer(\n", " default_root_dir=os.path.join(CHECKPOINT_PATH, \"PixelCNN\"),\n", " gpus=1 if str(device).startswith(\"cuda\") else 0,\n", " max_epochs=150,\n", " callbacks=[\n", " ModelCheckpoint(save_weights_only=True, mode=\"min\", monitor=\"val_bpd\"),\n", " LearningRateMonitor(\"epoch\"),\n", " ],\n", " )\n", " result = None\n", " # Check whether pretrained model exists. If yes, load it and skip training\n", " pretrained_filename = os.path.join(CHECKPOINT_PATH, \"PixelCNN.ckpt\")\n", " if os.path.isfile(pretrained_filename):\n", " print(\"Found pretrained model, loading...\")\n", " model = PixelCNN.load_from_checkpoint(pretrained_filename)\n", " ckpt = torch.load(pretrained_filename, map_location=device)\n", " result = ckpt.get(\"result\", None)\n", " else:\n", " model = PixelCNN(**kwargs)\n", " trainer.fit(model, train_loader, val_loader)\n", " model = model.to(device)\n", "\n", " if result is None:\n", " # Test best model on validation and test set\n", " val_result = trainer.test(model, test_dataloaders=val_loader, verbose=False)\n", " test_result = trainer.test(model, test_dataloaders=test_loader, verbose=False)\n", " result = {\"test\": test_result, \"val\": val_result}\n", " return model, result"]}, {"cell_type": "markdown", "id": "245b1ba8", "metadata": {"papermill": {"duration": 0.037966, "end_time": "2021-09-16T12:42:24.802271", "exception": false, "start_time": "2021-09-16T12:42:24.764305", "status": "completed"}, "tags": []}, "source": ["Training the model is time consuming and we recommend using the provided pre-trained model for going through this notebook.\n", "However, feel free to play around with the hyperparameter like number of layers etc.\n", "if you want to get a feeling for those.\n", "\n", "When calling the training function with a pre-trained model, we automatically load it and print its test performance:"]}, {"cell_type": "code", "execution_count": 19, "id": "4328bb62", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:24.884095Z", "iopub.status.busy": "2021-09-16T12:42:24.883627Z", "iopub.status.idle": "2021-09-16T12:42:27.511570Z", "shell.execute_reply": "2021-09-16T12:42:27.511143Z"}, "papermill": {"duration": 2.671446, "end_time": "2021-09-16T12:42:27.511686", "exception": false, "start_time": "2021-09-16T12:42:24.840240", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model, loading...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Test bits per dimension: 0.808bpd\n"]}], "source": ["model, result = train_model(c_in=1, c_hidden=64)\n", "test_res = result[\"test\"][0]\n", "print(\n", " \"Test bits per dimension: %4.3fbpd\" % (test_res[\"test_loss\"] if \"test_loss\" in test_res else test_res[\"test_bpd\"])\n", ")"]}, {"cell_type": "markdown", "id": "c4e1ed4e", "metadata": {"papermill": {"duration": 0.038901, "end_time": "2021-09-16T12:42:27.590698", "exception": false, "start_time": "2021-09-16T12:42:27.551797", "status": "completed"}, "tags": []}, "source": ["With a test performance of 0.809bpd, the PixelCNN significantly outperforms the normalizing flows we have seen in Tutorial 11.\n", "Considering image modeling as an autoregressive problem simplifies the learning process as predicting\n", "one pixel given the ground truth of all others is much easier than predicting all pixels at once.\n", "In addition, PixelCNN can explicitly predict the pixel values by a discrete softmax while\n", "Normalizing Flows have to learn transformations in continuous latent space.\n", "These two aspects allow the PixelCNN to achieve a notably better performance.\n", "\n", "To fully compare the models, let's also measure the number of parameters of the PixelCNN:"]}, {"cell_type": "code", "execution_count": 20, "id": "f8c9acf4", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:27.674832Z", "iopub.status.busy": "2021-09-16T12:42:27.674359Z", "iopub.status.idle": "2021-09-16T12:42:27.676436Z", "shell.execute_reply": "2021-09-16T12:42:27.676819Z"}, "papermill": {"duration": 0.046548, "end_time": "2021-09-16T12:42:27.676936", "exception": false, "start_time": "2021-09-16T12:42:27.630388", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Number of parameters: 852,160\n"]}], "source": ["num_params = sum(np.prod(param.shape) for param in model.parameters())\n", "print(f\"Number of parameters: {num_params:,}\")"]}, {"cell_type": "markdown", "id": "d3ee86a3", "metadata": {"papermill": {"duration": 0.039335, "end_time": "2021-09-16T12:42:27.755406", "exception": false, "start_time": "2021-09-16T12:42:27.716071", "status": "completed"}, "tags": []}, "source": ["Compared to the multi-scale normalizing flows, the PixelCNN has considerably less parameters.\n", "Of course, the number of parameters depend on our hyperparameter choices.\n", "Nevertheless, in general, it can be said that autoregressive models\n", "require considerably less parameters than normalizing flows to reach\n", "good performance, based on the reasons stated above. Still,\n", "autoregressive models are much slower in sampling than normalizing\n", "flows, which limits their possible applications."]}, {"cell_type": "markdown", "id": "77208025", "metadata": {"papermill": {"duration": 0.046301, "end_time": "2021-09-16T12:42:27.842873", "exception": false, "start_time": "2021-09-16T12:42:27.796572", "status": "completed"}, "tags": []}, "source": ["## Sampling\n", "\n", "One way of qualitatively analysing generative models is by looking at the actual samples.\n", "Let's therefore use our sampling function to generate a few digits:"]}, {"cell_type": "code", "execution_count": 21, "id": "27bb57d8", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:27.932413Z", "iopub.status.busy": "2021-09-16T12:42:27.931873Z", "iopub.status.idle": "2021-09-16T12:42:32.123905Z", "shell.execute_reply": "2021-09-16T12:42:32.123484Z"}, "papermill": {"duration": 4.238655, "end_time": "2021-09-16T12:42:32.124020", "exception": false, "start_time": "2021-09-16T12:42:27.885365", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 1\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "8961cfdd02c24f6dbc1c42cf6db817fd", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0/28 [00:00\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:42:32.079950\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["pl.seed_everything(1)\n", "samples = model.sample(img_shape=(16, 1, 28, 28))\n", "show_imgs(samples.cpu())"]}, {"cell_type": "markdown", "id": "8fb41b9f", "metadata": {"papermill": {"duration": 0.041107, "end_time": "2021-09-16T12:42:32.207277", "exception": false, "start_time": "2021-09-16T12:42:32.166170", "status": "completed"}, "tags": []}, "source": ["Most of the samples can be identified as digits, and overall we achieve a better quality than we had in normalizing flows.\n", "This goes along with the lower likelihood we achieved with autoregressive models.\n", "Nevertheless, we also see that there is still place for improvement\n", "as a considerable amount of samples cannot be identified (for example the first row).\n", "Deeper autoregressive models are expected to achieve better quality,\n", "as they can take more context into account for generating the pixels.\n", "\n", "Note that on Google Colab, you might see different results, specifically with a white line at the top.\n", "After some debugging, it seemed that the difference occurs inside the dilated convolution,\n", "as it gives different results for different batch sizes.\n", "However, it is hard to debug this further as it might be a bug of the installed PyTorch version on Google Colab.\n", "\n", "The trained model itself is not restricted to any specific image size.\n", "However, what happens if we actually sample a larger image than we had\n", "seen in our training dataset? Let's try below to sample images of size\n", "$64\\times64$ instead of $28\\times28$:"]}, {"cell_type": "code", "execution_count": 22, "id": "f55e0ed4", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:42:32.292415Z", "iopub.status.busy": "2021-09-16T12:42:32.291942Z", "iopub.status.idle": "2021-09-16T12:43:10.492028Z", "shell.execute_reply": "2021-09-16T12:43:10.492425Z"}, "papermill": {"duration": 38.244567, "end_time": "2021-09-16T12:43:10.492570", "exception": false, "start_time": "2021-09-16T12:42:32.248003", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 1\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "a04db2d75a3f476487be88f18d66ddb1", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0/64 [00:00\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:43:10.455579\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["pl.seed_everything(1)\n", "samples = model.sample(img_shape=(8, 1, 64, 64))\n", "show_imgs(samples.cpu())"]}, {"cell_type": "markdown", "id": "3876e6b8", "metadata": {"papermill": {"duration": 0.043073, "end_time": "2021-09-16T12:43:10.581847", "exception": false, "start_time": "2021-09-16T12:43:10.538774", "status": "completed"}, "tags": []}, "source": ["The larger images show that changing the size of the image during testing confuses the model\n", "and generates abstract figures (you can sometimes spot a digit in the upper left corner).\n", "In addition, sampling for images of 64x64 pixels take more than a minute on a GPU.\n", "Clearly, autoregressive models cannot be scaled to large images without changing the sampling procedure such as with [forecasting](https://arxiv.org/abs/2002.09928).\n", "Our implementation is also not the most efficient as many computations can be stored and reused throughout the sampling process.\n", "Nevertheless, the sampling procedure stays sequential which is\n", "inherently slower than parallel generation like done in normalizing\n", "flows."]}, {"cell_type": "markdown", "id": "5ef1ba66", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.042826, "end_time": "2021-09-16T12:43:10.667581", "exception": false, "start_time": "2021-09-16T12:43:10.624755", "status": "completed"}, "tags": []}, "source": ["### Autocompletion\n", "\n", "One common application done with autoregressive models is\n", "auto-completing an image. As autoregressive models predict pixels one by\n", "one, we can set the first $N$ pixels to predefined values and check how\n", "the model completes the image. For implementing this, we just need to\n", "skip the iterations in the sampling loop that already have a value\n", "unequals -1. See above in our PyTorch Lightning module for the specific\n", "implementation. In the cell below, we randomly take three images from\n", "the training set, mask about the lower half of the image, and let the\n", "model autocomplete it. To see the diversity of samples, we do this 12\n", "times for each image:"]}, {"cell_type": "code", "execution_count": 23, "id": "44b3d642", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:43:10.758938Z", "iopub.status.busy": "2021-09-16T12:43:10.758463Z", "iopub.status.idle": "2021-09-16T12:43:18.484127Z", "shell.execute_reply": "2021-09-16T12:43:18.483633Z"}, "papermill": {"duration": 7.773878, "end_time": "2021-09-16T12:43:18.484244", "exception": false, "start_time": "2021-09-16T12:43:10.710366", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Original image and input image to sampling:\n"]}, {"data": {"application/pdf": "JVBERi0xLjQKJazcIKu6CjEgMCBvYmoKPDwgL1BhZ2VzIDIgMCBSIC9UeXBlIC9DYXRhbG9nID4+CmVuZG9iago4IDAgb2JqCjw8IC9FeHRHU3RhdGUgNCAwIFIgL0ZvbnQgMyAwIFIgL1BhdHRlcm4gNSAwIFIKL1Byb2NTZXQgWyAvUERGIC9UZXh0IC9JbWFnZUIgL0ltYWdlQyAvSW1hZ2VJIF0gL1NoYWRpbmcgNiAwIFIKL1hPYmplY3QgNyAwIFIgPj4KZW5kb2JqCjExIDAgb2JqCjw8IC9Bbm5vdHMgMTAgMCBSIC9Db250ZW50cyA5IDAgUgovR3JvdXAgPDwgL0NTIC9EZXZpY2VSR0IgL1MgL1RyYW5zcGFyZW5jeSAvVHlwZSAvR3JvdXAgPj4KL01lZGlhQm94IFsgMCAwIDE3Mi4zODM3NSA5NS45NCBdIC9QYXJlbnQgMiAwIFIgL1Jlc291cmNlcyA4IDAgUgovVHlwZSAvUGFnZSA+PgplbmRvYmoKOSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDEyIDAgUiA+PgpzdHJlYW0KeJxNjUEKwjAURPf/FHOCJD/tJ8myUggu68YDhKAWW6kFvb6/XRQXAzPDDI8xku0YtxUOo+oLRobt6+dR6iWfUFZy2k/EwZsmNkE0Pf9SEpNabdzh7kQzLQjG72IJJu3TyEZavCuumGE7v2FZsaxYh6wflogNF/1xLxPsmdG/MNBAP35RJfYKZW5kc3RyZWFtCmVuZG9iagoxMiAwIG9iagoxMzQKZW5kb2JqCjEwIDAgb2JqClsgXQplbmRvYmoKMyAwIG9iago8PCA+PgplbmRvYmoKNCAwIG9iago8PCAvQTEgPDwgL0NBIDAgL1R5cGUgL0V4dEdTdGF0ZSAvY2EgMSA+PgovQTIgPDwgL0NBIDEgL1R5cGUgL0V4dEdTdGF0ZSAvY2EgMSA+PiA+PgplbmRvYmoKNSAwIG9iago8PCA+PgplbmRvYmoKNiAwIG9iago8PCA+PgplbmRvYmoKNyAwIG9iago8PCAvSTEgMTMgMCBSID4+CmVuZG9iagoxMyAwIG9iago8PCAvQml0c1BlckNvbXBvbmVudCA4Ci9Db2xvclNwYWNlIFsvSW5kZXhlZCAvRGV2aWNlUkdCIDcwICj////9/f37+/v6+vr19fXy8vLw8PDv7+/t7e3s7Ozr6+vo6Ojk5OTj4+Pf39/Y2NjR0dHQ0NDPz8/Hx8fDw8PCwsLBwcG/v7+6urq5ubm0tLSurq6srKylpaWgoKCVlZWTk5OPj4+Li4uKioqIiIiAgIB9fX1ycnJjY2NgYGBfX19WVlZRUVFQUFBPT09MTExHR0dEREQ7Ozs1NTUyMjIwMDAsLCwqKiojIyMiIiIdHR0bGxsaGhoZGRkUFBQTExMSEhIODg4MDAxcblxuXG4GBgYEBAQAAAApXQovRGVjb2RlUGFybXMgPDwgL0NvbG9ycyAxIC9Db2x1bW5zIDE1OCAvUHJlZGljdG9yIDEwID4+Ci9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9IZWlnaHQgODIgL0xlbmd0aCAxNCAwIFIgL1N1YnR5cGUgL0ltYWdlCi9UeXBlIC9YT2JqZWN0IC9XaWR0aCAxNTggPj4Kc3RyZWFtCnic7dfXcoJAGIZh1gY2Yu8K9oJdsDdEc/+XFCBMYkECs2qE+b9DGN55DnYUiPpbj/hvgPGAhzNb8D4fs/rDY8DDiQEPJwY8nBjwcGLAw4kBDycGPJzYfV673SYIgmVv7xyPx9PJGk9r3cbU1v0Y8J7BE8VoNIoQ4riLyzxfq9UoiorFer2eWZ6oxNTWRYxXYmorptMC3vN4mw1S1+mo/d1uN5mUy+VgEGmrVqtmeRst1lFiohKbKLHgecxZPI77fjAQYBiGptHVEglJkszyOC0WUGL0TSyhxID3Qp4k5fN5r9f7W/F4MpkMy94/LK/8z31znrrxeNxsfihrNBqjkXylVJJtPp9vvQaezXlXGw6HFCXz+v2+QRF4+ovH4wj5/f7lcgk8R/IqlYpxEXg25HW7JEkmk4fDAXgWeYIgkKT8i1wo/FkEnt14rVZLfQ0dDIBnlbffy1/yCKVSKb1vFuDZmvdz8AxPHvD0l8vJuFBoPp8Dz1m87XYbici8bNZcEXjn43keoXA4LAjAcxyvWCwilE6nzRaBZxvebOZ2uxFyuVwMs1qtgGeJN52qLys0TS8W5orAsw3PehF4OEXg4RSfwHvbAQ9nwMPZF28utk0KZW5kc3RyZWFtCmVuZG9iagoxNCAwIG9iago0NjMKZW5kb2JqCjIgMCBvYmoKPDwgL0NvdW50IDEgL0tpZHMgWyAxMSAwIFIgXSAvVHlwZSAvUGFnZXMgPj4KZW5kb2JqCjE1IDAgb2JqCjw8IC9DcmVhdGlvbkRhdGUgKEQ6MjAyMTA5MTYxNDQzMTArMDInMDAnKQovQ3JlYXRvciAoTWF0cGxvdGxpYiB2My40LjMsIGh0dHBzOi8vbWF0cGxvdGxpYi5vcmcpCi9Qcm9kdWNlciAoTWF0cGxvdGxpYiBwZGYgYmFja2VuZCB2My40LjMpID4+CmVuZG9iagp4cmVmCjAgMTYKMDAwMDAwMDAwMCA2NTUzNSBmIAowMDAwMDAwMDE2IDAwMDAwIG4gCjAwMDAwMDE3ODMgMDAwMDAgbiAKMDAwMDAwMDY0NSAwMDAwMCBuIAowMDAwMDAwNjY2IDAwMDAwIG4gCjAwMDAwMDA3NjUgMDAwMDAgbiAKMDAwMDAwMDc4NiAwMDAwMCBuIAowMDAwMDAwODA3IDAwMDAwIG4gCjAwMDAwMDAwNjUgMDAwMDAgbiAKMDAwMDAwMDM5NiAwMDAwMCBuIAowMDAwMDAwNjI1IDAwMDAwIG4gCjAwMDAwMDAyMDggMDAwMDAgbiAKMDAwMDAwMDYwNSAwMDAwMCBuIAowMDAwMDAwODM5IDAwMDAwIG4gCjAwMDAwMDE3NjMgMDAwMDAgbiAKMDAwMDAwMTg0MyAwMDAwMCBuIAp0cmFpbGVyCjw8IC9JbmZvIDE1IDAgUiAvUm9vdCAxIDAgUiAvU2l6ZSAxNiA+PgpzdGFydHhyZWYKMjAwMAolJUVPRgo=\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:43:10.792399\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["Global seed set to 1\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "e76d7eb2829b4c6c9b26ff6703e0787d", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0/28 [00:00\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:43:13.309899\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Original image and input image to sampling:\n"]}, {"data": {"application/pdf": "JVBERi0xLjQKJazcIKu6CjEgMCBvYmoKPDwgL1BhZ2VzIDIgMCBSIC9UeXBlIC9DYXRhbG9nID4+CmVuZG9iago4IDAgb2JqCjw8IC9FeHRHU3RhdGUgNCAwIFIgL0ZvbnQgMyAwIFIgL1BhdHRlcm4gNSAwIFIKL1Byb2NTZXQgWyAvUERGIC9UZXh0IC9JbWFnZUIgL0ltYWdlQyAvSW1hZ2VJIF0gL1NoYWRpbmcgNiAwIFIKL1hPYmplY3QgNyAwIFIgPj4KZW5kb2JqCjExIDAgb2JqCjw8IC9Bbm5vdHMgMTAgMCBSIC9Db250ZW50cyA5IDAgUgovR3JvdXAgPDwgL0NTIC9EZXZpY2VSR0IgL1MgL1RyYW5zcGFyZW5jeSAvVHlwZSAvR3JvdXAgPj4KL01lZGlhQm94IFsgMCAwIDE3Mi4zODM3NSA5NS45NCBdIC9QYXJlbnQgMiAwIFIgL1Jlc291cmNlcyA4IDAgUgovVHlwZSAvUGFnZSA+PgplbmRvYmoKOSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDEyIDAgUiA+PgpzdHJlYW0KeJxNjUEKwjAURPf/FHOCJD/tJ8myUggu68YDhKAWW6kFvb6/XRQXAzPDDI8xku0YtxUOo+oLRobt6+dR6iWfUFZy2k/EwZsmNkE0Pf9SEpNabdzh7kQzLQjG72IJJu3TyEZavCuumGE7v2FZsaxYh6wflogNF/1xLxPsmdG/MNBAP35RJfYKZW5kc3RyZWFtCmVuZG9iagoxMiAwIG9iagoxMzQKZW5kb2JqCjEwIDAgb2JqClsgXQplbmRvYmoKMyAwIG9iago8PCA+PgplbmRvYmoKNCAwIG9iago8PCAvQTEgPDwgL0NBIDAgL1R5cGUgL0V4dEdTdGF0ZSAvY2EgMSA+PgovQTIgPDwgL0NBIDEgL1R5cGUgL0V4dEdTdGF0ZSAvY2EgMSA+PiA+PgplbmRvYmoKNSAwIG9iago8PCA+PgplbmRvYmoKNiAwIG9iago8PCA+PgplbmRvYmoKNyAwIG9iago8PCAvSTEgMTMgMCBSID4+CmVuZG9iagoxMyAwIG9iago8PCAvQml0c1BlckNvbXBvbmVudCA4Ci9Db2xvclNwYWNlIFsvSW5kZXhlZCAvRGV2aWNlUkdCIDY4ICj////+/v78/Pz7+/v5+fn39/fy8vLx8fHq6urp6eno6Ojm5ubl5eXd3d3Z2dnX19fW1tbV1dXMzMzGxsbBwcG/v7+9vb28vLy7u7u6urq4uLi1tbW0tLSysrKtra2srKyhoaGYmJiVlZWRkZGAgIB1dXVzc3NxcXFqampnZ2diYmJaWlpXV1dTU1NRUVFPT09MTExLS0tCQkJAQEA7Ozs6OjowMDAgICAbGxsYGBgXFxcVFRUTExMODg5cclxyXHJcblxuXG4ICAgGBgYDAwMCAgIAAAApXQovRGVjb2RlUGFybXMgPDwgL0NvbG9ycyAxIC9Db2x1bW5zIDE1OCAvUHJlZGljdG9yIDEwID4+Ci9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9IZWlnaHQgODIgL0xlbmd0aCAxNCAwIFIgL1N1YnR5cGUgL0ltYWdlCi9UeXBlIC9YT2JqZWN0IC9XaWR0aCAxNTggPj4Kc3RyZWFtCnic7dhXj4JAFIZhxo5rb9h717X33v7/b9oZgu7qEpnNIeq457tDkjfPBRBEKr/0pGcD7g95kAnBO5mzsukx5EFiyIPEOHnz+TwSGQwGHEWeWITFkPcSvO02kUgQksvl4LwtixEW+xe85XKpKISt0WhAeax1jiHv+bxMJqP2XK79fg/lXVouo9ab8Px+v5psNg16PLxLizOGvAfwHA5Ht2sWj7U4Y8h7AI8+TA173Dyu1lvwajWr1UpIqVSC82osRlgMec/n0ZeVUEh9jtKXeTjvbxOe1263CfnmdTqdT7Z+v4884XnhcFjjpVKpbNZisagHdrs9m9W7l5Gnz/s9j8czmSDvHXhut/vj55xOSZK83punNfIE5EWjm83m6sxwKMsyIdPpFHlGvGr19sxqFQgEZHk2myFPcF48fnXt0QNFodfeaKRXRJ62fD6vPfd6vd5iQX85HsfjcTKZJCQYDOoXkScGb71ea19b6WKxYrFYKJwPK5UK8oy+Eux2Pp/v5lWPvszX64fDAXmC804netOm02eZzdZqtej/3TtF5EGKpsaQB4khDxJDHiSGPEgMeZAY8iAx5EFiQvBedsiDDHmQfQGIbT5JCmVuZHN0cmVhbQplbmRvYmoKMTQgMCBvYmoKNDU1CmVuZG9iagoyIDAgb2JqCjw8IC9Db3VudCAxIC9LaWRzIFsgMTEgMCBSIF0gL1R5cGUgL1BhZ2VzID4+CmVuZG9iagoxNSAwIG9iago8PCAvQ3JlYXRpb25EYXRlIChEOjIwMjEwOTE2MTQ0MzEzKzAyJzAwJykKL0NyZWF0b3IgKE1hdHBsb3RsaWIgdjMuNC4zLCBodHRwczovL21hdHBsb3RsaWIub3JnKQovUHJvZHVjZXIgKE1hdHBsb3RsaWIgcGRmIGJhY2tlbmQgdjMuNC4zKSA+PgplbmRvYmoKeHJlZgowIDE2CjAwMDAwMDAwMDAgNjU1MzUgZiAKMDAwMDAwMDAxNiAwMDAwMCBuIAowMDAwMDAxNzcyIDAwMDAwIG4gCjAwMDAwMDA2NDUgMDAwMDAgbiAKMDAwMDAwMDY2NiAwMDAwMCBuIAowMDAwMDAwNzY1IDAwMDAwIG4gCjAwMDAwMDA3ODYgMDAwMDAgbiAKMDAwMDAwMDgwNyAwMDAwMCBuIAowMDAwMDAwMDY1IDAwMDAwIG4gCjAwMDAwMDAzOTYgMDAwMDAgbiAKMDAwMDAwMDYyNSAwMDAwMCBuIAowMDAwMDAwMjA4IDAwMDAwIG4gCjAwMDAwMDA2MDUgMDAwMDAgbiAKMDAwMDAwMDgzOSAwMDAwMCBuIAowMDAwMDAxNzUyIDAwMDAwIG4gCjAwMDAwMDE4MzIgMDAwMDAgbiAKdHJhaWxlcgo8PCAvSW5mbyAxNSAwIFIgL1Jvb3QgMSAwIFIgL1NpemUgMTYgPj4Kc3RhcnR4cmVmCjE5ODkKJSVFT0YK\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:43:13.375277\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["Global seed set to 1\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "5ec4fe6328c247b489d2701b79eb8048", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0/28 [00:00\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:43:15.879705\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Original image and input image to sampling:\n"]}, {"data": {"application/pdf": "JVBERi0xLjQKJazcIKu6CjEgMCBvYmoKPDwgL1BhZ2VzIDIgMCBSIC9UeXBlIC9DYXRhbG9nID4+CmVuZG9iago4IDAgb2JqCjw8IC9FeHRHU3RhdGUgNCAwIFIgL0ZvbnQgMyAwIFIgL1BhdHRlcm4gNSAwIFIKL1Byb2NTZXQgWyAvUERGIC9UZXh0IC9JbWFnZUIgL0ltYWdlQyAvSW1hZ2VJIF0gL1NoYWRpbmcgNiAwIFIKL1hPYmplY3QgNyAwIFIgPj4KZW5kb2JqCjExIDAgb2JqCjw8IC9Bbm5vdHMgMTAgMCBSIC9Db250ZW50cyA5IDAgUgovR3JvdXAgPDwgL0NTIC9EZXZpY2VSR0IgL1MgL1RyYW5zcGFyZW5jeSAvVHlwZSAvR3JvdXAgPj4KL01lZGlhQm94IFsgMCAwIDE3Mi4zODM3NSA5NS45NCBdIC9QYXJlbnQgMiAwIFIgL1Jlc291cmNlcyA4IDAgUgovVHlwZSAvUGFnZSA+PgplbmRvYmoKOSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDEyIDAgUiA+PgpzdHJlYW0KeJxNjUEKwjAURPf/FHOCJD/tJ8myUggu68YDhKAWW6kFvb6/XRQXAzPDDI8xku0YtxUOo+oLRobt6+dR6iWfUFZy2k/EwZsmNkE0Pf9SEpNabdzh7kQzLQjG72IJJu3TyEZavCuumGE7v2FZsaxYh6wflogNF/1xLxPsmdG/MNBAP35RJfYKZW5kc3RyZWFtCmVuZG9iagoxMiAwIG9iagoxMzQKZW5kb2JqCjEwIDAgb2JqClsgXQplbmRvYmoKMyAwIG9iago8PCA+PgplbmRvYmoKNCAwIG9iago8PCAvQTEgPDwgL0NBIDAgL1R5cGUgL0V4dEdTdGF0ZSAvY2EgMSA+PgovQTIgPDwgL0NBIDEgL1R5cGUgL0V4dEdTdGF0ZSAvY2EgMSA+PiA+PgplbmRvYmoKNSAwIG9iago8PCA+PgplbmRvYmoKNiAwIG9iago8PCA+PgplbmRvYmoKNyAwIG9iago8PCAvSTEgMTMgMCBSID4+CmVuZG9iagoxMyAwIG9iago8PCAvQml0c1BlckNvbXBvbmVudCA4Ci9Db2xvclNwYWNlIFsvSW5kZXhlZCAvRGV2aWNlUkdCIDc4ICj////+/v79/f38/Pz5+fn39/f09PTz8/Pv7+/t7e3s7Ozr6+vp6eno6Ojm5ubh4eHe3t7b29va2trT09POzs7Jycm/v7++vr67u7u6urqurq6pqamoqKinp6ekpKScnJyYmJiWlpaTk5ORkZGPj4+NjY2JiYmFhYWAgIB3d3d2dnZxcXFqampkZGRgYGBeXl5dXV1ZWVlXV1dVVVVUVFRQUFBDQ0NAQEA/Pz8+Pj44ODgxMTErKysmJiYjIyMgICAfHx8dHR0bGxsWFhYSEhIQEBAPDw8ODg4LCwsHBwcGBgYFBQUEBAQCAgIAAAApXQovRGVjb2RlUGFybXMgPDwgL0NvbG9ycyAxIC9Db2x1bW5zIDE1OCAvUHJlZGljdG9yIDEwID4+Ci9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9IZWlnaHQgODIgL0xlbmd0aCAxNCAwIFIgL1N1YnR5cGUgL0ltYWdlCi9UeXBlIC9YT2JqZWN0IC9XaWR0aCAxNTggPj4Kc3RyZWFtCnic7ddpV4JAFIBhmQkMNXMpU3M3W9yX0tJSwxRL4v//nO6MtllqNHmSuveLAsf3PB8GBh2nGz2O3wYsH+SJjC145s/M6Y/HkCcSQ55IDHkiMeSJxJAnEkOeSAx5IrHVvGq1GggQQiQpGo2Wy7quC/BYK8BaEmuVl7SQt2beaDRKJGRZpmwI4R/BYLDZbFrn8VbipfUcW9hC3pp5sDoo9Xg8pVI+n58VYRRFubqyyuMtylol1iJvW4tjtuVpmgZ3GaXtdts0u93uOZtIZFr1+YbDoQXerEVZy3xpRWYt3yct5K2TVywWYYkcHxuG8XrSMAqFgtvtJiSdTlvgfWPszLu5cblcXq9X0+YujMdjv98vSbFYDHk25R0dTTewDxdarRbflWq1GvIW8Q4PAQE379zpx8d4PA5X9vYmkwny7MiDd7PdXUB8/M3Z2XRTu7hYWETeZvMGgwFHvHt43N3lcrmtrSlvSfHf80x258LryvPGdXtbr9cdDjKbTCaDPDvzTk5ghTmdzgM2OztwsL0N2v19+Ia8VbyHh1QqBa98/D6V5XA4zP+NcmilUkGenXl8dF3n/0gvL/khPK1VFcj9fh95q3lz02g0KM1ms8uLyLMlLxQKEQJLEXnWeb2eqqqUIu8v8q6v+QaHPOQh7/3c3yeTSUXpdDrI+3O8rxaRJ1JEnkhxDbyNHeSJDPJE5gkEVtsWCmVuZHN0cmVhbQplbmRvYmoKMTQgMCBvYmoKNTMwCmVuZG9iagoyIDAgb2JqCjw8IC9Db3VudCAxIC9LaWRzIFsgMTEgMCBSIF0gL1R5cGUgL1BhZ2VzID4+CmVuZG9iagoxNSAwIG9iago8PCAvQ3JlYXRpb25EYXRlIChEOjIwMjEwOTE2MTQ0MzE1KzAyJzAwJykKL0NyZWF0b3IgKE1hdHBsb3RsaWIgdjMuNC4zLCBodHRwczovL21hdHBsb3RsaWIub3JnKQovUHJvZHVjZXIgKE1hdHBsb3RsaWIgcGRmIGJhY2tlbmQgdjMuNC4zKSA+PgplbmRvYmoKeHJlZgowIDE2CjAwMDAwMDAwMDAgNjU1MzUgZiAKMDAwMDAwMDAxNiAwMDAwMCBuIAowMDAwMDAxODcxIDAwMDAwIG4gCjAwMDAwMDA2NDUgMDAwMDAgbiAKMDAwMDAwMDY2NiAwMDAwMCBuIAowMDAwMDAwNzY1IDAwMDAwIG4gCjAwMDAwMDA3ODYgMDAwMDAgbiAKMDAwMDAwMDgwNyAwMDAwMCBuIAowMDAwMDAwMDY1IDAwMDAwIG4gCjAwMDAwMDAzOTYgMDAwMDAgbiAKMDAwMDAwMDYyNSAwMDAwMCBuIAowMDAwMDAwMjA4IDAwMDAwIG4gCjAwMDAwMDA2MDUgMDAwMDAgbiAKMDAwMDAwMDgzOSAwMDAwMCBuIAowMDAwMDAxODUxIDAwMDAwIG4gCjAwMDAwMDE5MzEgMDAwMDAgbiAKdHJhaWxlcgo8PCAvSW5mbyAxNSAwIFIgL1Jvb3QgMSAwIFIgL1NpemUgMTYgPj4Kc3RhcnR4cmVmCjIwODgKJSVFT0YK\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:43:15.945419\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["Global seed set to 1\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "ff6c8e20790c444e8f7c56fe0cf6f5bd", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0/28 [00:00\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:43:18.448685\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["def autocomplete_image(img):\n", " # Remove lower half of the image\n", " img_init = img.clone()\n", " img_init[:, 10:, :] = -1\n", " print(\"Original image and input image to sampling:\")\n", " show_imgs([img, img_init])\n", " # Generate 12 example completions\n", " img_init = img_init.unsqueeze(dim=0).expand(12, -1, -1, -1).to(device)\n", " pl.seed_everything(1)\n", " img_generated = model.sample(img_init.shape, img_init)\n", " print(\"Autocompletion samples:\")\n", " show_imgs(img_generated)\n", "\n", "\n", "for i in range(1, 4):\n", " img = train_set[i][0]\n", " autocomplete_image(img)"]}, {"cell_type": "markdown", "id": "ba91d363", "metadata": {"papermill": {"duration": 0.051443, "end_time": "2021-09-16T12:43:18.586848", "exception": false, "start_time": "2021-09-16T12:43:18.535405", "status": "completed"}, "tags": []}, "source": ["For the first two digits (7 and 6), we see that the 12 samples all\n", "result in a shape which resemble the original digit. Nevertheless, there\n", "are some style difference in writing the 7, and some deformed sixes in\n", "the samples. When autocompleting the 9 below, we see that the model can\n", "fit multiple digits to it. We obtain diverse samples from 0, 3, 8 and 9.\n", "This shows that despite having no latent space, we can still obtain\n", "diverse samples from an autoregressive model."]}, {"cell_type": "markdown", "id": "ee095fbc", "metadata": {"papermill": {"duration": 0.04956, "end_time": "2021-09-16T12:43:18.685925", "exception": false, "start_time": "2021-09-16T12:43:18.636365", "status": "completed"}, "tags": []}, "source": ["### Visualization of the predictive distribution (softmax)\n", "\n", "Autoregressive models use a softmax over 256 values to predict the next pixel.\n", "This gives the model a large flexibility as the probabilities for each pixel value can be learned independently if necessary.\n", "However, the values are actually not independent because the values 32 and 33 are much closer than 32 and 255.\n", "In the following, we visualize the softmax distribution that the model predicts to gain insights how it has learned the relationships of close-by pixels.\n", "\n", "To do this, we first run the model on a batch of images and store the output softmax distributions:"]}, {"cell_type": "code", "execution_count": 24, "id": "fd594831", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:43:18.789379Z", "iopub.status.busy": "2021-09-16T12:43:18.788903Z", "iopub.status.idle": "2021-09-16T12:43:18.897568Z", "shell.execute_reply": "2021-09-16T12:43:18.897984Z"}, "papermill": {"duration": 0.162907, "end_time": "2021-09-16T12:43:18.898132", "exception": false, "start_time": "2021-09-16T12:43:18.735225", "status": "completed"}, "tags": []}, "outputs": [], "source": ["det_loader = data.DataLoader(train_set, batch_size=128, shuffle=False, drop_last=False)\n", "imgs, _ = next(iter(det_loader))\n", "imgs = imgs.to(device)\n", "with torch.no_grad():\n", " out = model(imgs)\n", " out = F.softmax(out, dim=1)\n", " mean_out = out.mean(dim=[0, 2, 3, 4]).cpu().numpy()\n", " out = out.cpu().numpy()"]}, {"cell_type": "markdown", "id": "460b20fc", "metadata": {"papermill": {"duration": 0.049128, "end_time": "2021-09-16T12:43:18.998216", "exception": false, "start_time": "2021-09-16T12:43:18.949088", "status": "completed"}, "tags": []}, "source": ["Before diving into the model, let's visualize the distribution of the pixel values in the whole dataset:"]}, {"cell_type": "code", "execution_count": 25, "id": "cf4f889d", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:43:19.102964Z", "iopub.status.busy": "2021-09-16T12:43:19.102489Z", "iopub.status.idle": "2021-09-16T12:43:20.698247Z", "shell.execute_reply": "2021-09-16T12:43:20.698640Z"}, "papermill": {"duration": 1.650907, "end_time": "2021-09-16T12:43:20.698784", "exception": false, "start_time": "2021-09-16T12:43:19.047877", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:43:19.922594\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["sns.set()\n", "plot_args = {\"color\": to_rgb(\"C0\") + (0.5,), \"edgecolor\": \"C0\", \"linewidth\": 0.5, \"width\": 1.0}\n", "plt.hist(imgs.view(-1).cpu().numpy(), bins=256, density=True, **plot_args)\n", "plt.yscale(\"log\")\n", "plt.xticks([0, 64, 128, 192, 256])\n", "plt.show()\n", "plt.close()"]}, {"cell_type": "markdown", "id": "b8f425d1", "metadata": {"papermill": {"duration": 0.054971, "end_time": "2021-09-16T12:43:20.809613", "exception": false, "start_time": "2021-09-16T12:43:20.754642", "status": "completed"}, "tags": []}, "source": ["As we would expect from the seen images, the pixel value 0 (black) is the dominant value, followed by a batch of values between 250 and 255.\n", "Note that we use a log scale on the y-axis due to the big imbalance in the dataset.\n", "Interestingly, the pixel values 64, 128 and 191 also stand out which is likely due to the quantization used during the creation of the dataset.\n", "For RGB images, we would also see two peaks around 0 and 255,\n", "but the values in between would be much more frequent than in MNIST\n", "(see Figure 1 in the [PixelCNN++](https://arxiv.org/pdf/1701.05517.pdf) for a visualization on CIFAR10).\n", "\n", "Next, we can visualize the distribution our model predicts (in average):"]}, {"cell_type": "code", "execution_count": 26, "id": "45d72339", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:43:20.943659Z", "iopub.status.busy": "2021-09-16T12:43:20.935876Z", "iopub.status.idle": "2021-09-16T12:43:22.354374Z", "shell.execute_reply": "2021-09-16T12:43:22.354760Z"}, "papermill": {"duration": 1.486584, "end_time": "2021-09-16T12:43:22.354905", "exception": false, "start_time": "2021-09-16T12:43:20.868321", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:43:21.574138\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["plt.bar(np.arange(mean_out.shape[0]), mean_out, **plot_args)\n", "plt.yscale(\"log\")\n", "plt.xticks([0, 64, 128, 192, 256])\n", "plt.show()\n", "plt.close()"]}, {"cell_type": "markdown", "id": "329f3ea9", "metadata": {"papermill": {"duration": 0.05645, "end_time": "2021-09-16T12:43:22.469433", "exception": false, "start_time": "2021-09-16T12:43:22.412983", "status": "completed"}, "tags": []}, "source": ["This distribution is very close to the actual dataset distribution.\n", "This is in general a good sign, but we can see a slightly smoother histogram than above.\n", "\n", "Finally, to take a closer look at learned value relations, we can\n", "visualize the distribution for individual pixel predictions to get a\n", "better intuition. For this, we pick 4 random images and pixels, and\n", "visualize their distribution below:"]}, {"cell_type": "code", "execution_count": 27, "id": "17909488", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:43:22.589483Z", "iopub.status.busy": "2021-09-16T12:43:22.588638Z", "iopub.status.idle": "2021-09-16T12:43:27.526284Z", "shell.execute_reply": "2021-09-16T12:43:27.526674Z"}, "papermill": {"duration": 5.001478, "end_time": "2021-09-16T12:43:27.526816", "exception": false, "start_time": "2021-09-16T12:43:22.525338", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:43:24.825070\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["fig, ax = plt.subplots(2, 2, figsize=(10, 6))\n", "for i in range(4):\n", " ax_sub = ax[i // 2][i % 2]\n", " ax_sub.bar(np.arange(out.shape[1], dtype=np.int32), out[i + 4, :, 0, 14, 14], **plot_args)\n", " ax_sub.set_yscale(\"log\")\n", " ax_sub.set_xticks([0, 64, 128, 192, 256])\n", "plt.show()\n", "plt.close()"]}, {"cell_type": "markdown", "id": "d39faab7", "metadata": {"papermill": {"duration": 0.074666, "end_time": "2021-09-16T12:43:27.671433", "exception": false, "start_time": "2021-09-16T12:43:27.596767", "status": "completed"}, "tags": []}, "source": ["Overall we see a very diverse set of distributions, with a usual peak\n", "for 0 and close to 1. However, the distributions in the first row show a\n", "potentially undesirable behavior. For instance, the value 242 has a\n", "1000x lower likelihood than 243 although they are extremely close and\n", "can often not be distinguished. This shows that the model might have not\n", "generlized well over pixel values. The better solution to this problem\n", "is to use discrete logitics mixtures instead of a softmax distribution.\n", "A discrete logistic distribution can be imagined as discretized, binned\n", "Gaussians. Using a mixture of discrete logistics instead of a softmax\n", "introduces an inductive bias to the model to assign close-by values\n", "similar likelihoods. We can visualize a discrete logistic below:"]}, {"cell_type": "code", "execution_count": 28, "id": "41272be3", "metadata": {"execution": {"iopub.execute_input": "2021-09-16T12:43:27.818104Z", "iopub.status.busy": "2021-09-16T12:43:27.817603Z", "iopub.status.idle": "2021-09-16T12:43:28.944136Z", "shell.execute_reply": "2021-09-16T12:43:28.944525Z"}, "papermill": {"duration": 1.200149, "end_time": "2021-09-16T12:43:28.944659", "exception": false, "start_time": "2021-09-16T12:43:27.744510", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-09-16T14:43:28.378484\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["mu = torch.Tensor([128])\n", "sigma = torch.Tensor([2.0])\n", "\n", "\n", "def discrete_logistic(x, mu, sigma):\n", " return torch.sigmoid((x + 0.5 - mu) / sigma) - torch.sigmoid((x - 0.5 - mu) / sigma)\n", "\n", "\n", "x = torch.arange(256)\n", "p = discrete_logistic(x, mu, sigma)\n", "\n", "# Visualization\n", "plt.figure(figsize=(6, 3))\n", "plt.bar(x.numpy(), p.numpy(), **plot_args)\n", "plt.xlim(96, 160)\n", "plt.title(\"Discrete logistic distribution\")\n", "plt.xlabel(\"Pixel value\")\n", "plt.ylabel(\"Probability\")\n", "plt.show()\n", "plt.close()"]}, {"cell_type": "markdown", "id": "0ee82ec6", "metadata": {"papermill": {"duration": 0.072594, "end_time": "2021-09-16T12:43:29.091439", "exception": false, "start_time": "2021-09-16T12:43:29.018845", "status": "completed"}, "tags": []}, "source": ["Instead of the softmax, the model would output mean and standard\n", "deviations for the $K$ logistics we use in the mixture. This is one of\n", "the improvements in autoregressive models that PixelCNN++ [3] has\n", "introduced compared to the original PixelCNN."]}, {"cell_type": "markdown", "id": "d30f7d84", "metadata": {"papermill": {"duration": 0.071033, "end_time": "2021-09-16T12:43:29.238966", "exception": false, "start_time": "2021-09-16T12:43:29.167933", "status": "completed"}, "tags": []}, "source": ["## Conclusion\n", "\n", "In this tutorial, we have looked at autoregressive image modeling, and\n", "implemented the PixelCNN architecture. With the usage of masked\n", "convolutions, we are able to apply a convolutional network in which a\n", "pixel is only influenced by all its predecessors. Separating the masked\n", "convolution into a horizontal and vertical stack allowed us to remove\n", "the known blind spot on the right upper row of a pixel. In experiments,\n", "autoregressive models outperformed normalizing flows in terms of bits\n", "per dimension, but are much slower to sample from. Improvements, that we\n", "have not implemented ourselves here, are discrete logistic mixtures, a\n", "downsampling architecture, and changing the pixel order in a diagonal\n", "fashion (see PixelSNAIL). Overall, autoregressive models are another,\n", "strong family of generative models, which however are mostly used in\n", "sequence tasks because of their linear scaling in sampling time than\n", "quadratic as on images."]}, {"cell_type": "markdown", "id": "38f1dd4f", "metadata": {"papermill": {"duration": 0.071797, "end_time": "2021-09-16T12:43:29.381584", "exception": false, "start_time": "2021-09-16T12:43:29.309787", "status": "completed"}, "tags": []}, "source": ["## References\n", "[1] van den Oord, A., et al.\n", "\"Pixel Recurrent Neural Networks.\"\n", "arXiv preprint arXiv:1601.06759 (2016).\n", "[Link](https://arxiv.org/abs/1601.06759)\n", "\n", "[2] van den Oord, A., et al.\n", "\"Conditional Image Generation with PixelCNN Decoders.\"\n", "In Advances in Neural Information Processing Systems 29, pp.\n", "4790\u20134798 (2016).\n", "[Link](http://papers.nips.cc/paper/6527-conditional-image-generation-with-pixelcnn-decoders.pdf)\n", "\n", "[3] Salimans, Tim, et al.\n", "\"PixelCNN++: Improving the PixelCNN with Discretized Logistic Mixture Likelihood and Other Modifications.\"\n", "arXiv preprint arXiv:1701.05517 (2017).\n", "[Link](https://arxiv.org/abs/1701.05517)"]}, {"cell_type": "markdown", "id": "c99bfefb", "metadata": {"papermill": {"duration": 0.074235, "end_time": "2021-09-16T12:43:29.526938", "exception": false, "start_time": "2021-09-16T12:43:29.452703", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "![Pytorch Lightning](){height=\"60px\" width=\"240px\"}"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: Tutorial 10: Autoregressive Image Modeling\n", " :card_description: In this tutorial, we implement an autoregressive likelihood model for the task of image modeling. Autoregressive models are naturally strong generative models that constitute...\n", " :tags: Image,GPU/TPU,UvA-DL-Course\n", " :image: _static/images/course_UvA-DL/10-autoregressive-image-modeling.jpg"]}], "metadata": {"jupytext": {"cell_metadata_filter": "id,colab_type,colab,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 73.044444, "end_time": "2021-09-16T12:43:30.306539", "environment_variables": {}, "exception": null, "input_path": "course_UvA-DL/10-autoregressive-image-modeling/Autoregressive_Image_Modeling.ipynb", "output_path": ".notebooks/course_UvA-DL/10-autoregressive-image-modeling.ipynb", "parameters": {}, "start_time": "2021-09-16T12:42:17.262095", "version": "2.3.3"}, "widgets": {"application/vnd.jupyter.widget-state+json": {"state": {"01769afc187444bfaf2aec03b4f08496": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "0640c19d24424bdd9409f8216335ba18": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "0bb5668432394fb5befb04fa0f5d4605": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1006aae5c5444b3583ff98233ccb55d2": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "14f0fe5dfbfb47b5bdb2c070ef6a31ee": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "1c756dfde210415c809395bc6f9bc1f8": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1f6f6bfc18304ecab2062b2bf6933f8f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1fa667b5112343df9c5e37e6d9ca6b1f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_0bb5668432394fb5befb04fa0f5d4605", "max": 28.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_5dbc98f3633e4245acdc824506aebf18", "value": 28.0}}, "1ffdceee837a4a4d9b92dc9983c6feb7": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "21e083e4f6784332a4e4be80c9719372": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "288775f9620a426f835527c2a20267f5": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "2990971999c9429baf82e5715967d2e7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3542c1b421d74a9c9673ec4a04fceba9", "placeholder": "\u200b", "style": "IPY_MODEL_f3ca5bf492e2434080c0eb2ee7d333f0", "value": " 28/28 [00:02<00:00, 8.81it/s]"}}, "353657f372f84344b42e3792af9f53b5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3542c1b421d74a9c9673ec4a04fceba9": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3e194c3fa88d4f7796e12faf5a612eaa": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "443488f69eb4484d8d014daa1df90910": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_01769afc187444bfaf2aec03b4f08496", "placeholder": "\u200b", "style": "IPY_MODEL_3e194c3fa88d4f7796e12faf5a612eaa", "value": " 28/28 [00:04<00:00, 5.26it/s]"}}, "4588a9d7ce4c4420b31d66495762c51d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "47dbee09f7744686a6f2811eabac4a47": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "4a41e2c8c24f4501ad3f27256fe2dd00": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_afe9d9293fc54046b1a23a652de9156c", "max": 28.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_e5e0bffb840a4e6bb1718c6edc3478c0", "value": 28.0}}, "580c4ca4d0104b1fb3d44477534e266c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_5df1358fcace453c90d53fc8bf0c6852", "placeholder": "\u200b", "style": "IPY_MODEL_14f0fe5dfbfb47b5bdb2c070ef6a31ee", "value": "100%"}}, "58c7fa2a2b544e4995676502aab755f1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "5dbc98f3633e4245acdc824506aebf18": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "5df1358fcace453c90d53fc8bf0c6852": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "5ec4fe6328c247b489d2701b79eb8048": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_f06e46b2cceb47d6bce7e6fb0deece49", "IPY_MODEL_4a41e2c8c24f4501ad3f27256fe2dd00", "IPY_MODEL_7b6d55f1c3e94df5a3c638a6963f180f"], "layout": "IPY_MODEL_e0e996dd55e54974abbba367a08b200d"}}, "609d34d968c74b98bfde90b5c8853bb2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1c756dfde210415c809395bc6f9bc1f8", "placeholder": "\u200b", "style": "IPY_MODEL_47dbee09f7744686a6f2811eabac4a47", "value": "100%"}}, "6678217ddd654f39bdbc8fba2cd3788f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "6ddeeb369e0b46dd9e9a13c20c943fe4": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "71addce685174d8c9ed888c0e5e10e93": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "7b6d55f1c3e94df5a3c638a6963f180f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_0640c19d24424bdd9409f8216335ba18", "placeholder": "\u200b", "style": "IPY_MODEL_4588a9d7ce4c4420b31d66495762c51d", "value": " 28/28 [00:02<00:00, 8.84it/s]"}}, "8961cfdd02c24f6dbc1c42cf6db817fd": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_d80e197eb464480d9f8d2b14d7d47169", "IPY_MODEL_1fa667b5112343df9c5e37e6d9ca6b1f", "IPY_MODEL_443488f69eb4484d8d014daa1df90910"], "layout": "IPY_MODEL_aa387ed113584652801c05449d0576f4"}}, "9162e93ab9e348f48b2f46cce2c72155": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "a04db2d75a3f476487be88f18d66ddb1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_609d34d968c74b98bfde90b5c8853bb2", "IPY_MODEL_a70e1a44ecb440e8a79c4735752761c2", "IPY_MODEL_a8f4af858d4d457b8d2c2c59506c257c"], "layout": "IPY_MODEL_c5d74f5e252d446b838c3a099f2534f4"}}, "a70e1a44ecb440e8a79c4735752761c2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b91e999fdf704ceeb051bf05e4d0728f", "max": 64.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_f63d7ff436734e8dbe1e7ea69988a2e1", "value": 64.0}}, "a8f4af858d4d457b8d2c2c59506c257c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_353657f372f84344b42e3792af9f53b5", "placeholder": "\u200b", "style": "IPY_MODEL_c142ac0ce8e6411ea84868b82e3112d3", "value": " 64/64 [00:38<00:00, 1.02s/it]"}}, "aa387ed113584652801c05449d0576f4": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "aa4ad04083b642e4b289e7350fbef888": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1006aae5c5444b3583ff98233ccb55d2", "max": 28.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_d320a03105ae4a43a4d3ee1ec4c2cf75", "value": 28.0}}, "ad3bbb05cc344a59a95a7a6ca63461f5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "afe9d9293fc54046b1a23a652de9156c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b91e999fdf704ceeb051bf05e4d0728f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ba1f0b2b45fd4c3ca18dfe2954a6747f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1f6f6bfc18304ecab2062b2bf6933f8f", "placeholder": "\u200b", "style": "IPY_MODEL_6678217ddd654f39bdbc8fba2cd3788f", "value": "100%"}}, "c142ac0ce8e6411ea84868b82e3112d3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "c1e3f5021d764025a1e5dfc1a7acb318": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "c5d74f5e252d446b838c3a099f2534f4": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d320a03105ae4a43a4d3ee1ec4c2cf75": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "d80e197eb464480d9f8d2b14d7d47169": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_6ddeeb369e0b46dd9e9a13c20c943fe4", "placeholder": "\u200b", "style": "IPY_MODEL_71addce685174d8c9ed888c0e5e10e93", "value": "100%"}}, "e0e996dd55e54974abbba367a08b200d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "e1cd7fe63e8646ccb242422e29b75572": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "e5e0bffb840a4e6bb1718c6edc3478c0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "e76d7eb2829b4c6c9b26ff6703e0787d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_ba1f0b2b45fd4c3ca18dfe2954a6747f", "IPY_MODEL_ebd8b932d6ce4c76b14940b50d2d2569", "IPY_MODEL_2990971999c9429baf82e5715967d2e7"], "layout": "IPY_MODEL_1ffdceee837a4a4d9b92dc9983c6feb7"}}, "e973aa8423374ae9895e0f38003d662f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ad3bbb05cc344a59a95a7a6ca63461f5", "placeholder": "\u200b", "style": "IPY_MODEL_9162e93ab9e348f48b2f46cce2c72155", "value": " 28/28 [00:02<00:00, 8.85it/s]"}}, "ebd8b932d6ce4c76b14940b50d2d2569": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e1cd7fe63e8646ccb242422e29b75572", "max": 28.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_288775f9620a426f835527c2a20267f5", "value": 28.0}}, "f06e46b2cceb47d6bce7e6fb0deece49": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_58c7fa2a2b544e4995676502aab755f1", "placeholder": "\u200b", "style": "IPY_MODEL_c1e3f5021d764025a1e5dfc1a7acb318", "value": "100%"}}, "f3ca5bf492e2434080c0eb2ee7d333f0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "f63d7ff436734e8dbe1e7ea69988a2e1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "ff6c8e20790c444e8f7c56fe0cf6f5bd": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_580c4ca4d0104b1fb3d44477534e266c", "IPY_MODEL_aa4ad04083b642e4b289e7350fbef888", "IPY_MODEL_e973aa8423374ae9895e0f38003d662f"], "layout": "IPY_MODEL_21e083e4f6784332a4e4be80c9719372"}}}, "version_major": 2, "version_minor": 0}}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/course_UvA-DL/11-vision-transformer.ipynb b/source/notebooks/course_UvA-DL/11-vision-transformer.ipynb deleted file mode 100644 index ee96f08..0000000 --- a/source/notebooks/course_UvA-DL/11-vision-transformer.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "aa14bc73", "metadata": {"papermill": {"duration": 0.013536, "end_time": "2021-10-10T16:36:01.853136", "exception": false, "start_time": "2021-10-10T16:36:01.839600", "status": "completed"}, "tags": []}, "source": ["\n", "# Tutorial 11: Vision Transformers\n", "\n", "* **Author:** Phillip Lippe\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-10-10T18:35:49.064490\n", "\n", "In this tutorial, we will take a closer look at a recent new trend: Transformers for Computer Vision.\n", "Since [Alexey Dosovitskiy et al.](https://openreview.net/pdf?id=YicbFdNTTy) successfully applied a Transformer on a variety of image recognition benchmarks, there have been an incredible amount of follow-up works showing that CNNs might not be optimal architecture for Computer Vision anymore.\n", "But how do Vision Transformers work exactly, and what benefits and drawbacks do they offer in contrast to CNNs?\n", "We will answer these questions by implementing a Vision Transformer ourselves, and train it on the popular, small dataset CIFAR10.\n", "We will compare these results to popular convolutional architectures such as Inception, ResNet and DenseNet.\n", "This notebook is part of a lecture series on Deep Learning at the University of Amsterdam.\n", "The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io.\n", "\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/course_UvA-DL/11-vision-transformer.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "9f2931ec", "metadata": {"papermill": {"duration": 0.011652, "end_time": "2021-10-10T16:36:01.876879", "exception": false, "start_time": "2021-10-10T16:36:01.865227", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "1d59c918", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-10-10T16:36:01.905223Z", "iopub.status.busy": "2021-10-10T16:36:01.904752Z", "iopub.status.idle": "2021-10-10T16:36:01.907322Z", "shell.execute_reply": "2021-10-10T16:36:01.906861Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 0.018985, "end_time": "2021-10-10T16:36:01.907434", "exception": false, "start_time": "2021-10-10T16:36:01.888449", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# ! pip install --quiet \"torchmetrics>=0.3\" \"matplotlib\" \"torch>=1.6, <1.9\" \"pytorch-lightning>=1.3\" \"torchvision\" \"seaborn\""]}, {"cell_type": "markdown", "id": "cef420ac", "metadata": {"papermill": {"duration": 0.0116, "end_time": "2021-10-10T16:36:01.931606", "exception": false, "start_time": "2021-10-10T16:36:01.920006", "status": "completed"}, "tags": []}, "source": ["
\n", "Let's start with importing our standard set of libraries."]}, {"cell_type": "code", "execution_count": 2, "id": "d1953eb9", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:01.963459Z", "iopub.status.busy": "2021-10-10T16:36:01.962980Z", "iopub.status.idle": "2021-10-10T16:36:03.909605Z", "shell.execute_reply": "2021-10-10T16:36:03.909182Z"}, "papermill": {"duration": 1.966591, "end_time": "2021-10-10T16:36:03.909720", "exception": false, "start_time": "2021-10-10T16:36:01.943129", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/tmp/ipykernel_493/3416006740.py:22: DeprecationWarning: `set_matplotlib_formats` is deprecated since IPython 7.23, directly use `matplotlib_inline.backend_inline.set_matplotlib_formats()`\n", " set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "Global seed set to 42\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Device: cuda:0\n"]}, {"data": {"text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["import os\n", "import urllib.request\n", "from urllib.error import HTTPError\n", "\n", "import matplotlib\n", "import matplotlib.pyplot as plt\n", "import pytorch_lightning as pl\n", "import seaborn as sns\n", "import torch\n", "import torch.nn as nn\n", "import torch.nn.functional as F\n", "import torch.optim as optim\n", "import torch.utils.data as data\n", "import torchvision\n", "from IPython.display import set_matplotlib_formats\n", "from pytorch_lightning.callbacks import LearningRateMonitor, ModelCheckpoint\n", "from torchvision import transforms\n", "from torchvision.datasets import CIFAR10\n", "\n", "plt.set_cmap(\"cividis\")\n", "# %matplotlib inline\n", "set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "matplotlib.rcParams[\"lines.linewidth\"] = 2.0\n", "sns.reset_orig()\n", "\n", "# %load_ext tensorboard\n", "\n", "# Path to the folder where the datasets are/should be downloaded (e.g. CIFAR10)\n", "DATASET_PATH = os.environ.get(\"PATH_DATASETS\", \"data/\")\n", "# Path to the folder where the pretrained models are saved\n", "CHECKPOINT_PATH = os.environ.get(\"PATH_CHECKPOINT\", \"saved_models/VisionTransformers/\")\n", "\n", "# Setting the seed\n", "pl.seed_everything(42)\n", "\n", "# Ensure that all operations are deterministic on GPU (if used) for reproducibility\n", "torch.backends.cudnn.determinstic = True\n", "torch.backends.cudnn.benchmark = False\n", "\n", "device = torch.device(\"cuda:0\") if torch.cuda.is_available() else torch.device(\"cpu\")\n", "print(\"Device:\", device)"]}, {"cell_type": "markdown", "id": "7b4c9cda", "metadata": {"papermill": {"duration": 0.012503, "end_time": "2021-10-10T16:36:03.935539", "exception": false, "start_time": "2021-10-10T16:36:03.923036", "status": "completed"}, "tags": []}, "source": ["We provide a pre-trained Vision Transformer which we download in the next cell.\n", "However, Vision Transformers can be relatively quickly trained on CIFAR10 with an overall training time of less than an hour on an NVIDIA TitanRTX.\n", "Feel free to experiment with training your own Transformer once you went through the whole notebook."]}, {"cell_type": "code", "execution_count": 3, "id": "6284d05a", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:03.966290Z", "iopub.status.busy": "2021-10-10T16:36:03.965811Z", "iopub.status.idle": "2021-10-10T16:36:04.460168Z", "shell.execute_reply": "2021-10-10T16:36:04.460557Z"}, "papermill": {"duration": 0.512509, "end_time": "2021-10-10T16:36:04.460702", "exception": false, "start_time": "2021-10-10T16:36:03.948193", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial15/ViT.ckpt...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial15/tensorboards/ViT/events.out.tfevents.ViT...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial5/tensorboards/ResNet/events.out.tfevents.resnet...\n"]}], "source": ["# Github URL where saved models are stored for this tutorial\n", "base_url = \"https://raw.githubusercontent.com/phlippe/saved_models/main/\"\n", "# Files to download\n", "pretrained_files = [\n", " \"tutorial15/ViT.ckpt\",\n", " \"tutorial15/tensorboards/ViT/events.out.tfevents.ViT\",\n", " \"tutorial5/tensorboards/ResNet/events.out.tfevents.resnet\",\n", "]\n", "# Create checkpoint path if it doesn't exist yet\n", "os.makedirs(CHECKPOINT_PATH, exist_ok=True)\n", "\n", "# For each file, check whether it already exists. If not, try downloading it.\n", "for file_name in pretrained_files:\n", " file_path = os.path.join(CHECKPOINT_PATH, file_name.split(\"/\", 1)[1])\n", " if \"/\" in file_name.split(\"/\", 1)[1]:\n", " os.makedirs(file_path.rsplit(\"/\", 1)[0], exist_ok=True)\n", " if not os.path.isfile(file_path):\n", " file_url = base_url + file_name\n", " print(\"Downloading %s...\" % file_url)\n", " try:\n", " urllib.request.urlretrieve(file_url, file_path)\n", " except HTTPError as e:\n", " print(\n", " \"Something went wrong. Please try to download the file from the GDrive folder, or contact the author with the full output including the following error:\\n\",\n", " e,\n", " )"]}, {"cell_type": "markdown", "id": "c96b3099", "metadata": {"papermill": {"duration": 0.012919, "end_time": "2021-10-10T16:36:04.487227", "exception": false, "start_time": "2021-10-10T16:36:04.474308", "status": "completed"}, "tags": []}, "source": ["We load the CIFAR10 dataset below.\n", "We use the same setup of the datasets and data augmentations as for the CNNs in Tutorial 5 to keep a fair comparison.\n", "The constants in the `transforms.Normalize` correspond to the values\n", "that scale and shift the data to a zero mean and standard deviation of\n", "one."]}, {"cell_type": "code", "execution_count": 4, "id": "bb8b01bd", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:04.522789Z", "iopub.status.busy": "2021-10-10T16:36:04.522299Z", "iopub.status.idle": "2021-10-10T16:36:06.982772Z", "shell.execute_reply": "2021-10-10T16:36:06.983222Z"}, "papermill": {"duration": 2.483202, "end_time": "2021-10-10T16:36:06.983367", "exception": false, "start_time": "2021-10-10T16:36:04.500165", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}, {"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}, {"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}, {"data": {"application/pdf": "JVBERi0xLjQKJazcIKu6CjEgMCBvYmoKPDwgL1BhZ2VzIDIgMCBSIC9UeXBlIC9DYXRhbG9nID4+CmVuZG9iago4IDAgb2JqCjw8IC9FeHRHU3RhdGUgNCAwIFIgL0ZvbnQgMyAwIFIgL1BhdHRlcm4gNSAwIFIKL1Byb2NTZXQgWyAvUERGIC9UZXh0IC9JbWFnZUIgL0ltYWdlQyAvSW1hZ2VJIF0gL1NoYWRpbmcgNiAwIFIKL1hPYmplY3QgNyAwIFIgPj4KZW5kb2JqCjExIDAgb2JqCjw8IC9Bbm5vdHMgMTAgMCBSIC9Db250ZW50cyA5IDAgUgovR3JvdXAgPDwgL0NTIC9EZXZpY2VSR0IgL1MgL1RyYW5zcGFyZW5jeSAvVHlwZSAvR3JvdXAgPj4KL01lZGlhQm94IFsgMCAwIDQ2MC44IDE0NS45NzcxNzM5MTMgXSAvUGFyZW50IDIgMCBSIC9SZXNvdXJjZXMgOCAwIFIKL1R5cGUgL1BhZ2UgPj4KZW5kb2JqCjkgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAxMiAwIFIgPj4Kc3RyZWFtCnicVY9Nb4MwDIbv/hXvEQ4NcQikHOm6InZrhbTD1AOiKV1V2lHQtp8/023VFsmJP/L6sRlHinJGO0DjKPYBRoFo6d9fG78pFmgG0pLvyKZazcU7/XhsE5U5x85KSv8PD0Rn6uGUuZm1qbJgljsx7OKMY1w9nnFGlJsJzgJngWsUorPWYYIyu3uPpkNUMpYXrGmN/leo0f4VTzH1xPLORC8dtNImAZtMpXd209GiQrSSukG1vy1Y7YheEJRd3Xr4EDJsZpyex9NB8Fl3byc/4LLHePB4KFchMlay9fePmIJ8wxq7eqwHP4bYUvVEjxXJtPQFTx5PIAplbmRzdHJlYW0KZW5kb2JqCjEyIDAgb2JqCjI0NgplbmRvYmoKMTAgMCBvYmoKWyBdCmVuZG9iagoxOCAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDkxID4+CnN0cmVhbQp4nDWMuw3AMAhEe6a4Efg4gPeJohT2/m2ILRfcPemJ82xgZJ2HI7TjFrKmcFNMUk6odwxqpTcdO+glzf00yXouGvQPcfUVtpsDklEkkYdEl8uVZ+VffD4MbxxiCmVuZHN0cmVhbQplbmRvYmoKMTkgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAyMzUgPj4Kc3RyZWFtCnicNVFJbgAxCLvnFf5ApbAn75mq6qH9/7WGUS8DA9jYJO/BRiQ+xJDuKFd8yuo0y/A7WeTFz0rh5L2ICqQqwgppB89yVjMMnhuZApcz8VlmPpkWOxZQTcRxduQ0g0GIaVxHy+kw0zzoCbk+GHFjp1muYkjr3VK9vtfynyrKR9bdLLdO2dRK3aJn7Elcdl5PbWlfGHUUNwWRDh87vAf5IuYsLjqRbvabKYeVpCE4LYAfiaFUzw6vESZ+ZiR4yp5O76M0vPZB0/W9e0FHbiZkKrdQRiqerDTGjKH6jWgmqe//gZ71vb7+AENNVLkKZW5kc3RyZWFtCmVuZG9iagoyMCAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDc2ID4+CnN0cmVhbQp4nDM1N1UwULC0ABKmhuYK5kaWCimGXEA+iJXLBRPLAbPMTMyALENLZJaJsSGQZWJhhsQyNrGAyiJYBkAabE0OzPQcrgyuNAA1FxkFCmVuZHN0cmVhbQplbmRvYmoKMjEgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCA1MSA+PgpzdHJlYW0KeJwzsjRVMFCwtAAShpbmCuZGlgophlxAPoiVywUTywGzDIA0WGkOTEUOVwZXGgC/jA1WCmVuZHN0cmVhbQplbmRvYmoKMjIgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAyMzIgPj4Kc3RyZWFtCnicPZBLcgQhDEP3nEJHAH/hPJ1KzaLn/tvI7plskKrA8hNxHBNn84gIpBz8rGFmUBO8h4VD1WA7oOvAZ0BO4BoudClwo9qEc3ydw5sKmriHx2y1SKyd5Uwh6jAmSWzoScg2zmhy45zcqlTeTGu9xuKbcne7ymvalsK9h8r6OONUOasqa5E2EZlFaxvBRh7ssM+jq2jLWSrcN4xNXROVw5vF7lndyeKK769c49Uswcz3w7e/HB9X3egqx9jKhNlSk+bSOfWvltH6cLSLhXrhR3smSHB1qyBVpdbO2lN6/VPcJPr9A/TBVx0KZW5kc3RyZWFtCmVuZG9iagoyMyAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDMwNyA+PgpzdHJlYW0KeJw9kktuAzEMQ/c+hS4QwPrZnvOkKLqY3n/bJyXpihzZFkVqlrpMWVMekDSThH/p8HCxnfI7bM9mZuBaopeJ5ZTn0BVi7qJ82cxGXVknxeqEZjq36FE5Fwc2Taqfqyyl3S54Dtcmnlv2ET+80KAe1DUuCTd0V6NlKTRjqvt/0nv8jDLgakxdbFKrex88XkRV6OgHR4kiY5cX5+NBCelKwmhaiJV3RQNB7vK0ynsJ7tveasiyB6mYzjspZrDrdFIubheHIR7I8qjw5aPYa0LP+LArJfRI2IYzcifuaMbm1MjikP7ejQRLj65oIfPgr27WLmC8UzpFYmROcqxpi1VO91AU07nDvQwQ9WxFQylzkdXqX8POC2uWbBZ4SvoFHqPdJksOVtnbqE7vrTzZ0PcfWtd0HwplbmRzdHJlYW0KZW5kb2JqCjI0IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMjMxID4+CnN0cmVhbQp4nDVPOZIEIQzLeYU+MFUY20C/p6e2Ntj5f7qSmU6Q8CHJ0xMdmXiZIyOwZsfbWmQgZuBTTMW/9rQPE6r34B4ilIsLYYaRcNas426ejhf/dpXPWAfvNviKWV4Q2MJM1lcWZy7bBWNpnMQ5yW6MXROxjXWtp1NYRzChDIR0tsOUIHNUpPTJjjLm6DiRJ56L7/bbLHY5fg7rCzaNIRXn+Cp6gjaDoux57wIackH/Xd34HkW76CUgGwkW1lFi7pzlhF+9dnQetSgSc0KaQS4TIc3pKqYQmlCss6OgUlFwqT6n6Kyff+VfXC0KZW5kc3RyZWFtCmVuZG9iagoyNSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDI0OSA+PgpzdHJlYW0KeJw9UDuORCEM6zmFL/Ak8iNwHkarLWbv364DmilQTH62MyTQEYFHDDGUr+MlraCugb+LQvFu4uuDwiCrQ1IgznoPiHTspjaREzodnDM/YTdjjsBFMQac6XSmPQcmOfvCCoRzG2XsVkgniaoijuozjimeKnufeBYs7cg2WyeSPeQg4VJSicmln5TKP23KlAo6ZtEELBK54GQTTTjLu0lSjBmUMuoepnYifaw8yKM66GRNzqwjmdnTT9uZ+Bxwt1/aZE6Vx3QezPictM6DORW69+OJNgdNjdro7PcTaSovUrsdWp1+dRKV3RjnGBKXZ38Z32T/+Qf+h1oiCmVuZHN0cmVhbQplbmRvYmoKMjYgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAxMzYgPj4Kc3RyZWFtCnicTY9BDgMxCAPveYWfQCBAeM9WVQ/b/19L2HbTCx7JgGxRBoElh3iHG+HR2w/fRTYVZ+OcX1IpYiGYT3CfMFMcjSl38mOPgHGUaiynaHheS85NwxctdxMtpa2XkxlvuO6X90eVbZENRc8tC0LXbJL5MoEHfBiYR3XjaaXH3fZsr/b8AM5sNEkKZW5kc3RyZWFtCmVuZG9iagoyNyAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDM0MSA+PgpzdHJlYW0KeJxFUktuRDEI279TcIFI4ZeQ87Squpjef1ubTNXN4AlgbHjLU6ZkyrC5JSMk15RPfSJDrKb8NHIkIqb4SQkFdpWPx2tLrI3skagUn9rx47H0RqbZFVr17tGlzaJRzcrIOcgQoZ4VurJ71A7Z8HpcSLrvlM0hHMv/UIEsZd1yCiVBW9B37BHfDx2ugiuCYbBrLoPtZTLU//qHFlzvffdixy6AFqznvsEOAKinE7QFyBna7jYpaABVuotJwqPyem52omyjVen5HAAzDjBywIglWx2+0d4Aln1d6EWNiv0rQFFZQPzI1XbB3jHJSHAW5gaOvXA8xZlwSzjGAkCKveIYevAl2OYvV66ImvAJdbpkL7zCntrm50KTCHetAA5eZMOtq6Oolu3pPIL2Z0VyRozUizg6IZJa0jmC4tKgHlrjXDex4m0jsblX3+4f4ZwvXPbrF0vshMQKZW5kc3RyZWFtCmVuZG9iagoyOCAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDE2NCA+PgpzdHJlYW0KeJxFkMdxBTEMQ++qAiUwgAr1rMfzD+v+r4b000F6GEIMYk/CsFxXcWF0w4+3LTMNf0cZ7sb6MmO81VggJ+gDDJGJq9Gk+nbFGar05NVirqOiXC86IhLMkuOrQCN8OrLHk7a2M/10Xh/sIe8T/yoq525hAS6q7kD5Uh/x1I/ZUeqaoY8qK2seatpXhF0RSts+LqcyTt29A1rhvZWrPdrvPx52OvIKZW5kc3RyZWFtCmVuZG9iagoyOSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDQ3ID4+CnN0cmVhbQp4nDMyt1AwULA0ARKGFiYK5mYGCimGXJYQVi4XTCwHzALRlnAKIp7BlQYAuWcNJwplbmRzdHJlYW0KZW5kb2JqCjMwIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMjU4ID4+CnN0cmVhbQp4nEWRS3IEIAhE956CI4D85DyTSmUxuf82Dc5kNnaXqP2ESiOmEiznFHkwfcnyzWS26Xc5VjsbBRRFKJjJVeixAqs7U8SZa4lq62Nl5LjTOwbFG85dOalkcaOMdVR1KnBMz5X1Ud35dlmUfUcOZQrYrHMcbODKbcMYJ0abre4O94kgTydTR8XtINnwByeNfZWrK3CdbPbRSzAOBP1CE5jki0DrDIHGzVP05BLs4+N254Fgb3kRSNkQyJEhGB2Cdp1c/+LW+b3/cYY7z7UZrhzv4neY1nbHX2KSFXMBi9wpqOdrLlrXGTrekzPH5Kb7hs65YJe7g0zv+T/Wz/r+Ax4pZvoKZW5kc3RyZWFtCmVuZG9iagozMSAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDIxOCA+PgpzdHJlYW0KeJw9ULmNBDEMy12FGljAeu2pZxaLS6b/9Ej59iLRFkVSKjWZkikvdZQlWVPeOnyWxA55huVuZDYlKkUvk7Al99AK8X2J5hT33dWWs0M0l2g5fgszKqobHdNLNppwKhO6oNzDM/oNbXQDVocesVsg0KRg17YgcscPGAzBmROLIgxKTQb/rnKPn16LGz7D8UMUkZIO5jX/WP3ycw2vU48nkW5vvuJenKkOAxEckpq8I11YsS4SEWk1QU3PwFotgLu3Xv4btCO6DED2icRxmlKOob9rcKXPL+UnU9gKZW5kc3RyZWFtCmVuZG9iagozMiAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDgzID4+CnN0cmVhbQp4nEWMuw3AMAhEe6ZgBH4m9j5RlMLevw0QJW64J909XB0JmSluM8NDBp4MLIZdcYH0ljALXEdQjp3so2HVvuoEjfWmUvPvD5Se7KzihusBAkIaZgplbmRzdHJlYW0KZW5kb2JqCjMzIDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMjM5ID4+CnN0cmVhbQp4nE1QyW0EMQz7uwo1MMDoHLseB4s8sv1/Q8oJkpdoS+Kh8pRblspl9yM5b8m65UOHTpVp8m7Qza+x/qMMAnb/UFQQrSWxSsxc0m6xNEkv2cM4jZdrtY7nqXuEWaN48OPY0ymB6T0ywWazvTkwqz3ODpBOuMav6tM7lSQDibqQ80KlCuse1CWijyvbmFKdTi3lGJef6Ht8jgA9xd6N3NHHyxeMRrUtqNFqlTgPMBNT0ZVxq5GBlBMGQ2dHVzQLpcjKekI1wo05oZm9w3BgA8uzhKSlrVK8D2UB6AJd2jrjNEqCjgDC3yiM9foGqvxeNwplbmRzdHJlYW0KZW5kb2JqCjM0IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMzM0ID4+CnN0cmVhbQp4nC1SS3LFIAzbcwpdoDP4B+Q86XS6eL3/tpKTRUYOYPQx5YaJSnxZILej1sS3jcxAheGvq8yFz0jbyDqIy5CLuJIthXtELOQxxDzEgu+r8R4e+azMybMHxi/Zdw8r9tSEZSHjxRnaYRXHYRXkWLB1Iap7eFOkw6kk2OOL/z7Fcy0ELXxG0IBf5J+vjuD5khZp95ht0656sEw7qqSwHGxPc14mX1pnuToezwfJ9q7YEVK7AhSFuTPOc+Eo01ZGtBZ2NkhqXGxvjv1YStCFblxGiiOQn6kiPKCkycwmCuKPnB5yKgNh6pqudHIbVXGnnsw1m4u3M0lm675IsZnCeV04s/4MU2a1eSfPcqLUqQjvsWdL0NA5rp69lllodJsTvKSEz8ZOT06+VzPrITkVCaliWlfBaRSZYgnbEl9TUVOaehn++/Lu8Tt+/gEsc3xzCmVuZHN0cmVhbQplbmRvYmoKMzUgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAxOCA+PgpzdHJlYW0KeJwzNrRQMIDDFEOuNAAd5gNSCmVuZHN0cmVhbQplbmRvYmoKMzYgMCBvYmoKPDwgL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0xlbmd0aCAxMzMgPj4Kc3RyZWFtCnicRY9LDgQhCET3nKKOwMcf53Ey6YVz/+2AnW4TYz2FVIG5gqE9LmsDnRUfIRm28beplo5FWT5UelJWD8ngh6zGyyHcoCzwgkkqhiFQi5gakS1lbreA2zYNsrKVU6WOsIujMI/2tGwVHl+iWyJ1kj+DxCov3OO6Hcil1rveoou+f6QBMQkKZW5kc3RyZWFtCmVuZG9iagozNyAwIG9iago8PCAvRmlsdGVyIC9GbGF0ZURlY29kZSAvTGVuZ3RoIDg5ID4+CnN0cmVhbQp4nDVNuRGAMAzrPYVHwI9IvA/HUYT9W+yENJZOnxHKB2vkAYLhjS8h+KIvGYS1Cw8q+0h02EQNZxUkE8OvLPCqnBVtcyUT2VlMo7NBy/St7W+DHro/3Y4cCgplbmRzdHJlYW0KZW5kb2JqCjM4IDAgb2JqCjw8IC9GaWx0ZXIgL0ZsYXRlRGVjb2RlIC9MZW5ndGggMjE1ID4+CnN0cmVhbQp4nDVROQ4DIQzs9xX+QCSML3hPoijN/r/NjNFWHsFchrSUIZnyUpOoIeVTPnqZLpy63NfMajTnlrQtc4C4trwvrZLAiWaIg8FpmLgBmjwBQ9fRqFFDFx7Q1KVTKLDcBD6Kt24P3WO1gZe2IeeJIGIoGSxBzalFExZtzyekNb9eixvel+3dyFOlxpYYgQYBVjgc1+jX8JU9TybRdBUy1Ks1yxgJE0UiPPmOptUT61o00jIS1MYRrGoDvDv9ME4AABNxywJkn0qUs+TEb7H0swZX+v4Bn0dUlgplbmRzdHJlYW0KZW5kb2JqCjE2IDAgb2JqCjw8IC9CYXNlRm9udCAvRGVqYVZ1U2FucyAvQ2hhclByb2NzIDE3IDAgUgovRW5jb2RpbmcgPDwKL0RpZmZlcmVuY2VzIFsgMzIgL3NwYWNlIDQ4IC96ZXJvIC9vbmUgNjUgL0EgNjcgL0MgNzAgL0YgNzMgL0kgODIgL1IgOTcgL2EgMTAwIC9kIC9lIC9mCi9nIC9oIDEwOCAvbCAvbSAxMTEgL28gL3AgMTE1IC9zIC90IDEyMCAveCBdCi9UeXBlIC9FbmNvZGluZyA+PgovRmlyc3RDaGFyIDAgL0ZvbnRCQm94IFsgLTEwMjEgLTQ2MyAxNzk0IDEyMzMgXSAvRm9udERlc2NyaXB0b3IgMTUgMCBSCi9Gb250TWF0cml4IFsgMC4wMDEgMCAwIDAuMDAxIDAgMCBdIC9MYXN0Q2hhciAyNTUgL05hbWUgL0RlamFWdVNhbnMKL1N1YnR5cGUgL1R5cGUzIC9UeXBlIC9Gb250IC9XaWR0aHMgMTQgMCBSID4+CmVuZG9iagoxNSAwIG9iago8PCAvQXNjZW50IDkyOSAvQ2FwSGVpZ2h0IDAgL0Rlc2NlbnQgLTIzNiAvRmxhZ3MgMzIKL0ZvbnRCQm94IFsgLTEwMjEgLTQ2MyAxNzk0IDEyMzMgXSAvRm9udE5hbWUgL0RlamFWdVNhbnMgL0l0YWxpY0FuZ2xlIDAKL01heFdpZHRoIDEzNDIgL1N0ZW1WIDAgL1R5cGUgL0ZvbnREZXNjcmlwdG9yIC9YSGVpZ2h0IDAgPj4KZW5kb2JqCjE0IDAgb2JqClsgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAKNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCA2MDAgNjAwIDYwMCAzMTggNDAxIDQ2MCA4MzggNjM2Cjk1MCA3ODAgMjc1IDM5MCAzOTAgNTAwIDgzOCAzMTggMzYxIDMxOCAzMzcgNjM2IDYzNiA2MzYgNjM2IDYzNiA2MzYgNjM2IDYzNgo2MzYgNjM2IDMzNyAzMzcgODM4IDgzOCA4MzggNTMxIDEwMDAgNjg0IDY4NiA2OTggNzcwIDYzMiA1NzUgNzc1IDc1MiAyOTUKMjk1IDY1NiA1NTcgODYzIDc0OCA3ODcgNjAzIDc4NyA2OTUgNjM1IDYxMSA3MzIgNjg0IDk4OSA2ODUgNjExIDY4NSAzOTAgMzM3CjM5MCA4MzggNTAwIDUwMCA2MTMgNjM1IDU1MCA2MzUgNjE1IDM1MiA2MzUgNjM0IDI3OCAyNzggNTc5IDI3OCA5NzQgNjM0IDYxMgo2MzUgNjM1IDQxMSA1MjEgMzkyIDYzNCA1OTIgODE4IDU5MiA1OTIgNTI1IDYzNiAzMzcgNjM2IDgzOCA2MDAgNjM2IDYwMCAzMTgKMzUyIDUxOCAxMDAwIDUwMCA1MDAgNTAwIDEzNDIgNjM1IDQwMCAxMDcwIDYwMCA2ODUgNjAwIDYwMCAzMTggMzE4IDUxOCA1MTgKNTkwIDUwMCAxMDAwIDUwMCAxMDAwIDUyMSA0MDAgMTAyMyA2MDAgNTI1IDYxMSAzMTggNDAxIDYzNiA2MzYgNjM2IDYzNiAzMzcKNTAwIDUwMCAxMDAwIDQ3MSA2MTIgODM4IDM2MSAxMDAwIDUwMCA1MDAgODM4IDQwMSA0MDEgNTAwIDYzNiA2MzYgMzE4IDUwMAo0MDEgNDcxIDYxMiA5NjkgOTY5IDk2OSA1MzEgNjg0IDY4NCA2ODQgNjg0IDY4NCA2ODQgOTc0IDY5OCA2MzIgNjMyIDYzMiA2MzIKMjk1IDI5NSAyOTUgMjk1IDc3NSA3NDggNzg3IDc4NyA3ODcgNzg3IDc4NyA4MzggNzg3IDczMiA3MzIgNzMyIDczMiA2MTEgNjA1CjYzMCA2MTMgNjEzIDYxMyA2MTMgNjEzIDYxMyA5ODIgNTUwIDYxNSA2MTUgNjE1IDYxNSAyNzggMjc4IDI3OCAyNzggNjEyIDYzNAo2MTIgNjEyIDYxMiA2MTIgNjEyIDgzOCA2MTIgNjM0IDYzNCA2MzQgNjM0IDU5MiA2MzUgNTkyIF0KZW5kb2JqCjE3IDAgb2JqCjw8IC9BIDE4IDAgUiAvQyAxOSAwIFIgL0YgMjAgMCBSIC9JIDIxIDAgUiAvUiAyMiAwIFIgL2EgMjMgMCBSIC9kIDI0IDAgUgovZSAyNSAwIFIgL2YgMjYgMCBSIC9nIDI3IDAgUiAvaCAyOCAwIFIgL2wgMjkgMCBSIC9tIDMwIDAgUiAvbyAzMSAwIFIKL29uZSAzMiAwIFIgL3AgMzMgMCBSIC9zIDM0IDAgUiAvc3BhY2UgMzUgMCBSIC90IDM2IDAgUiAveCAzNyAwIFIKL3plcm8gMzggMCBSID4+CmVuZG9iagozIDAgb2JqCjw8IC9GMSAxNiAwIFIgPj4KZW5kb2JqCjQgMCBvYmoKPDwgL0ExIDw8IC9DQSAwIC9UeXBlIC9FeHRHU3RhdGUgL2NhIDEgPj4KL0EyIDw8IC9DQSAxIC9UeXBlIC9FeHRHU3RhdGUgL2NhIDEgPj4gPj4KZW5kb2JqCjUgMCBvYmoKPDwgPj4KZW5kb2JqCjYgMCBvYmoKPDwgPj4KZW5kb2JqCjcgMCBvYmoKPDwgL0kxIDEzIDAgUiA+PgplbmRvYmoKMTMgMCBvYmoKPDwgL0JpdHNQZXJDb21wb25lbnQgOCAvQ29sb3JTcGFjZSAvRGV2aWNlUkdCCi9EZWNvZGVQYXJtcyA8PCAvQ29sb3JzIDMgL0NvbHVtbnMgNDQ3IC9QcmVkaWN0b3IgMTAgPj4KL0ZpbHRlciAvRmxhdGVEZWNvZGUgL0hlaWdodCAxMTcgL0xlbmd0aCAzOSAwIFIgL1N1YnR5cGUgL0ltYWdlCi9UeXBlIC9YT2JqZWN0IC9XaWR0aCA0NDcgPj4Kc3RyZWFtCnic7X1LjCRXdt2LiPx/qrK+XV3VXV39YXdPk6KG5HCG0syYGluGJRuGIAOSbMuQtfLCgGHYWhleeOWNYRj2xja09EoGDMMeWRqNIJIz1AxnOGTzT3Y3+1dd3fX/ZFb+M75exD33vs7MTowTBgwD92z4mPkq4sWLl9Fxzrv3XGd7e9soFAqF4v8Q7v/rASgUCsX/l9Cnp0KhUEwDfXoqFArFNNCnp0KhUEwDfXoqFArFNMiMfjS3eIbbSZKkDcc4/Bn9x5E/Sdxk6NvJcGL500n98KV9Lgaf08XYeLSuQ/8qHB6fcP92u502qjPVtNFsNtPG2toqd8t4PCd0EGfc2R182mh30kbUb492+2vf+u20UYp6aaPshBikHNfzPByXj09nL8zMcrd/8i//gL6tFNPGX77z07Rx+/O71L9Y5v6XLl1MG29898200Tqop42sx71MsUITMuPRJew1jtLGk04gg3TzaeM0HNAl+N20cWN5ibt1qzTyWfrS3D9ppY1OJLe7NEsnvXL1etqoFemi/vA//2szgn/6b76fNgYhrR4+WCyL0zguvxAMr1gbfJddzHwiMy9Hc11n6MMER8tk5LALmMBCPps2jpt0yV0/4m5eQiN3DX2Yz+UxVjp+t9fn/gPfTxtBxJfMa9IepIcGfes59Ml//IO/Mnrtf/hH/yFtZHM0jFI5Zx2NZibj0QVmsVZOTupyLZi3bJb6xwEt7KUlmo1Wq8P9j/bpXJt3aVncfP9B2uj3B9ztyvWVtPH8i/QUavd20sbikvwQ3IDaQYNW+62bj+hEBw3u9osv09L6/d/9TRpbrZA2/FjGtt8+ThuHA3ognLao8fDhJnf7R7/3z83T0HdPhUKhmAb69FQoFIppoE9PhUKhmAZjdM+Maz1SJ8iS9oPX/bnkTjma8/P157+DyBNbEiSfUw4WowWl5uGDx9z/+997K20sLsyljQwkm3/w+78jh4V01e2SQBPHpDpVqiIpQmI1nR51K4yVR9EtCEn3ibKQk3JZ7uZBbLLkLChuniiULKHNQbr9tV//63T2HAk6H314i/sfHxymjavPraeN7ZjEqSQWPa7n04cRhLluL0BDZDhj6MNeQEJVHpeXtQaZwcLgm1WCLDg/J/Lo4upZupa5hbRRLcqEjML1SagatGlIA0xpGNlTzyNJhv9rrToXt97LQLYbp3tyK5OlsWWzdHnVaoG7hRFNSL1O6rYf0pRWcnK0HIaWyZDOmGBlD/o0t/avystgQjByBzfN1uI9j/6Hdc/xUj0QxTTarAs5NZaZyRfopDnMTCZD457BqjPGZDEhLSi8vKD6PTra0b4snp3HNDN7u6Std9v0SRjKUrz1yb204fdP08a3vnMjbZw5U+Fum3doP+OzD+kHfrhNR8u48kzDcpZ72mzS2bNFuWQPIviVK1fSRr1Jxz9tHppnQ989FQqFYhro01OhUCimwRjmnlhhJUxahRQwD0os9s2vyGYSZbDin4YOZjFh6zWbQxmaHWJt2byQuyzet0tF4lASCOXT0fYPJGLpB2++Q6fyiSX9zu/+nbQhFMmYQUjf3vryftro9YgUfOUrV+Xs+JNbt79MGy995crwBRtjImIl2RyN9rhJYR/+0TH3yoH5etKg/mWL1/QHNCFhRMTw8tVLaaOQ+9W0waTbGLPzmHhNAeE1RegGnidBKsxGDSY8k6FImn6/yd2wFkwCqpggqCUK5KRRSEfDNJtytZY2rlx7nrvNnaGQlABTVMlP+recyWWM8B3DjVAi4ELQUu4mfxhLNw5s4gkPkwh/KEsxwtiEzuO/OSvmK4MJiSM6bKVaShuvf22du72AcBwXi6HVJG7b7VBwUrPtc/9Gm+7yKcQKkF1jjVECtlyPzh5O/BlmoK1kMtQtCOSkgwGdK5+t4FsaRj4va2YGAWdJzGsA3XJ07af1Pe6/t01MvHlKN4ifM4kscJPENDNPHtHPxItn0sa5M5e42+bnn6SN3W36Efl9CA6W/LN6niIR5+dJrAu7jbSRLcgM+i265AcPKOwvMjTI2ZroM6PQd0+FQqGYBvr0VCgUimkwjrnbT1ROsRi3I8mI8eHYbxkhNiI7HdqnLpXpJd9zrdwXHGP38CBtfPzpF2mjUJQX6cUF2qvdOL9GB8FXOzv8h59z/3NrRBXDDr2WL8zR+3yuIGc/atDY7j54mDYy2HxcXT/H3TJgfLfvUcrEWOYulBbs2MEOZhLKSZlq+QH444DIVM+R+8F3IRxRVJibXL0qBCcKiOntfEmUZHubuHw+a1GSHHG0sks3yMcuvA0P52LmzukodgwFd4uhpLAqUy2VpFsCyozN2rw3ZjUyrB12+iQM6Pi8wW2ssAFGjE+iyPoqBNf26ENeuo4lIrkiF0RDjU7Plp2S4QaklVpR7vIvXiYSOjNTxNF415saoaVCtLq0Bo5PaRX5fnaovzGmO6Ah9bBmTiz6P4pSiYYRJySIWZmEJgzoEnoItygUiLDH1tZ8v4d8M2943vr9PvrIfak3aLO7dYqNeNwXT364In30W3QJH/2MBLRkIIN8dI8IexDwA4omIbCCSVotigf4EipchK1844nWtHWyRa0a/W2xQpc8CCQlaRT67qlQKBTTQJ+eCoVCMQ3GcKV2v8ftGG/jHDEbMbU0wh2YozGRZJJuh8U3EVj7xa07aeM6drHnQKKNMbu7+2njFro9uE8kulgQvnkMBxB+oe/BsOPdd2+mjZ/+7Gfc/8IS7XgWIBckMbGD0CJrPZ+YRR2v/efO0c4db5UaY27fJi5898GmeTY4HiAxdK5cHsYQlsqRwQ6+sGN8lbXYbgiyw9826o200QYzsjdGc2iXsUOaKdHZ6w2hJD52ftcXicJnsHtrR1Z4EoxN/5VdbOs2O9AXmL3mMW1nahLw3IOmkSDIIWzKwhsFn8sOzhgaj7G2gKU/Js0mnszvJQ5knOgkBJnnAd1skxc+iDVI+iS05IIEPwo3ZqcYbH+7tAAKOemfBykuQvbJYQUWrB8Cx7rzGNvdYfnCxnOXyTvji9sfpo1OVxZDWcS0ABcFUhwIE+/gt+ZlmLlT/w5+OOyxYizFg29HAgnGsZ5CRezXByF9uL1JP/NuXVS4cqlG1/IcPUC+vEu/R8eVa+8jWuYY8S3FDIbhijVJEND69xy6BE4ZaJx2zbOh754KhUIxDfTpqVAoFNNAn54KhUIxDcbonn/8529wOwcvgCL0O053ia3IAA6qySO4gRWmbkeEgyOoD/cfUojAA9RDXl5a5G6PnzxJG/t7FHgUDUiPmK2IcDaAqJFAWmLd81NEOO0f7HL/yyvLaaMEjwYHthv3793jbnUclu0/6qcNGphVvfmDjynb4f7mlnk22siSKheGzTOOGqfcjaeLA6FYMfK6MoEHJ6QBXbzxXNrI5+m+1APKzWjD2NUYs7ZOsVwrSxTd9eIN8lx49FCu5Xt/+kM6ew4yHGJI8pbUC+VKJpxdsQNf4j8M0kXiiKTe9iEJ2e/8xZ9zrybyZgb4Wxemy//iX/1jMwK2FjZQq9mXwo4x4uAbK5+Nw+msw42InKNRR8aYJB4WEJ9KsRsBf5mMqK7GmAShOY6XHTpaPO5aYijIAYuuCPPKWYbh8YiFOec+jcX1Sy+kjQeIYzvtStpbOyQR0KlSWJWBUt+3LGM4144lex/qYSFPZjrlsuikM2UEaXWyOBHMSrIy2sV5sj0eDGh55JD2dlqXs0ch/axe/frXaGx9+pkcHYivx6uvvJQ2Xvs6XXK/Q1faa0sWYrBDP5m6x/FMWPZ2JOUI9N1ToVAopoE+PRUKhWIajGHut+59we18gV6bOVqFjQ6TgbyWl/BunysjsMnQt4OeEM8TeHY4SIpo7MJHoC8xE2GHgm8yeD+fLdFrf8HKEIjhMnl8TOc6gbvio0d02N6x1BpyfNgTYGwnh8Reb38i89AF1Sp41L97QkrCvZ4QnEGPXvJXlmrm2XDAodj1QzidxR4joXzwXEA3z0qkOUXIl49wnx/+4Edp48lDSiL6kz/5PvfPVSj+o1SghoP8nDAQ4SXBPXWQeFMqkrhRQ6iTMWYwgJsnZqsk0SGWJyYYcgYZSFGXmNEBxm//gQO/kjnc5bEYYM0kIScAcWKPxY4le4dD64aNPo0xVtGq4aJYk7n52MAmyVOSq0Iuk21NwnYeXImLk7Tw+3oqayvDDUQEwuDDtQxVY/wtvwq5/qRLWDlDes6F85SW1uk0rJPS0sqAtLJcYPsH9ZHGli9w9BVPIH3S78mvL8Z687t0/KzHvh6WOhSyyQvrRPjKOvvjLfrlss1oGYF9dYtrH+yTnBVB6IgxyEEoz6UwIk3AR0jWAI1COW+eDX33VCgUimmgT0+FQqGYBmOY+6+89iK3rT1B9oWkB242lidvGftiCfJcAhjkZa09x7hPb+PNFn3YbNL7cy4vhKg2T3V0e3jz57SEYlFepAvYEwwdent/462P0sZJnahi40j2tevH9BqfzFL/UoVe8peWZ7gb+zxeXkVh1QYJDi64hjFmbYV2sZ+/umGeDQfpFuwHwWS3XBCimgjBH/73LFuWciBsDtI4pQu8e5c8SronjbQR+JJEUczQDmaIErWtFuoiWPunNQQ8RE2q/prLU/9r58TStFBAwlKNhhR3aBjtWw+4WxeXkEMABtfqqDoygayfRBGdq2K5rI4ixL/0MWxsIhhqxOMcadmak5m7Y70ruM9+bXiamo/Zm8f47c/YS5SHxNaZIrwEYK+BSA2cywT2bZ0wRnhGDPVmwDc3lH4hfpuc/lRv0mHPSiTLmIvKoMS050g+W7nI8QB0kAGSD9nCw1i3z6DBVjucPBZForP1+yS8DBA/U4AqyHfKGNNu0wPBRzVmvqFFyyEowgNh8wEVIi5XykNfGWM+/JBEyJUV+iGsnqegnZ4vUuEAWVKs9nDgih0PMAp991QoFIppoE9PhUKhmAZjmPu5srwhM98MrNILKXhb1hjZ/fTBoep1Dl6tcy/Hp6PdfkQbxPuHFNqaWJ4ja+fIiHN9new5MijIEVhml1kEir93k8wO3v/JB2kjRAB2aNGwAf60uMgMlC7huCOb6Qa8I8DcdFp0CeWqEPxcib7OeZO8LSKQHXaLiBLUYOgId2BTiYzspWKD26pb4Pd5T5wISBc1G5hwZnOy5+jD/WFmlmMnWCKQw+ZRrmOArcniLJm2XLzxAneLPQQ84yDtY0pnODDC3A2CMcCHjAcDykFW7rLn8E4utmhHrDltzBZowtvo1ue1EMjF8EmlDqtVypW7sT2HM1JyJrYkqThifoq/FacUm7vzjjkNku1yvIyMjUticAnSCNw8wtGsu22Y1+8f013+/o8oreOgLr9H8d7FJx1M+L/9Z79uRsBGP46hVXH1itzls7DBzcGa5LhOP9Lt7U3udnxCeSjtNv062KuXl4dt/1HAr5VTVDi0gffNjUXY+YHj+zRXNnPP4YGQy9FPeOUsDfsAKTbGmC4Cfn70zrt0dev0w5mdl8UQuPQTdlBtZeDTIDPZMU9Ihr57KhQKxTTQp6dCoVBMA316KhQKxTQYw+pPmyIcjHrHspAYWuELIeTOfo++/os/oRyY4y05GhcBbfsUN7N0Zn7o+MaYB59QnMGTW+RiUF0iGW7+7DJ3ixwa/Ps3qf/BNp1rgHCcvhUv8sV90oxq51AXtwz9LrAMO5ApwYV0ogzJIn3LCyOISFL0kQMzFi4GmYPm5cPkomQZcHAWijdqS2zlTvS7fRyN5J5KhTTcV19+LW0sn1vi/sdHpEkVCyT3nJwgFKMgZ7/70Wdpo4UYIDfi+y7deC4zWZYsUTvasoyZgajX68MdGdlBYc6K/8CRE0Ozyj67Y9FFtRw+bIQ4njAUCTIMOSqIvo2fzjGiC+T8HIh0CeRDJ7HCqmBjHENPDeCS41shLwZ+KC50TB9a3kcfyfIo5WmZLcxRgawwhsUGZPHQUj75Erb3aQX+9FNKojuuy2GdkUYUy7IfRSZLcufLL5PFRsnK8mKjH7YZZvuPdvsXudvWFoUK7e5SJl6Y0I+ajZPnarJ0l5dJtTzZozQhLm4WibgskZFcTCyPPMbQCkVaWKR4wRwKEL/+K99MG7axS22GTvpwi54kT/ZoAk992bZZXqOnUOuEcuHOrNToRPOSazcKffdUKBSKaaBPT4VCoZgGY5j7445w7QyMClwwylhq4VoOgwjy+ORjep//8cdEBlfLNe62u0c+j6U8HWTtDMUAlUti3DmLJASWCfpgx4OOhAd5qKPrgf54GEa1SMETrZz4FNy5S8WRrn6NeJMDKYFtAowxyHwxUQaMD43EEVLQQ+DRIJzEkhwUSuUUpgJiZc7WJP5JbD2d4X/P4oLkgbgI1gkRVrWKmktr6xtpo7pQ4/5//v230sa5C+fTxtwiTWDGYu4VhGW826bpap4Sx9z88kvu1o9pkHzrfeQaJYEkOLkZuq5AyvMiYqkr3XJIr4oDVHyKJv1bziFfPoejQUrwrSq+XNI5ENJNX9lJRBZzH7YL8VxhiJFPVK7fg2sqvhz0ZWkFbYrpeW6JKHALlYVufvqIu/UbVBf36IRWbD9LOTDFxXX6w2P59YWwzMjXyNeDM4ycvJWXFQ7/NqNokgbC7HhhgUQee9WJWwqSiPJgx/k5obGzVVp4156jQba7R2mj16NJu7wuHppvDChm6NYnT4bG41qJX9zkkLIiVIWu/duHlcnGBs3by698NW2USjIzW49up42ViJg+a3Rdy+To6ISOXG820kYFmUv7e6Lpma8MDVzfPRUKhWIq6NNToVAopsEY5n4wEBNGZu4MfrG3K98OesRn3nqHKgA/ekJ7W+U1eUAHfTpyFft6kU/7boWakIJ8Djkt2MHMJpy+IhytjT27sAdHzgxtsa1eJqbj+8LCTk+JE1VmUZEYbqFxYLmL4l8U9hN0wAEda/vb54yX6On0kKfBRgkDzFsJFD5nSR9WJYVhx8zIqrCagQ7w+We30sZxnfjjBx8TSVm/uMb9f/vv/3ba6PboAj9DzZKd/X3utn6R6E8m+qW08Uf/5Y/Sxu6+ZGFxkAO7i5agaVTzMjNNMKwBuHCIa2n5QpfcGLce1V+7feH1o+AtVy52zRTeZu5ByDldI/6eFpinu7inGaTW+EzSjQlgWuE6tCYdBAZkinLPCrhrV1boWrZ7FO0Qzojw8vIcneLtW3SzvGW6WfVtYoiPb93i/ghtMEuXaHPcYbXKyvSLxXuFhsRpQmMRcYgCJ+9YkpSUeeZ0LPZnsVa6BxmnkqWjzMzTFEU42rlVmaKdLVoVb/3F+9QNR3OsHDDeMe93qT+bAlu+KKYPtacBO49Hj6lATtcyFf3LH5Fy9cJL19IG61q7hzvcrX1Iz6WlMzS9bHT7+InU+RiFvnsqFArFNNCnp0KhUEyDMczds2wWY/H35K324c1KY2XmP/yS3p+rWdjtWSUhXYTdcqEIF0UZQ2vT9uiA2CJTjBgc5qgt+26tDqKy4efhYDORS28WLEfOfJnIzsLiDE6KqpyBHNZBSUgPlosoNGl8y68wRNT0oD/sn2JD7DrBwjIIDMhYRAjTIMzFqhghrOosTEWrKLkxAJ9hvnz7zib3b7aIsG/v0n15600qn/kIRi3GmJVaLW28eIWcVfMwX0himRk/JLrEzgk5BLpnLU0j4h15XHwR9RSX58Rv8uiQOFcXwog7IhPZyGIN5DhWn8007R1m3rS1K2Kk/7HjGUY24uNBg4bdFuXKy9GeuOvSQoojmhDPuuQsVKxTsP6Fs/SHLcvOI+7QWZ+/TkRyF5Ujtz8nRSXsydljEPCDrQ9wpTSMWaSZGGNmVqhdQE7EV18Q149RsJ2HZVJqiRvC4ocTNzzrJ99BQkoPa6y2BNqbp/vY60lIP1eCubx+Hh/R1O/s7HE3rj3D52JPW9tqNcRv5+HmZtr48TvvpI1vv/4N7rZ2gaJrthEkn4XeMjMntrmNJoq+sHEJ1n/ejm0Ygb57KhQKxTTQp6dCoVBMA316KhQKxTQYozSFvi3kQXmExpRwnE0kisDxNsVndBukhrz0ypW04TYlWH//CWmFuTwCLyB1nZ5IZEwDhsoOJ7cU6CnPZXmMMbsHNE63SB4iMQJHei06aTFvZdSgXcRFhS0SWYK+iLNc7IXL5hjkWhTtwjsQzOxTjAFmK+EQGdgfBAOZ54yY747a68rxFxboSi9fJYHyDKK1/B6phxzIZYwpIE/j7pfkXvz22z/GNUnIy/4WpX+UXAlXoWGHlgcKsn1Yk+JLTyxbCm4FEChLSB6bW1vlbkmRYtROm6QVciXqseBqOTEaCd8gq4YwBypxhJMjxYelm+MiE6nfSBv+6SHGLy68iaHJHAxQTBuWFraVczugkR/N0JWu5+ggrYas//dws/7uP6RIsg/efY8an5GFzdy8ZKAVZ+n2ZefpZpXmSa2rrYjuWV6oYki0Pk8a2+bZyIg386Q0OQbPrmPF2O2hlvg9pPD90ne+TsMuFXB8KzsI8uU1aJEZpJa5ViWuCFsjESR1Bzc0b8nitXmSlWs1epLMzVGjWJaFfeHyStp47yat8G6DVNr1yxLYt7BIcnz9qEFjy53gWia9X+q7p0KhUEwDfXoqFArFNBjDOk8OhESXK8QdcqiWE6DwSNvytdzfpj8BqTLlGsIdrAI6bWQKnTSpX88nuhRZngu1Ik6KFJwAqQVuKC/5fp9ewtkekAuktFFDuGS9xueRJVIEg5sBEw8sJ44EGTVxbjiew64FVOH/cScxd/brzJfoFD6CVBIrmipEQJO4sXAFY8u80mdHSyRqVHGD6n3iv6WCjPKrL1I94R+99WbaKOdpGJ7lmcFiAtt0HoFNFxIrrMoZDmFxxfXVCicBYefD9hBJ9ujgSI7mQSEpcsWbMUlBDLkskKkY0SceCmIbY0qY5xxsUFzc7sO6kOjtA1p4XdyOQUJLK7LC1wYDGnAAuxCDdKnQso5dXqWT3nj5Rtp4+Blx50d7ktPVXK6ljU4eiWfLxEDPP0+ahlcV3WB+FQFqS0TYy1VquAVZPAO4i7YRebP3aNM8G5Nm+Sk4T/3nqZY5PqKfGMcXdhGflEPaYMGqRHT9+iX6Ft32H9PMbGyInnP9JVqxIfxwe3imnD8nXLtaRQ0lZCHOI4lo4Ity1Q/pqVKo0GKoH5IyUMcjwhiTheGp79Pc7G7T8jh3oWaeDX33VCgUimmgT0+FQqGYBmNYZ9Cwsh04zaCMkrZIRQh88cRswqsii4oRRfSvVGQP8U6RHtZPDokQDbDFVvCEIZ5bpp3l1SWqMlrKEBmoJjLgLDz+mshPKGBv9/SYTnRiFVIuVohHzCPXiHNP2P3fGDNgmwlQMyaqcTKG9CTO6GeC5bNn00YGM5PzOHPDcgmBhpBFHs/D+5tpY3ZOJtAHBeZx5EFwlpA7kbWyI2JcPhsx5HhP38p0isG7M3BvyaEqtX9qOXLmWAbhOrq86y3Xwsft8eLBsIOOdTSOo0DAQ2kipfzbv/YLNHIwcQfFfos5ueQAe/73HlP+24P7RKJ539wYEzu08LLIg/LyZHYZB0L9EpDiJM7hWuiTalUUkr/xay+ljRsbG2nj1s9oJzrOygqcO0fn+vgeOWWUZuiw3/hbVPTCsXxXHdxcPhMb3Z40xb2ijQS8Zpu+LXuTqsWMltt5BpuHPgORqnEs0scHNz9OG9uPqTTx+nMUB/JKjeSIrBUusnqefghZnH1hlXa6cyUh+GsblIk0u0hBBREWqrX8zPERPUB2d8nsowDblCc78vgagLnnIPKsb9AwmlaARxZhNvPz/GSgo/U6E+vuTPhOoVAoFM+CPj0VCoViGoxh7pfOnOG2i13vDDasEzCz0LJ0rJSINrKjfQ18c3lGulXnic7Um8TgVs7R2/svff0Gd3vvJxRC3EOVgtU5KqWZiJWhyYGn57GVzxYbXNWvFcn+6TdeJ2uG2gIF1vawPedZ298+73GzwwcOG1oR0rLv7E76F+jatWs4BthuFqO1yyHIYamxjlIlc7NiZ3AKu8mfvXszbVQwCR3IF7/1936D+9/78k7a6GNCuOhjxuLaPgi4izKfpRk6e70pBCdy2J4DFVMQA8Dc3BgT4hoCEPw+9qkdq4woT2AIAh5YNp2juHKJONcANqAhpu0YIdDGmB+++2Ha+Og2xZ83ThHkYB3NhVTiSRYD+Kw1yBxIaw675DNz9Mn1G7IFfOkF4puHO5Tocf1Vigm/khFjlMsvUApJoQgdDA40PmL7j6ywhE6bNQQaZKfXQ38RBHJZ0rX8Pn1bm5kzz8b+Lv2sVlYhVtgmIWiMBsk/eSyemB98QMz95JAueRF1Pr5y7TkaxplZ7l9CWPv50oW0sbBBoeyJFbCRxWLgX2SGf/LWr28WP4rE0PSeoqjG4+0t7taBoXC5Rnv0DtbwIJYJzCOAIcbScjg5KJwkJ+m7p0KhUEwDfXoqFArFNNCnp0KhUEyDMbrnbEUSbxy27UWgEtvE9gYiQ8wgPmkeNUvnF0l5ybkS2OQhIKaC4IPXvvNK2vi6pXuWl2gAH99EER4kNjiWgUmuBlPkAHE8PkoSQchZWqlx/2/+ChWH8RD5kEAEyVi6J0fhcHwS58xYqUZiF/1UodsRHNUbaNLYBi7cLizdkwfAn51fJ1ntnlUTeP+Y0jNuvEBy6nafpvcnf/mTtPHat17h/n/6v/4sbbC7CttRZy3PhQwSyWaqsFqAfr0TSmBTkMCWxRlOJMvZ4i8mJmIBFF9mMzJXAfpFbHJsJs3kf/vvP0gbTVxLEyLg40Ox1z2BQQznZXHlIs+z3xUQicL2LLClsP1wa1hji7D+PbtaSxsry1KJq9Om1KzMDJ3ipW9fxGVa/ilI3Oqj9k6nTpfQ6pJ02zwVDZercnENYR8/urUl2ZzY/ZJ+Hc3jRtpYvr5gno0dGGOfXYEma63hmJc5r0U8A9rHEgxUR/ugTtd+7x6CtJAZmLV+MFJCGU7SLixsnrrrXA8ZJ42QVtdG/psx5rSJPENswxy1KOWp5UtYVQ9lhwMs48EAps4D2RHhwL6lWS7RTF9lspPWpL57KhQKxTTQp6dCoVBMgzHMvRdJeD0Td7bCyIL+uFnZy5+p0Dv63ByR7nkY8O09kgiMbpfekFcuU/TJheeIgLRDIQUXrpNrwCLimdqogdM5lW4BmMWHH9xNG/c/IwYXwGLjyvkl7j+/SOSrD2uSBPTNs4rgxAnicvifFglOskqnss2pXad1BC3LswDHBzeJ5aQO/BTYHGTrIfGgXkeo3BdfkJRx9879tHH12uW0MbdEV3oHXxljXn71q2njz773Rtqo1oguhVZ4ECc43f2C/vYQZWCLFQk6KRbp5rbhi9pE6kvGKi00a4ijJQkSyeBTGVnVmyOEjMRc8DkesxoZb7xJzqRcCttFhtjW7iO5lvww3/SQieRadXojqD0sYFSQO3RhQ9bMiy9QreYNpMrMzRRwNOGlLXjcHDRoaTUQItaz3HK7iCjigj/9Abg8ZjK27kuIQfo+ql2h1lbUkplcyhJP34Sw0z6aVEf38gZdFN+zp2oCc2Ok6FEhJyl5XPmHL5CFmkyGb4EM0rIaoRnPcTcrliwZKaTGcK3MJQ5uO4Qv8OYOOXjuHsoDp4eaY+wflGChrp5d5m4ZHLmE2K8BBLFqtWieDX33VCgUimmgT0+FQqGYBmO4Ut+RXUKxXOSqDODLGSOv1vBUNEtLlGLEe7APH+5yt+M60ZlvbBBhL4LyD0Lhp1xgI18lplCq1GgUkbxIx8jk3z2lXbab71P9iaAHK0/L3zOCgSMfnwdpl6rNwSyS6T9bmsbWPzZsbRklkzJkuEoB71MH2OAbWAapPuob877w1ibNW9PaaiyXaSu8DWL48AFlVvzVX/122vj3/+4/cX+upxrhWiJsPnLshLH2dlutRtpgXl9BbWdjzIV1yp9hd4nTUxpb3ao/MeCiykzXpLqycDSeSq4j/VTKywgah0TNqrNEVCMWRdqSENXhCsDYLZ1h50eJ/jAxVn4ebqEvvrSRNn7zt77J3S5fpA/LUAl2UNv20a4k3jw+oPb+Ccp7RHT20PKpYZIbyO1AGhvntFgaiIft74xDNyhA/ZV+JD/Sb7xMNXgfwzujmEx6K8piTVqEWb6V4ticb4P7uAL5whhz5Rr5dT54RCvQlbuMTo4tCCCViz/i1TEu1oLXGB+2UpEgB67oE7s0M3vHKHKeiLzQa5FUkp+nS76wwWtYJrBYoG9DhDQ82iRnmcNJEoi+eyoUCsVU0KenQqFQTINxNTUd2SmTt3c0ODTd8eV1P5JCEXTAEGRwf6/B3WZR/G/tEm2mD2J2cLDJA51rEIHOc0C1tRPHvJv3Ul3UiQRHN7m8MHfHwyXg+pKEd4flX5GY99AxIt6Ss7eM2fTQjSf9C9Tv9XEKDIPDs60d/MGA6TxTZiLpHWvPPYuTVhHWPjNDU5rHHmjWKvzZgfNjEcVOWBlwnTHD5gtkSl5dEqnk7DJtU/pgoItzlBMRWpT8cZ3YTnOX6E8Xsc0Zq7YJMzKOd4hDIVOj+PYr19PGXofO/vkmccangvCxzeqh4Gc+R5ewdmaduyUo13p6RJYZ2YREpxlrm7XZotiD935M5/ru/3w7bXQCEV42bsBuI0cT6LNzjbXvzIEaScQ5C3TX2IWHyaYxpokIkwFrR/hZLS+e426lAi2Gi9hHnq9Oil7IWHaoKRzr9rHDjhSVAbGdOyPmI6/9MiVlfHDzo7TRRTHXBhbPwqoEbIyxEGWJYNyeu4yNf+eWRMZB7xEChDwUehn0ZGFvPaCbO+jTr2lxka5ld0eElzXU/KjA7HVhkX5Wjx5JOMco9N1ToVAopoE+PRUKhWIa6NNToVAopsEYfSSOJMaC1T0OT4ojjmGSJy9HYJSryDeAyGhbP2xcIz/UuTMk9wQx6ReeK3EGrIg4LrJQoH1EA0siCUgDYi1tHrpqF2onZ9EYYzyUTmLtNAzoT52MpXuixqmBGMq6p/eUVohBToyzYYnQw0xm4P9q2yqzfMnxTA2Uz52bq3G3gd8b+tsGQoXqMGuwY0Ly+eLQt2fP0i14Kl4KstreHkmWDq7UVlEvXCAPYK4ws79HupIdsbRUJbUrxMy0MOx2V0S9FhThAuxvHcuwdhQlj5VEik8qIkGrb0UFZVApyEN6SSw3yErucumSZ5ByUlrEJBw/5m7bD8n693v/leyoe6coqHsshbtPML2XXyYBlKfIdUTqTUK6NTFU0VaL/rDbpdkIrVAk1qYLEPTbnGsXW6F4+EleWKGLqRVtQ5thFBCxFLMFjLWGn2zS5fNP/9wl8jM2lrPMjV+g0sGv/5XX0sanH92mIzwhvfviVSk1LBbIzkjo0kSwEGor9fVGI238FE7qXyDF7ss7cvt6yMjqozyRg12NWSsUr4/J933SfEsVehxdv3F5wtj03VOhUCimgT49FQqFYhqMY+5WZABcPaW2CQfNJJ68es+eJS7ATLlQo+fymQs17jY3t4BuoDBSXcc2RyDyksujCA8cGWyWnIXdQCZHfzu/RHSmVAI7thgMx44EHBkDW4rEOq4n4S+ILwHVz2TGTJdXmBQdwkWSmSmfNoYjQmywESfHDNmBTdncMCPjlIwvPr+VNk5OrLQfBHZwRFQPfNl1ZNj8IQdrrawQA63NS5DKrdvkNLq2SvS/XKVAkJUz4rnAeVDLdQr3OWkT37SjfI4QiVUsU5ZIwZs0k/e36Wg9UPhL54gY9vuSRXRySvk2ffiz9GH4uLUjsV8zC7RUXvwahTFdep4Eh05Pur395idp4+wiZcdd/xYV7Xnv/Y+426f3qYbS4gYpMLNleJsOhIn3kSkUQhzjWKtyicYTWpS836H70TyiELy9Bw06fkZ0g06X5IV8hn8vwzFJNqKRisT9nigqT+D+Wa3SfVk4S4shXxa2y4XLvvM6pWblEDMkOpv1s+Ifuiu63BjJi4dk5SY5Q4c1xhTxs9rfJ2MUzg6qH0viWQ6LfBW12s4sU6zkvhX7CAnQZHO4HWDuuZFfnA1991QoFIppoE9PhUKhmAbjmHscWm1qlGCjz8kAgbU1P3+W+B1vizW6RJdKc5K50faJYX16hzI3TpvUrdsZcDfeXFtank8bC4s1Ohq2WY0xCzXiDqUKskTmiUgWS3RdrsWOmRRIylDEXN7atBVFwh3+Q09mhrOYeHd1LE6OiVVlc7wFTHPKO93GmAFcQvhotdosPhEWxkIEHySECnGME/UHMpOFPKcY0UHKoMm8HW+MKeQL6MYFeGkYeWsCGyh63IBxSaFAB1lfkUIR87gdL16mArxH2JE/AoU3xlRRGoGtLb2J27An7P6A+sZuhzjakpV4U6vRyPshU3jcXCujLI8V0urQkO4+JheS9oHQ2NN9OsV3/uZ30sbiItw/LenjPv62eURXmvSHtSxjzGyNeH0OFi2823sIvtk6FN2g36BvG2j04JD7JHuPu23dJUFs4zzpJ5OZO3vIupDL6ifiiXl4iPycHt3H9TbdoErFelyA5F7BrnRlnvoXWIWIhB17UL1YQONni2dloPHjhQl7gkE6VtbWwhyUpQo1ui2qkOxYjy/2YOVMvJ0n+0OHNdbPPwdbogSBAfHEujv67qlQKBTTQJ+eCoVCMQ3GMPe85axhuXIMO+Z7Vhx1AZtx9+9tpo2PP6TQWSeRfbrdHdo2bcfEU7oD2hj1fXnf5sj5TIYIfhlv4FWLxm6sk8NgMQdDjTYCAzA2e5e83ydKG4HtMke3LzkHzxEu3sCv/fauH09Iu9k2PwdiVgkQ2m1Tfg787iKenEeey8kldHs0XRwtHyLgmV1FFhelniIPmB0c+A/zVpWFIvxZWaNgQWBgOXeIHSr+0e2HxOnubYqZQgXOF/Uj2t8sw9NkvlbjbjN5Ivst1Pk4qUu0wCi8PO5yg1bRk63NtHEwc8LdVtdITCjO0rVwJVfLeFIsYzqndPt2HtN9Obov8sLZWYou4KAC16XjLy2IWFGrYqt9lm7WlasUYW6bV27vEEHevk8WFd0jouRFxMM/f04Ou/4StWM40bCZrGct7GUIXLPIuUhGylo8Df4t0+LZeiwR5ieY3nKZtKNKGakcPdGaAg5EKdLIz16g0fIFJ+OlmOGqmbYzCLcjHD/BIK3YE+Miw6KQgxFJhAgcK/OFq+awhrCwSPex021wt9kSLa3TLklSAZxoKqY87hIwjAnfKRQKheJZ0KenQqFQTAN9eioUCsU0GKN7ZqzCrR5CK1gv4/CCwLKydZBJ8GSLqvFUIJrMlFa42/YWKUpFKCkbVy+mjdapqIf7exR8E/h0LlZFj9tS4Pdgl6TVvEfahId/DFxDClp5RgbZ79fSRg41arj0sm17HHOwAqwcfGgxtmUGz8NklxAOWGEJ0nHorLbtcYDZ5P4saA4GcjsSkb3YwcQbGs+gL9FX/CF7VXA0mC00O+4AY4NwzCEvnl38htohNCmXM0isjIxGREfrbFP6RxaycqYkYVILS6RAVSEarq9J2ZxRHB+Qg0nQpaXCIXMnx1J9pt2isZ1doyg6zorxCpa2nsN6Rh0hv01/2DyWzKVrV0hSZO2Pbb/7XVmxfNeqReq285Difo4fSVJQBtO0jgyuq79AvrxrK4s4kcTkOQgXY2GQk8FcT5ZigtgpjryZuCSNB71/Z5dqNN18/yZ/2+3SspxBRCDHIX76+W3uVkKa2eo5umt5bE5wcJ4zMdyHYVuec5t/Eax7nrbl9/L555to3EV/th+X7QT+vWahfS+t0K5A4/6eXAt2IKp4krSxT8CbJWOh754KhUIxDfTpqVAoFNNgDHO3w3IisCN+MXbx2m8XIOm1KcphZZliUxYXycHh5FBI8fo5oidXrlHjwkVKFej35A15d4eYe+OEzt7qIYjEchY43KPgnr2tBn0JitFpU+TB4YEkUSTJxaFunEhgWUAav0/MOsElcxWa2GK7HFGUdSf5CPSkrtFwyFfXMrtkDxF2FeHAppLFdkdPVUDNGb6oRkcCbthhhCsSc3+bVfVgEsFuKfxtriA8KItKQez6ytcSOdZq4HvEKgGMOztHQr729ojSco2mM2si8owi7BOZCgNaKrwCfUtF4mCdbhv+oRBqilb5oxiiTYDUrD76tyybicx1pCShNJOPYQQDEZECFCPa+4Imf3WZGOLXLl3ibhcvEMldXCRSzAoJM3HbWYMDbnh98jSHltbEbVljE9+KEkP9P/v087Tx4P4D/rZSofC1/UPitvcfkXXmmz/8AXcrotvVa5dxdRtp49JFitayk4ickarU8biwqgCJYffu0ZA6INE9K17qu//jjbTx+W0aW+zwUrQkRZxrENJdPj6lJ1WhLBF7PiQ8Ni3i+xJY1rGj0HdPhUKhmAb69FQoFIppMIa52xk1GWwmMp/lV+usFdPP3h0XL1K+AZv9Jb7sYL72KtlGzM9ipxiVOeZn5UV6rUqmD8GA3p9PAyJTA1dey+sHNJKf+J/hpDSOxgm9xtvVZfMZkGL4U7DtgJcRisG72JwowXV07bwRrqLqjSvtK73AHazsILoEJtHG2tpjf09mPU/FA4ywHtelaymj0gAXHzaWOMDMnfl6bCkv7KXCskwAB5N2S2hsOWYTFjoFE8mnrBpxCh8jZ9ZWsExepDoFNq/b9++bZ8MzTM2Gd3JtCugP6KR7uxR30WrSOilXLJeQIi0GTjMrQqOAHagxxhwfN9LGwSFJQB6IYRyL1vTS87R1fvk8KVErZ4i5l8uW8MKT78IyA7vCUpXXctZw8XLDSUF86Z71I+WUHs7PETfNcei0acI//vjTtNFEgRBjTKVC92hrh7hzO6AZ6fQlfuDhNm1239+8kzZ++VUy+jyLvKxKVfIMeQ1M3oh/8oSysP74u3+WNgZ9DgiRxfPZF2Q12+rQyGcW6YZWSvJMa8DrdveQwj/O1OkucxUfY2XisXUIPwTGygsMffdUKBSKaaBPT4VCoZgGY5h704ri9vLELNh70UXDs5+88PVg60AueFmrWGYiedqn8316Gw+Q25+LrejfgAkIdatg49ezdlfzs/Tp+WU6bBLRMJ6/QuUW8kV58S561C0CzwwNdvFsGsslHjE3WTbs8GQDOgqG90PHggk4M0Tezjs4OBztz3YhTHDsrflcno+GgH9MeP2kkTbmalJLQy5qRDcoWYyStRresGaKHVl7jmK5GA3LEU5i7xRzORe2aDT4Q4uWQvnJZ1HicSJLCjlinGs8cMpAZC1j6Byy+Q7r2E5bNJAkQuIGCkyW4HbR7ojWdOfOZtr4+je/mjYW4GLZ2N/kbt/+xgtpY24WPh0ynDEOs/wjitmwA/dFatYak/ClJiO016a/vCPPP9KJ7LiBgpRtUHjbWaPZIrbbg5WPydHPpDQrApfXog/zJVqKXG6H68jaiEZknNFdeGPMndskCLyPwidiSTOQs7MfbmWWfk1XnyfNsLYgGuDeLru30F3mhe1lZP0XixmcglYFSyXNhmgao9B3T4VCoZgG+vRUKBSKaaBPT4VCoZgGY3TPjlWe1EEJWTaLyEJ/ii1zX4+9MFipgcKVz1haIeROlgpduJAMBqJJZRAD5CAiJotatXEk8qiPJ//iPKkbp3U6/sYGZTpl83JYNkW2wj4Q6hGOUdxGrYILGZFUPNjZsp3HWLDcw6FIrGOGlvEwd5uBwS2nGJ2ciPUvG4uwh8LCAipKwQeE05bsw7Lqmkcuk202K8LTiCaVzeZGu02uFsvRS9I/GSMNW0FX7oRujOfXybCjjvJK7S5dcq8nipiPCsB+APkSWSjzMxKkUsaK5Zlk25RqwdLX2pT29u7bb6eNKxcpnO7quhRhnput0SXwrkCWFWFZWhE0TXa+ECGYI9ssRdNalMMluZ6eKcT/sXw5MWLp5JgCdFpIrzqC1mmMqUGGXptFIeICzt6Xpb60SJO5sEB5g7V5LqI15j5ai4EOwmJroy4bLTdvfkFDOqK7HER0X6JYfn0cK8dC89k1Wh7lGZm2Coqq5VDFqwB1u1CRhd3rYbfGp1XRbtOP1Pc1YkmhUCj+b0OfngqFQjENxvl7Wrn9fQ5YAZsuIDvCTrzJIHeCM5EivPG6kZW5hL/NIQaIA3oyVoyFx5R5AL9CxKFkLCLJA7h4aR1np6/OrNTSRrMltNdHlEM2Bw9BkO6sRcnZClOiQ2Km8EJJcp4z1H8suOywZXZAdMkuNcy85vSUIiSYa9t5UEwzRxM2OMWoUZcYC05nsqpRQWOxUqSk/iq6ccM+jfD0Mdk+lkIyEnjkumP+kR7l9WO7MX7vN15PG4eob9zElHa7IlZ0YTfDxa7Z6OHMwix3u3COaCnnXPVhQhFbYVV5TNccTEJXUXeoVhMdIMFCYkrOkxAnk6jf2Kgd69tnNuw74445yCTmfooonKM6fh0WJ55ZpuuqzNKKyuZoBVYQ82eMqVYR/wcBqotKQf0BMfGiL7lGmZGKxHztD+5LUayfvUeFhTtIbmQn1tiVu8xJQb0efTtAbefyjPysMnmIQljhbfz6BpHIBSE8RDLw92SblVJJLmEU+u6pUCgU00CfngqFQjENxjD3wNoLDkaYe4wNvozFKGNYYcbgtpxAknXlRTqfRUoSMxE8vXNW0Yuwz/SfGj7e9t2snJTzbQrYUGPKFcXE6RzH3hCHmMCmGDGTdDksGyy6I5khvrWdHUJM8Cb6ezI94dFKCQ3raNyNN1WZwvf7EgLhYeS8NZ8I8RwuZWyflNM/soiUsBnlKBMfzYox49il5dWY2J/yUYa6jXWI4KSgieUkzNxcFQ0iU+yU4TwVP8AVTeiSObYh40m3Qn5YOxLLE2scWW84Q4wTnOwrZvrPqV+SRDSu3K5U2oh5AvlQ1mHN8IdJwmeXfnwrrQ8nzeUgoKU1vwgVLl+Trx2aty64M5fzNZaLK5cqGUBNasFU9xEqRUehTPj8PG3NI3xGIhC2tp5wtzb8Smo1uN4gmyibl+cSb51nwesjeMh2hZGbHqxgPQ+ZRZjK3kDCDAowFikVOOmOzhWE8iMdhb57KhQKxTTQp6dCoVBMA2cbhQ8VCoVC8fND3z0VCoViGujTU6FQKKaBPj0VCoViGujTU6FQKKaBPj0VCoViGujTU6FQKKbB/wZ/Q/tTCmVuZHN0cmVhbQplbmRvYmoKMzkgMCBvYmoKMTQzMzMKZW5kb2JqCjIgMCBvYmoKPDwgL0NvdW50IDEgL0tpZHMgWyAxMSAwIFIgXSAvVHlwZSAvUGFnZXMgPj4KZW5kb2JqCjQwIDAgb2JqCjw8IC9DcmVhdGlvbkRhdGUgKEQ6MjAyMTEwMTAxODM2MDYrMDInMDAnKQovQ3JlYXRvciAoTWF0cGxvdGxpYiB2My40LjMsIGh0dHBzOi8vbWF0cGxvdGxpYi5vcmcpCi9Qcm9kdWNlciAoTWF0cGxvdGxpYiBwZGYgYmFja2VuZCB2My40LjMpID4+CmVuZG9iagp4cmVmCjAgNDEKMDAwMDAwMDAwMCA2NTUzNSBmIAowMDAwMDAwMDE2IDAwMDAwIG4gCjAwMDAwMjI3MjYgMDAwMDAgbiAKMDAwMDAwNzkzNyAwMDAwMCBuIAowMDAwMDA3OTY5IDAwMDAwIG4gCjAwMDAwMDgwNjggMDAwMDAgbiAKMDAwMDAwODA4OSAwMDAwMCBuIAowMDAwMDA4MTEwIDAwMDAwIG4gCjAwMDAwMDAwNjUgMDAwMDAgbiAKMDAwMDAwMDQwMCAwMDAwMCBuIAowMDAwMDAwNzQxIDAwMDAwIG4gCjAwMDAwMDAyMDggMDAwMDAgbiAKMDAwMDAwMDcyMSAwMDAwMCBuIAowMDAwMDA4MTQyIDAwMDAwIG4gCjAwMDAwMDY2NDMgMDAwMDAgbiAKMDAwMDAwNjQ0MyAwMDAwMCBuIAowMDAwMDA2MDM0IDAwMDAwIG4gCjAwMDAwMDc2OTYgMDAwMDAgbiAKMDAwMDAwMDc2MSAwMDAwMCBuIAowMDAwMDAwOTI0IDAwMDAwIG4gCjAwMDAwMDEyMzIgMDAwMDAgbiAKMDAwMDAwMTM4MCAwMDAwMCBuIAowMDAwMDAxNTAzIDAwMDAwIG4gCjAwMDAwMDE4MDggMDAwMDAgbiAKMDAwMDAwMjE4OCAwMDAwMCBuIAowMDAwMDAyNDkyIDAwMDAwIG4gCjAwMDAwMDI4MTQgMDAwMDAgbiAKMDAwMDAwMzAyMyAwMDAwMCBuIAowMDAwMDAzNDM3IDAwMDAwIG4gCjAwMDAwMDM2NzQgMDAwMDAgbiAKMDAwMDAwMzc5MyAwMDAwMCBuIAowMDAwMDA0MTI0IDAwMDAwIG4gCjAwMDAwMDQ0MTUgMDAwMDAgbiAKMDAwMDAwNDU3MCAwMDAwMCBuIAowMDAwMDA0ODgyIDAwMDAwIG4gCjAwMDAwMDUyODkgMDAwMDAgbiAKMDAwMDAwNTM3OSAwMDAwMCBuIAowMDAwMDA1NTg1IDAwMDAwIG4gCjAwMDAwMDU3NDYgMDAwMDAgbiAKMDAwMDAyMjcwNCAwMDAwMCBuIAowMDAwMDIyNzg2IDAwMDAwIG4gCnRyYWlsZXIKPDwgL0luZm8gNDAgMCBSIC9Sb290IDEgMCBSIC9TaXplIDQxID4+CnN0YXJ0eHJlZgoyMjk0MwolJUVPRgo=\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-10-10T18:36:06.917884\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["test_transform = transforms.Compose(\n", " [\n", " transforms.ToTensor(),\n", " transforms.Normalize([0.49139968, 0.48215841, 0.44653091], [0.24703223, 0.24348513, 0.26158784]),\n", " ]\n", ")\n", "# For training, we add some augmentation. Networks are too powerful and would overfit.\n", "train_transform = transforms.Compose(\n", " [\n", " transforms.RandomHorizontalFlip(),\n", " transforms.RandomResizedCrop((32, 32), scale=(0.8, 1.0), ratio=(0.9, 1.1)),\n", " transforms.ToTensor(),\n", " transforms.Normalize([0.49139968, 0.48215841, 0.44653091], [0.24703223, 0.24348513, 0.26158784]),\n", " ]\n", ")\n", "# Loading the training dataset. We need to split it into a training and validation part\n", "# We need to do a little trick because the validation set should not use the augmentation.\n", "train_dataset = CIFAR10(root=DATASET_PATH, train=True, transform=train_transform, download=True)\n", "val_dataset = CIFAR10(root=DATASET_PATH, train=True, transform=test_transform, download=True)\n", "pl.seed_everything(42)\n", "train_set, _ = torch.utils.data.random_split(train_dataset, [45000, 5000])\n", "pl.seed_everything(42)\n", "_, val_set = torch.utils.data.random_split(val_dataset, [45000, 5000])\n", "\n", "# Loading the test set\n", "test_set = CIFAR10(root=DATASET_PATH, train=False, transform=test_transform, download=True)\n", "\n", "# We define a set of data loaders that we can use for various purposes later.\n", "train_loader = data.DataLoader(train_set, batch_size=128, shuffle=True, drop_last=True, pin_memory=True, num_workers=4)\n", "val_loader = data.DataLoader(val_set, batch_size=128, shuffle=False, drop_last=False, num_workers=4)\n", "test_loader = data.DataLoader(test_set, batch_size=128, shuffle=False, drop_last=False, num_workers=4)\n", "\n", "# Visualize some examples\n", "NUM_IMAGES = 4\n", "CIFAR_images = torch.stack([val_set[idx][0] for idx in range(NUM_IMAGES)], dim=0)\n", "img_grid = torchvision.utils.make_grid(CIFAR_images, nrow=4, normalize=True, pad_value=0.9)\n", "img_grid = img_grid.permute(1, 2, 0)\n", "\n", "plt.figure(figsize=(8, 8))\n", "plt.title(\"Image examples of the CIFAR10 dataset\")\n", "plt.imshow(img_grid)\n", "plt.axis(\"off\")\n", "plt.show()\n", "plt.close()"]}, {"cell_type": "markdown", "id": "de31824d", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.01573, "end_time": "2021-10-10T16:36:07.015490", "exception": false, "start_time": "2021-10-10T16:36:06.999760", "status": "completed"}, "tags": []}, "source": ["## Transformers for image classification\n", "\n", "Transformers have been originally proposed to process sets since it is a permutation-equivariant architecture, i.e., producing the same output permuted if the input is permuted.\n", "To apply Transformers to sequences, we have simply added a positional encoding to the input feature vectors, and the model learned by itself what to do with it.\n", "So, why not do the same thing on images?\n", "This is exactly what [Alexey Dosovitskiy et al. ](https://openreview.net/pdf?id=YicbFdNTTy) proposed in their paper \"An Image is Worth 16x16 Words: Transformers for Image Recognition at Scale\".\n", "Specifically, the Vision Transformer is a model for image classification that views images as sequences of smaller patches.\n", "As a preprocessing step, we split an image of, for example, $48\\times 48$ pixels into 9 $16\\times 16$ patches.\n", "Each of those patches is considered to be a \"word\"/\"token\", and projected to a feature space.\n", "With adding positional encodings and a token for classification on top, we can apply a Transformer as usual to this sequence and start training it for our task.\n", "A nice GIF visualization of the architecture is shown below (figure credit - [Phil Wang](https://github.com/lucidrains/vit-pytorch/blob/main/images/vit.gif)):\n", "\n", "
\n", "\n", "We will walk step by step through the Vision Transformer, and implement all parts by ourselves.\n", "First, let's implement the image preprocessing: an image of size $N\\times N$ has to be split into $(N/M)^2$ patches of size $M\\times M$.\n", "These represent the input words to the Transformer."]}, {"cell_type": "code", "execution_count": 5, "id": "ae492f17", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:07.050794Z", "iopub.status.busy": "2021-10-10T16:36:07.048305Z", "iopub.status.idle": "2021-10-10T16:36:07.053076Z", "shell.execute_reply": "2021-10-10T16:36:07.052610Z"}, "papermill": {"duration": 0.022148, "end_time": "2021-10-10T16:36:07.053172", "exception": false, "start_time": "2021-10-10T16:36:07.031024", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def img_to_patch(x, patch_size, flatten_channels=True):\n", " \"\"\"\n", " Inputs:\n", " x - torch.Tensor representing the image of shape [B, C, H, W]\n", " patch_size - Number of pixels per dimension of the patches (integer)\n", " flatten_channels - If True, the patches will be returned in a flattened format\n", " as a feature vector instead of a image grid.\n", " \"\"\"\n", " B, C, H, W = x.shape\n", " x = x.reshape(B, C, H // patch_size, patch_size, W // patch_size, patch_size)\n", " x = x.permute(0, 2, 4, 1, 3, 5) # [B, H', W', C, p_H, p_W]\n", " x = x.flatten(1, 2) # [B, H'*W', C, p_H, p_W]\n", " if flatten_channels:\n", " x = x.flatten(2, 4) # [B, H'*W', C*p_H*p_W]\n", " return x"]}, {"cell_type": "markdown", "id": "1577af41", "metadata": {"papermill": {"duration": 0.016461, "end_time": "2021-10-10T16:36:07.085363", "exception": false, "start_time": "2021-10-10T16:36:07.068902", "status": "completed"}, "tags": []}, "source": ["Let's take a look at how that works for our CIFAR examples above.\n", "For our images of size $32\\times 32$, we choose a patch size of 4.\n", "Hence, we obtain sequences of 64 patches of size $4\\times 4$.\n", "We visualize them below:"]}, {"cell_type": "code", "execution_count": 6, "id": "bc8f2072", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:07.121184Z", "iopub.status.busy": "2021-10-10T16:36:07.120716Z", "iopub.status.idle": "2021-10-10T16:36:07.353313Z", "shell.execute_reply": "2021-10-10T16:36:07.353705Z"}, "papermill": {"duration": 0.252758, "end_time": "2021-10-10T16:36:07.353849", "exception": false, "start_time": "2021-10-10T16:36:07.101091", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-10-10T18:36:07.261617\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["img_patches = img_to_patch(CIFAR_images, patch_size=4, flatten_channels=False)\n", "\n", "fig, ax = plt.subplots(CIFAR_images.shape[0], 1, figsize=(14, 3))\n", "fig.suptitle(\"Images as input sequences of patches\")\n", "for i in range(CIFAR_images.shape[0]):\n", " img_grid = torchvision.utils.make_grid(img_patches[i], nrow=64, normalize=True, pad_value=0.9)\n", " img_grid = img_grid.permute(1, 2, 0)\n", " ax[i].imshow(img_grid)\n", " ax[i].axis(\"off\")\n", "plt.show()\n", "plt.close()"]}, {"cell_type": "markdown", "id": "cce53f7d", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.018572, "end_time": "2021-10-10T16:36:07.393026", "exception": false, "start_time": "2021-10-10T16:36:07.374454", "status": "completed"}, "tags": []}, "source": ["Compared to the original images, it is much harder to recognize the objects from those patch lists now.\n", "Still, this is the input we provide to the Transformer for classifying the images.\n", "The model has to learn itself how it has to combine the patches to recognize the objects.\n", "The inductive bias in CNNs that an image is grid of pixels, is lost in this input format.\n", "\n", "After we have looked at the preprocessing, we can now start building the Transformer model.\n", "Since we have discussed the fundamentals of Multi-Head Attention in [Tutorial 6](https://uvadlc-notebooks.readthedocs.io/en/latest/tutorial_notebooks/tutorial6/Transformers_and_MHAttention.html), we will use the PyTorch module `nn.MultiheadAttention` ([docs](https://pytorch.org/docs/stable/generated/torch.nn.MultiheadAttention.html?highlight=multihead#torch.nn.MultiheadAttention)) here.\n", "Further, we use the Pre-Layer Normalization version of the Transformer blocks proposed by [Ruibin Xiong et al. ](http://proceedings.mlr.press/v119/xiong20b/xiong20b.pdf) in 2020.\n", "The idea is to apply Layer Normalization not in between residual blocks, but instead as a first layer in the residual blocks.\n", "This reorganization of the layers supports better gradient flow and removes the necessity of a warm-up stage.\n", "A visualization of the difference between the standard Post-LN and the Pre-LN version is shown below.\n", "\n", "
\n", "\n", "The implementation of the Pre-LN attention block looks as follows:"]}, {"cell_type": "code", "execution_count": 7, "id": "0f69e05b", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:07.437581Z", "iopub.status.busy": "2021-10-10T16:36:07.437105Z", "iopub.status.idle": "2021-10-10T16:36:07.439187Z", "shell.execute_reply": "2021-10-10T16:36:07.438722Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.027401, "end_time": "2021-10-10T16:36:07.439284", "exception": false, "start_time": "2021-10-10T16:36:07.411883", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class AttentionBlock(nn.Module):\n", " def __init__(self, embed_dim, hidden_dim, num_heads, dropout=0.0):\n", " \"\"\"\n", " Inputs:\n", " embed_dim - Dimensionality of input and attention feature vectors\n", " hidden_dim - Dimensionality of hidden layer in feed-forward network\n", " (usually 2-4x larger than embed_dim)\n", " num_heads - Number of heads to use in the Multi-Head Attention block\n", " dropout - Amount of dropout to apply in the feed-forward network\n", " \"\"\"\n", " super().__init__()\n", "\n", " self.layer_norm_1 = nn.LayerNorm(embed_dim)\n", " self.attn = nn.MultiheadAttention(embed_dim, num_heads)\n", " self.layer_norm_2 = nn.LayerNorm(embed_dim)\n", " self.linear = nn.Sequential(\n", " nn.Linear(embed_dim, hidden_dim),\n", " nn.GELU(),\n", " nn.Dropout(dropout),\n", " nn.Linear(hidden_dim, embed_dim),\n", " nn.Dropout(dropout),\n", " )\n", "\n", " def forward(self, x):\n", " inp_x = self.layer_norm_1(x)\n", " x = x + self.attn(inp_x, inp_x, inp_x)[0]\n", " x = x + self.linear(self.layer_norm_2(x))\n", " return x"]}, {"cell_type": "markdown", "id": "b5f96bdf", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.0187, "end_time": "2021-10-10T16:36:07.476786", "exception": false, "start_time": "2021-10-10T16:36:07.458086", "status": "completed"}, "tags": []}, "source": ["Now we have all modules ready to build our own Vision Transformer.\n", "Besides the Transformer encoder, we need the following modules:\n", "\n", "* A **linear projection** layer that maps the input patches to a feature vector of larger size.\n", "It is implemented by a simple linear layer that takes each $M\\times M$ patch independently as input.\n", "* A **classification token** that is added to the input sequence.\n", "We will use the output feature vector of the classification token (CLS token in short) for determining the classification prediction.\n", "* Learnable **positional encodings** that are added to the tokens before being processed by the Transformer.\n", "Those are needed to learn position-dependent information, and convert the set to a sequence.\n", "Since we usually work with a fixed resolution, we can learn the positional encodings instead of having the pattern of sine and cosine functions.\n", "* A **MLP head** that takes the output feature vector of the CLS token, and maps it to a classification prediction.\n", "This is usually implemented by a small feed-forward network or even a single linear layer.\n", "\n", "With those components in mind, let's implement the full Vision Transformer below:"]}, {"cell_type": "code", "execution_count": 8, "id": "0228d483", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:07.522084Z", "iopub.status.busy": "2021-10-10T16:36:07.521601Z", "iopub.status.idle": "2021-10-10T16:36:07.523699Z", "shell.execute_reply": "2021-10-10T16:36:07.523301Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.02827, "end_time": "2021-10-10T16:36:07.523823", "exception": false, "start_time": "2021-10-10T16:36:07.495553", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class VisionTransformer(nn.Module):\n", " def __init__(\n", " self,\n", " embed_dim,\n", " hidden_dim,\n", " num_channels,\n", " num_heads,\n", " num_layers,\n", " num_classes,\n", " patch_size,\n", " num_patches,\n", " dropout=0.0,\n", " ):\n", " \"\"\"\n", " Inputs:\n", " embed_dim - Dimensionality of the input feature vectors to the Transformer\n", " hidden_dim - Dimensionality of the hidden layer in the feed-forward networks\n", " within the Transformer\n", " num_channels - Number of channels of the input (3 for RGB)\n", " num_heads - Number of heads to use in the Multi-Head Attention block\n", " num_layers - Number of layers to use in the Transformer\n", " num_classes - Number of classes to predict\n", " patch_size - Number of pixels that the patches have per dimension\n", " num_patches - Maximum number of patches an image can have\n", " dropout - Amount of dropout to apply in the feed-forward network and\n", " on the input encoding\n", " \"\"\"\n", " super().__init__()\n", "\n", " self.patch_size = patch_size\n", "\n", " # Layers/Networks\n", " self.input_layer = nn.Linear(num_channels * (patch_size ** 2), embed_dim)\n", " self.transformer = nn.Sequential(\n", " *(AttentionBlock(embed_dim, hidden_dim, num_heads, dropout=dropout) for _ in range(num_layers))\n", " )\n", " self.mlp_head = nn.Sequential(nn.LayerNorm(embed_dim), nn.Linear(embed_dim, num_classes))\n", " self.dropout = nn.Dropout(dropout)\n", "\n", " # Parameters/Embeddings\n", " self.cls_token = nn.Parameter(torch.randn(1, 1, embed_dim))\n", " self.pos_embedding = nn.Parameter(torch.randn(1, 1 + num_patches, embed_dim))\n", "\n", " def forward(self, x):\n", " # Preprocess input\n", " x = img_to_patch(x, self.patch_size)\n", " B, T, _ = x.shape\n", " x = self.input_layer(x)\n", "\n", " # Add CLS token and positional encoding\n", " cls_token = self.cls_token.repeat(B, 1, 1)\n", " x = torch.cat([cls_token, x], dim=1)\n", " x = x + self.pos_embedding[:, : T + 1]\n", "\n", " # Apply Transforrmer\n", " x = self.dropout(x)\n", " x = x.transpose(0, 1)\n", " x = self.transformer(x)\n", "\n", " # Perform classification prediction\n", " cls = x[0]\n", " out = self.mlp_head(cls)\n", " return out"]}, {"cell_type": "markdown", "id": "0fde39b8", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.018994, "end_time": "2021-10-10T16:36:07.561842", "exception": false, "start_time": "2021-10-10T16:36:07.542848", "status": "completed"}, "tags": []}, "source": ["Finally, we can put everything into a PyTorch Lightning Module as usual.\n", "We use `torch.optim.AdamW` as the optimizer, which is Adam with a corrected weight decay implementation.\n", "Since we use the Pre-LN Transformer version, we do not need to use a learning rate warmup stage anymore.\n", "Instead, we use the same learning rate scheduler as the CNNs in our previous tutorial on image classification."]}, {"cell_type": "code", "execution_count": 9, "id": "99bcb238", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:07.606617Z", "iopub.status.busy": "2021-10-10T16:36:07.606128Z", "iopub.status.idle": "2021-10-10T16:36:07.608256Z", "shell.execute_reply": "2021-10-10T16:36:07.607820Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.027621, "end_time": "2021-10-10T16:36:07.608351", "exception": false, "start_time": "2021-10-10T16:36:07.580730", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class ViT(pl.LightningModule):\n", " def __init__(self, model_kwargs, lr):\n", " super().__init__()\n", " self.save_hyperparameters()\n", " self.model = VisionTransformer(**model_kwargs)\n", " self.example_input_array = next(iter(train_loader))[0]\n", "\n", " def forward(self, x):\n", " return self.model(x)\n", "\n", " def configure_optimizers(self):\n", " optimizer = optim.AdamW(self.parameters(), lr=self.hparams.lr)\n", " lr_scheduler = optim.lr_scheduler.MultiStepLR(optimizer, milestones=[100, 150], gamma=0.1)\n", " return [optimizer], [lr_scheduler]\n", "\n", " def _calculate_loss(self, batch, mode=\"train\"):\n", " imgs, labels = batch\n", " preds = self.model(imgs)\n", " loss = F.cross_entropy(preds, labels)\n", " acc = (preds.argmax(dim=-1) == labels).float().mean()\n", "\n", " self.log(\"%s_loss\" % mode, loss)\n", " self.log(\"%s_acc\" % mode, acc)\n", " return loss\n", "\n", " def training_step(self, batch, batch_idx):\n", " loss = self._calculate_loss(batch, mode=\"train\")\n", " return loss\n", "\n", " def validation_step(self, batch, batch_idx):\n", " self._calculate_loss(batch, mode=\"val\")\n", "\n", " def test_step(self, batch, batch_idx):\n", " self._calculate_loss(batch, mode=\"test\")"]}, {"cell_type": "markdown", "id": "db79a63a", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.018896, "end_time": "2021-10-10T16:36:07.646134", "exception": false, "start_time": "2021-10-10T16:36:07.627238", "status": "completed"}, "tags": []}, "source": ["## Experiments\n", "\n", "Commonly, Vision Transformers are applied to large-scale image classification benchmarks such as ImageNet to leverage their full potential.\n", "However, here we take a step back and ask: can Vision Transformer also succeed on classical, small benchmarks such as CIFAR10?\n", "To find this out, we train a Vision Transformer from scratch on the CIFAR10 dataset.\n", "Let's first create a training function for our PyTorch Lightning module\n", "which also loads the pre-trained model if you have downloaded it above."]}, {"cell_type": "code", "execution_count": 10, "id": "8c1f2286", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:07.692103Z", "iopub.status.busy": "2021-10-10T16:36:07.691595Z", "iopub.status.idle": "2021-10-10T16:36:07.693685Z", "shell.execute_reply": "2021-10-10T16:36:07.693221Z"}, "papermill": {"duration": 0.028441, "end_time": "2021-10-10T16:36:07.693783", "exception": false, "start_time": "2021-10-10T16:36:07.665342", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def train_model(**kwargs):\n", " trainer = pl.Trainer(\n", " default_root_dir=os.path.join(CHECKPOINT_PATH, \"ViT\"),\n", " gpus=1 if str(device) == \"cuda:0\" else 0,\n", " max_epochs=180,\n", " callbacks=[\n", " ModelCheckpoint(save_weights_only=True, mode=\"max\", monitor=\"val_acc\"),\n", " LearningRateMonitor(\"epoch\"),\n", " ],\n", " progress_bar_refresh_rate=1,\n", " )\n", " trainer.logger._log_graph = True # If True, we plot the computation graph in tensorboard\n", " trainer.logger._default_hp_metric = None # Optional logging argument that we don't need\n", "\n", " # Check whether pretrained model exists. If yes, load it and skip training\n", " pretrained_filename = os.path.join(CHECKPOINT_PATH, \"ViT.ckpt\")\n", " if os.path.isfile(pretrained_filename):\n", " print(\"Found pretrained model at %s, loading...\" % pretrained_filename)\n", " # Automatically loads the model with the saved hyperparameters\n", " model = ViT.load_from_checkpoint(pretrained_filename)\n", " else:\n", " pl.seed_everything(42) # To be reproducable\n", " model = ViT(**kwargs)\n", " trainer.fit(model, train_loader, val_loader)\n", " # Load best checkpoint after training\n", " model = ViT.load_from_checkpoint(trainer.checkpoint_callback.best_model_path)\n", "\n", " # Test best model on validation and test set\n", " val_result = trainer.test(model, test_dataloaders=val_loader, verbose=False)\n", " test_result = trainer.test(model, test_dataloaders=test_loader, verbose=False)\n", " result = {\"test\": test_result[0][\"test_acc\"], \"val\": val_result[0][\"test_acc\"]}\n", "\n", " return model, result"]}, {"cell_type": "markdown", "id": "e359c353", "metadata": {"papermill": {"duration": 0.019033, "end_time": "2021-10-10T16:36:07.732020", "exception": false, "start_time": "2021-10-10T16:36:07.712987", "status": "completed"}, "tags": []}, "source": ["Now, we can already start training our model.\n", "As seen in our implementation, we have couple of hyperparameter that we have to choose.\n", "When creating this notebook, we have performed a small grid search over hyperparameters and listed the best hyperparameters in the cell below.\n", "Nevertheless, it is worth to discuss the influence that each hyperparameter has, and what intuition we have for choosing its value.\n", "\n", "First, let's consider the patch size.\n", "The smaller we make the patches, the longer the input sequences to the Transformer become.\n", "While in general, this allows the Transformer to model more complex functions, it requires a longer computation time due to its quadratic memory usage in the attention layer.\n", "Furthermore, small patches can make the task more difficult since the Transformer has to learn which patches are close-by, and which are far away.\n", "We experimented with patch sizes of 2, 4 and 8 which gives us the input sequence lengths of 256, 64, and 16 respectively.\n", "We found 4 to result in the best performance, and hence pick it below.\n", "\n", "Next, the embedding and hidden dimensionality have a similar impact to a Transformer as to an MLP.\n", "The larger the sizes, the more complex the model becomes, and the longer it takes to train.\n", "In Transformer however, we have one more aspect to consider: the query-key sizes in the Multi-Head Attention layers.\n", "Each key has the feature dimensionality of `embed_dim/num_heads`.\n", "Considering that we have an input sequence length of 64, a minimum reasonable size for the key vectors is 16 or 32.\n", "Lower dimensionalities can restrain the possible attention maps too much.\n", "We observed that more than 8 heads are not necessary for the Transformer, and therefore pick a embedding dimensionality of `256`.\n", "The hidden dimensionality in the feed-forward networks is usually 2-4x larger than the embedding dimensionality, and thus we pick `512`.\n", "\n", "Finally, the learning rate for Transformers is usually relatively small, and in papers, a common value to use is 3e-5.\n", "However, since we work with a smaller dataset and have a potentially easier task, we found that we are able to increase the learning rate to 3e-4 without any problems.\n", "To reduce overfitting, we use a dropout value of 0.2.\n", "Remember that we also use small image augmentations as regularization during training.\n", "\n", "Feel free to explore the hyperparameters yourself by changing the values below.\n", "In general, the Vision Transformer did not show to be too sensitive to\n", "the hyperparameter choices on the CIFAR10 dataset."]}, {"cell_type": "code", "execution_count": 11, "id": "8aacc01b", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:07.775505Z", "iopub.status.busy": "2021-10-10T16:36:07.775020Z", "iopub.status.idle": "2021-10-10T16:36:15.614815Z", "shell.execute_reply": "2021-10-10T16:36:15.615209Z"}, "papermill": {"duration": 7.864306, "end_time": "2021-10-10T16:36:15.615357", "exception": false, "start_time": "2021-10-10T16:36:07.751051", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model at saved_models/VisionTransformers/ViT.ckpt, loading...\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/trainer.py:678: LightningDeprecationWarning: `trainer.test(test_dataloaders)` is deprecated in v1.4 and will be removed in v1.6. Use `trainer.test(dataloaders)` instead.\n", " rank_zero_deprecation(\n", "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/usr/local/lib/python3.9/dist-packages/torch/_jit_internal.py:603: LightningDeprecationWarning: The `LightningModule.datamodule` property is deprecated in v1.3 and will be removed in v1.5. Access the datamodule through using `self.trainer.datamodule` instead.\n", " if hasattr(mod, name):\n", "/usr/local/lib/python3.9/dist-packages/torch/_jit_internal.py:603: LightningDeprecationWarning: The `LightningModule.loaded_optimizer_states_dict` property is deprecated in v1.4 and will be removed in v1.6.\n", " if hasattr(mod, name):\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "2824556005cc42f79c31cbebe248b150", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "06ecaa193abb4c6599f94a9a7e64de8f", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["ViT results {'test': 0.7559000253677368, 'val': 0.7563999891281128}\n"]}], "source": ["model, results = train_model(\n", " model_kwargs={\n", " \"embed_dim\": 256,\n", " \"hidden_dim\": 512,\n", " \"num_heads\": 8,\n", " \"num_layers\": 6,\n", " \"patch_size\": 4,\n", " \"num_channels\": 3,\n", " \"num_patches\": 64,\n", " \"num_classes\": 10,\n", " \"dropout\": 0.2,\n", " },\n", " lr=3e-4,\n", ")\n", "print(\"ViT results\", results)"]}, {"cell_type": "markdown", "id": "c305d6d0", "metadata": {"papermill": {"duration": 0.327633, "end_time": "2021-10-10T16:36:16.015814", "exception": false, "start_time": "2021-10-10T16:36:15.688181", "status": "completed"}, "tags": []}, "source": ["The Vision Transformer achieves a validation and test performance of about 75%.\n", "In comparison, almost all CNN architectures that we have tested in [Tutorial 5](https://uvadlc-notebooks.readthedocs.io/en/latest/tutorial_notebooks/tutorial5/Inception_ResNet_DenseNet.html) obtained a classification performance of around 90%.\n", "This is a considerable gap and shows that although Vision Transformers perform strongly on ImageNet with potential pretraining, they cannot come close to simple CNNs on CIFAR10 when being trained from scratch.\n", "The differences between a CNN and Transformer can be well observed in the training curves.\n", "Let's look at them in a tensorboard below:"]}, {"cell_type": "code", "execution_count": 12, "id": "88cc38e7", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:16.703879Z", "iopub.status.busy": "2021-10-10T16:36:16.703404Z", "iopub.status.idle": "2021-10-10T16:36:16.705449Z", "shell.execute_reply": "2021-10-10T16:36:16.705045Z"}, "papermill": {"duration": 0.027779, "end_time": "2021-10-10T16:36:16.705553", "exception": false, "start_time": "2021-10-10T16:36:16.677774", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# Opens tensorboard in notebook. Adjust the path to your CHECKPOINT_PATH!\n", "# %tensorboard --logdir ../saved_models/tutorial15/tensorboards/"]}, {"cell_type": "markdown", "id": "1b7c6344", "metadata": {"papermill": {"duration": 0.021202, "end_time": "2021-10-10T16:36:16.748363", "exception": false, "start_time": "2021-10-10T16:36:16.727161", "status": "completed"}, "tags": []}, "source": ["
"]}, {"cell_type": "markdown", "id": "26c6ac67", "metadata": {"papermill": {"duration": 0.02121, "end_time": "2021-10-10T16:36:16.790843", "exception": false, "start_time": "2021-10-10T16:36:16.769633", "status": "completed"}, "tags": []}, "source": ["The tensorboard compares the Vision Transformer to a ResNet trained on CIFAR10.\n", "When looking at the training losses, we see that the ResNet learns much more quickly in the first iterations.\n", "While the learning rate might have an influence on the initial learning speed, we see the same trend in the validation accuracy.\n", "The ResNet achieves the best performance of the Vision Transformer after just 5 epochs (2000 iterations).\n", "Further, while the ResNet training loss and validation accuracy have a similar trend, the validation performance of the Vision Transformers only marginally changes after 10k iterations while the training loss has almost just started going down.\n", "Yet, the Vision Transformer is also able to achieve a close-to 100% accuracy on the training set.\n", "\n", "All those observed phenomenons can be explained with a concept that we have visited before: inductive biases.\n", "Convolutional Neural Networks have been designed with the assumption that images are translation invariant.\n", "Hence, we apply convolutions with shared filters across the image.\n", "Furthermore, a CNN architecture integrates the concept of distance in an image: two pixels that are close to each other are more related than two distant pixels.\n", "Local patterns are combined into larger patterns, until we perform our classification prediction.\n", "All those aspects are inductive biases of a CNN.\n", "In contrast, a Vision Transformer does not know which two pixels are close to each other, and which are far apart.\n", "It has to learn this information solely from the sparse learning signal of the classification task.\n", "This is a huge disadvantage when we have a small dataset since such information is crucial for generalizing to an unseen test dataset.\n", "With large enough datasets and/or good pre-training, a Transformer can learn this information without the need of inductive biases, and instead is more flexible than a CNN.\n", "Especially long-distance relations between local patterns can be difficult to process in CNNs, while in Transformers, all patches have the distance of one.\n", "This is why Vision Transformers are so strong on large-scale datasets\n", "such as ImageNet, but underperform a lot when being applied to a small\n", "dataset such as CIFAR10."]}, {"cell_type": "markdown", "id": "5df010c9", "metadata": {"papermill": {"duration": 0.021723, "end_time": "2021-10-10T16:36:16.834866", "exception": false, "start_time": "2021-10-10T16:36:16.813143", "status": "completed"}, "tags": []}, "source": ["## Conclusion\n", "\n", "In this tutorial, we have implemented our own Vision Transformer from scratch and applied it on the task of image classification.\n", "Vision Transformers work by splitting an image into a sequence of smaller patches, use those as input to a standard Transformer encoder.\n", "While Vision Transformers achieved outstanding results on large-scale image recognition benchmarks such as ImageNet, they considerably underperform when being trained from scratch on small-scale datasets like CIFAR10.\n", "The reason is that in contrast to CNNs, Transformers do not have the inductive biases of translation invariance and the feature hierachy (i.e. larger patterns consist of many smaller patterns).\n", "However, these aspects can be learned when enough data is provided, or the model has been pre-trained on other large-scale tasks.\n", "Considering that Vision Transformers have just been proposed end of 2020, there is likely a lot more to come on Transformers for Computer Vision.\n", "\n", "\n", "### References\n", "\n", "Dosovitskiy, Alexey, et al.\n", "\"An image is worth 16x16 words: Transformers for image recognition at scale.\"\n", "International Conference on Representation Learning (2021).\n", "[link](https://arxiv.org/pdf/2010.11929.pdf)\n", "\n", "Chen, Xiangning, et al.\n", "\"When Vision Transformers Outperform ResNets without Pretraining or Strong Data Augmentations.\"\n", "arXiv preprint arXiv:2106.01548 (2021).\n", "[link](https://arxiv.org/abs/2106.01548)\n", "\n", "Tolstikhin, Ilya, et al.\n", "\"MLP-mixer: An all-MLP Architecture for Vision.\"\n", "arXiv preprint arXiv:2105.01601 (2021).\n", "[link](https://arxiv.org/abs/2105.01601)\n", "\n", "Xiong, Ruibin, et al.\n", "\"On layer normalization in the transformer architecture.\"\n", "International Conference on Machine Learning.\n", "PMLR, 2020.\n", "[link](http://proceedings.mlr.press/v119/xiong20b/xiong20b.pdf)"]}, {"cell_type": "markdown", "id": "18e70eed", "metadata": {"papermill": {"duration": 0.021621, "end_time": "2021-10-10T16:36:16.878164", "exception": false, "start_time": "2021-10-10T16:36:16.856543", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "![Pytorch Lightning](){height=\"60px\" width=\"240px\"}"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: Tutorial 11: Vision Transformers\n", " :card_description: In this tutorial, we will take a closer look at a recent new trend: Transformers for Computer Vision. Since [Alexey Dosovitskiy et...\n", " :tags: Image,GPU/TPU,UvA-DL-Course\n", " :image: _static/images/course_UvA-DL/11-vision-transformer.jpg"]}], "metadata": {"jupytext": {"cell_metadata_filter": "colab,colab_type,id,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 17.019243, "end_time": "2021-10-10T16:36:17.607886", "environment_variables": {}, "exception": null, "input_path": "course_UvA-DL/11-vision-transformer/Vision_Transformer.ipynb", "output_path": ".notebooks/course_UvA-DL/11-vision-transformer.ipynb", "parameters": {}, "start_time": "2021-10-10T16:36:00.588643", "version": "2.3.3"}, "widgets": {"application/vnd.jupyter.widget-state+json": {"state": {"06ecaa193abb4c6599f94a9a7e64de8f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_262db12adb4a4eb8a01537b1fbbac6a7", "IPY_MODEL_de04ee4e69b34edbb4623993191f18ff", "IPY_MODEL_34d1be73a2424261976f78e8ebd2f3b9"], "layout": "IPY_MODEL_3cf6ceecdcc04e9ea8214064fe78c0cc"}}, "07ce532be9e048b4a36844396612f0d6": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "112f161d8d5e4d6892247a723f5c42d7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_88a70622b99e4603992ebe4a8310647a", "placeholder": "\u200b", "style": "IPY_MODEL_07ce532be9e048b4a36844396612f0d6", "value": "Testing: 100%"}}, "21c8daba50c54686b687787528812f0a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "24c3fc2871254a43a96cb796a4246134": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_be78b541f4774bcba63ff910d8f1ce22", "placeholder": "\u200b", "style": "IPY_MODEL_21c8daba50c54686b687787528812f0a", "value": " 40/40 [00:00<00:00, 47.98it/s]"}}, "262db12adb4a4eb8a01537b1fbbac6a7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d1ce9a66c073476d9c101cd69731611d", "placeholder": "\u200b", "style": "IPY_MODEL_654debaf094149e09b6c3423310b596c", "value": "Testing: 100%"}}, "2824556005cc42f79c31cbebe248b150": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_112f161d8d5e4d6892247a723f5c42d7", "IPY_MODEL_b29fce5508ba479589e3f4b0d0c593ae", "IPY_MODEL_24c3fc2871254a43a96cb796a4246134"], "layout": "IPY_MODEL_d1dd5a2d9d904ef3949b431c81e9f5ad"}}, "34d1be73a2424261976f78e8ebd2f3b9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8511d9a6c88540a893dd44dd16362e6b", "placeholder": "\u200b", "style": "IPY_MODEL_ce9b4471f190492182eb11d93560a81b", "value": " 79/79 [00:01<00:00, 49.85it/s]"}}, "3cf6ceecdcc04e9ea8214064fe78c0cc": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "654debaf094149e09b6c3423310b596c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "688aa138fc5148bf85f1c48377198169": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "8511d9a6c88540a893dd44dd16362e6b": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "88a70622b99e4603992ebe4a8310647a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "a5c301fa41b34ea29fc9e3745f950ce2": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b29fce5508ba479589e3f4b0d0c593ae": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a5c301fa41b34ea29fc9e3745f950ce2", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_d1bd9770a9c04cc687a41b9da1507b7c", "value": 1.0}}, "b4d671d57ae7430b9f8b46f5dd95be19": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "be78b541f4774bcba63ff910d8f1ce22": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ce9b4471f190492182eb11d93560a81b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "d1bd9770a9c04cc687a41b9da1507b7c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "d1ce9a66c073476d9c101cd69731611d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d1dd5a2d9d904ef3949b431c81e9f5ad": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "de04ee4e69b34edbb4623993191f18ff": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_688aa138fc5148bf85f1c48377198169", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_b4d671d57ae7430b9f8b46f5dd95be19", "value": 1.0}}}, "version_major": 2, "version_minor": 0}}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/course_UvA-DL/12-meta-learning.ipynb b/source/notebooks/course_UvA-DL/12-meta-learning.ipynb deleted file mode 100644 index 5e56e5e..0000000 --- a/source/notebooks/course_UvA-DL/12-meta-learning.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "e97dbf01", "metadata": {"papermill": {"duration": 0.035787, "end_time": "2021-10-10T16:36:26.406495", "exception": false, "start_time": "2021-10-10T16:36:26.370708", "status": "completed"}, "tags": []}, "source": ["\n", "# Tutorial 12: Meta-Learning - Learning to Learn\n", "\n", "* **Author:** Phillip Lippe\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-10-10T18:35:50.818431\n", "\n", "In this tutorial, we will discuss algorithms that learn models which can quickly adapt to new classes and/or tasks with few samples.\n", "This area of machine learning is called _Meta-Learning_ aiming at \"learning to learn\".\n", "Learning from very few examples is a natural task for humans. In contrast to current deep learning models, we need to see only a few examples of a police car or firetruck to recognize them in daily traffic.\n", "This is crucial ability since in real-world application, it is rarely the case that the data stays static and does not change over time.\n", "For example, an object detection system for mobile phones trained on data from 2000 will have troubles detecting today's common mobile phones, and thus, needs to adapt to new data without excessive label effort.\n", "The optimization techniques we have discussed so far struggle with this because they only aim at obtaining a good performance on a test set that had similar data.\n", "However, what if the test set has classes that we do not have in the training set?\n", "Or what if we want to test the model on a completely different task?\n", "We will discuss and implement three common Meta-Learning algorithms for such situations.\n", "This notebook is part of a lecture series on Deep Learning at the University of Amsterdam.\n", "The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io.\n", "\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/course_UvA-DL/12-meta-learning.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "89d6c708", "metadata": {"papermill": {"duration": 0.034571, "end_time": "2021-10-10T16:36:26.475148", "exception": false, "start_time": "2021-10-10T16:36:26.440577", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "2350fea0", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-10-10T16:36:26.546320Z", "iopub.status.busy": "2021-10-10T16:36:26.545801Z", "iopub.status.idle": "2021-10-10T16:36:26.547964Z", "shell.execute_reply": "2021-10-10T16:36:26.548348Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 0.039795, "end_time": "2021-10-10T16:36:26.548525", "exception": false, "start_time": "2021-10-10T16:36:26.508730", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# ! pip install --quiet \"torch>=1.6, <1.9\" \"matplotlib\" \"torchmetrics>=0.3\" \"seaborn\" \"torchvision\" \"pytorch-lightning>=1.3\""]}, {"cell_type": "markdown", "id": "5bc75be2", "metadata": {"papermill": {"duration": 0.033967, "end_time": "2021-10-10T16:36:26.617046", "exception": false, "start_time": "2021-10-10T16:36:26.583079", "status": "completed"}, "tags": []}, "source": ["
\n", "Meta-Learning offers solutions to these situations, and we will discuss three popular algorithms: __Prototypical Networks__ ([Snell et al., 2017](https://arxiv.org/pdf/1703.05175.pdf)), __Model-Agnostic Meta-Learning / MAML__ ([Finn et al., 2017](http://proceedings.mlr.press/v70/finn17a.html)), and __Proto-MAML__ ([Triantafillou et al., 2020](https://openreview.net/pdf?id=rkgAGAVKPr)).\n", "We will focus on the task of few-shot classification where the training and test set have distinct sets of classes.\n", "For instance, we would train the model on the binary classifications of cats-birds and flowers-bikes, but during test time, the model would need to learn from 4 examples each the difference between dogs and otters, two classes we have not seen during training (Figure credit - [Lilian Weng](https://lilianweng.github.io/lil-log/2018/11/30/meta-learning.html)).\n", "\n", "
\n", "\n", "A different setup, which is very common in Reinforcement Learning and recently Natural Language Processing, is to aim at few-shot learning of a completely new task.\n", "For example, an robot agent that learned to run, jump and pick up boxes, should quickly adapt to collecting and stacking boxes.\n", "In NLP, we can think of a model which was trained sentiment classification, hatespeech detection and sarcasm classification, to adapt to classifying the emotion of a text.\n", "All methods we will discuss in this notebook can be easily applied to these settings since we only use a different definition of a 'task'.\n", "For few-shot classification, we consider a task to distinguish between $M$ novel classes.\n", "Here, we would not only have novel classes, but also a completely different dataset.\n", "\n", "First of all, let's start with importing our standard libraries. We will again be using PyTorch Lightning."]}, {"cell_type": "code", "execution_count": 2, "id": "a414f0fb", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:26.695087Z", "iopub.status.busy": "2021-10-10T16:36:26.694610Z", "iopub.status.idle": "2021-10-10T16:36:28.445235Z", "shell.execute_reply": "2021-10-10T16:36:28.444817Z"}, "papermill": {"duration": 1.794133, "end_time": "2021-10-10T16:36:28.445346", "exception": false, "start_time": "2021-10-10T16:36:26.651213", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/tmp/ipykernel_739/3072189054.py:29: DeprecationWarning: `set_matplotlib_formats` is deprecated since IPython 7.23, directly use `matplotlib_inline.backend_inline.set_matplotlib_formats()`\n", " set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "Global seed set to 42\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Device: cuda:0\n"]}, {"data": {"text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["import json\n", "import os\n", "import random\n", "import urllib.request\n", "from collections import defaultdict\n", "from copy import deepcopy\n", "from statistics import mean, stdev\n", "from urllib.error import HTTPError\n", "\n", "import matplotlib\n", "import matplotlib.pyplot as plt\n", "import numpy as np\n", "import pytorch_lightning as pl\n", "import seaborn as sns\n", "import torch\n", "import torch.nn.functional as F\n", "import torch.optim as optim\n", "import torch.utils.data as data\n", "import torchvision\n", "from IPython.display import set_matplotlib_formats\n", "from PIL import Image\n", "from pytorch_lightning.callbacks import LearningRateMonitor, ModelCheckpoint\n", "from torchvision import transforms\n", "from torchvision.datasets import CIFAR100, SVHN\n", "from tqdm.auto import tqdm\n", "\n", "plt.set_cmap(\"cividis\")\n", "# %matplotlib inline\n", "set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "matplotlib.rcParams[\"lines.linewidth\"] = 2.0\n", "sns.reset_orig()\n", "\n", "# Import tensorboard\n", "# %load_ext tensorboard\n", "\n", "# Path to the folder where the datasets are/should be downloaded (e.g. CIFAR10)\n", "DATASET_PATH = os.environ.get(\"PATH_DATASETS\", \"data/\")\n", "# Path to the folder where the pretrained models are saved\n", "CHECKPOINT_PATH = os.environ.get(\"PATH_CHECKPOINT\", \"saved_models/MetaLearning/\")\n", "\n", "# Setting the seed\n", "pl.seed_everything(42)\n", "\n", "# Ensure that all operations are deterministic on GPU (if used) for reproducibility\n", "torch.backends.cudnn.determinstic = True\n", "torch.backends.cudnn.benchmark = False\n", "\n", "device = torch.device(\"cuda:0\") if torch.cuda.is_available() else torch.device(\"cpu\")\n", "print(\"Device:\", device)"]}, {"cell_type": "markdown", "id": "ce51286e", "metadata": {"papermill": {"duration": 0.034776, "end_time": "2021-10-10T16:36:28.518803", "exception": false, "start_time": "2021-10-10T16:36:28.484027", "status": "completed"}, "tags": []}, "source": ["Training the models in this notebook can take between 2 and 8 hours, and the evaluation time of some algorithms is in the span of couples of minutes.\n", "Hence, we download pre-trained models and results below."]}, {"cell_type": "code", "execution_count": 3, "id": "fddcdeaa", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:28.594883Z", "iopub.status.busy": "2021-10-10T16:36:28.594389Z", "iopub.status.idle": "2021-10-10T16:36:29.453405Z", "shell.execute_reply": "2021-10-10T16:36:29.452919Z"}, "papermill": {"duration": 0.899529, "end_time": "2021-10-10T16:36:29.453517", "exception": false, "start_time": "2021-10-10T16:36:28.553988", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial16/ProtoNet.ckpt...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial16/ProtoMAML.ckpt...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial16/tensorboards/ProtoNet/events.out.tfevents.ProtoNet...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial16/tensorboards/ProtoMAML/events.out.tfevents.ProtoMAML...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial16/protomaml_fewshot.json...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial16/protomaml_svhn_fewshot.json...\n"]}], "source": ["# Github URL where saved models are stored for this tutorial\n", "base_url = \"https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial16/\"\n", "# Files to download\n", "pretrained_files = [\n", " \"ProtoNet.ckpt\",\n", " \"ProtoMAML.ckpt\",\n", " \"tensorboards/ProtoNet/events.out.tfevents.ProtoNet\",\n", " \"tensorboards/ProtoMAML/events.out.tfevents.ProtoMAML\",\n", " \"protomaml_fewshot.json\",\n", " \"protomaml_svhn_fewshot.json\",\n", "]\n", "# Create checkpoint path if it doesn't exist yet\n", "os.makedirs(CHECKPOINT_PATH, exist_ok=True)\n", "\n", "# For each file, check whether it already exists. If not, try downloading it.\n", "for file_name in pretrained_files:\n", " file_path = os.path.join(CHECKPOINT_PATH, file_name)\n", " if \"/\" in file_name:\n", " os.makedirs(file_path.rsplit(\"/\", 1)[0], exist_ok=True)\n", " if not os.path.isfile(file_path):\n", " file_url = base_url + file_name\n", " print(\"Downloading %s...\" % file_url)\n", " try:\n", " urllib.request.urlretrieve(file_url, file_path)\n", " except HTTPError as e:\n", " print(\n", " \"Something went wrong. Please try to download the file from the GDrive folder, or contact the author with the full output including the following error:\\n\",\n", " e,\n", " )"]}, {"cell_type": "markdown", "id": "96d108b7", "metadata": {"papermill": {"duration": 0.038624, "end_time": "2021-10-10T16:36:29.528397", "exception": false, "start_time": "2021-10-10T16:36:29.489773", "status": "completed"}, "tags": []}, "source": ["## Few-shot classification\n", "\n", "We start our implementation by discussing the dataset setup.\n", "In this notebook, we will use CIFAR100 which we have already seen in Tutorial 6.\n", "CIFAR100 has 100 classes each with 600 images of size $32\\times 32$ pixels.\n", "Instead of splitting the training, validation and test set over examples, we will split them over classes: we will use 80 classes for training, and 10 for validation and 10 for testing.\n", "Our overall goal is to obtain a model that can distinguish between the 10 test classes with seeing very little examples.\n", "First, let's load the dataset and visualize some examples."]}, {"cell_type": "code", "execution_count": 4, "id": "2a4a4c43", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:29.603641Z", "iopub.status.busy": "2021-10-10T16:36:29.603170Z", "iopub.status.idle": "2021-10-10T16:36:34.357455Z", "shell.execute_reply": "2021-10-10T16:36:34.357029Z"}, "papermill": {"duration": 4.793304, "end_time": "2021-10-10T16:36:34.357578", "exception": false, "start_time": "2021-10-10T16:36:29.564274", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading https://www.cs.toronto.edu/~kriz/cifar-100-python.tar.gz to /__w/1/s/.datasets/cifar-100-python.tar.gz\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "f523d40c013f4da7bc639dc9291509e8", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0/169001437 [00:00\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-10-10T18:36:34.496593\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["# Visualize some examples\n", "NUM_IMAGES = 12\n", "cifar_images = [cifar_train_set[np.random.randint(len(cifar_train_set))][0] for idx in range(NUM_IMAGES)]\n", "cifar_images = torch.stack(cifar_images, dim=0)\n", "img_grid = torchvision.utils.make_grid(cifar_images, nrow=6, normalize=True, pad_value=0.9)\n", "img_grid = img_grid.permute(1, 2, 0)\n", "\n", "plt.figure(figsize=(8, 8))\n", "plt.title(\"Image examples of the CIFAR100 dataset\")\n", "plt.imshow(img_grid)\n", "plt.axis(\"off\")\n", "plt.show()\n", "plt.close()"]}, {"cell_type": "markdown", "id": "6393f96b", "metadata": {"papermill": {"duration": 0.041466, "end_time": "2021-10-10T16:36:34.711913", "exception": false, "start_time": "2021-10-10T16:36:34.670447", "status": "completed"}, "tags": []}, "source": ["### Data preprocessing\n", "\n", "Next, we need to prepare the dataset in the training, validation and test split as mentioned before.\n", "The torchvision package gives us the training and test set as two separate dataset objects.\n", "The next code cells will merge the original training and test set, and then create the new train-val-test split."]}, {"cell_type": "code", "execution_count": 6, "id": "ce60f407", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:34.798013Z", "iopub.status.busy": "2021-10-10T16:36:34.797539Z", "iopub.status.idle": "2021-10-10T16:36:34.875295Z", "shell.execute_reply": "2021-10-10T16:36:34.875698Z"}, "papermill": {"duration": 0.122697, "end_time": "2021-10-10T16:36:34.875846", "exception": false, "start_time": "2021-10-10T16:36:34.753149", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# Merging original training and test set\n", "cifar_all_images = np.concatenate([cifar_train_set.data, cifar_test_set.data], axis=0)\n", "cifar_all_targets = torch.LongTensor(cifar_train_set.targets + cifar_test_set.targets)"]}, {"cell_type": "markdown", "id": "3f939d72", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.040873, "end_time": "2021-10-10T16:36:34.959229", "exception": false, "start_time": "2021-10-10T16:36:34.918356", "status": "completed"}, "tags": []}, "source": ["To have an easier time handling the dataset, we define our own, simple dataset class below.\n", "It takes a set of images, labels/targets, and image transformations, and\n", "returns the corresponding images and labels element-wise."]}, {"cell_type": "code", "execution_count": 7, "id": "83d1fcac", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:35.051943Z", "iopub.status.busy": "2021-10-10T16:36:35.051455Z", "iopub.status.idle": "2021-10-10T16:36:35.053594Z", "shell.execute_reply": "2021-10-10T16:36:35.053130Z"}, "papermill": {"duration": 0.053299, "end_time": "2021-10-10T16:36:35.053692", "exception": false, "start_time": "2021-10-10T16:36:35.000393", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class ImageDataset(data.Dataset):\n", " def __init__(self, imgs, targets, img_transform=None):\n", " \"\"\"\n", " Inputs:\n", " imgs - Numpy array of shape [N,32,32,3] containing all images.\n", " targets - PyTorch array of shape [N] containing all labels.\n", " img_transform - A torchvision transformation that should be applied\n", " to the images before returning. If none, no transformation\n", " is applied.\n", " \"\"\"\n", " super().__init__()\n", " self.img_transform = img_transform\n", " self.imgs = imgs\n", " self.targets = targets\n", "\n", " def __getitem__(self, idx):\n", " img, target = self.imgs[idx], self.targets[idx]\n", " img = Image.fromarray(img)\n", "\n", " if self.img_transform is not None:\n", " img = self.img_transform(img)\n", "\n", " return img, target\n", "\n", " def __len__(self):\n", " return self.imgs.shape[0]"]}, {"cell_type": "markdown", "id": "8afc6b05", "metadata": {"papermill": {"duration": 0.041697, "end_time": "2021-10-10T16:36:35.136827", "exception": false, "start_time": "2021-10-10T16:36:35.095130", "status": "completed"}, "tags": []}, "source": ["Now, we can create the class splits.\n", "We will assign the classes randomly to training, validation and test, and use a 80%-10%-10% split."]}, {"cell_type": "code", "execution_count": 8, "id": "5ff3abd6", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:35.223236Z", "iopub.status.busy": "2021-10-10T16:36:35.222768Z", "iopub.status.idle": "2021-10-10T16:36:35.226508Z", "shell.execute_reply": "2021-10-10T16:36:35.226037Z"}, "papermill": {"duration": 0.048464, "end_time": "2021-10-10T16:36:35.226609", "exception": false, "start_time": "2021-10-10T16:36:35.178145", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 0\n"]}], "source": ["pl.seed_everything(0) # Set seed for reproducibility\n", "classes = torch.randperm(100) # Returns random permutation of numbers 0 to 99\n", "train_classes, val_classes, test_classes = classes[:80], classes[80:90], classes[90:]"]}, {"cell_type": "markdown", "id": "32cdc6d7", "metadata": {"papermill": {"duration": 0.042958, "end_time": "2021-10-10T16:36:35.311335", "exception": false, "start_time": "2021-10-10T16:36:35.268377", "status": "completed"}, "tags": []}, "source": ["To get an intuition of the validation and test classes, we print the class names below:"]}, {"cell_type": "code", "execution_count": 9, "id": "3ba456f9", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:35.405497Z", "iopub.status.busy": "2021-10-10T16:36:35.405025Z", "iopub.status.idle": "2021-10-10T16:36:35.408515Z", "shell.execute_reply": "2021-10-10T16:36:35.408107Z"}, "papermill": {"duration": 0.052713, "end_time": "2021-10-10T16:36:35.408617", "exception": false, "start_time": "2021-10-10T16:36:35.355904", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Validation classes: ['caterpillar', 'castle', 'skunk', 'ray', 'bus', 'motorcycle', 'keyboard', 'chimpanzee', 'possum', 'tiger']\n", "Test classes: ['kangaroo', 'crocodile', 'butterfly', 'shark', 'forest', 'pickup_truck', 'telephone', 'lion', 'worm', 'mushroom']\n"]}], "source": ["# Printing validation and test classes\n", "idx_to_class = {val: key for key, val in cifar_train_set.class_to_idx.items()}\n", "print(\"Validation classes:\", [idx_to_class[c.item()] for c in val_classes])\n", "print(\"Test classes:\", [idx_to_class[c.item()] for c in test_classes])"]}, {"cell_type": "markdown", "id": "ce1f7d09", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.041936, "end_time": "2021-10-10T16:36:35.493337", "exception": false, "start_time": "2021-10-10T16:36:35.451401", "status": "completed"}, "tags": []}, "source": ["As we can see, the classes have quite some variety and some classes might be easier to distinguish than others.\n", "For instance, in the test classes, 'pickup_truck' is the only vehicle while the classes 'mushroom', 'worm' and 'forest' might be harder to keep apart.\n", "Remember that we want to learn the classification of those ten classes from 80 other classes in our training set, and few examples from the actual test classes.\n", "We will experiment with the number of examples per class.\n", "\n", "Finally, we can create the training, validation and test dataset according to our split above.\n", "For this, we create dataset objects of our previously defined class `ImageDataset`."]}, {"cell_type": "code", "execution_count": 10, "id": "32f068d1", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:35.581555Z", "iopub.status.busy": "2021-10-10T16:36:35.581087Z", "iopub.status.idle": "2021-10-10T16:36:35.583171Z", "shell.execute_reply": "2021-10-10T16:36:35.582711Z"}, "papermill": {"duration": 0.04763, "end_time": "2021-10-10T16:36:35.583269", "exception": false, "start_time": "2021-10-10T16:36:35.535639", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def dataset_from_labels(imgs, targets, class_set, **kwargs):\n", " class_mask = (targets[:, None] == class_set[None, :]).any(dim=-1)\n", " return ImageDataset(imgs=imgs[class_mask], targets=targets[class_mask], **kwargs)"]}, {"cell_type": "markdown", "id": "e8d4fb26", "metadata": {"papermill": {"duration": 0.041782, "end_time": "2021-10-10T16:36:35.667114", "exception": false, "start_time": "2021-10-10T16:36:35.625332", "status": "completed"}, "tags": []}, "source": ["As in our experiments before on CIFAR in Tutorial 5, 6 and 9, we normalize the dataset.\n", "Additionally, we use small augmentations during training to prevent overfitting."]}, {"cell_type": "code", "execution_count": 11, "id": "25bb398a", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:35.757452Z", "iopub.status.busy": "2021-10-10T16:36:35.756975Z", "iopub.status.idle": "2021-10-10T16:36:38.059891Z", "shell.execute_reply": "2021-10-10T16:36:38.059376Z"}, "papermill": {"duration": 2.350192, "end_time": "2021-10-10T16:36:38.060028", "exception": false, "start_time": "2021-10-10T16:36:35.709836", "status": "completed"}, "tags": []}, "outputs": [], "source": ["DATA_MEANS = (cifar_train_set.data / 255.0).mean(axis=(0, 1, 2))\n", "DATA_STD = (cifar_train_set.data / 255.0).std(axis=(0, 1, 2))\n", "\n", "test_transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize(DATA_MEANS, DATA_STD)])\n", "# For training, we add some augmentation.\n", "train_transform = transforms.Compose(\n", " [\n", " transforms.RandomHorizontalFlip(),\n", " transforms.RandomResizedCrop((32, 32), scale=(0.8, 1.0), ratio=(0.9, 1.1)),\n", " transforms.ToTensor(),\n", " transforms.Normalize(DATA_MEANS, DATA_STD),\n", " ]\n", ")\n", "\n", "train_set = dataset_from_labels(cifar_all_images, cifar_all_targets, train_classes, img_transform=train_transform)\n", "val_set = dataset_from_labels(cifar_all_images, cifar_all_targets, val_classes, img_transform=test_transform)\n", "test_set = dataset_from_labels(cifar_all_images, cifar_all_targets, test_classes, img_transform=test_transform)"]}, {"cell_type": "markdown", "id": "3456a8f9", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.042069, "end_time": "2021-10-10T16:36:38.145286", "exception": false, "start_time": "2021-10-10T16:36:38.103217", "status": "completed"}, "tags": []}, "source": ["### Data sampling\n", "\n", "The strategy of how to use the available training data for learning few-shot adaptation is crucial in meta-learning.\n", "All three algorithms that we discuss here have a similar idea: simulate few-shot learning during training.\n", "Specifically, at each training step, we randomly select a small number of classes, and sample a small number of examples for each class.\n", "This represents our few-shot training batch, which we also refer to as **support set**.\n", "Additionally, we sample a second set of examples from the same classes, and refer to this batch as **query set**.\n", "Our training objective is to classify the query set correctly from seeing the support set and its corresponding labels.\n", "The main difference between our three methods (ProtoNet, MAML, and Proto-MAML) is in how they use the support set to adapt to the training classes.\n", "\n", "This subsection summarizes the code that is needed to create such training batches.\n", "In PyTorch, we can specify the data sampling procedure by so-called `Sampler` ([documentation](https://pytorch.org/docs/stable/data.html#data-loading-order-and-sampler)).\n", "Samplers are iteratable objects that return indices in the order in which the data elements should be sampled.\n", "In our previous notebooks, we usually used the option `shuffle=True` in the `data.DataLoader` objects which creates a sampler returning the data indices in a random order.\n", "Here, we focus on samplers that return batches of indices that correspond to support and query set batches.\n", "Below, we implement such a sampler."]}, {"cell_type": "code", "execution_count": 12, "id": "c0bad2d9", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:38.237449Z", "iopub.status.busy": "2021-10-10T16:36:38.236947Z", "iopub.status.idle": "2021-10-10T16:36:38.243012Z", "shell.execute_reply": "2021-10-10T16:36:38.242609Z"}, "papermill": {"duration": 0.055637, "end_time": "2021-10-10T16:36:38.243112", "exception": false, "start_time": "2021-10-10T16:36:38.187475", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class FewShotBatchSampler:\n", " def __init__(self, dataset_targets, N_way, K_shot, include_query=False, shuffle=True, shuffle_once=False):\n", " \"\"\"\n", " Inputs:\n", " dataset_targets - PyTorch tensor of the labels of the data elements.\n", " N_way - Number of classes to sample per batch.\n", " K_shot - Number of examples to sample per class in the batch.\n", " include_query - If True, returns batch of size N_way*K_shot*2, which\n", " can be split into support and query set. Simplifies\n", " the implementation of sampling the same classes but\n", " distinct examples for support and query set.\n", " shuffle - If True, examples and classes are newly shuffled in each\n", " iteration (for training)\n", " shuffle_once - If True, examples and classes are shuffled once in\n", " the beginning, but kept constant across iterations\n", " (for validation)\n", " \"\"\"\n", " super().__init__()\n", " self.dataset_targets = dataset_targets\n", " self.N_way = N_way\n", " self.K_shot = K_shot\n", " self.shuffle = shuffle\n", " self.include_query = include_query\n", " if self.include_query:\n", " self.K_shot *= 2\n", " self.batch_size = self.N_way * self.K_shot # Number of overall images per batch\n", "\n", " # Organize examples by class\n", " self.classes = torch.unique(self.dataset_targets).tolist()\n", " self.num_classes = len(self.classes)\n", " self.indices_per_class = {}\n", " self.batches_per_class = {} # Number of K-shot batches that each class can provide\n", " for c in self.classes:\n", " self.indices_per_class[c] = torch.where(self.dataset_targets == c)[0]\n", " self.batches_per_class[c] = self.indices_per_class[c].shape[0] // self.K_shot\n", "\n", " # Create a list of classes from which we select the N classes per batch\n", " self.iterations = sum(self.batches_per_class.values()) // self.N_way\n", " self.class_list = [c for c in self.classes for _ in range(self.batches_per_class[c])]\n", " if shuffle_once or self.shuffle:\n", " self.shuffle_data()\n", " else:\n", " # For testing, we iterate over classes instead of shuffling them\n", " sort_idxs = [\n", " i + p * self.num_classes for i, c in enumerate(self.classes) for p in range(self.batches_per_class[c])\n", " ]\n", " self.class_list = np.array(self.class_list)[np.argsort(sort_idxs)].tolist()\n", "\n", " def shuffle_data(self):\n", " # Shuffle the examples per class\n", " for c in self.classes:\n", " perm = torch.randperm(self.indices_per_class[c].shape[0])\n", " self.indices_per_class[c] = self.indices_per_class[c][perm]\n", " # Shuffle the class list from which we sample. Note that this way of shuffling\n", " # does not prevent to choose the same class twice in a batch. However, for\n", " # training and validation, this is not a problem.\n", " random.shuffle(self.class_list)\n", "\n", " def __iter__(self):\n", " # Shuffle data\n", " if self.shuffle:\n", " self.shuffle_data()\n", "\n", " # Sample few-shot batches\n", " start_index = defaultdict(int)\n", " for it in range(self.iterations):\n", " class_batch = self.class_list[it * self.N_way : (it + 1) * self.N_way] # Select N classes for the batch\n", " index_batch = []\n", " for c in class_batch: # For each class, select the next K examples and add them to the batch\n", " index_batch.extend(self.indices_per_class[c][start_index[c] : start_index[c] + self.K_shot])\n", " start_index[c] += self.K_shot\n", " if self.include_query: # If we return support+query set, sort them so that they are easy to split\n", " index_batch = index_batch[::2] + index_batch[1::2]\n", " yield index_batch\n", "\n", " def __len__(self):\n", " return self.iterations"]}, {"cell_type": "markdown", "id": "966baf43", "metadata": {"papermill": {"duration": 0.041981, "end_time": "2021-10-10T16:36:38.327241", "exception": false, "start_time": "2021-10-10T16:36:38.285260", "status": "completed"}, "tags": []}, "source": ["Now, we can create our intended data loaders by passing an object of `FewShotBatchSampler` as `batch_sampler=...` input to the PyTorch data loader object.\n", "For our experiments, we will use a 5-class 4-shot training setting.\n", "This means that each support set contains 5 classes with 4 examples each, i.e., 20 images overall.\n", "Usually, it is good to keep the number of shots equal to the number that you aim to test on.\n", "However, we will experiment later with different number of shots, and hence, we pick 4 as a compromise for now.\n", "To get the best performing model, it is recommended to consider the\n", "number of training shots as hyperparameter in a grid search."]}, {"cell_type": "code", "execution_count": 13, "id": "6e5eee4a", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:38.415592Z", "iopub.status.busy": "2021-10-10T16:36:38.415120Z", "iopub.status.idle": "2021-10-10T16:36:38.437251Z", "shell.execute_reply": "2021-10-10T16:36:38.436842Z"}, "papermill": {"duration": 0.068099, "end_time": "2021-10-10T16:36:38.437354", "exception": false, "start_time": "2021-10-10T16:36:38.369255", "status": "completed"}, "tags": []}, "outputs": [], "source": ["N_WAY = 5\n", "K_SHOT = 4\n", "train_data_loader = data.DataLoader(\n", " train_set,\n", " batch_sampler=FewShotBatchSampler(train_set.targets, include_query=True, N_way=N_WAY, K_shot=K_SHOT, shuffle=True),\n", " num_workers=4,\n", ")\n", "val_data_loader = data.DataLoader(\n", " val_set,\n", " batch_sampler=FewShotBatchSampler(\n", " val_set.targets, include_query=True, N_way=N_WAY, K_shot=K_SHOT, shuffle=False, shuffle_once=True\n", " ),\n", " num_workers=4,\n", ")"]}, {"cell_type": "markdown", "id": "3105a10e", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.042422, "end_time": "2021-10-10T16:36:38.521966", "exception": false, "start_time": "2021-10-10T16:36:38.479544", "status": "completed"}, "tags": []}, "source": ["For simplicity, we implemented the sampling of a support and query set as sampling a support set with twice the number of examples.\n", "After sampling a batch from the data loader, we need to split it into a support and query set.\n", "We can summarize this step in the following function:"]}, {"cell_type": "code", "execution_count": 14, "id": "928a254e", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:38.609800Z", "iopub.status.busy": "2021-10-10T16:36:38.608312Z", "iopub.status.idle": "2021-10-10T16:36:38.611864Z", "shell.execute_reply": "2021-10-10T16:36:38.611397Z"}, "papermill": {"duration": 0.048021, "end_time": "2021-10-10T16:36:38.611980", "exception": false, "start_time": "2021-10-10T16:36:38.563959", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def split_batch(imgs, targets):\n", " support_imgs, query_imgs = imgs.chunk(2, dim=0)\n", " support_targets, query_targets = targets.chunk(2, dim=0)\n", " return support_imgs, query_imgs, support_targets, query_targets"]}, {"cell_type": "markdown", "id": "ac8356fb", "metadata": {"papermill": {"duration": 0.041927, "end_time": "2021-10-10T16:36:38.696240", "exception": false, "start_time": "2021-10-10T16:36:38.654313", "status": "completed"}, "tags": []}, "source": ["Finally, to ensure that our implementation of the data sampling process is correct, we can sample a batch and visualize its support and query set.\n", "What we would like to see is that the support and query set have the same classes, but distinct examples."]}, {"cell_type": "code", "execution_count": 15, "id": "18340de4", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:38.786640Z", "iopub.status.busy": "2021-10-10T16:36:38.786168Z", "iopub.status.idle": "2021-10-10T16:36:39.045016Z", "shell.execute_reply": "2021-10-10T16:36:39.044567Z"}, "papermill": {"duration": 0.306369, "end_time": "2021-10-10T16:36:39.045134", "exception": false, "start_time": "2021-10-10T16:36:38.738765", "status": "completed"}, "tags": []}, "outputs": [], "source": ["imgs, targets = next(iter(val_data_loader)) # We use the validation set since it does not apply augmentations\n", "support_imgs, query_imgs, _, _ = split_batch(imgs, targets)\n", "support_grid = torchvision.utils.make_grid(support_imgs, nrow=K_SHOT, normalize=True, pad_value=0.9)\n", "support_grid = support_grid.permute(1, 2, 0)\n", "query_grid = torchvision.utils.make_grid(query_imgs, nrow=K_SHOT, normalize=True, pad_value=0.9)\n", "query_grid = query_grid.permute(1, 2, 0)\n", "\n", "fig, ax = plt.subplots(1, 2, figsize=(8, 5))\n", "ax[0].imshow(support_grid)\n", "ax[0].set_title(\"Support set\")\n", "ax[0].axis(\"off\")\n", "ax[1].imshow(query_grid)\n", "ax[1].set_title(\"Query set\")\n", "ax[1].axis(\"off\")\n", "fig.suptitle(\"Few Shot Batch\", weight=\"bold\")\n", "fig.show()\n", "plt.close(fig)"]}, {"cell_type": "markdown", "id": "06b51e8e", "metadata": {"papermill": {"duration": 0.042585, "end_time": "2021-10-10T16:36:39.130534", "exception": false, "start_time": "2021-10-10T16:36:39.087949", "status": "completed"}, "tags": []}, "source": ["As we can see, the support and query set have the same five classes, but different examples.\n", "The models will be tasked to classify the examples in the query set by learning from the support set and its labels.\n", "With the data sampling in place, we can now start to implement our first meta-learning model: Prototypical Networks."]}, {"cell_type": "markdown", "id": "40315428", "metadata": {"papermill": {"duration": 0.042341, "end_time": "2021-10-10T16:36:39.214888", "exception": false, "start_time": "2021-10-10T16:36:39.172547", "status": "completed"}, "tags": []}, "source": ["## Prototypical Networks\n", "\n", "
"]}, {"cell_type": "markdown", "id": "e32fdcd0", "metadata": {"papermill": {"duration": 0.042438, "end_time": "2021-10-10T16:36:39.299755", "exception": false, "start_time": "2021-10-10T16:36:39.257317", "status": "completed"}, "tags": []}, "source": ["The Prototypical Network, or ProtoNet for short, is a metric-based meta-learning algorithm which operates similar to a nearest neighbor classification.\n", "Metric-based meta-learning methods classify a new example $\\mathbf{x}$ based on some distance function $d_{\\varphi}$ between $x$ and all elements in the support set.\n", "ProtoNets implements this idea with the concept of prototypes in a learned feature space.\n", "First, ProtoNet uses an embedding function $f_{\\theta}$ to encode each input in the support set into a $L$-dimensional feature vector.\n", "Next, for each class $c$, we collect the feature vectors of all examples with label $c$, and average their feature vectors.\n", "Formally, we can define this as:\n", "\n", "$$\\mathbf{v}_c=\\frac{1}{|S_c|}\\sum_{(\\mathbf{x}_i,y_i)\\in S_c}f_{\\theta}(\\mathbf{x}_i)$$\n", "\n", "where $S_c$ is the part of the support set $S$ for which $y_i=c$, and $\\mathbf{v}_c$ represents the _prototype_ of class $c$.\n", "The prototype calculation is visualized below for a 2-dimensional feature space and 3 classes (Figure credit - [Snell et al.](https://arxiv.org/pdf/1703.05175.pdf)).\n", "The colored dots represent encoded support elements with color-corresponding class label, and the black dots next to the class label are the averaged prototypes.\n", "\n", "
\n", "\n", "Based on these prototypes, we want to classify a new example.\n", "Remember that since we want to learn the encoding function $f_{\\theta}$, this classification must be differentiable and hence, we need to define a probability distribution across classes.\n", "For this, we will make use of the distance function $d_{\\varphi}$: the closer a new example $\\mathbf{x}$ is to a prototype $\\mathbf{v}_c$, the higher the probability for $\\mathbf{x}$ belonging to class $c$.\n", "Formally, we can simply use a softmax over the distances of $\\mathbf{x}$ to all class prototypes:\n", "\n", "$$p(y=c\\vert\\mathbf{x})=\\text{softmax}(-d_{\\varphi}(f_{\\theta}(\\mathbf{x}), \\mathbf{v}_c))=\\frac{\\exp\\left(-d_{\\varphi}(f_{\\theta}(\\mathbf{x}), \\mathbf{v}_c)\\right)}{\\sum_{c'\\in \\mathcal{C}}\\exp\\left(-d_{\\varphi}(f_{\\theta}(\\mathbf{x}), \\mathbf{v}_{c'})\\right)}$$\n", "\n", "Note that the negative sign is necessary since we want to increase the probability for close-by vectors and have a low probability for distant vectors.\n", "We train the network $f_{\\theta}$ based on the cross entropy error of the training query set examples.\n", "Thereby, the gradient flows through both the prototypes $\\mathbf{v}_c$ and the query set encodings $f_{\\theta}(\\mathbf{x})$.\n", "For the distance function $d_{\\varphi}$, we can choose any function as long as it is differentiable with respect to both of its inputs.\n", "The most common function, which we also use here, is the squared\n", "euclidean distance, but there has been several works on different\n", "distance functions as well."]}, {"cell_type": "markdown", "id": "d400bfc2", "metadata": {"papermill": {"duration": 0.042184, "end_time": "2021-10-10T16:36:39.384014", "exception": false, "start_time": "2021-10-10T16:36:39.341830", "status": "completed"}, "tags": []}, "source": ["### ProtoNet implementation"]}, {"cell_type": "markdown", "id": "a10ef367", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.042386, "end_time": "2021-10-10T16:36:39.468678", "exception": false, "start_time": "2021-10-10T16:36:39.426292", "status": "completed"}, "tags": []}, "source": ["Now that we know how a ProtoNet works in principle, let's look at how we can apply to our specific problem of few-shot image classification, and implement it below.\n", "First, we need to define the encoder function $f_{\\theta}$.\n", "Since we work with CIFAR images, we can take a look back at Tutorial 5 where we compared common Computer Vision architectures, and choose one of the best performing ones.\n", "Here, we go with a DenseNet since it is in general more parameter efficient than ResNet.\n", "Luckily, we do not need to implement DenseNet ourselves again and can rely on torchvision's model package instead.\n", "We use common hyperparameters of 64 initial feature channels, add 32 per block, and use a bottleneck size of 64 (i.e. 2 times the growth rate).\n", "We use 4 stages of 6 layers each, which results in overall about 1 million parameters.\n", "Note that the torchvision package assumes that the last layer is used for classification and hence calls its output size `num_classes`.\n", "However, we can instead just use it as the feature space of ProtoNet, and choose an arbitrary dimensionality.\n", "We will use the same network for other algorithms in this notebook to ensure a fair comparison."]}, {"cell_type": "code", "execution_count": 16, "id": "2ba373cc", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:39.567463Z", "iopub.status.busy": "2021-10-10T16:36:39.566989Z", "iopub.status.idle": "2021-10-10T16:36:39.569062Z", "shell.execute_reply": "2021-10-10T16:36:39.568593Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.056702, "end_time": "2021-10-10T16:36:39.569165", "exception": false, "start_time": "2021-10-10T16:36:39.512463", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def get_convnet(output_size):\n", " convnet = torchvision.models.DenseNet(\n", " growth_rate=32,\n", " block_config=(6, 6, 6, 6),\n", " bn_size=2,\n", " num_init_features=64,\n", " num_classes=output_size, # Output dimensionality\n", " )\n", " return convnet"]}, {"cell_type": "markdown", "id": "50da6f0b", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.042572, "end_time": "2021-10-10T16:36:39.654722", "exception": false, "start_time": "2021-10-10T16:36:39.612150", "status": "completed"}, "tags": []}, "source": ["Next, we can look at implementing ProtoNet.\n", "We will define it as PyTorch Lightning module to use all functionalities of PyTorch Lightning.\n", "The first step during training is to encode all images in a batch with our network.\n", "Next, we calculate the class prototypes from the support set (function `calculate_prototypes`), and classify the query set examples according to the prototypes (function `classify_feats`).\n", "Keep in mind that we use the data sampling described before, such that the support and query set are stacked together in the batch.\n", "Thus, we use our previously defined function `split_batch` to split them apart.\n", "The full code can be found below."]}, {"cell_type": "code", "execution_count": 17, "id": "08c3adca", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:39.751136Z", "iopub.status.busy": "2021-10-10T16:36:39.750647Z", "iopub.status.idle": "2021-10-10T16:36:39.752752Z", "shell.execute_reply": "2021-10-10T16:36:39.752285Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.055843, "end_time": "2021-10-10T16:36:39.752853", "exception": false, "start_time": "2021-10-10T16:36:39.697010", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class ProtoNet(pl.LightningModule):\n", " def __init__(self, proto_dim, lr):\n", " \"\"\"Inputs.\n", "\n", " proto_dim - Dimensionality of prototype feature space\n", " lr - Learning rate of Adam optimizer\n", " \"\"\"\n", " super().__init__()\n", " self.save_hyperparameters()\n", " self.model = get_convnet(output_size=self.hparams.proto_dim)\n", "\n", " def configure_optimizers(self):\n", " optimizer = optim.AdamW(self.parameters(), lr=self.hparams.lr)\n", " scheduler = optim.lr_scheduler.MultiStepLR(optimizer, milestones=[140, 180], gamma=0.1)\n", " return [optimizer], [scheduler]\n", "\n", " @staticmethod\n", " def calculate_prototypes(features, targets):\n", " # Given a stack of features vectors and labels, return class prototypes\n", " # features - shape [N, proto_dim], targets - shape [N]\n", " classes, _ = torch.unique(targets).sort() # Determine which classes we have\n", " prototypes = []\n", " for c in classes:\n", " p = features[torch.where(targets == c)[0]].mean(dim=0) # Average class feature vectors\n", " prototypes.append(p)\n", " prototypes = torch.stack(prototypes, dim=0)\n", " # Return the 'classes' tensor to know which prototype belongs to which class\n", " return prototypes, classes\n", "\n", " def classify_feats(self, prototypes, classes, feats, targets):\n", " # Classify new examples with prototypes and return classification error\n", " dist = torch.pow(prototypes[None, :] - feats[:, None], 2).sum(dim=2) # Squared euclidean distance\n", " preds = F.log_softmax(-dist, dim=1)\n", " labels = (classes[None, :] == targets[:, None]).long().argmax(dim=-1)\n", " acc = (preds.argmax(dim=1) == labels).float().mean()\n", " return preds, labels, acc\n", "\n", " def calculate_loss(self, batch, mode):\n", " # Determine training loss for a given support and query set\n", " imgs, targets = batch\n", " features = self.model(imgs) # Encode all images of support and query set\n", " support_feats, query_feats, support_targets, query_targets = split_batch(features, targets)\n", " prototypes, classes = ProtoNet.calculate_prototypes(support_feats, support_targets)\n", " preds, labels, acc = self.classify_feats(prototypes, classes, query_feats, query_targets)\n", " loss = F.cross_entropy(preds, labels)\n", "\n", " self.log(\"%s_loss\" % mode, loss)\n", " self.log(\"%s_acc\" % mode, acc)\n", " return loss\n", "\n", " def training_step(self, batch, batch_idx):\n", " return self.calculate_loss(batch, mode=\"train\")\n", "\n", " def validation_step(self, batch, batch_idx):\n", " self.calculate_loss(batch, mode=\"val\")"]}, {"cell_type": "markdown", "id": "1d28cde2", "metadata": {"papermill": {"duration": 0.042403, "end_time": "2021-10-10T16:36:39.837555", "exception": false, "start_time": "2021-10-10T16:36:39.795152", "status": "completed"}, "tags": []}, "source": ["For validation, we use the same principle as training and sample support and query sets from the hold-out 10 classes.\n", "However, this gives us noisy scores depending on which query sets are chosen to which support sets.\n", "This is why we will use a different strategy during testing.\n", "For validation, our training strategy is sufficient since it is much\n", "faster than testing, and gives a good estimate of the training\n", "generalization as long as we keep the support-query sets constant across\n", "validation iterations."]}, {"cell_type": "markdown", "id": "02222c05", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.042841, "end_time": "2021-10-10T16:36:39.923166", "exception": false, "start_time": "2021-10-10T16:36:39.880325", "status": "completed"}, "tags": []}, "source": ["### Training\n", "\n", "After implementing the model, we can already start training it.\n", "We use our common PyTorch Lightning training function, and train the model for 200 epochs.\n", "The training function takes `model_class` as input argument, i.e. the\n", "PyTorch Lightning module class that should be trained, since we will\n", "reuse this function for other algorithms as well."]}, {"cell_type": "code", "execution_count": 18, "id": "76c40dce", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:40.014200Z", "iopub.status.busy": "2021-10-10T16:36:40.013719Z", "iopub.status.idle": "2021-10-10T16:36:40.015817Z", "shell.execute_reply": "2021-10-10T16:36:40.015348Z"}, "papermill": {"duration": 0.050208, "end_time": "2021-10-10T16:36:40.015917", "exception": false, "start_time": "2021-10-10T16:36:39.965709", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def train_model(model_class, train_loader, val_loader, **kwargs):\n", " trainer = pl.Trainer(\n", " default_root_dir=os.path.join(CHECKPOINT_PATH, model_class.__name__),\n", " gpus=1 if str(device) == \"cuda:0\" else 0,\n", " max_epochs=200,\n", " callbacks=[\n", " ModelCheckpoint(save_weights_only=True, mode=\"max\", monitor=\"val_acc\"),\n", " LearningRateMonitor(\"epoch\"),\n", " ],\n", " progress_bar_refresh_rate=0,\n", " )\n", " trainer.logger._default_hp_metric = None\n", "\n", " # Check whether pretrained model exists. If yes, load it and skip training\n", " pretrained_filename = os.path.join(CHECKPOINT_PATH, model_class.__name__ + \".ckpt\")\n", " if os.path.isfile(pretrained_filename):\n", " print(\"Found pretrained model at %s, loading...\" % pretrained_filename)\n", " # Automatically loads the model with the saved hyperparameters\n", " model = model_class.load_from_checkpoint(pretrained_filename)\n", " else:\n", " pl.seed_everything(42) # To be reproducable\n", " model = model_class(**kwargs)\n", " trainer.fit(model, train_loader, val_loader)\n", " model = model_class.load_from_checkpoint(\n", " trainer.checkpoint_callback.best_model_path\n", " ) # Load best checkpoint after training\n", "\n", " return model"]}, {"cell_type": "markdown", "id": "6bd74652", "metadata": {"papermill": {"duration": 0.043123, "end_time": "2021-10-10T16:36:40.102077", "exception": false, "start_time": "2021-10-10T16:36:40.058954", "status": "completed"}, "tags": []}, "source": ["Below is the training call for our ProtoNet.\n", "We use a 64-dimensional feature space.\n", "Larger feature spaces showed to give noisier results since the squared euclidean distance becomes proportionally larger in expectation, and smaller feature spaces might not allow for enough flexibility.\n", "We recommend to load the pre-trained model here at first, but feel free\n", "to play around with the hyperparameters yourself."]}, {"cell_type": "code", "execution_count": 19, "id": "91cae9d3", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:40.192927Z", "iopub.status.busy": "2021-10-10T16:36:40.192456Z", "iopub.status.idle": "2021-10-10T16:36:40.257180Z", "shell.execute_reply": "2021-10-10T16:36:40.256698Z"}, "papermill": {"duration": 0.1128, "end_time": "2021-10-10T16:36:40.257291", "exception": false, "start_time": "2021-10-10T16:36:40.144491", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model at saved_models/MetaLearning/ProtoNet.ckpt, loading...\n"]}], "source": ["protonet_model = train_model(\n", " ProtoNet, proto_dim=64, lr=2e-4, train_loader=train_data_loader, val_loader=val_data_loader\n", ")"]}, {"cell_type": "markdown", "id": "92207f47", "metadata": {"papermill": {"duration": 0.043516, "end_time": "2021-10-10T16:36:40.344935", "exception": false, "start_time": "2021-10-10T16:36:40.301419", "status": "completed"}, "tags": []}, "source": ["We can also take a closer look at the TensorBoard below."]}, {"cell_type": "code", "execution_count": 20, "id": "7b2883ee", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:40.435675Z", "iopub.status.busy": "2021-10-10T16:36:40.435210Z", "iopub.status.idle": "2021-10-10T16:36:40.437301Z", "shell.execute_reply": "2021-10-10T16:36:40.436898Z"}, "papermill": {"duration": 0.048812, "end_time": "2021-10-10T16:36:40.437398", "exception": false, "start_time": "2021-10-10T16:36:40.388586", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# Opens tensorboard in notebook. Adjust the path to your CHECKPOINT_PATH if needed\n", "# # %tensorboard --logdir ../saved_models/tutorial16/tensorboards/ProtoNet/"]}, {"cell_type": "markdown", "id": "a96395e2", "metadata": {"papermill": {"duration": 0.043172, "end_time": "2021-10-10T16:36:40.524550", "exception": false, "start_time": "2021-10-10T16:36:40.481378", "status": "completed"}, "tags": []}, "source": ["
\n", "\n", "In contrast to standard supervised learning, we see that ProtoNet does not overfit as much as we would expect.\n", "The validation accuracy is of course lower than the average training, but the training loss does not stick close to zero.\n", "This is because no training batch is as the other, and we also mix new examples in the support set and query set.\n", "This gives us slightly different prototypes in every iteration, and makes it harder for the network to fully overfit."]}, {"cell_type": "markdown", "id": "fe724d6e", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.043726, "end_time": "2021-10-10T16:36:40.611913", "exception": false, "start_time": "2021-10-10T16:36:40.568187", "status": "completed"}, "tags": []}, "source": ["### Testing\n", "\n", "Our goal of meta-learning is to obtain a model that can quickly adapt to a new task, or in this case, new classes to distinguish between.\n", "To test this, we will use our trained ProtoNet and adapt it to the 10 test classes.\n", "Thereby, we pick $k$ examples per class from which we determine the prototypes, and test the classification accuracy on all other examples.\n", "This can be seen as using the $k$ examples per class as support set, and the rest of the dataset as a query set.\n", "We iterate through the dataset such that each example has been once included in a support set.\n", "The average performance over all support sets tells us how well we can expect ProtoNet to perform when seeing only $k$ examples per class.\n", "During training, we used $k=4$.\n", "In testing, we will experiment with $k=\\{2,4,8,16,32\\}$ to get a better sense of how $k$ influences the results.\n", "We would expect that we achieve higher accuracies the more examples we have in the support set, but we don't know how it scales.\n", "Hence, let's first implement a function that executes the testing procedure for a given $k$:"]}, {"cell_type": "code", "execution_count": 21, "id": "9e43469f", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:40.708839Z", "iopub.status.busy": "2021-10-10T16:36:40.706609Z", "iopub.status.idle": "2021-10-10T16:36:40.710916Z", "shell.execute_reply": "2021-10-10T16:36:40.710471Z"}, "papermill": {"duration": 0.055241, "end_time": "2021-10-10T16:36:40.711017", "exception": false, "start_time": "2021-10-10T16:36:40.655776", "status": "completed"}, "tags": []}, "outputs": [], "source": ["@torch.no_grad()\n", "def test_proto_net(model, dataset, data_feats=None, k_shot=4):\n", " \"\"\"Inputs.\n", "\n", " model - Pretrained ProtoNet model\n", " dataset - The dataset on which the test should be performed.\n", " Should be instance of ImageDataset\n", " data_feats - The encoded features of all images in the dataset.\n", " If None, they will be newly calculated, and returned\n", " for later usage.\n", " k_shot - Number of examples per class in the support set.\n", " \"\"\"\n", " model = model.to(device)\n", " model.eval()\n", " num_classes = dataset.targets.unique().shape[0]\n", " exmps_per_class = dataset.targets.shape[0] // num_classes # We assume uniform example distribution here\n", "\n", " # The encoder network remains unchanged across k-shot settings. Hence, we only need\n", " # to extract the features for all images once.\n", " if data_feats is None:\n", " # Dataset preparation\n", " dataloader = data.DataLoader(dataset, batch_size=128, num_workers=4, shuffle=False, drop_last=False)\n", "\n", " img_features = []\n", " img_targets = []\n", " for imgs, targets in tqdm(dataloader, \"Extracting image features\", leave=False):\n", " imgs = imgs.to(device)\n", " feats = model.model(imgs)\n", " img_features.append(feats.detach().cpu())\n", " img_targets.append(targets)\n", " img_features = torch.cat(img_features, dim=0)\n", " img_targets = torch.cat(img_targets, dim=0)\n", " # Sort by classes, so that we obtain tensors of shape [num_classes, exmps_per_class, ...]\n", " # Makes it easier to process later\n", " img_targets, sort_idx = img_targets.sort()\n", " img_targets = img_targets.reshape(num_classes, exmps_per_class).transpose(0, 1)\n", " img_features = img_features[sort_idx].reshape(num_classes, exmps_per_class, -1).transpose(0, 1)\n", " else:\n", " img_features, img_targets = data_feats\n", "\n", " # We iterate through the full dataset in two manners. First, to select the k-shot batch.\n", " # Second, the evaluate the model on all other examples\n", " accuracies = []\n", " for k_idx in tqdm(range(0, img_features.shape[0], k_shot), \"Evaluating prototype classification\", leave=False):\n", " # Select support set and calculate prototypes\n", " k_img_feats = img_features[k_idx : k_idx + k_shot].flatten(0, 1)\n", " k_targets = img_targets[k_idx : k_idx + k_shot].flatten(0, 1)\n", " prototypes, proto_classes = model.calculate_prototypes(k_img_feats, k_targets)\n", " # Evaluate accuracy on the rest of the dataset\n", " batch_acc = 0\n", " for e_idx in range(0, img_features.shape[0], k_shot):\n", " if k_idx == e_idx: # Do not evaluate on the support set examples\n", " continue\n", " e_img_feats = img_features[e_idx : e_idx + k_shot].flatten(0, 1)\n", " e_targets = img_targets[e_idx : e_idx + k_shot].flatten(0, 1)\n", " _, _, acc = model.classify_feats(prototypes, proto_classes, e_img_feats, e_targets)\n", " batch_acc += acc.item()\n", " batch_acc /= img_features.shape[0] // k_shot - 1\n", " accuracies.append(batch_acc)\n", "\n", " return (mean(accuracies), stdev(accuracies)), (img_features, img_targets)"]}, {"cell_type": "markdown", "id": "e8adff5f", "metadata": {"papermill": {"duration": 0.043398, "end_time": "2021-10-10T16:36:40.798077", "exception": false, "start_time": "2021-10-10T16:36:40.754679", "status": "completed"}, "tags": []}, "source": ["Testing ProtoNet is relatively quick if we have processed all images once. Hence, we can do in this notebook:"]}, {"cell_type": "code", "execution_count": 22, "id": "6b522e34", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:36:40.891051Z", "iopub.status.busy": "2021-10-10T16:36:40.890582Z", "iopub.status.idle": "2021-10-10T16:37:25.334685Z", "shell.execute_reply": "2021-10-10T16:37:25.334200Z"}, "papermill": {"duration": 44.492916, "end_time": "2021-10-10T16:37:25.334799", "exception": false, "start_time": "2021-10-10T16:36:40.841883", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "59b3b0d90a7548ae8ec79d1fb1aa783e", "version_major": 2, "version_minor": 0}, "text/plain": ["Extracting image features: 0%| | 0/47 [00:00\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-10-10T18:37:25.755286\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["ax = plot_few_shot(protonet_accuracies, name=\"ProtoNet\", color=\"C1\")\n", "plt.show()\n", "plt.close()"]}, {"cell_type": "markdown", "id": "d99265a0", "metadata": {"papermill": {"duration": 0.04916, "end_time": "2021-10-10T16:37:26.050508", "exception": false, "start_time": "2021-10-10T16:37:26.001348", "status": "completed"}, "tags": []}, "source": ["As we initially expected, the performance of ProtoNet indeed increases the more samples we have.\n", "However, even with just two samples per class, we classify almost half of the images correctly, which is well above random accuracy (10%).\n", "The curve shows an exponentially dampend trend, meaning that adding 2 extra examples to $k=2$ has a much higher impact than adding 2 extra samples if we already have $k=16$.\n", "Nonetheless, we can say that ProtoNet adapts fairly well to new classes."]}, {"cell_type": "markdown", "id": "41e5a54a", "metadata": {"papermill": {"duration": 0.05058, "end_time": "2021-10-10T16:37:26.152476", "exception": false, "start_time": "2021-10-10T16:37:26.101896", "status": "completed"}, "tags": []}, "source": ["## MAML and ProtoMAML\n", "\n", "
"]}, {"cell_type": "markdown", "id": "209a64ec", "metadata": {"papermill": {"duration": 0.051648, "end_time": "2021-10-10T16:37:26.254669", "exception": false, "start_time": "2021-10-10T16:37:26.203021", "status": "completed"}, "tags": []}, "source": ["The second meta-learning algorithm we will look at is MAML, short for Model-Agnostic Meta-Learning.\n", "MAML is an optimization-based meta-learning algorithm, which means that it tries to adjust the standard optimization procedure to a few-shot setting.\n", "The idea of MAML is relatively simple: given a model, support and query set during training, we optimize the model for $m$ steps on the support set, and evaluate the gradients of the query loss with respect to the original model's parameters.\n", "For the same model, we do it for a few different support-query sets and accumulate the gradients.\n", "This results in learning a model that provides a good initialization for being quickly adapted to the training tasks.\n", "If we denote the model parameters with $\\theta$, we can visualize the procedure as follows (Figure credit - [Finn et al. ](http://proceedings.mlr.press/v70/finn17a.html)).\n", "\n", "
"]}, {"cell_type": "markdown", "id": "d0f6ca26", "metadata": {"papermill": {"duration": 0.049624, "end_time": "2021-10-10T16:37:26.354505", "exception": false, "start_time": "2021-10-10T16:37:26.304881", "status": "completed"}, "tags": []}, "source": ["The full algorithm of MAML is therefore as follows.\n", "At each training step, we sample a batch of tasks, i.e., a batch of support-query set pairs.\n", "For each task $\\mathcal{T}_i$, we optimize a model $f_{\\theta}$ on the support set via SGD, and denote this model as $f_{\\theta_i'}$.\n", "We refer to this optimization as _inner loop_.\n", "Using this new model, we calculate the gradients of the original parameters, $\\theta$, with respect to the query loss on $f_{\\theta_i'}$.\n", "These gradients are accumulated over all tasks, and used to update $\\theta$.\n", "This is called _outer loop_ since we iterate over tasks.\n", "The full MAML algorithm is summarized below (Figure credit - [Finn et al. ](http://proceedings.mlr.press/v70/finn17a.html)).\n", "\n", "
"]}, {"cell_type": "markdown", "id": "1555184d", "metadata": {"papermill": {"duration": 0.049633, "end_time": "2021-10-10T16:37:26.455355", "exception": false, "start_time": "2021-10-10T16:37:26.405722", "status": "completed"}, "tags": []}, "source": ["To obtain gradients for the initial parameters $\\theta$ from the optimized model $f_{\\theta_i'}$, we actually need second-order gradients, i.e. gradients of gradients, as the support set gradients depend on $\\theta$ as well.\n", "This makes MAML computationally expensive, especially when using mulitple inner loop steps.\n", "A simpler, yet almost equally well performing alternative is First-Order MAML (FOMAML) which only uses first-order gradients.\n", "This means that the second-order gradients are ignored, and we can calculate the outer loop gradients (line 10 in algorithm 2) simply by calculating the gradients with respect to $\\theta_i'$, and use those as update to $\\theta$.\n", "Hence, the new update rule becomes:\n", "$$\\theta\\leftarrow\\theta-\\beta\\sum_{\\mathcal{T}_i\\sim p(\\mathcal{T})}\\nabla_{\\theta_i'}\\mathcal{L}_{\\mathcal{T}_i}(f_{\\theta_i'})$$\n", "Note the change of $\\theta$ to $\\theta_i'$ for $\\nabla$."]}, {"cell_type": "markdown", "id": "fcef41fa", "metadata": {"papermill": {"duration": 0.050818, "end_time": "2021-10-10T16:37:26.556682", "exception": false, "start_time": "2021-10-10T16:37:26.505864", "status": "completed"}, "tags": []}, "source": ["### ProtoMAML\n", "\n", "A problem of MAML is how to design the output classification layer.\n", "In case all tasks have different number of classes, we need to initialize the output layer with zeros or randomly in every iteration.\n", "Even if we always have the same number of classes, we just start from random predictions.\n", "This requires several inner loop steps to reach a reasonable classification result.\n", "To overcome this problem, Triantafillou et al.\n", "(2020) propose to combine the merits of Prototypical Networks and MAML.\n", "Specifically, we can use prototypes to initialize our output layer to have a strong initialization.\n", "Thereby, it can be shown that the softmax over euclidean distances can be reformulated as a linear layer with softmax.\n", "To see this, let's first write out the negative euclidean distance between a feature vector $f_{\\theta}(\\mathbf{x}^{*})$ of a new data point $\\mathbf{x}^{*}$ to a prototype $\\mathbf{v}_c$ of class $c$:\n", "$$\n", "-||f_{\\theta}(\\mathbf{x}^{*})-\\mathbf{v}_c||^2=-f_{\\theta}(\\mathbf{x}^{*})^Tf_{\\theta}(\\mathbf{x}^{*})+2\\mathbf{v}_c^{T}f_{\\theta}(\\mathbf{x}^{*})-\\mathbf{v}_c^T\\mathbf{v}_c\n", "$$\n", "\n", "We perform the classification across all classes $c\\in\\mathcal{C}$ and take a softmax on the distance.\n", "Hence, any term that is same for all classes can be removed without changing the output probabilities.\n", "In the equation above, this is true for $-f_{\\theta}(\\mathbf{x}^{*})^Tf_{\\theta}(\\mathbf{x}^{*})$ since it is independent of any class prototype.\n", "Thus, we can write:\n", "\n", "$$\n", "-||f_{\\theta}(\\mathbf{x}^{*})-\\mathbf{v}_c||^2=2\\mathbf{v}_c^{T}f_{\\theta}(\\mathbf{x}^{*})-||\\mathbf{v}_c||^2+\\text{constant}\n", "$$\n", "\n", "Taking a second look at the equation above, it looks a lot like a linear layer.\n", "For this, we use $\\mathbf{W}_{c,\\cdot}=2\\mathbf{v}_c$ and $b_c=-||\\mathbf{v}_c||^2$ which gives us the linear layer $\\mathbf{W}f_{\\theta}(\\mathbf{x}^{*})+\\mathbf{b}$.\n", "Hence, if we initialize the output weight with twice the prototypes, and the biases by the negative squared L2 norm of the prototypes, we start with a Prototypical Network.\n", "MAML allows us to adapt this layer and the rest of the network further.\n", "\n", "In the following, we will implement First-Order ProtoMAML for few-shot classification.\n", "The implementation of MAML would be the same except the output layer initialization."]}, {"cell_type": "markdown", "id": "352f15a0", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.050087, "end_time": "2021-10-10T16:37:26.657875", "exception": false, "start_time": "2021-10-10T16:37:26.607788", "status": "completed"}, "tags": []}, "source": ["### ProtoMAML implementation\n", "\n", "For implementing ProtoMAML, we can follow Algorithm 2 with minor modifications.\n", "At each training step, we first sample a batch of tasks, and a support and query set for each task.\n", "In our case of few-shot classification, this means that we simply sample multiple support-query set pairs from our sampler.\n", "For each task, we finetune our current model on the support set.\n", "However, since we need to remember the original parameters for the other tasks, the outer loop gradient update and future training steps, we need to create a copy of our model, and finetune only the copy.\n", "We can copy a model by using standard Python functions like `deepcopy`.\n", "The inner loop is implemented in the function `adapt_few_shot` in the PyTorch Lightning module below.\n", "\n", "After finetuning the model, we apply it on the query set and calculate the first-order gradients with respect to the original parameters $\\theta$.\n", "In contrast to simple MAML, we also have to consider the gradients with respect to the output layer initialization, i.e. the prototypes, since they directly rely on $\\theta$.\n", "To realize this efficiently, we take two steps.\n", "First, we calculate the prototypes by applying the original model, i.e. not the copied model, on the support elements.\n", "When initializing the output layer, we detach the prototypes to stop the gradients.\n", "This is because in the inner loop itself, we do not want to consider gradients through the prototypes back to the original model.\n", "However, after the inner loop is finished, we re-attach the computation graph of the prototypes by writing `output_weight = (output_weight - init_weight).detach() + init_weight`.\n", "While this line does not change the value of the variable `output_weight`, it adds its dependency on the prototype initialization `init_weight`.\n", "Thus, if we call `.backward` on `output_weight`, we will automatically calculate the first-order gradients with respect to the prototype initialization in the original model.\n", "\n", "After calculating all gradients and summing them together in the original model, we can take a standard optimizer step.\n", "PyTorch Lightning's method is however designed to return a loss-tensor on which we call `.backward` first.\n", "Since this is not possible here, we need to perform the optimization step ourselves.\n", "All details can be found in the code below.\n", "\n", "For implementing (Proto-)MAML with second-order gradients, it is recommended to use libraries such as [$\\nabla$higher](https://github.com/facebookresearch/higher) from Facebook AI Research.\n", "For simplicity, we stick with first-order methods here."]}, {"cell_type": "code", "execution_count": 25, "id": "7fb5c1c7", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:37:26.777531Z", "iopub.status.busy": "2021-10-10T16:37:26.774558Z", "iopub.status.idle": "2021-10-10T16:37:26.779554Z", "shell.execute_reply": "2021-10-10T16:37:26.779118Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.070015, "end_time": "2021-10-10T16:37:26.779661", "exception": false, "start_time": "2021-10-10T16:37:26.709646", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class ProtoMAML(pl.LightningModule):\n", " def __init__(self, proto_dim, lr, lr_inner, lr_output, num_inner_steps):\n", " \"\"\"Inputs.\n", "\n", " proto_dim - Dimensionality of prototype feature space\n", " lr - Learning rate of the outer loop Adam optimizer\n", " lr_inner - Learning rate of the inner loop SGD optimizer\n", " lr_output - Learning rate for the output layer in the inner loop\n", " num_inner_steps - Number of inner loop updates to perform\n", " \"\"\"\n", " super().__init__()\n", " self.save_hyperparameters()\n", " self.model = get_convnet(output_size=self.hparams.proto_dim)\n", "\n", " def configure_optimizers(self):\n", " optimizer = optim.AdamW(self.parameters(), lr=self.hparams.lr)\n", " scheduler = optim.lr_scheduler.MultiStepLR(optimizer, milestones=[140, 180], gamma=0.1)\n", " return [optimizer], [scheduler]\n", "\n", " def run_model(self, local_model, output_weight, output_bias, imgs, labels):\n", " # Execute a model with given output layer weights and inputs\n", " feats = local_model(imgs)\n", " preds = F.linear(feats, output_weight, output_bias)\n", " loss = F.cross_entropy(preds, labels)\n", " acc = (preds.argmax(dim=1) == labels).float()\n", " return loss, preds, acc\n", "\n", " def adapt_few_shot(self, support_imgs, support_targets):\n", " # Determine prototype initialization\n", " support_feats = self.model(support_imgs)\n", " prototypes, classes = ProtoNet.calculate_prototypes(support_feats, support_targets)\n", " support_labels = (classes[None, :] == support_targets[:, None]).long().argmax(dim=-1)\n", " # Create inner-loop model and optimizer\n", " local_model = deepcopy(self.model)\n", " local_model.train()\n", " local_optim = optim.SGD(local_model.parameters(), lr=self.hparams.lr_inner)\n", " local_optim.zero_grad()\n", " # Create output layer weights with prototype-based initialization\n", " init_weight = 2 * prototypes\n", " init_bias = -torch.norm(prototypes, dim=1) ** 2\n", " output_weight = init_weight.detach().requires_grad_()\n", " output_bias = init_bias.detach().requires_grad_()\n", "\n", " # Optimize inner loop model on support set\n", " for _ in range(self.hparams.num_inner_steps):\n", " # Determine loss on the support set\n", " loss, _, _ = self.run_model(local_model, output_weight, output_bias, support_imgs, support_labels)\n", " # Calculate gradients and perform inner loop update\n", " loss.backward()\n", " local_optim.step()\n", " # Update output layer via SGD\n", " output_weight.data -= self.hparams.lr_output * output_weight.grad\n", " output_bias.data -= self.hparams.lr_output * output_bias.grad\n", " # Reset gradients\n", " local_optim.zero_grad()\n", " output_weight.grad.fill_(0)\n", " output_bias.grad.fill_(0)\n", "\n", " # Re-attach computation graph of prototypes\n", " output_weight = (output_weight - init_weight).detach() + init_weight\n", " output_bias = (output_bias - init_bias).detach() + init_bias\n", "\n", " return local_model, output_weight, output_bias, classes\n", "\n", " def outer_loop(self, batch, mode=\"train\"):\n", " accuracies = []\n", " losses = []\n", " self.model.zero_grad()\n", "\n", " # Determine gradients for batch of tasks\n", " for task_batch in batch:\n", " imgs, targets = task_batch\n", " support_imgs, query_imgs, support_targets, query_targets = split_batch(imgs, targets)\n", " # Perform inner loop adaptation\n", " local_model, output_weight, output_bias, classes = self.adapt_few_shot(support_imgs, support_targets)\n", " # Determine loss of query set\n", " query_labels = (classes[None, :] == query_targets[:, None]).long().argmax(dim=-1)\n", " loss, preds, acc = self.run_model(local_model, output_weight, output_bias, query_imgs, query_labels)\n", " # Calculate gradients for query set loss\n", " if mode == \"train\":\n", " loss.backward()\n", "\n", " for p_global, p_local in zip(self.model.parameters(), local_model.parameters()):\n", " p_global.grad += p_local.grad # First-order approx. -> add gradients of finetuned and base model\n", "\n", " accuracies.append(acc.mean().detach())\n", " losses.append(loss.detach())\n", "\n", " # Perform update of base model\n", " if mode == \"train\":\n", " opt = self.optimizers()\n", " opt.step()\n", " opt.zero_grad()\n", "\n", " self.log(\"%s_loss\" % mode, sum(losses) / len(losses))\n", " self.log(\"%s_acc\" % mode, sum(accuracies) / len(accuracies))\n", "\n", " def training_step(self, batch, batch_idx):\n", " self.outer_loop(batch, mode=\"train\")\n", " return None # Returning None means we skip the default training optimizer steps by PyTorch Lightning\n", "\n", " def validation_step(self, batch, batch_idx):\n", " # Validation requires to finetune a model, hence we need to enable gradients\n", " torch.set_grad_enabled(True)\n", " self.outer_loop(batch, mode=\"val\")\n", " torch.set_grad_enabled(False)"]}, {"cell_type": "markdown", "id": "175f6c04", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.049445, "end_time": "2021-10-10T16:37:26.879819", "exception": false, "start_time": "2021-10-10T16:37:26.830374", "status": "completed"}, "tags": []}, "source": ["### Training\n", "\n", "To train ProtoMAML, we need to change our sampling slightly.\n", "Instead of a single support-query set batch, we need to sample multiple.\n", "To implement this, we yet use another Sampler which combines multiple batches from a `FewShotBatchSampler`, and returns it afterwards.\n", "Additionally, we define a `collate_fn` for our data loader which takes the stack of support-query set images, and returns the tasks as a list.\n", "This makes it easier to process in our PyTorch Lightning module before.\n", "The implementation of the sampler can be found below."]}, {"cell_type": "code", "execution_count": 26, "id": "a64ff4e8", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:37:26.989336Z", "iopub.status.busy": "2021-10-10T16:37:26.988844Z", "iopub.status.idle": "2021-10-10T16:37:26.990910Z", "shell.execute_reply": "2021-10-10T16:37:26.990506Z"}, "papermill": {"duration": 0.059649, "end_time": "2021-10-10T16:37:26.991013", "exception": false, "start_time": "2021-10-10T16:37:26.931364", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class TaskBatchSampler:\n", " def __init__(self, dataset_targets, batch_size, N_way, K_shot, include_query=False, shuffle=True):\n", " \"\"\"\n", " Inputs:\n", " dataset_targets - PyTorch tensor of the labels of the data elements.\n", " batch_size - Number of tasks to aggregate in a batch\n", " N_way - Number of classes to sample per batch.\n", " K_shot - Number of examples to sample per class in the batch.\n", " include_query - If True, returns batch of size N_way*K_shot*2, which\n", " can be split into support and query set. Simplifies\n", " the implementation of sampling the same classes but\n", " distinct examples for support and query set.\n", " shuffle - If True, examples and classes are newly shuffled in each\n", " iteration (for training)\n", " \"\"\"\n", " super().__init__()\n", " self.batch_sampler = FewShotBatchSampler(dataset_targets, N_way, K_shot, include_query, shuffle)\n", " self.task_batch_size = batch_size\n", " self.local_batch_size = self.batch_sampler.batch_size\n", "\n", " def __iter__(self):\n", " # Aggregate multiple batches before returning the indices\n", " batch_list = []\n", " for batch_idx, batch in enumerate(self.batch_sampler):\n", " batch_list.extend(batch)\n", " if (batch_idx + 1) % self.task_batch_size == 0:\n", " yield batch_list\n", " batch_list = []\n", "\n", " def __len__(self):\n", " return len(self.batch_sampler) // self.task_batch_size\n", "\n", " def get_collate_fn(self):\n", " # Returns a collate function that converts one big tensor into a list of task-specific tensors\n", " def collate_fn(item_list):\n", " imgs = torch.stack([img for img, target in item_list], dim=0)\n", " targets = torch.stack([target for img, target in item_list], dim=0)\n", " imgs = imgs.chunk(self.task_batch_size, dim=0)\n", " targets = targets.chunk(self.task_batch_size, dim=0)\n", " return list(zip(imgs, targets))\n", "\n", " return collate_fn"]}, {"cell_type": "markdown", "id": "a8e833ad", "metadata": {"papermill": {"duration": 0.050761, "end_time": "2021-10-10T16:37:27.091732", "exception": false, "start_time": "2021-10-10T16:37:27.040971", "status": "completed"}, "tags": []}, "source": ["The creation of the data loaders is with this sampler straight-forward.\n", "Note that since many images need to loaded for a training batch, it is recommended to use less workers than usual."]}, {"cell_type": "code", "execution_count": 27, "id": "579696ce", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:37:27.195877Z", "iopub.status.busy": "2021-10-10T16:37:27.195402Z", "iopub.status.idle": "2021-10-10T16:37:27.234232Z", "shell.execute_reply": "2021-10-10T16:37:27.233821Z"}, "papermill": {"duration": 0.092572, "end_time": "2021-10-10T16:37:27.234347", "exception": false, "start_time": "2021-10-10T16:37:27.141775", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# Training constant (same as for ProtoNet)\n", "N_WAY = 5\n", "K_SHOT = 4\n", "\n", "# Training set\n", "train_protomaml_sampler = TaskBatchSampler(\n", " train_set.targets, include_query=True, N_way=N_WAY, K_shot=K_SHOT, batch_size=16\n", ")\n", "train_protomaml_loader = data.DataLoader(\n", " train_set, batch_sampler=train_protomaml_sampler, collate_fn=train_protomaml_sampler.get_collate_fn(), num_workers=2\n", ")\n", "\n", "# Validation set\n", "val_protomaml_sampler = TaskBatchSampler(\n", " val_set.targets,\n", " include_query=True,\n", " N_way=N_WAY,\n", " K_shot=K_SHOT,\n", " batch_size=1, # We do not update the parameters, hence the batch size is irrelevant here\n", " shuffle=False,\n", ")\n", "val_protomaml_loader = data.DataLoader(\n", " val_set, batch_sampler=val_protomaml_sampler, collate_fn=val_protomaml_sampler.get_collate_fn(), num_workers=2\n", ")"]}, {"cell_type": "markdown", "id": "483d09a8", "metadata": {"papermill": {"duration": 0.04969, "end_time": "2021-10-10T16:37:27.335586", "exception": false, "start_time": "2021-10-10T16:37:27.285896", "status": "completed"}, "tags": []}, "source": ["Now, we are ready to train our ProtoMAML.\n", "We use the same feature space size as for ProtoNet, but can use a higher learning rate since the outer loop gradients are accumulated over 16 batches.\n", "The inner loop learning rate is set to 0.1, which is much higher than the outer loop lr because we use SGD in the inner loop instead of Adam.\n", "Commonly, the learning rate for the output layer is higher than the base model is the base model is very deep or pre-trained.\n", "However, for our setup, we observed no noticable impact of using a different learning rate than the base model.\n", "The number of inner loop updates is another crucial hyperparmaeter, and depends on the similarity of our training tasks.\n", "Since all tasks are on images from the same dataset, we notice that a single inner loop update achieves similar performance as 3 or 5 while training considerably faster.\n", "However, especially in RL and NLP, larger number of inner loop steps are often needed."]}, {"cell_type": "code", "execution_count": 28, "id": "f65be6c5", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:37:27.441153Z", "iopub.status.busy": "2021-10-10T16:37:27.440678Z", "iopub.status.idle": "2021-10-10T16:37:27.503563Z", "shell.execute_reply": "2021-10-10T16:37:27.503082Z"}, "papermill": {"duration": 0.118168, "end_time": "2021-10-10T16:37:27.503674", "exception": false, "start_time": "2021-10-10T16:37:27.385506", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model at saved_models/MetaLearning/ProtoMAML.ckpt, loading...\n"]}], "source": ["protomaml_model = train_model(\n", " ProtoMAML,\n", " proto_dim=64,\n", " lr=1e-3,\n", " lr_inner=0.1,\n", " lr_output=0.1,\n", " num_inner_steps=1, # Often values between 1 and 10\n", " train_loader=train_protomaml_loader,\n", " val_loader=val_protomaml_loader,\n", ")"]}, {"cell_type": "markdown", "id": "8cc7c232", "metadata": {"papermill": {"duration": 0.049852, "end_time": "2021-10-10T16:37:27.604342", "exception": false, "start_time": "2021-10-10T16:37:27.554490", "status": "completed"}, "tags": []}, "source": ["Let's have a look at the training TensorBoard."]}, {"cell_type": "code", "execution_count": 29, "id": "8bdec8ea", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:37:27.711240Z", "iopub.status.busy": "2021-10-10T16:37:27.710762Z", "iopub.status.idle": "2021-10-10T16:37:27.712848Z", "shell.execute_reply": "2021-10-10T16:37:27.712444Z"}, "papermill": {"duration": 0.05552, "end_time": "2021-10-10T16:37:27.712949", "exception": false, "start_time": "2021-10-10T16:37:27.657429", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# Opens tensorboard in notebook. Adjust the path to your CHECKPOINT_PATH if needed\n", "# # %tensorboard --logdir ../saved_models/tutorial16/tensorboards/ProtoMAML/"]}, {"cell_type": "markdown", "id": "ffa8d4ab", "metadata": {"papermill": {"duration": 0.050609, "end_time": "2021-10-10T16:37:27.813989", "exception": false, "start_time": "2021-10-10T16:37:27.763380", "status": "completed"}, "tags": []}, "source": ["
\n", "\n", "One obvious difference to ProtoNet is that the loss curves look much less noisy.\n", "This is because we average the outer loop gradients over multiple tasks, and thus have a smoother training curve.\n", "Additionally, we only have 15k training iterations after 200 epochs.\n", "This is again because of the task batches, which cause 16 times less iterations.\n", "However, each iteration has seen 16 times more data in this experiment.\n", "Thus, we still have a fair comparison between ProtoMAML and ProtoNet.\n", "At first sight on the validation accuracy, one would assume that\n", "ProtoNet performs superior to ProtoMAML, but we have to verify that with\n", "proper testing below."]}, {"cell_type": "markdown", "id": "1ef9ae57", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.051235, "end_time": "2021-10-10T16:37:27.917147", "exception": false, "start_time": "2021-10-10T16:37:27.865912", "status": "completed"}, "tags": []}, "source": ["### Testing\n", "\n", "We test ProtoMAML in the same manner as ProtoNet, namely by picking random examples in the test set as support sets and use the rest of the dataset as query set.\n", "Instead of just calculating the prototypes for all examples, we need to finetune a separate model for each support set.\n", "This is why this process is more expensive than ProtoNet, and in our case, testing $k=\\{2,4,8,16,32\\}$ can take almost an hour.\n", "Hence, we provide evaluation files besides the pretrained models."]}, {"cell_type": "code", "execution_count": 30, "id": "24b90577", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:37:28.039732Z", "iopub.status.busy": "2021-10-10T16:37:28.039190Z", "iopub.status.idle": "2021-10-10T16:37:28.041339Z", "shell.execute_reply": "2021-10-10T16:37:28.040864Z"}, "papermill": {"duration": 0.070613, "end_time": "2021-10-10T16:37:28.041443", "exception": false, "start_time": "2021-10-10T16:37:27.970830", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def test_protomaml(model, dataset, k_shot=4):\n", " pl.seed_everything(42)\n", " model = model.to(device)\n", " num_classes = dataset.targets.unique().shape[0]\n", "\n", " # Data loader for full test set as query set\n", " full_dataloader = data.DataLoader(dataset, batch_size=128, num_workers=4, shuffle=False, drop_last=False)\n", " # Data loader for sampling support sets\n", " sampler = FewShotBatchSampler(\n", " dataset.targets, include_query=False, N_way=num_classes, K_shot=k_shot, shuffle=False, shuffle_once=False\n", " )\n", " sample_dataloader = data.DataLoader(dataset, batch_sampler=sampler, num_workers=2)\n", "\n", " # We iterate through the full dataset in two manners. First, to select the k-shot batch.\n", " # Second, the evaluate the model on all other examples\n", " accuracies = []\n", " for (support_imgs, support_targets), support_indices in tqdm(\n", " zip(sample_dataloader, sampler), \"Performing few-shot finetuning\"\n", " ):\n", " support_imgs = support_imgs.to(device)\n", " support_targets = support_targets.to(device)\n", " # Finetune new model on support set\n", " local_model, output_weight, output_bias, classes = model.adapt_few_shot(support_imgs, support_targets)\n", " with torch.no_grad(): # No gradients for query set needed\n", " local_model.eval()\n", " batch_acc = torch.zeros((0,), dtype=torch.float32, device=device)\n", " # Evaluate all examples in test dataset\n", " for query_imgs, query_targets in full_dataloader:\n", " query_imgs = query_imgs.to(device)\n", " query_targets = query_targets.to(device)\n", " query_labels = (classes[None, :] == query_targets[:, None]).long().argmax(dim=-1)\n", " _, _, acc = model.run_model(local_model, output_weight, output_bias, query_imgs, query_labels)\n", " batch_acc = torch.cat([batch_acc, acc.detach()], dim=0)\n", " # Exclude support set elements\n", " for s_idx in support_indices:\n", " batch_acc[s_idx] = 0\n", " batch_acc = batch_acc.sum().item() / (batch_acc.shape[0] - len(support_indices))\n", " accuracies.append(batch_acc)\n", " return mean(accuracies), stdev(accuracies)"]}, {"cell_type": "markdown", "id": "d580df69", "metadata": {"papermill": {"duration": 0.051584, "end_time": "2021-10-10T16:37:28.144161", "exception": false, "start_time": "2021-10-10T16:37:28.092577", "status": "completed"}, "tags": []}, "source": ["In contrast to training, it is recommended to use many more inner loop updates during testing.\n", "During training, we are not interested in getting the best model from the inner loop, but the model which can provide the best gradients.\n", "Hence, one update might be already sufficient in training, but for testing, it was often observed that larger number of updates can give a considerable performance boost.\n", "Thus, we change the inner loop updates to 200 before testing."]}, {"cell_type": "code", "execution_count": 31, "id": "a3a77c03", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:37:28.249335Z", "iopub.status.busy": "2021-10-10T16:37:28.248861Z", "iopub.status.idle": "2021-10-10T16:37:28.251118Z", "shell.execute_reply": "2021-10-10T16:37:28.250650Z"}, "papermill": {"duration": 0.056293, "end_time": "2021-10-10T16:37:28.251218", "exception": false, "start_time": "2021-10-10T16:37:28.194925", "status": "completed"}, "tags": []}, "outputs": [], "source": ["protomaml_model.hparams.num_inner_steps = 200"]}, {"cell_type": "markdown", "id": "5c8e75e8", "metadata": {"papermill": {"duration": 0.050389, "end_time": "2021-10-10T16:37:28.352727", "exception": false, "start_time": "2021-10-10T16:37:28.302338", "status": "completed"}, "tags": []}, "source": ["Now, we can test our model.\n", "For the pre-trained models, we provide a json file with the results to reduce evaluation time."]}, {"cell_type": "code", "execution_count": 32, "id": "a2ec75b4", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:37:28.464792Z", "iopub.status.busy": "2021-10-10T16:37:28.464316Z", "iopub.status.idle": "2021-10-10T16:37:28.467735Z", "shell.execute_reply": "2021-10-10T16:37:28.467269Z"}, "papermill": {"duration": 0.059702, "end_time": "2021-10-10T16:37:28.467837", "exception": false, "start_time": "2021-10-10T16:37:28.408135", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Accuracy for k=2: 42.89% (+-3.82%)\n", "Accuracy for k=4: 52.27% (+-2.72%)\n", "Accuracy for k=8: 59.23% (+-1.50%)\n", "Accuracy for k=16: 63.94% (+-1.24%)\n", "Accuracy for k=32: 67.57% (+-0.90%)\n"]}], "source": ["protomaml_result_file = os.path.join(CHECKPOINT_PATH, \"protomaml_fewshot.json\")\n", "\n", "if os.path.isfile(protomaml_result_file):\n", " # Load pre-computed results\n", " with open(protomaml_result_file) as f:\n", " protomaml_accuracies = json.load(f)\n", " protomaml_accuracies = {int(k): v for k, v in protomaml_accuracies.items()}\n", "else:\n", " # Perform same experiments as for ProtoNet\n", " protomaml_accuracies = dict()\n", " for k in [2, 4, 8, 16, 32]:\n", " protomaml_accuracies[k] = test_protomaml(protomaml_model, test_set, k_shot=k)\n", " # Export results\n", " with open(protomaml_result_file, \"w\") as f:\n", " json.dump(protomaml_accuracies, f, indent=4)\n", "\n", "for k in protomaml_accuracies:\n", " print(\n", " \"Accuracy for k=%i: %4.2f%% (+-%4.2f%%)\"\n", " % (k, 100.0 * protomaml_accuracies[k][0], 100.0 * protomaml_accuracies[k][1])\n", " )"]}, {"cell_type": "markdown", "id": "a3b76b70", "metadata": {"papermill": {"duration": 0.051095, "end_time": "2021-10-10T16:37:28.569910", "exception": false, "start_time": "2021-10-10T16:37:28.518815", "status": "completed"}, "tags": []}, "source": ["Again, let's plot the results in our plot from before."]}, {"cell_type": "code", "execution_count": 33, "id": "c19a1cd0", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:37:28.700295Z", "iopub.status.busy": "2021-10-10T16:37:28.688544Z", "iopub.status.idle": "2021-10-10T16:37:28.982037Z", "shell.execute_reply": "2021-10-10T16:37:28.981554Z"}, "papermill": {"duration": 0.36056, "end_time": "2021-10-10T16:37:28.982151", "exception": false, "start_time": "2021-10-10T16:37:28.621591", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/pdf": "\n", "image/svg+xml": ["\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-10-10T18:37:28.787735\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["ax = plot_few_shot(protonet_accuracies, name=\"ProtoNet\", color=\"C1\")\n", "plot_few_shot(protomaml_accuracies, name=\"ProtoMAML\", color=\"C2\", ax=ax)\n", "plt.show()\n", "plt.close()"]}, {"cell_type": "markdown", "id": "b631ffc3", "metadata": {"papermill": {"duration": 0.053734, "end_time": "2021-10-10T16:37:29.090435", "exception": false, "start_time": "2021-10-10T16:37:29.036701", "status": "completed"}, "tags": []}, "source": ["We can observe that ProtoMAML is indeed able to outperform ProtoNet for $k>4$.\n", "This is because with more samples, it becomes more relevant to also adapt the base model's parameters.\n", "Meanwhile, for $k=2$, ProtoMAML achieves lower performance than ProtoNet.\n", "This is likely also related to choosing 200 inner loop updates since with more updates, there exists the risk of overfitting.\n", "Nonetheless, the high standard deviation for $k=2$ makes it hard to take any statistically valid conclusion.\n", "\n", "Overall, we can conclude that ProtoMAML slightly outperforms ProtoNet for larger shot counts.\n", "However, one disadvantage of ProtoMAML is its much longer training and testing time.\n", "ProtoNet provides a simple, efficient, yet strong baseline for\n", "ProtoMAML, and might be the better solution in situations where limited\n", "resources are available."]}, {"cell_type": "markdown", "id": "6d158afa", "metadata": {"papermill": {"duration": 0.055343, "end_time": "2021-10-10T16:37:29.202908", "exception": false, "start_time": "2021-10-10T16:37:29.147565", "status": "completed"}, "tags": []}, "source": ["## Domain adaptation\n", "\n", "So far, we have evaluated our meta-learning algorithms on the same dataset on which we have trained them.\n", "However, meta-learning algorithms are especially interesting when we want to move from one to another dataset.\n", "So, what happens if we apply them on a quite different dataset than CIFAR?\n", "This is what we try out below, and evaluate ProtoNet and ProtoMAML on the SVHN dataset."]}, {"cell_type": "markdown", "id": "71c4f38f", "metadata": {"papermill": {"duration": 0.054154, "end_time": "2021-10-10T16:37:29.316416", "exception": false, "start_time": "2021-10-10T16:37:29.262262", "status": "completed"}, "tags": []}, "source": ["### SVHN dataset\n", "\n", "The Street View House Numbers (SVHN) dataset is a real-world image dataset for house number detection.\n", "It is similar to MNIST by having the classes 0 to 9, but is more difficult due to its real-world setting and possible distracting numbers left and right.\n", "Let's first load the dataset, and visualize some images to get an impression of the dataset."]}, {"cell_type": "code", "execution_count": 34, "id": "74228693", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:37:29.435411Z", "iopub.status.busy": "2021-10-10T16:37:29.434935Z", "iopub.status.idle": "2021-10-10T16:37:34.722837Z", "shell.execute_reply": "2021-10-10T16:37:34.722322Z"}, "papermill": {"duration": 5.346857, "end_time": "2021-10-10T16:37:34.722956", "exception": false, "start_time": "2021-10-10T16:37:29.376099", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading http://ufldl.stanford.edu/housenumbers/test_32x32.mat to /__w/1/s/.datasets/test_32x32.mat\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "04c241d2abd34caa8d271a853e8f6a74", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0/64275384 [00:00\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-10-10T18:37:34.921312\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["# Visualize some examples\n", "NUM_IMAGES = 12\n", "SVHN_images = [SVHN_test_dataset[np.random.randint(len(SVHN_test_dataset))][0] for idx in range(NUM_IMAGES)]\n", "SVHN_images = torch.stack(SVHN_images, dim=0)\n", "img_grid = torchvision.utils.make_grid(SVHN_images, nrow=6, normalize=True, pad_value=0.9)\n", "img_grid = img_grid.permute(1, 2, 0)\n", "\n", "plt.figure(figsize=(8, 8))\n", "plt.title(\"Image examples of the SVHN dataset\")\n", "plt.imshow(img_grid)\n", "plt.axis(\"off\")\n", "plt.show()\n", "plt.close()"]}, {"cell_type": "markdown", "id": "65604d6b", "metadata": {"papermill": {"duration": 0.057271, "end_time": "2021-10-10T16:37:35.195031", "exception": false, "start_time": "2021-10-10T16:37:35.137760", "status": "completed"}, "tags": []}, "source": ["Each image is labeled with one class between 0 and 9 representing the main digit in the image.\n", "Can our ProtoNet and ProtoMAML learn to classify the digits from only a few examples?\n", "This is what we will test out below.\n", "The images have the same size as CIFAR, so that we can use the images without changes.\n", "We first prepare the dataset, for which we take the first 500 images per class.\n", "For this dataset, we use our test functions as before to get an estimated performance for different number of shots."]}, {"cell_type": "code", "execution_count": 36, "id": "0de00f6d", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:37:35.315332Z", "iopub.status.busy": "2021-10-10T16:37:35.314823Z", "iopub.status.idle": "2021-10-10T16:37:35.326321Z", "shell.execute_reply": "2021-10-10T16:37:35.326709Z"}, "papermill": {"duration": 0.07457, "end_time": "2021-10-10T16:37:35.326849", "exception": false, "start_time": "2021-10-10T16:37:35.252279", "status": "completed"}, "tags": []}, "outputs": [{"data": {"text/plain": ["(5000, 32, 32, 3)"]}, "execution_count": 36, "metadata": {}, "output_type": "execute_result"}], "source": ["imgs = np.transpose(SVHN_test_dataset.data, (0, 2, 3, 1))\n", "targets = SVHN_test_dataset.labels\n", "# Limit number of examples to 500 to reduce test time\n", "min_label_count = min(500, np.bincount(SVHN_test_dataset.labels).min())\n", "\n", "idxs = np.concatenate([np.where(targets == c)[0][:min_label_count] for c in range(1 + targets.max())], axis=0)\n", "imgs = imgs[idxs]\n", "targets = torch.from_numpy(targets[idxs]).long()\n", "\n", "svhn_fewshot_dataset = ImageDataset(imgs, targets, img_transform=test_transform)\n", "svhn_fewshot_dataset.imgs.shape"]}, {"cell_type": "markdown", "id": "761db618", "metadata": {"papermill": {"duration": 0.059836, "end_time": "2021-10-10T16:37:35.446022", "exception": false, "start_time": "2021-10-10T16:37:35.386186", "status": "completed"}, "tags": []}, "source": ["### Experiments\n", "\n", "First, we can apply ProtoNet to the SVHN dataset:"]}, {"cell_type": "code", "execution_count": 37, "id": "443d295e", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:37:35.566197Z", "iopub.status.busy": "2021-10-10T16:37:35.565609Z", "iopub.status.idle": "2021-10-10T16:37:49.932486Z", "shell.execute_reply": "2021-10-10T16:37:49.932000Z"}, "papermill": {"duration": 14.429039, "end_time": "2021-10-10T16:37:49.932629", "exception": false, "start_time": "2021-10-10T16:37:35.503590", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "6ae81549f8a343a2985e8fbdd3e6cfce", "version_major": 2, "version_minor": 0}, "text/plain": ["Extracting image features: 0%| | 0/40 [00:00\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-10-10T18:37:50.563371\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["ax = plot_few_shot(protonet_svhn_accuracies, name=\"ProtoNet\", color=\"C1\")\n", "plot_few_shot(protomaml_svhn_accuracies, name=\"ProtoMAML\", color=\"C2\", ax=ax)\n", "plt.show()\n", "plt.close()"]}, {"cell_type": "markdown", "id": "81b31ea2", "metadata": {"papermill": {"duration": 0.064936, "end_time": "2021-10-10T16:38:10.896748", "exception": false, "start_time": "2021-10-10T16:38:10.831812", "status": "completed"}, "tags": []}, "source": ["## Conclusion\n", "\n", "In this notebook, we have discussed meta-learning algorithms that learn to adapt to new classes and/or tasks with just a few samples.\n", "We have discussed three popular algorithms, namely ProtoNet, MAML and ProtoMAML.\n", "On the few-shot image classification task of CIFAR100, ProtoNet and ProtoMAML showed to perform similarly well, with slight benefits of ProtoMAML for larger shot sizes.\n", "However, for out-of-distribution data (SVHN), the ability to optimize the base model showed to be crucial and gave ProtoMAML considerable performance gains over ProtoNet.\n", "Nonetheless, ProtoNet offers other advantages compared to ProtoMAML, namely a very cheap training and test cost as well as a simpler implementation.\n", "Hence, it is recommended to consider whether the additionally complexity\n", "of ProtoMAML is worth the extra training computation cost, or whether\n", "ProtoNet is already sufficient for the task at hand."]}, {"cell_type": "markdown", "id": "e546b5d0", "metadata": {"papermill": {"duration": 0.064218, "end_time": "2021-10-10T16:38:11.027954", "exception": false, "start_time": "2021-10-10T16:38:10.963736", "status": "completed"}, "tags": []}, "source": ["### References\n", "\n", "[1] Snell, Jake, Kevin Swersky, and Richard S. Zemel.\n", "\"Prototypical networks for few-shot learning.\"\n", "NeurIPS 2017.\n", "([link](https://arxiv.org/pdf/1703.05175.pdf))\n", "\n", "[2] Chelsea Finn, Pieter Abbeel, Sergey Levine.\n", "\"Model-Agnostic Meta-Learning for Fast Adaptation of Deep Networks.\"\n", "ICML 2017.\n", "([link](http://proceedings.mlr.press/v70/finn17a.html))\n", "\n", "[3] Triantafillou, Eleni, Tyler Zhu, Vincent Dumoulin, Pascal Lamblin, Utku Evci, Kelvin Xu, Ross Goroshin et al.\n", "\"Meta-dataset: A dataset of datasets for learning to learn from few examples.\"\n", "ICLR 2020.\n", "([link](https://openreview.net/pdf?id=rkgAGAVKPr))"]}, {"cell_type": "markdown", "id": "468b2212", "metadata": {"papermill": {"duration": 0.062817, "end_time": "2021-10-10T16:38:11.155742", "exception": false, "start_time": "2021-10-10T16:38:11.092925", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "![Pytorch Lightning](){height=\"60px\" width=\"240px\"}"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: Tutorial 12: Meta-Learning - Learning to Learn\n", " :card_description: In this tutorial, we will discuss algorithms that learn models which can quickly adapt to new classes and/or tasks with few samples. This area of machine learning is called...\n", " :tags: Few-shot-learning,MAML,ProtoNet,GPU/TPU,UvA-DL-Course\n", " :image: _static/images/course_UvA-DL/12-meta-learning.jpg"]}], "metadata": {"jupytext": {"cell_metadata_filter": "id,colab,colab_type,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 106.820185, "end_time": "2021-10-10T16:38:11.928740", "environment_variables": {}, "exception": null, "input_path": "course_UvA-DL/12-meta-learning/Meta_Learning.ipynb", "output_path": ".notebooks/course_UvA-DL/12-meta-learning.ipynb", "parameters": {}, "start_time": "2021-10-10T16:36:25.108555", "version": "2.3.3"}, "widgets": {"application/vnd.jupyter.widget-state+json": {"state": {"02efcb1a6aa4448eb2be5597b7229117": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "04c241d2abd34caa8d271a853e8f6a74": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_94a0798591274c8b8b0011603eb7638f", "IPY_MODEL_b0685ba39080452fa095a152855ce3f5", "IPY_MODEL_df741ff3bf654a9b8b7a024c14f54f61"], "layout": "IPY_MODEL_5643ce9402954952881a5eb9119ff556"}}, "05eeda38820a4700b6808a22c087f854": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "06dabf4f2d724f2e855a18452a421901": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "0748cb2c03654ebebcdbf1bec54ef2a6": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_72ff32b019be4252b3a9736e42d05257", "placeholder": "\u200b", "style": "IPY_MODEL_693e0990c811418d8be6f20a3c613f3e", "value": " 42/47 [00:00<00:00, 83.87it/s]"}}, "074a0b76522b4e2ab81b2abed09f23a3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_bffa3c9c26424621a044f35fc72dc03f", "IPY_MODEL_65f3907fd55c4b4dbd91642a08fd39d9", "IPY_MODEL_4ea0e80530d34d4f8d8485c83df9da16"], "layout": "IPY_MODEL_cb0c7957cd344fd5b8e229b443f1640d"}}, "08d9ec62524244f1872cdb20191f3be7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "0a0c945ddb6546be814dab292cf61c4e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "0a2fabd9ce614e4ab1700634bc17e28e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1357795e20b8457abe5ee3078efe3ca7": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "136db4bc997541c5b3123895b1746e5e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "16b537a4cb21479fa2564472a850f609": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "18aca4955a7a4c64a8eb12925d3704d7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_b380f61e129140fcb2daf6c273570e16", "IPY_MODEL_b7d2cb428c5c4272a094846477794af9", "IPY_MODEL_509d1c763a634f83b7fba1ad9494dc02"], "layout": "IPY_MODEL_74c3e37ba7ac43019562374aae3f8c4e"}}, "1984df6019f34935a0d89f8f0cc9c549": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "19f3640a3b6f411984df19dd9b9f2536": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "1b10c53ce772446d99285a37607ef5e3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f6e7ccff3f3f4b87983f1603bf0b3547", "placeholder": "\u200b", "style": "IPY_MODEL_241f1955c2624d60b29151d36487ef5e", "value": " 298/300 [00:13<00:00, 22.45it/s]"}}, "219937af24194529826e86cbeaa92dc1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_45c4fd2d576f4ecaa4df4aca60ed4377", "IPY_MODEL_5fa0132632af4e80b186723f1a5c9667", "IPY_MODEL_43bf706a87a74c8c903431b130a3b7cd"], "layout": "IPY_MODEL_314d69183852488f8d2526db24356295"}}, "241f1955c2624d60b29151d36487ef5e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "25be42641c3c4d3abe06f325f7e5707c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "26bde6db982d430988ad5224841c46b6": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "29ac64c53e904692b4e1bcacd235cb15": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "2cc8415ac50d463e9eb6eba8bd7441dd": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "2e1ac83c3a2b4bda89b392a3b2795d7d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_842078486c2c449786473d055756c9f3", "placeholder": "\u200b", "style": "IPY_MODEL_fca8ada280ae405ab7fc84a435653757", "value": " 124/125 [00:02<00:00, 44.61it/s]"}}, "314d69183852488f8d2526db24356295": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "33082c5ed1d04d52bc8bf407f24b6cd2": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3545a43fc2ba428b8b8c312ecdb91469": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_36c6f2b6dcba4d0386076ed767d9c503", "max": 300.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_441a767165c641359c9955258a379f90", "value": 300.0}}, "36c6f2b6dcba4d0386076ed767d9c503": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3ae54407f35e4135929978d9d2889764": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e08469460c584a789dd3516b7d78ae77", "placeholder": "\u200b", "style": "IPY_MODEL_e46fb7aeb83b4002bdd245d9c6f731e3", "value": "Evaluating prototype classification: 99%"}}, "3c728764f18c47bc8b94ff75bfdde4f4": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3d2ebb08ff2f4bdbacdb096b84f1ec09": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "3e6e0061bdc745beaac7f83f84327df4": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3e99426778d245cbbafb04d6f52c153e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "3ec9165e19ed46f8b78dfdfd0adc8ccf": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4281b262e4a544969139ae166f292c37": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_cb1d437a4c354907bc26e5c54ca76168", "max": 47.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_ea8059402deb40659f77d6c63d7f8d09", "value": 47.0}}, "43bbd6d914404eb7be1ccc7417e0c882": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "43bf706a87a74c8c903431b130a3b7cd": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1357795e20b8457abe5ee3078efe3ca7", "placeholder": "\u200b", "style": "IPY_MODEL_4b795244ba454b47bca4061ab2fc69a7", "value": " 34/38 [00:00<00:00, 52.34it/s]"}}, "441a767165c641359c9955258a379f90": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "447d64a260fa4e579069160a3d9460de": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "45c4fd2d576f4ecaa4df4aca60ed4377": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_cc4167da1b794828ab4eb0679922efe1", "placeholder": "\u200b", "style": "IPY_MODEL_48a737ec864a4e288e6cf338e313bf74", "value": "Evaluating prototype classification: 89%"}}, "461f881689924b8e82af3e96a920be27": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3c728764f18c47bc8b94ff75bfdde4f4", "placeholder": "\u200b", "style": "IPY_MODEL_d939ed1df36b4c5db18f4b0496ee48de", "value": " 72/75 [00:22<00:00, 17.74it/s]"}}, "467e71f262cf432fba62ed8d75effd3a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "48a737ec864a4e288e6cf338e313bf74": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "495f557ce24948f0968a8e77cc121b55": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d2c2b819979a476a8482e9d67ebab1a7", "placeholder": "\u200b", "style": "IPY_MODEL_557662d2d3e3487cbedd294325df6f31", "value": ""}}, "4b795244ba454b47bca4061ab2fc69a7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "4c13f424d1bb4cf0a44284e678229cf7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "4d5211d9d6e24a2cb1baa906ffa8dac2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "4ea0e80530d34d4f8d8485c83df9da16": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_29ac64c53e904692b4e1bcacd235cb15", "placeholder": "\u200b", "style": "IPY_MODEL_a37e0600abe64891ba7bad38e42cae86", "value": " 12/16 [00:00<00:00, 117.22it/s]"}}, "4fd996b6dd534694b6413f376e6be22c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "509d1c763a634f83b7fba1ad9494dc02": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b19b954922464bc3ae7a287ae8e7ba36", "placeholder": "\u200b", "style": "IPY_MODEL_f4334aa28f094684884cba73f70d9539", "value": " 148/150 [00:04<00:00, 37.03it/s]"}}, "557662d2d3e3487cbedd294325df6f31": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "5643ce9402954952881a5eb9119ff556": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "59b3b0d90a7548ae8ec79d1fb1aa783e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_fc0cd3a5fceb46438c8831f7ace96e8e", "IPY_MODEL_4281b262e4a544969139ae166f292c37", "IPY_MODEL_0748cb2c03654ebebcdbf1bec54ef2a6"], "layout": "IPY_MODEL_5c60626bcc1c4a56a49881ed8afd804c"}}, "5b9c06753fca42ca89e480bfe3de1b06": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_eae30ee4b8e54cfbafa7a73ac8c3720d", "max": 250.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_02efcb1a6aa4448eb2be5597b7229117", "value": 250.0}}, "5c60626bcc1c4a56a49881ed8afd804c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "5fa0132632af4e80b186723f1a5c9667": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2cc8415ac50d463e9eb6eba8bd7441dd", "max": 38.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_b4923b5857b447e2aca7a73524cbb3bb", "value": 38.0}}, "6051618a7e8943ce91d14f6a31a0f679": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "65f3907fd55c4b4dbd91642a08fd39d9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c39a5cb98e1644529c1364704681c37d", "max": 16.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_7b48347de2bd47e88549b165c7af8d90", "value": 16.0}}, "66330b6ebefe44c7906d3e6e5fd221c6": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "693e0990c811418d8be6f20a3c613f3e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "69f9bf1e8e3c43d0a2225f3c3d6cf91d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "6ae81549f8a343a2985e8fbdd3e6cfce": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_9643addbcabd45b48bba6f84b24900f2", "IPY_MODEL_d022e70ba7ff4133a278315f4cabdec8", "IPY_MODEL_f69a45ea7e884b48bc7e22af83113f6d"], "layout": "IPY_MODEL_3ec9165e19ed46f8b78dfdfd0adc8ccf"}}, "6b6ae741f4c442b5bcccfbb60ea48963": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "6e439485ca4e47de8597c3af51ac4d8a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_dee61b262f264abe9c8f19123bb21078", "max": 32.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_90ce08a097804618b4b4aa29e00c2221", "value": 32.0}}, "72ff32b019be4252b3a9736e42d05257": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "738ae6a5004b4fcd8e1acf8973c7fcf6": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "7427ffde194a471bb68404b98bba5521": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_6b6ae741f4c442b5bcccfbb60ea48963", "placeholder": "\u200b", "style": "IPY_MODEL_4c13f424d1bb4cf0a44284e678229cf7", "value": " 169001984/? [00:01<00:00, 116158853.76it/s]"}}, "74c3e37ba7ac43019562374aae3f8c4e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "77ca484b49b447dc9c081a459a84ab3b": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "783a9fed2b1a4153869348f1b4cd9bdf": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "7b48347de2bd47e88549b165c7af8d90": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "7f28b92e80274d7f9b778bfb634ac8db": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3e6e0061bdc745beaac7f83f84327df4", "max": 75.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_3e99426778d245cbbafb04d6f52c153e", "value": 75.0}}, "8058b34966e64a54a236152f5de30268": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "820542f219d34da6af0d83ed20f6756d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_a38734b949f0443fae617d76a196b40f", "IPY_MODEL_6e439485ca4e47de8597c3af51ac4d8a", "IPY_MODEL_84f66ce16b0a435eb9746909f90b69b5"], "layout": "IPY_MODEL_cac735df1f3544b0a8a2c89d88e27d1c"}}, "8352a72f638049be98819a832027cb10": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "842078486c2c449786473d055756c9f3": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "84a6abc3c3d54dd7a08fbc7b8dfd07f3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_97e410e1d6a245009d4f410fbf407f2a", "IPY_MODEL_f5f64e7b652046608b09e1865fc8929c", "IPY_MODEL_ae07625fe7bd4a2cbbbf1d0890d6df36"], "layout": "IPY_MODEL_cc5e5ce694504583a2d4dcaf311d80c2"}}, "84f66ce16b0a435eb9746909f90b69b5": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_738ae6a5004b4fcd8e1acf8973c7fcf6", "placeholder": "\u200b", "style": "IPY_MODEL_0a0c945ddb6546be814dab292cf61c4e", "value": " 31/32 [00:00<00:00, 97.75it/s]"}}, "8a82349f3b624433926ed46218343ef9": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "90ce08a097804618b4b4aa29e00c2221": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "93c64b6a35e441bf9a79602a829a41d7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_b35a4714ac784c49970726e49084c08b", "IPY_MODEL_5b9c06753fca42ca89e480bfe3de1b06", "IPY_MODEL_b81a79f5481446ad9a9ef8597cc47731"], "layout": "IPY_MODEL_b6c8207aebc64e519f57ea458016b8d8"}}, "94a0798591274c8b8b0011603eb7638f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b8d61566453f40a8a10086d9159efd3f", "placeholder": "\u200b", "style": "IPY_MODEL_467e71f262cf432fba62ed8d75effd3a", "value": ""}}, "9643addbcabd45b48bba6f84b24900f2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_efed4fdf79514ceabb9b9762cc24d4a2", "placeholder": "\u200b", "style": "IPY_MODEL_c0993cf20a304d07b41e2a11fa17f1ef", "value": "Extracting image features: 78%"}}, "97e410e1d6a245009d4f410fbf407f2a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_136db4bc997541c5b3123895b1746e5e", "placeholder": "\u200b", "style": "IPY_MODEL_783a9fed2b1a4153869348f1b4cd9bdf", "value": "Evaluating prototype classification: 97%"}}, "9a243670d2374f4ca046908284044ab5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "9dc8c432361347f482dc1fbac96f1ec5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "a09bea6c4bec4d14b6ac5fc81cf9461a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "a0ee70498fb94ecc9c39238ad029ae29": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_26bde6db982d430988ad5224841c46b6", "max": 125.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_4d5211d9d6e24a2cb1baa906ffa8dac2", "value": 125.0}}, "a28f68eaf131448ebb0bc0fb801bfd0b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ef2a48d284cd4a8b99863c678d1eff1f", "placeholder": "\u200b", "style": "IPY_MODEL_e67ab28b10924b64a5d18ea090aa87e8", "value": "Evaluating prototype classification: 53%"}}, "a37e0600abe64891ba7bad38e42cae86": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "a38734b949f0443fae617d76a196b40f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_69f9bf1e8e3c43d0a2225f3c3d6cf91d", "placeholder": "\u200b", "style": "IPY_MODEL_3d2ebb08ff2f4bdbacdb096b84f1ec09", "value": "Evaluating prototype classification: 97%"}}, "a4f9318e26d847d394ca5e252d5bbaf4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8058b34966e64a54a236152f5de30268", "max": 19.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_08d9ec62524244f1872cdb20191f3be7", "value": 19.0}}, "a878ed48e3e745238604dc0491a31f1e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "acb6f2dd23f94af091e7ed4aa1b7a3de": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8a82349f3b624433926ed46218343ef9", "placeholder": "\u200b", "style": "IPY_MODEL_fb4936f8301947a686a8c8fe1df1eb27", "value": "Evaluating prototype classification: 99%"}}, "ae07625fe7bd4a2cbbbf1d0890d6df36": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_eda1ed0aecca4420a13f2ac4cc2475a3", "placeholder": "\u200b", "style": "IPY_MODEL_d36132a1ac6044e08ce39355ab0e24c0", "value": " 61/63 [00:00<00:00, 64.84it/s]"}}, "b0685ba39080452fa095a152855ce3f5": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d388d078f57a4be6a40dfb1d09fcdb68", "max": 64275384.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_a09bea6c4bec4d14b6ac5fc81cf9461a", "value": 64275384.0}}, "b19b954922464bc3ae7a287ae8e7ba36": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b35a4714ac784c49970726e49084c08b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_9a243670d2374f4ca046908284044ab5", "placeholder": "\u200b", "style": "IPY_MODEL_e79716d59af843ae8291b7d25d7afa97", "value": "Evaluating prototype classification: 100%"}}, "b380f61e129140fcb2daf6c273570e16": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a878ed48e3e745238604dc0491a31f1e", "placeholder": "\u200b", "style": "IPY_MODEL_f449bfa0562f46dd9d166a6667df8ce2", "value": "Evaluating prototype classification: 99%"}}, "b46d974e72914b52bd20ced66ed6fcd3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "b4923b5857b447e2aca7a73524cbb3bb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "b6767d1462de4f8b8eb018e9f51ef402": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_e8f08f9a11444d0fbdfeaeebcdc3ac7a", "IPY_MODEL_7f28b92e80274d7f9b778bfb634ac8db", "IPY_MODEL_461f881689924b8e82af3e96a920be27"], "layout": "IPY_MODEL_c0922c095d624b36adfc21be13d915e9"}}, "b6c8207aebc64e519f57ea458016b8d8": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b7d2cb428c5c4272a094846477794af9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_16b537a4cb21479fa2564472a850f609", "max": 150.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_1984df6019f34935a0d89f8f0cc9c549", "value": 150.0}}, "b81a79f5481446ad9a9ef8597cc47731": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_be1415cbc6e14d888ea2e0f649648c2a", "placeholder": "\u200b", "style": "IPY_MODEL_447d64a260fa4e579069160a3d9460de", "value": " 249/250 [00:09<00:00, 26.83it/s]"}}, "b8d61566453f40a8a10086d9159efd3f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "bcd5770b13c540db929b606eb7518b21": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "be1415cbc6e14d888ea2e0f649648c2a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "bffa3c9c26424621a044f35fc72dc03f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_66330b6ebefe44c7906d3e6e5fd221c6", "placeholder": "\u200b", "style": "IPY_MODEL_c3f25997fc9b49649de9d4690d00ba4d", "value": "Evaluating prototype classification: 75%"}}, "c0922c095d624b36adfc21be13d915e9": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c0993cf20a304d07b41e2a11fa17f1ef": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "c2ce51ed3ad643b2b521e696f82af495": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_3ae54407f35e4135929978d9d2889764", "IPY_MODEL_3545a43fc2ba428b8b8c312ecdb91469", "IPY_MODEL_1b10c53ce772446d99285a37607ef5e3"], "layout": "IPY_MODEL_8352a72f638049be98819a832027cb10"}}, "c39a5cb98e1644529c1364704681c37d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c3f25997fc9b49649de9d4690d00ba4d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "c40fd99740dc4dd5980ca6537e42c5d0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "cac735df1f3544b0a8a2c89d88e27d1c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "cb0c7957cd344fd5b8e229b443f1640d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "cb1d437a4c354907bc26e5c54ca76168": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "cc4167da1b794828ab4eb0679922efe1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "cc5e5ce694504583a2d4dcaf311d80c2": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "cd0b594802d34dd58532e00bad4a7397": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ceabb6b1df1d4a1284de89bb635533c0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4fd996b6dd534694b6413f376e6be22c", "max": 169001437.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_e7e09bfea2384e90951c090fc2a680e7", "value": 169001437.0}}, "d022e70ba7ff4133a278315f4cabdec8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_05eeda38820a4700b6808a22c087f854", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_dfd6e04d1360446d9ef1db11256ebe69", "value": 40.0}}, "d2c2b819979a476a8482e9d67ebab1a7": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d36132a1ac6044e08ce39355ab0e24c0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "d388d078f57a4be6a40dfb1d09fcdb68": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d939ed1df36b4c5db18f4b0496ee48de": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "db308fcc8f994e4aabcd079e27a47da6": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "de8827ff3a9b4e519927fb64aa069b4d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "dee61b262f264abe9c8f19123bb21078": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "df741ff3bf654a9b8b7a024c14f54f61": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_77ca484b49b447dc9c081a459a84ab3b", "placeholder": "\u200b", "style": "IPY_MODEL_b46d974e72914b52bd20ced66ed6fcd3", "value": " 64275456/? [00:04<00:00, 21648157.34it/s]"}}, "dfd6e04d1360446d9ef1db11256ebe69": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "e08469460c584a789dd3516b7d78ae77": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "e46fb7aeb83b4002bdd245d9c6f731e3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "e67ab28b10924b64a5d18ea090aa87e8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "e79716d59af843ae8291b7d25d7afa97": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "e7e09bfea2384e90951c090fc2a680e7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "e8f08f9a11444d0fbdfeaeebcdc3ac7a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_9dc8c432361347f482dc1fbac96f1ec5", "placeholder": "\u200b", "style": "IPY_MODEL_bcd5770b13c540db929b606eb7518b21", "value": "Evaluating prototype classification: 96%"}}, "e9c2476de61b41c78b739b3465029786": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_acb6f2dd23f94af091e7ed4aa1b7a3de", "IPY_MODEL_a0ee70498fb94ecc9c39238ad029ae29", "IPY_MODEL_2e1ac83c3a2b4bda89b392a3b2795d7d"], "layout": "IPY_MODEL_6051618a7e8943ce91d14f6a31a0f679"}}, "ea8059402deb40659f77d6c63d7f8d09": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "eae30ee4b8e54cfbafa7a73ac8c3720d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ed46b8de7055431dafc7c8dbf5aede81": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_43bbd6d914404eb7be1ccc7417e0c882", "placeholder": "\u200b", "style": "IPY_MODEL_19f3640a3b6f411984df19dd9b9f2536", "value": " 10/19 [00:00<00:00, 97.06it/s]"}}, "eda1ed0aecca4420a13f2ac4cc2475a3": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ef2a48d284cd4a8b99863c678d1eff1f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "efed4fdf79514ceabb9b9762cc24d4a2": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "f4334aa28f094684884cba73f70d9539": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "f449bfa0562f46dd9d166a6667df8ce2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "f523d40c013f4da7bc639dc9291509e8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_495f557ce24948f0968a8e77cc121b55", "IPY_MODEL_ceabb6b1df1d4a1284de89bb635533c0", "IPY_MODEL_7427ffde194a471bb68404b98bba5521"], "layout": "IPY_MODEL_33082c5ed1d04d52bc8bf407f24b6cd2"}}, "f5f64e7b652046608b09e1865fc8929c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_cd0b594802d34dd58532e00bad4a7397", "max": 63.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_25be42641c3c4d3abe06f325f7e5707c", "value": 63.0}}, "f69a45ea7e884b48bc7e22af83113f6d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_0a2fabd9ce614e4ab1700634bc17e28e", "placeholder": "\u200b", "style": "IPY_MODEL_c40fd99740dc4dd5980ca6537e42c5d0", "value": " 31/40 [00:00<00:00, 74.38it/s]"}}, "f6e7ccff3f3f4b87983f1603bf0b3547": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "fb4936f8301947a686a8c8fe1df1eb27": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "fc0cd3a5fceb46438c8831f7ace96e8e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_db308fcc8f994e4aabcd079e27a47da6", "placeholder": "\u200b", "style": "IPY_MODEL_de8827ff3a9b4e519927fb64aa069b4d", "value": "Extracting image features: 89%"}}, "fca8ada280ae405ab7fc84a435653757": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "ffaf8189884a44548efd49c252a85a7a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_a28f68eaf131448ebb0bc0fb801bfd0b", "IPY_MODEL_a4f9318e26d847d394ca5e252d5bbaf4", "IPY_MODEL_ed46b8de7055431dafc7c8dbf5aede81"], "layout": "IPY_MODEL_06dabf4f2d724f2e855a18452a421901"}}}, "version_major": 2, "version_minor": 0}}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/course_UvA-DL/13-contrastive-learning.ipynb b/source/notebooks/course_UvA-DL/13-contrastive-learning.ipynb deleted file mode 100644 index 44f1eef..0000000 --- a/source/notebooks/course_UvA-DL/13-contrastive-learning.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "6000551a", "metadata": {"papermill": {"duration": 0.030399, "end_time": "2021-10-10T16:38:20.779892", "exception": false, "start_time": "2021-10-10T16:38:20.749493", "status": "completed"}, "tags": []}, "source": ["\n", "# Tutorial 13: Self-Supervised Contrastive Learning with SimCLR\n", "\n", "* **Author:** Phillip Lippe\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-10-10T18:35:52.598167\n", "\n", "In this tutorial, we will take a closer look at self-supervised contrastive learning.\n", "Self-supervised learning, or also sometimes called unsupervised learning, describes the scenario where we have given input data, but no accompanying labels to train in a classical supervised way.\n", "However, this data still contains a lot of information from which we can learn: how are the images different from each other?\n", "What patterns are descriptive for certain images?\n", "Can we cluster the images?\n", "To get an insight into these questions, we will implement a popular, simple contrastive learning method, SimCLR, and apply it to the STL10 dataset.\n", "This notebook is part of a lecture series on Deep Learning at the University of Amsterdam.\n", "The full list of tutorials can be found at https://uvadlc-notebooks.rtfd.io.\n", "\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/course_UvA-DL/13-contrastive-learning.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "c075e657", "metadata": {"papermill": {"duration": 0.028259, "end_time": "2021-10-10T16:38:20.837183", "exception": false, "start_time": "2021-10-10T16:38:20.808924", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "132c3c36", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-10-10T16:38:20.897899Z", "iopub.status.busy": "2021-10-10T16:38:20.897428Z", "iopub.status.idle": "2021-10-10T16:38:20.900024Z", "shell.execute_reply": "2021-10-10T16:38:20.899479Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 0.034648, "end_time": "2021-10-10T16:38:20.900141", "exception": false, "start_time": "2021-10-10T16:38:20.865493", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# ! pip install --quiet \"torch>=1.6, <1.9\" \"matplotlib\" \"pytorch-lightning>=1.3\" \"seaborn\" \"torchvision\" \"torchmetrics>=0.3\""]}, {"cell_type": "markdown", "id": "15410d3c", "metadata": {"papermill": {"duration": 0.02886, "end_time": "2021-10-10T16:38:20.957863", "exception": false, "start_time": "2021-10-10T16:38:20.929003", "status": "completed"}, "tags": []}, "source": ["
\n", "Methods for self-supervised learning try to learn as much as possible from the data alone, so it can quickly be finetuned for a specific classification task.\n", "The benefit of self-supervised learning is that a large dataset can often easily be obtained.\n", "For instance, if we want to train a vision model on semantic segmentation for autonomous driving, we can collect large amounts of data by simply installing a camera in a car, and driving through a city for an hour.\n", "In contrast, if we would want to do supervised learning, we would have to manually label all those images before training a model.\n", "This is extremely expensive, and would likely take a couple of months to manually label the same amount of data.\n", "Further, self-supervised learning can provide an alternative to transfer learning from models pretrained on ImageNet since we could pretrain a model on a specific dataset/situation, e.g. traffic scenarios for autonomous driving.\n", "\n", "Within the last two years, a lot of new approaches have been proposed for self-supervised learning, in particular for images, that have resulted in great improvements over supervised models when few labels are available.\n", "The subfield that we will focus on in this tutorial is contrastive learning.\n", "Contrastive learning is motivated by the question mentioned above: how are images different from each other?\n", "Specifically, contrastive learning methods train a model to cluster an image and its slightly augmented version in latent space, while the distance to other images should be maximized.\n", "A very recent and simple method for this is [SimCLR](https://arxiv.org/abs/2006.10029), which is visualized below (figure credit - [Ting Chen et al. ](https://simclr.github.io/)).\n", "\n", "
![simclr contrastive learning](){width=\"500px\"}
\n", "\n", "The general setup is that we are given a dataset of images without any labels, and want to train a model on this data such that it can quickly adapt to any image recognition task afterward.\n", "During each training iteration, we sample a batch of images as usual.\n", "For each image, we create two versions by applying data augmentation techniques like cropping, Gaussian noise, blurring, etc.\n", "An example of such is shown on the left with the image of the dog.\n", "We will go into the details and effects of the chosen augmentation techniques later.\n", "On those images, we apply a CNN like ResNet and obtain as output a 1D feature vector on which we apply a small MLP.\n", "The output features of the two augmented images are then trained to be close to each other, while all other images in that batch should be as different as possible.\n", "This way, the model has to learn to recognize the content of the image that remains unchanged under the data augmentations, such as objects which we usually care about in supervised tasks.\n", "\n", "We will now implement this framework ourselves and discuss further details along the way.\n", "Let's first start with importing our standard libraries below:"]}, {"cell_type": "code", "execution_count": 2, "id": "e2627246", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:38:21.024058Z", "iopub.status.busy": "2021-10-10T16:38:21.022126Z", "iopub.status.idle": "2021-10-10T16:38:22.765560Z", "shell.execute_reply": "2021-10-10T16:38:22.765143Z"}, "papermill": {"duration": 1.779594, "end_time": "2021-10-10T16:38:22.765675", "exception": false, "start_time": "2021-10-10T16:38:20.986081", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/tmp/ipykernel_1189/3845858059.py:24: DeprecationWarning: `set_matplotlib_formats` is deprecated since IPython 7.23, directly use `matplotlib_inline.backend_inline.set_matplotlib_formats()`\n", " set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "Global seed set to 42\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Device: cuda:0\n", "Number of workers: 12\n"]}, {"data": {"text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["import os\n", "import urllib.request\n", "from copy import deepcopy\n", "from urllib.error import HTTPError\n", "\n", "import matplotlib\n", "import matplotlib.pyplot as plt\n", "import pytorch_lightning as pl\n", "import seaborn as sns\n", "import torch\n", "import torch.nn as nn\n", "import torch.nn.functional as F\n", "import torch.optim as optim\n", "import torch.utils.data as data\n", "import torchvision\n", "from IPython.display import set_matplotlib_formats\n", "from pytorch_lightning.callbacks import LearningRateMonitor, ModelCheckpoint\n", "from torchvision import transforms\n", "from torchvision.datasets import STL10\n", "from tqdm.notebook import tqdm\n", "\n", "plt.set_cmap(\"cividis\")\n", "# %matplotlib inline\n", "set_matplotlib_formats(\"svg\", \"pdf\") # For export\n", "matplotlib.rcParams[\"lines.linewidth\"] = 2.0\n", "sns.set()\n", "\n", "# Import tensorboard\n", "# %load_ext tensorboard\n", "\n", "# Path to the folder where the datasets are/should be downloaded (e.g. CIFAR10)\n", "DATASET_PATH = os.environ.get(\"PATH_DATASETS\", \"data/\")\n", "# Path to the folder where the pretrained models are saved\n", "CHECKPOINT_PATH = os.environ.get(\"PATH_CHECKPOINT\", \"saved_models/ContrastiveLearning/\")\n", "# In this notebook, we use data loaders with heavier computational processing. It is recommended to use as many\n", "# workers as possible in a data loader, which corresponds to the number of CPU cores\n", "NUM_WORKERS = os.cpu_count()\n", "\n", "# Setting the seed\n", "pl.seed_everything(42)\n", "\n", "# Ensure that all operations are deterministic on GPU (if used) for reproducibility\n", "torch.backends.cudnn.determinstic = True\n", "torch.backends.cudnn.benchmark = False\n", "\n", "device = torch.device(\"cuda:0\") if torch.cuda.is_available() else torch.device(\"cpu\")\n", "print(\"Device:\", device)\n", "print(\"Number of workers:\", NUM_WORKERS)"]}, {"cell_type": "markdown", "id": "ae59fd9f", "metadata": {"papermill": {"duration": 0.029754, "end_time": "2021-10-10T16:38:22.826902", "exception": false, "start_time": "2021-10-10T16:38:22.797148", "status": "completed"}, "tags": []}, "source": ["As in many tutorials before, we provide pre-trained models.\n", "Note that those models are slightly larger as normal (~100MB overall) since we use the default ResNet-18 architecture.\n", "If you are running this notebook locally, make sure to have sufficient disk space available."]}, {"cell_type": "code", "execution_count": 3, "id": "482bf0ff", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:38:22.890766Z", "iopub.status.busy": "2021-10-10T16:38:22.887393Z", "iopub.status.idle": "2021-10-10T16:38:25.058940Z", "shell.execute_reply": "2021-10-10T16:38:25.058450Z"}, "papermill": {"duration": 2.20285, "end_time": "2021-10-10T16:38:25.059060", "exception": false, "start_time": "2021-10-10T16:38:22.856210", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial17/SimCLR.ckpt...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial17/ResNet.ckpt...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial17/tensorboards/SimCLR/events.out.tfevents.SimCLR...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial17/tensorboards/classification/ResNet/events.out.tfevents.ResNet...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial17/LogisticRegression_10.ckpt...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial17/LogisticRegression_20.ckpt...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial17/LogisticRegression_50.ckpt...\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial17/LogisticRegression_100.ckpt...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial17/LogisticRegression_200.ckpt...\n", "Downloading https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial17/LogisticRegression_500.ckpt...\n"]}], "source": ["# Github URL where saved models are stored for this tutorial\n", "base_url = \"https://raw.githubusercontent.com/phlippe/saved_models/main/tutorial17/\"\n", "# Files to download\n", "pretrained_files = [\n", " \"SimCLR.ckpt\",\n", " \"ResNet.ckpt\",\n", " \"tensorboards/SimCLR/events.out.tfevents.SimCLR\",\n", " \"tensorboards/classification/ResNet/events.out.tfevents.ResNet\",\n", "]\n", "pretrained_files += [f\"LogisticRegression_{size}.ckpt\" for size in [10, 20, 50, 100, 200, 500]]\n", "# Create checkpoint path if it doesn't exist yet\n", "os.makedirs(CHECKPOINT_PATH, exist_ok=True)\n", "\n", "# For each file, check whether it already exists. If not, try downloading it.\n", "for file_name in pretrained_files:\n", " file_path = os.path.join(CHECKPOINT_PATH, file_name)\n", " if \"/\" in file_name:\n", " os.makedirs(file_path.rsplit(\"/\", 1)[0], exist_ok=True)\n", " if not os.path.isfile(file_path):\n", " file_url = base_url + file_name\n", " print(f\"Downloading {file_url}...\")\n", " try:\n", " urllib.request.urlretrieve(file_url, file_path)\n", " except HTTPError as e:\n", " print(\n", " \"Something went wrong. Please try to download the file from the GDrive folder, or contact the author with the full output including the following error:\\n\",\n", " e,\n", " )"]}, {"cell_type": "markdown", "id": "f7e66a12", "metadata": {"papermill": {"duration": 0.030275, "end_time": "2021-10-10T16:38:25.125477", "exception": false, "start_time": "2021-10-10T16:38:25.095202", "status": "completed"}, "tags": []}, "source": ["## SimCLR\n", "\n", "We will start our exploration of contrastive learning by discussing the effect of different data augmentation techniques, and how we can implement an efficient data loader for such.\n", "Next, we implement SimCLR with PyTorch Lightning, and finally train it on a large, unlabeled dataset."]}, {"cell_type": "markdown", "id": "f78a4c91", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.030063, "end_time": "2021-10-10T16:38:25.185749", "exception": false, "start_time": "2021-10-10T16:38:25.155686", "status": "completed"}, "tags": []}, "source": ["### Data Augmentation for Contrastive Learning\n", "\n", "To allow efficient training, we need to prepare the data loading such that we sample two different, random augmentations for each image in the batch.\n", "The easiest way to do this is by creating a transformation that, when being called, applies a set of data augmentations to an image twice.\n", "This is implemented in the class `ContrastiveTransformations` below:"]}, {"cell_type": "code", "execution_count": 4, "id": "c7868578", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:38:25.253314Z", "iopub.status.busy": "2021-10-10T16:38:25.252845Z", "iopub.status.idle": "2021-10-10T16:38:25.254844Z", "shell.execute_reply": "2021-10-10T16:38:25.254446Z"}, "papermill": {"duration": 0.036682, "end_time": "2021-10-10T16:38:25.254947", "exception": false, "start_time": "2021-10-10T16:38:25.218265", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class ContrastiveTransformations:\n", " def __init__(self, base_transforms, n_views=2):\n", " self.base_transforms = base_transforms\n", " self.n_views = n_views\n", "\n", " def __call__(self, x):\n", " return [self.base_transforms(x) for i in range(self.n_views)]"]}, {"cell_type": "markdown", "id": "ebf730fc", "metadata": {"papermill": {"duration": 0.030955, "end_time": "2021-10-10T16:38:25.316735", "exception": false, "start_time": "2021-10-10T16:38:25.285780", "status": "completed"}, "tags": []}, "source": ["The contrastive learning framework can easily be extended to have more _positive_ examples by sampling more than two augmentations of the same image.\n", "However, the most efficient training is usually obtained by using only two.\n", "\n", "Next, we can look at the specific augmentations we want to apply.\n", "The choice of the data augmentation to use is the most crucial hyperparameter in SimCLR since it directly affects how the latent space is structured, and what patterns might be learned from the data.\n", "Let's first take a look at some of the most popular data augmentations (figure credit - [Ting Chen and Geoffrey Hinton](https://ai.googleblog.com/2020/04/advancing-self-supervised-and-semi.html)):\n", "\n", "
\n", "\n", "All of them can be used, but it turns out that two augmentations stand out in their importance: crop-and-resize, and color distortion.\n", "Interestingly, however, they only lead to strong performance if they have been used together as discussed by [Ting Chen et al. ](https://arxiv.org/abs/2006.10029) in their SimCLR paper.\n", "When performing randomly cropping and resizing, we can distinguish between two situations: (a) cropped image A provides a local view of cropped image B, or (b) cropped images C and D show neighboring views of the same image (figure credit - [Ting Chen and Geoffrey Hinton](https://ai.googleblog.com/2020/04/advancing-self-supervised-and-semi.html)).\n", "\n", "
\n", "\n", "While situation (a) requires the model to learn some sort of scale invariance to make crops A and B similar in latent space, situation (b) is more challenging since the model needs to recognize an object beyond its limited view.\n", "However, without color distortion, there is a loophole that the model can exploit, namely that different crops of the same image usually look very similar in color space.\n", "Consider the picture of the dog above.\n", "Simply from the color of the fur and the green color tone of the background, you can reason that two patches belong to the same image without actually recognizing the dog in the picture.\n", "In this case, the model might end up focusing only on the color histograms of the images, and ignore other more generalizable features.\n", "If, however, we distort the colors in the two patches randomly and independently of each other, the model cannot rely on this simple feature anymore.\n", "Hence, by combining random cropping and color distortions, the model can only match two patches by learning generalizable representations.\n", "\n", "Overall, for our experiments, we apply a set of 5 transformations following the original SimCLR setup: random horizontal flip, crop-and-resize, color distortion, random grayscale, and gaussian blur.\n", "In comparison to the [original implementation](https://github.com/google-research/simclr), we reduce the effect of the color jitter slightly (0.5 instead of 0.8 for brightness, contrast, and saturation, and 0.1 instead of 0.2 for hue).\n", "In our experiments, this setting obtained better performance and was faster and more stable to train.\n", "If, for instance, the brightness scale highly varies in a dataset, the\n", "original settings can be more beneficial since the model can't rely on\n", "this information anymore to distinguish between images."]}, {"cell_type": "code", "execution_count": 5, "id": "cfb65837", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:38:25.382410Z", "iopub.status.busy": "2021-10-10T16:38:25.381935Z", "iopub.status.idle": "2021-10-10T16:38:25.383969Z", "shell.execute_reply": "2021-10-10T16:38:25.383557Z"}, "papermill": {"duration": 0.036481, "end_time": "2021-10-10T16:38:25.384069", "exception": false, "start_time": "2021-10-10T16:38:25.347588", "status": "completed"}, "tags": []}, "outputs": [], "source": ["contrast_transforms = transforms.Compose(\n", " [\n", " transforms.RandomHorizontalFlip(),\n", " transforms.RandomResizedCrop(size=96),\n", " transforms.RandomApply([transforms.ColorJitter(brightness=0.5, contrast=0.5, saturation=0.5, hue=0.1)], p=0.8),\n", " transforms.RandomGrayscale(p=0.2),\n", " transforms.GaussianBlur(kernel_size=9),\n", " transforms.ToTensor(),\n", " transforms.Normalize((0.5,), (0.5,)),\n", " ]\n", ")"]}, {"cell_type": "markdown", "id": "64514ea2", "metadata": {"papermill": {"duration": 0.030802, "end_time": "2021-10-10T16:38:25.444902", "exception": false, "start_time": "2021-10-10T16:38:25.414100", "status": "completed"}, "tags": []}, "source": ["After discussing the data augmentation techniques, we can now focus on the dataset.\n", "In this tutorial, we will use the [STL10 dataset](https://cs.stanford.edu/~acoates/stl10/), which, similarly to CIFAR10, contains images of 10 classes: airplane, bird, car, cat, deer, dog, horse, monkey, ship, truck.\n", "However, the images have a higher resolution, namely $96\\times 96$ pixels, and we are only provided with 500 labeled images per class.\n", "Additionally, we have a much larger set of $100,000$ unlabeled images which are similar to the training images but are sampled from a wider range of animals and vehicles.\n", "This makes the dataset ideal to showcase the benefits that self-supervised learning offers.\n", "\n", "Luckily, the STL10 dataset is provided through torchvision.\n", "Keep in mind, however, that since this dataset is relatively large and has a considerably higher resolution than CIFAR10, it requires more disk space (~3GB) and takes a bit of time to download.\n", "For our initial discussion of self-supervised learning and SimCLR, we\n", "will create two data loaders with our contrastive transformations above:\n", "the `unlabeled_data` will be used to train our model via contrastive\n", "learning, and `train_data_contrast` will be used as a validation set in\n", "contrastive learning."]}, {"cell_type": "code", "execution_count": 6, "id": "5893d109", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:38:25.510013Z", "iopub.status.busy": "2021-10-10T16:38:25.509537Z", "iopub.status.idle": "2021-10-10T16:41:52.516922Z", "shell.execute_reply": "2021-10-10T16:41:52.517324Z"}, "papermill": {"duration": 207.042247, "end_time": "2021-10-10T16:41:52.517484", "exception": false, "start_time": "2021-10-10T16:38:25.475237", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading http://ai.stanford.edu/~acoates/stl10/stl10_binary.tar.gz to /__w/1/s/.datasets/stl10_binary.tar.gz\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "c111f74da90d4a8f831df4733df12b94", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0/2640397119 [00:00\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-10-10T18:41:53.106628\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}], "source": ["# Visualize some examples\n", "pl.seed_everything(42)\n", "NUM_IMAGES = 6\n", "imgs = torch.stack([img for idx in range(NUM_IMAGES) for img in unlabeled_data[idx][0]], dim=0)\n", "img_grid = torchvision.utils.make_grid(imgs, nrow=6, normalize=True, pad_value=0.9)\n", "img_grid = img_grid.permute(1, 2, 0)\n", "\n", "plt.figure(figsize=(10, 5))\n", "plt.title(\"Augmented image examples of the STL10 dataset\")\n", "plt.imshow(img_grid)\n", "plt.axis(\"off\")\n", "plt.show()\n", "plt.close()"]}, {"cell_type": "markdown", "id": "d9b44c08", "metadata": {"papermill": {"duration": 0.079471, "end_time": "2021-10-10T16:41:53.515584", "exception": false, "start_time": "2021-10-10T16:41:53.436113", "status": "completed"}, "tags": []}, "source": ["We see the wide variety of our data augmentation, including randomly cropping, grayscaling, gaussian blur, and color distortion.\n", "Thus, it remains a challenging task for the model to match two, independently augmented patches of the same image."]}, {"cell_type": "markdown", "id": "525c3967", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.047654, "end_time": "2021-10-10T16:41:53.615813", "exception": false, "start_time": "2021-10-10T16:41:53.568159", "status": "completed"}, "tags": []}, "source": ["### SimCLR implementation\n", "\n", "Using the data loader pipeline above, we can now implement SimCLR.\n", "At each iteration, we get for every image $x$ two differently augmented versions, which we refer to as $\\tilde{x}_i$ and $\\tilde{x}_j$.\n", "Both of these images are encoded into a one-dimensional feature vector, between which we want to maximize similarity which minimizes it to all other images in the batch.\n", "The encoder network is split into two parts: a base encoder network $f(\\cdot)$, and a projection head $g(\\cdot)$.\n", "The base network is usually a deep CNN as we have seen in e.g. [Tutorial 5](https://uvadlc-notebooks.readthedocs.io/en/latest/tutorial_notebooks/tutorial5/Inception_ResNet_DenseNet.html) before, and is responsible for extracting a representation vector from the augmented data examples.\n", "In our experiments, we will use the common ResNet-18 architecture as $f(\\cdot)$, and refer to the output as $f(\\tilde{x}_i)=h_i$.\n", "The projection head $g(\\cdot)$ maps the representation $h$ into a space where we apply the contrastive loss, i.e., compare similarities between vectors.\n", "It is often chosen to be a small MLP with non-linearities, and for simplicity, we follow the original SimCLR paper setup by defining it as a two-layer MLP with ReLU activation in the hidden layer.\n", "Note that in the follow-up paper, [SimCLRv2](https://arxiv.org/abs/2006.10029), the authors mention that larger/wider MLPs can boost the performance considerably.\n", "This is why we apply an MLP with four times larger hidden dimensions, but deeper MLPs showed to overfit on the given dataset.\n", "The general setup is visualized below (figure credit - [Ting Chen et al. ](https://arxiv.org/abs/2006.10029)):\n", "\n", "
\n", "\n", "After finishing the training with contrastive learning, we will remove the projection head $g(\\cdot)$, and use $f(\\cdot)$ as a pretrained feature extractor.\n", "The representations $z$ that come out of the projection head $g(\\cdot)$ have been shown to perform worse than those of the base network $f(\\cdot)$ when finetuning the network for a new task.\n", "This is likely because the representations $z$ are trained to become invariant to many features like the color that can be important for downstream tasks.\n", "Thus, $g(\\cdot)$ is only needed for the contrastive learning stage.\n", "\n", "Now that the architecture is described, let's take a closer look at how we train the model.\n", "As mentioned before, we want to maximize the similarity between the representations of the two augmented versions of the same image, i.e., $z_i$ and $z_j$ in the figure above, while minimizing it to all other examples in the batch.\n", "SimCLR thereby applies the InfoNCE loss, originally proposed by [Aaron van den Oord et al. ](https://arxiv.org/abs/1807.03748) for contrastive learning.\n", "In short, the InfoNCE loss compares the similarity of $z_i$ and $z_j$ to the similarity of $z_i$ to any other representation in the batch by performing a softmax over the similarity values.\n", "The loss can be formally written as:\n", "$$\n", "\\ell_{i,j}=-\\log \\frac{\\exp(\\text{sim}(z_i,z_j)/\\tau)}{\\sum_{k=1}^{2N}\\mathbb{1}_{[k\\neq i]}\\exp(\\text{sim}(z_i,z_k)/\\tau)}=-\\text{sim}(z_i,z_j)/\\tau+\\log\\left[\\sum_{k=1}^{2N}\\mathbb{1}_{[k\\neq i]}\\exp(\\text{sim}(z_i,z_k)/\\tau)\\right]\n", "$$\n", "The function $\\text{sim}$ is a similarity metric, and the hyperparameter $\\tau$ is called temperature determining how peaked the distribution is.\n", "Since many similarity metrics are bounded, the temperature parameter allows us to balance the influence of many dissimilar image patches versus one similar patch.\n", "The similarity metric that is used in SimCLR is cosine similarity, as defined below:\n", "$$\n", "\\text{sim}(z_i,z_j) = \\frac{z_i^\\top \\cdot z_j}{||z_i||\\cdot||z_j||}\n", "$$\n", "The maximum cosine similarity possible is $1$, while the minimum is $-1$.\n", "In general, we will see that the features of two different images will converge to a cosine similarity around zero since the minimum, $-1$, would require $z_i$ and $z_j$ to be in the exact opposite direction in all feature dimensions, which does not allow for great flexibility.\n", "\n", "Finally, now that we have discussed all details, let's implement SimCLR below as a PyTorch Lightning module:"]}, {"cell_type": "code", "execution_count": 8, "id": "a94c063a", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:41:53.767396Z", "iopub.status.busy": "2021-10-10T16:41:53.764007Z", "iopub.status.idle": "2021-10-10T16:41:53.769425Z", "shell.execute_reply": "2021-10-10T16:41:53.769027Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.09737, "end_time": "2021-10-10T16:41:53.769531", "exception": false, "start_time": "2021-10-10T16:41:53.672161", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class SimCLR(pl.LightningModule):\n", " def __init__(self, hidden_dim, lr, temperature, weight_decay, max_epochs=500):\n", " super().__init__()\n", " self.save_hyperparameters()\n", " assert self.hparams.temperature > 0.0, \"The temperature must be a positive float!\"\n", " # Base model f(.)\n", " self.convnet = torchvision.models.resnet18(\n", " pretrained=False, num_classes=4 * hidden_dim\n", " ) # num_classes is the output size of the last linear layer\n", " # The MLP for g(.) consists of Linear->ReLU->Linear\n", " self.convnet.fc = nn.Sequential(\n", " self.convnet.fc, # Linear(ResNet output, 4*hidden_dim)\n", " nn.ReLU(inplace=True),\n", " nn.Linear(4 * hidden_dim, hidden_dim),\n", " )\n", "\n", " def configure_optimizers(self):\n", " optimizer = optim.AdamW(self.parameters(), lr=self.hparams.lr, weight_decay=self.hparams.weight_decay)\n", " lr_scheduler = optim.lr_scheduler.CosineAnnealingLR(\n", " optimizer, T_max=self.hparams.max_epochs, eta_min=self.hparams.lr / 50\n", " )\n", " return [optimizer], [lr_scheduler]\n", "\n", " def info_nce_loss(self, batch, mode=\"train\"):\n", " imgs, _ = batch\n", " imgs = torch.cat(imgs, dim=0)\n", "\n", " # Encode all images\n", " feats = self.convnet(imgs)\n", " # Calculate cosine similarity\n", " cos_sim = F.cosine_similarity(feats[:, None, :], feats[None, :, :], dim=-1)\n", " # Mask out cosine similarity to itself\n", " self_mask = torch.eye(cos_sim.shape[0], dtype=torch.bool, device=cos_sim.device)\n", " cos_sim.masked_fill_(self_mask, -9e15)\n", " # Find positive example -> batch_size//2 away from the original example\n", " pos_mask = self_mask.roll(shifts=cos_sim.shape[0] // 2, dims=0)\n", " # InfoNCE loss\n", " cos_sim = cos_sim / self.hparams.temperature\n", " nll = -cos_sim[pos_mask] + torch.logsumexp(cos_sim, dim=-1)\n", " nll = nll.mean()\n", "\n", " # Logging loss\n", " self.log(mode + \"_loss\", nll)\n", " # Get ranking position of positive example\n", " comb_sim = torch.cat(\n", " [cos_sim[pos_mask][:, None], cos_sim.masked_fill(pos_mask, -9e15)], # First position positive example\n", " dim=-1,\n", " )\n", " sim_argsort = comb_sim.argsort(dim=-1, descending=True).argmin(dim=-1)\n", " # Logging ranking metrics\n", " self.log(mode + \"_acc_top1\", (sim_argsort == 0).float().mean())\n", " self.log(mode + \"_acc_top5\", (sim_argsort < 5).float().mean())\n", " self.log(mode + \"_acc_mean_pos\", 1 + sim_argsort.float().mean())\n", "\n", " return nll\n", "\n", " def training_step(self, batch, batch_idx):\n", " return self.info_nce_loss(batch, mode=\"train\")\n", "\n", " def validation_step(self, batch, batch_idx):\n", " self.info_nce_loss(batch, mode=\"val\")"]}, {"cell_type": "markdown", "id": "5930dd21", "metadata": {"papermill": {"duration": 0.339364, "end_time": "2021-10-10T16:41:54.219681", "exception": false, "start_time": "2021-10-10T16:41:53.880317", "status": "completed"}, "tags": []}, "source": ["Alternatively to performing the validation on the contrastive learning loss as well, we could also take a simple, small downstream task, and track the performance of the base network $f(\\cdot)$ on that.\n", "However, in this tutorial, we will restrict ourselves to the STL10\n", "dataset where we use the task of image classification on STL10 as our\n", "test task."]}, {"cell_type": "markdown", "id": "371aa9b6", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.041653, "end_time": "2021-10-10T16:41:54.360538", "exception": false, "start_time": "2021-10-10T16:41:54.318885", "status": "completed"}, "tags": []}, "source": ["### Training\n", "\n", "Now that we have implemented SimCLR and the data loading pipeline, we are ready to train the model.\n", "We will use the same training function setup as usual.\n", "For saving the best model checkpoint, we track the metric `val_acc_top5`, which describes how often the correct image patch is within the top-5 most similar examples in the batch.\n", "This is usually less noisy than the top-1 metric, making it a better metric to choose the best model from."]}, {"cell_type": "code", "execution_count": 9, "id": "7ae8797a", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:41:54.466376Z", "iopub.status.busy": "2021-10-10T16:41:54.465889Z", "iopub.status.idle": "2021-10-10T16:41:54.467539Z", "shell.execute_reply": "2021-10-10T16:41:54.467915Z"}, "papermill": {"duration": 0.056039, "end_time": "2021-10-10T16:41:54.468066", "exception": false, "start_time": "2021-10-10T16:41:54.412027", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def train_simclr(batch_size, max_epochs=500, **kwargs):\n", " trainer = pl.Trainer(\n", " default_root_dir=os.path.join(CHECKPOINT_PATH, \"SimCLR\"),\n", " gpus=1 if str(device) == \"cuda:0\" else 0,\n", " max_epochs=max_epochs,\n", " callbacks=[\n", " ModelCheckpoint(save_weights_only=True, mode=\"max\", monitor=\"val_acc_top5\"),\n", " LearningRateMonitor(\"epoch\"),\n", " ],\n", " progress_bar_refresh_rate=1,\n", " )\n", " trainer.logger._default_hp_metric = None # Optional logging argument that we don't need\n", "\n", " # Check whether pretrained model exists. If yes, load it and skip training\n", " pretrained_filename = os.path.join(CHECKPOINT_PATH, \"SimCLR.ckpt\")\n", " if os.path.isfile(pretrained_filename):\n", " print(f\"Found pretrained model at {pretrained_filename}, loading...\")\n", " # Automatically loads the model with the saved hyperparameters\n", " model = SimCLR.load_from_checkpoint(pretrained_filename)\n", " else:\n", " train_loader = data.DataLoader(\n", " unlabeled_data,\n", " batch_size=batch_size,\n", " shuffle=True,\n", " drop_last=True,\n", " pin_memory=True,\n", " num_workers=NUM_WORKERS,\n", " )\n", " val_loader = data.DataLoader(\n", " train_data_contrast,\n", " batch_size=batch_size,\n", " shuffle=False,\n", " drop_last=False,\n", " pin_memory=True,\n", " num_workers=NUM_WORKERS,\n", " )\n", " pl.seed_everything(42) # To be reproducable\n", " model = SimCLR(max_epochs=max_epochs, **kwargs)\n", " trainer.fit(model, train_loader, val_loader)\n", " # Load best checkpoint after training\n", " model = SimCLR.load_from_checkpoint(trainer.checkpoint_callback.best_model_path)\n", "\n", " return model"]}, {"cell_type": "markdown", "id": "30619702", "metadata": {"papermill": {"duration": 0.043291, "end_time": "2021-10-10T16:41:54.559443", "exception": false, "start_time": "2021-10-10T16:41:54.516152", "status": "completed"}, "tags": []}, "source": ["A common observation in contrastive learning is that the larger the batch size, the better the models perform.\n", "A larger batch size allows us to compare each image to more negative examples, leading to overall smoother loss gradients.\n", "However, in our case, we experienced that a batch size of 256 was sufficient to get good results."]}, {"cell_type": "code", "execution_count": 10, "id": "204e88a8", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:41:54.726388Z", "iopub.status.busy": "2021-10-10T16:41:54.725918Z", "iopub.status.idle": "2021-10-10T16:41:54.977674Z", "shell.execute_reply": "2021-10-10T16:41:54.977166Z"}, "papermill": {"duration": 0.357848, "end_time": "2021-10-10T16:41:54.977825", "exception": false, "start_time": "2021-10-10T16:41:54.619977", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model at saved_models/ContrastiveLearning/SimCLR.ckpt, loading...\n"]}], "source": ["simclr_model = train_simclr(\n", " batch_size=256, hidden_dim=128, lr=5e-4, temperature=0.07, weight_decay=1e-4, max_epochs=500\n", ")"]}, {"cell_type": "markdown", "id": "6e791b30", "metadata": {"papermill": {"duration": 0.041235, "end_time": "2021-10-10T16:41:55.168558", "exception": false, "start_time": "2021-10-10T16:41:55.127323", "status": "completed"}, "tags": []}, "source": ["To get an intuition of how training with contrastive learning behaves, we can take a look at the TensorBoard below:"]}, {"cell_type": "code", "execution_count": 11, "id": "4faca6fd", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:41:55.269774Z", "iopub.status.busy": "2021-10-10T16:41:55.269307Z", "iopub.status.idle": "2021-10-10T16:41:55.271319Z", "shell.execute_reply": "2021-10-10T16:41:55.270919Z"}, "papermill": {"duration": 0.045346, "end_time": "2021-10-10T16:41:55.271426", "exception": false, "start_time": "2021-10-10T16:41:55.226080", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# %tensorboard --logdir ../saved_models/tutorial17/tensorboards/SimCLR/"]}, {"cell_type": "markdown", "id": "6defaecc", "metadata": {"papermill": {"duration": 0.040274, "end_time": "2021-10-10T16:41:55.366743", "exception": false, "start_time": "2021-10-10T16:41:55.326469", "status": "completed"}, "tags": []}, "source": ["
![tensorboard simclr](){width=\"1200px\"}
\n", "\n", "One thing to note is that contrastive learning benefits a lot from long training.\n", "The shown plot above is from a training that took approx.\n", "1 day on a NVIDIA TitanRTX.\n", "Training the model for even longer might reduce its loss further, but we did not experience any gains from it for the downstream task on image classification.\n", "In general, contrastive learning can also benefit from using larger models, if sufficient unlabeled data is available."]}, {"cell_type": "markdown", "id": "aaab8b66", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.110092, "end_time": "2021-10-10T16:41:55.567176", "exception": false, "start_time": "2021-10-10T16:41:55.457084", "status": "completed"}, "tags": []}, "source": ["## Logistic Regression\n", "\n", "
\n", "After we have trained our model via contrastive learning, we can deploy it on downstream tasks and see how well it performs with little data.\n", "A common setup, which also verifies whether the model has learned generalized representations, is to perform Logistic Regression on the features.\n", "In other words, we learn a single, linear layer that maps the representations to a class prediction.\n", "Since the base network $f(\\cdot)$ is not changed during the training process, the model can only perform well if the representations of $h$ describe all features that might be necessary for the task.\n", "Further, we do not have to worry too much about overfitting since we have very few parameters that are trained.\n", "Hence, we might expect that the model can perform well even with very little data.\n", "\n", "First, let's implement a simple Logistic Regression setup for which we assume that the images already have been encoded in their feature vectors.\n", "If very little data is available, it might be beneficial to dynamically encode the images during training so that we can also apply data augmentations.\n", "However, the way we implement it here is much more efficient and can be trained within a few seconds.\n", "Further, using data augmentations did not show any significant gain in this simple setup."]}, {"cell_type": "code", "execution_count": 12, "id": "6745071e", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:41:55.788482Z", "iopub.status.busy": "2021-10-10T16:41:55.788000Z", "iopub.status.idle": "2021-10-10T16:41:55.789951Z", "shell.execute_reply": "2021-10-10T16:41:55.789550Z"}, "papermill": {"duration": 0.117728, "end_time": "2021-10-10T16:41:55.790056", "exception": false, "start_time": "2021-10-10T16:41:55.672328", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class LogisticRegression(pl.LightningModule):\n", " def __init__(self, feature_dim, num_classes, lr, weight_decay, max_epochs=100):\n", " super().__init__()\n", " self.save_hyperparameters()\n", " # Mapping from representation h to classes\n", " self.model = nn.Linear(feature_dim, num_classes)\n", "\n", " def configure_optimizers(self):\n", " optimizer = optim.AdamW(self.parameters(), lr=self.hparams.lr, weight_decay=self.hparams.weight_decay)\n", " lr_scheduler = optim.lr_scheduler.MultiStepLR(\n", " optimizer, milestones=[int(self.hparams.max_epochs * 0.6), int(self.hparams.max_epochs * 0.8)], gamma=0.1\n", " )\n", " return [optimizer], [lr_scheduler]\n", "\n", " def _calculate_loss(self, batch, mode=\"train\"):\n", " feats, labels = batch\n", " preds = self.model(feats)\n", " loss = F.cross_entropy(preds, labels)\n", " acc = (preds.argmax(dim=-1) == labels).float().mean()\n", "\n", " self.log(mode + \"_loss\", loss)\n", " self.log(mode + \"_acc\", acc)\n", " return loss\n", "\n", " def training_step(self, batch, batch_idx):\n", " return self._calculate_loss(batch, mode=\"train\")\n", "\n", " def validation_step(self, batch, batch_idx):\n", " self._calculate_loss(batch, mode=\"val\")\n", "\n", " def test_step(self, batch, batch_idx):\n", " self._calculate_loss(batch, mode=\"test\")"]}, {"cell_type": "markdown", "id": "55495b0b", "metadata": {"papermill": {"duration": 0.040786, "end_time": "2021-10-10T16:41:56.009838", "exception": false, "start_time": "2021-10-10T16:41:55.969052", "status": "completed"}, "tags": []}, "source": ["The data we use is the training and test set of STL10.\n", "The training contains 500 images per class, while the test set has 800 images per class."]}, {"cell_type": "code", "execution_count": 13, "id": "eeca05e6", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:41:56.197171Z", "iopub.status.busy": "2021-10-10T16:41:56.196690Z", "iopub.status.idle": "2021-10-10T16:42:07.538122Z", "shell.execute_reply": "2021-10-10T16:42:07.537640Z"}, "papermill": {"duration": 11.449982, "end_time": "2021-10-10T16:42:07.538239", "exception": false, "start_time": "2021-10-10T16:41:56.088257", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n", "Number of training examples: 5000\n", "Number of test examples: 8000\n"]}], "source": ["img_transforms = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.5,), (0.5,))])\n", "\n", "train_img_data = STL10(root=DATASET_PATH, split=\"train\", download=True, transform=img_transforms)\n", "test_img_data = STL10(root=DATASET_PATH, split=\"test\", download=True, transform=img_transforms)\n", "\n", "print(\"Number of training examples:\", len(train_img_data))\n", "print(\"Number of test examples:\", len(test_img_data))"]}, {"cell_type": "markdown", "id": "88ebb27b", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.066846, "end_time": "2021-10-10T16:42:07.663036", "exception": false, "start_time": "2021-10-10T16:42:07.596190", "status": "completed"}, "tags": []}, "source": ["Next, we implement a small function to encode all images in our datasets.\n", "The output representations are then used as inputs to the Logistic Regression model."]}, {"cell_type": "code", "execution_count": 14, "id": "08b87e56", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:42:07.810979Z", "iopub.status.busy": "2021-10-10T16:42:07.810493Z", "iopub.status.idle": "2021-10-10T16:42:07.812587Z", "shell.execute_reply": "2021-10-10T16:42:07.812116Z"}, "papermill": {"duration": 0.049258, "end_time": "2021-10-10T16:42:07.812757", "exception": false, "start_time": "2021-10-10T16:42:07.763499", "status": "completed"}, "tags": []}, "outputs": [], "source": ["@torch.no_grad()\n", "def prepare_data_features(model, dataset):\n", " # Prepare model\n", " network = deepcopy(model.convnet)\n", " network.fc = nn.Identity() # Removing projection head g(.)\n", " network.eval()\n", " network.to(device)\n", "\n", " # Encode all images\n", " data_loader = data.DataLoader(dataset, batch_size=64, num_workers=NUM_WORKERS, shuffle=False, drop_last=False)\n", " feats, labels = [], []\n", " for batch_imgs, batch_labels in tqdm(data_loader):\n", " batch_imgs = batch_imgs.to(device)\n", " batch_feats = network(batch_imgs)\n", " feats.append(batch_feats.detach().cpu())\n", " labels.append(batch_labels)\n", "\n", " feats = torch.cat(feats, dim=0)\n", " labels = torch.cat(labels, dim=0)\n", "\n", " # Sort images by labels\n", " labels, idxs = labels.sort()\n", " feats = feats[idxs]\n", "\n", " return data.TensorDataset(feats, labels)"]}, {"cell_type": "markdown", "id": "f1e62cc6", "metadata": {"papermill": {"duration": 0.10389, "end_time": "2021-10-10T16:42:08.012147", "exception": false, "start_time": "2021-10-10T16:42:07.908257", "status": "completed"}, "tags": []}, "source": ["Let's apply the function to both training and test set below."]}, {"cell_type": "code", "execution_count": 15, "id": "274643eb", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:42:08.330518Z", "iopub.status.busy": "2021-10-10T16:42:08.330044Z", "iopub.status.idle": "2021-10-10T16:42:14.259714Z", "shell.execute_reply": "2021-10-10T16:42:14.260561Z"}, "papermill": {"duration": 5.994866, "end_time": "2021-10-10T16:42:14.260713", "exception": false, "start_time": "2021-10-10T16:42:08.265847", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "32cad3ea3e3644baaa844883a715a613", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0/79 [00:00\n", "\n", "\n", " \n", " \n", " \n", " \n", " 2021-10-10T18:42:16.456325\n", " image/svg+xml\n", " \n", " \n", " Matplotlib v3.4.3, https://matplotlib.org/\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "\n"], "text/plain": ["
"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Test accuracy for 10 images per label: 62.79%\n", "Test accuracy for 20 images per label: 68.60%\n", "Test accuracy for 50 images per label: 74.44%\n", "Test accuracy for 100 images per label: 77.20%\n", "Test accuracy for 200 images per label: 79.06%\n", "Test accuracy for 500 images per label: 81.33%\n"]}], "source": ["dataset_sizes = sorted(k for k in results)\n", "test_scores = [results[k][\"test\"] for k in dataset_sizes]\n", "\n", "fig = plt.figure(figsize=(6, 4))\n", "plt.plot(\n", " dataset_sizes,\n", " test_scores,\n", " \"--\",\n", " color=\"#000\",\n", " marker=\"*\",\n", " markeredgecolor=\"#000\",\n", " markerfacecolor=\"y\",\n", " markersize=16,\n", ")\n", "plt.xscale(\"log\")\n", "plt.xticks(dataset_sizes, labels=dataset_sizes)\n", "plt.title(\"STL10 classification over dataset size\", fontsize=14)\n", "plt.xlabel(\"Number of images per class\")\n", "plt.ylabel(\"Test accuracy\")\n", "plt.minorticks_off()\n", "plt.show()\n", "\n", "for k, score in zip(dataset_sizes, test_scores):\n", " print(f\"Test accuracy for {k:3d} images per label: {100*score:4.2f}%\")"]}, {"cell_type": "markdown", "id": "e6cb0f66", "metadata": {"papermill": {"duration": 0.049197, "end_time": "2021-10-10T16:42:16.746998", "exception": false, "start_time": "2021-10-10T16:42:16.697801", "status": "completed"}, "tags": []}, "source": ["As one would expect, the classification performance improves the more data we have.\n", "However, with only 10 images per class, we can already classify more than 60% of the images correctly.\n", "This is quite impressive, considering that the images are also higher dimensional than e.g. CIFAR10.\n", "With the full dataset, we achieve an accuracy of 81%.\n", "The increase between 50 to 500 images per class might suggest a linear increase in performance with an exponentially larger dataset.\n", "However, with even more data, we could also finetune $f(\\cdot)$ in the training process, allowing for the representations to adapt more to the specific classification task given.\n", "\n", "To set the results above into perspective, we will train the base\n", "network, a ResNet-18, on the classification task from scratch."]}, {"cell_type": "markdown", "id": "237fe863", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.048695, "end_time": "2021-10-10T16:42:16.844984", "exception": false, "start_time": "2021-10-10T16:42:16.796289", "status": "completed"}, "tags": []}, "source": ["## Baseline\n", "\n", "As a baseline to our results above, we will train a standard ResNet-18 with random initialization on the labeled training set of STL10.\n", "The results will give us an indication of the advantages that contrastive learning on unlabeled data has compared to using only supervised training.\n", "The implementation of the model is straightforward since the ResNet\n", "architecture is provided in the torchvision library."]}, {"cell_type": "code", "execution_count": 20, "id": "201725a2", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:42:16.952607Z", "iopub.status.busy": "2021-10-10T16:42:16.952127Z", "iopub.status.idle": "2021-10-10T16:42:16.954345Z", "shell.execute_reply": "2021-10-10T16:42:16.953881Z"}, "papermill": {"duration": 0.059107, "end_time": "2021-10-10T16:42:16.954448", "exception": false, "start_time": "2021-10-10T16:42:16.895341", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class ResNet(pl.LightningModule):\n", " def __init__(self, num_classes, lr, weight_decay, max_epochs=100):\n", " super().__init__()\n", " self.save_hyperparameters()\n", " self.model = torchvision.models.resnet18(pretrained=False, num_classes=num_classes)\n", "\n", " def configure_optimizers(self):\n", " optimizer = optim.AdamW(self.parameters(), lr=self.hparams.lr, weight_decay=self.hparams.weight_decay)\n", " lr_scheduler = optim.lr_scheduler.MultiStepLR(\n", " optimizer, milestones=[int(self.hparams.max_epochs * 0.7), int(self.hparams.max_epochs * 0.9)], gamma=0.1\n", " )\n", " return [optimizer], [lr_scheduler]\n", "\n", " def _calculate_loss(self, batch, mode=\"train\"):\n", " imgs, labels = batch\n", " preds = self.model(imgs)\n", " loss = F.cross_entropy(preds, labels)\n", " acc = (preds.argmax(dim=-1) == labels).float().mean()\n", "\n", " self.log(mode + \"_loss\", loss)\n", " self.log(mode + \"_acc\", acc)\n", " return loss\n", "\n", " def training_step(self, batch, batch_idx):\n", " return self._calculate_loss(batch, mode=\"train\")\n", "\n", " def validation_step(self, batch, batch_idx):\n", " self._calculate_loss(batch, mode=\"val\")\n", "\n", " def test_step(self, batch, batch_idx):\n", " self._calculate_loss(batch, mode=\"test\")"]}, {"cell_type": "markdown", "id": "e6fe14f2", "metadata": {"papermill": {"duration": 0.049585, "end_time": "2021-10-10T16:42:17.052720", "exception": false, "start_time": "2021-10-10T16:42:17.003135", "status": "completed"}, "tags": []}, "source": ["It is clear that the ResNet easily overfits on the training data since its parameter count is more than 1000 times larger than the dataset size.\n", "To make the comparison to the contrastive learning models fair, we apply data augmentations similar to the ones we used before: horizontal flip, crop-and-resize, grayscale, and gaussian blur.\n", "Color distortions as before are not used because the color distribution of an image showed to be an important feature for the classification.\n", "Hence, we observed no noticeable performance gains when adding color distortions to the set of augmentations.\n", "Similarly, we restrict the resizing operation before cropping to the max.\n", "125% of its original resolution, instead of 1250% as done in SimCLR.\n", "This is because, for classification, the model needs to recognize the full object, while in contrastive learning, we only want to check whether two patches belong to the same image/object.\n", "Hence, the chosen augmentations below are overall weaker than in the contrastive learning case."]}, {"cell_type": "code", "execution_count": 21, "id": "3c7c2020", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:42:17.163394Z", "iopub.status.busy": "2021-10-10T16:42:17.162926Z", "iopub.status.idle": "2021-10-10T16:42:22.652111Z", "shell.execute_reply": "2021-10-10T16:42:22.652505Z"}, "papermill": {"duration": 5.551414, "end_time": "2021-10-10T16:42:22.652657", "exception": false, "start_time": "2021-10-10T16:42:17.101243", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}], "source": ["train_transforms = transforms.Compose(\n", " [\n", " transforms.RandomHorizontalFlip(),\n", " transforms.RandomResizedCrop(size=96, scale=(0.8, 1.0)),\n", " transforms.RandomGrayscale(p=0.2),\n", " transforms.GaussianBlur(kernel_size=9, sigma=(0.1, 0.5)),\n", " transforms.ToTensor(),\n", " transforms.Normalize((0.5,), (0.5,)),\n", " ]\n", ")\n", "\n", "train_img_aug_data = STL10(root=DATASET_PATH, split=\"train\", download=True, transform=train_transforms)"]}, {"cell_type": "markdown", "id": "318c1f64", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.053189, "end_time": "2021-10-10T16:42:22.755918", "exception": false, "start_time": "2021-10-10T16:42:22.702729", "status": "completed"}, "tags": []}, "source": ["The training function for the ResNet is almost identical to the Logistic Regression setup.\n", "Note that we allow the ResNet to perform validation every 2 epochs to\n", "also check whether the model overfits strongly in the first iterations\n", "or not."]}, {"cell_type": "code", "execution_count": 22, "id": "9f4db9de", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:42:22.863515Z", "iopub.status.busy": "2021-10-10T16:42:22.862996Z", "iopub.status.idle": "2021-10-10T16:42:22.865112Z", "shell.execute_reply": "2021-10-10T16:42:22.864714Z"}, "papermill": {"duration": 0.059991, "end_time": "2021-10-10T16:42:22.865213", "exception": false, "start_time": "2021-10-10T16:42:22.805222", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def train_resnet(batch_size, max_epochs=100, **kwargs):\n", " trainer = pl.Trainer(\n", " default_root_dir=os.path.join(CHECKPOINT_PATH, \"ResNet\"),\n", " gpus=1 if str(device) == \"cuda:0\" else 0,\n", " max_epochs=max_epochs,\n", " callbacks=[\n", " ModelCheckpoint(save_weights_only=True, mode=\"max\", monitor=\"val_acc\"),\n", " LearningRateMonitor(\"epoch\"),\n", " ],\n", " progress_bar_refresh_rate=1,\n", " check_val_every_n_epoch=2,\n", " )\n", " trainer.logger._default_hp_metric = None\n", "\n", " # Data loaders\n", " train_loader = data.DataLoader(\n", " train_img_aug_data,\n", " batch_size=batch_size,\n", " shuffle=True,\n", " drop_last=True,\n", " pin_memory=True,\n", " num_workers=NUM_WORKERS,\n", " )\n", " test_loader = data.DataLoader(\n", " test_img_data, batch_size=batch_size, shuffle=False, drop_last=False, pin_memory=True, num_workers=NUM_WORKERS\n", " )\n", "\n", " # Check whether pretrained model exists. If yes, load it and skip training\n", " pretrained_filename = os.path.join(CHECKPOINT_PATH, \"ResNet.ckpt\")\n", " if os.path.isfile(pretrained_filename):\n", " print(\"Found pretrained model at %s, loading...\" % pretrained_filename)\n", " model = ResNet.load_from_checkpoint(pretrained_filename)\n", " else:\n", " pl.seed_everything(42) # To be reproducable\n", " model = ResNet(**kwargs)\n", " trainer.fit(model, train_loader, test_loader)\n", " model = ResNet.load_from_checkpoint(trainer.checkpoint_callback.best_model_path)\n", "\n", " # Test best model on validation set\n", " train_result = trainer.test(model, test_dataloaders=train_loader, verbose=False)\n", " val_result = trainer.test(model, test_dataloaders=test_loader, verbose=False)\n", " result = {\"train\": train_result[0][\"test_acc\"], \"test\": val_result[0][\"test_acc\"]}\n", "\n", " return model, result"]}, {"cell_type": "markdown", "id": "f3781014", "metadata": {"papermill": {"duration": 0.049896, "end_time": "2021-10-10T16:42:22.965127", "exception": false, "start_time": "2021-10-10T16:42:22.915231", "status": "completed"}, "tags": []}, "source": ["Finally, let's train the model and check its results:"]}, {"cell_type": "code", "execution_count": 23, "id": "4f4caab0", "metadata": {"execution": {"iopub.execute_input": "2021-10-10T16:42:23.068310Z", "iopub.status.busy": "2021-10-10T16:42:23.066889Z", "iopub.status.idle": "2021-10-10T16:42:27.618125Z", "shell.execute_reply": "2021-10-10T16:42:27.618532Z"}, "papermill": {"duration": 4.604524, "end_time": "2021-10-10T16:42:27.618678", "exception": false, "start_time": "2021-10-10T16:42:23.014154", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Found pretrained model at saved_models/ContrastiveLearning/ResNet.ckpt, loading...\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/trainer.py:678: LightningDeprecationWarning: `trainer.test(test_dataloaders)` is deprecated in v1.4 and will be removed in v1.6. Use `trainer.test(dataloaders)` instead.\n", " rank_zero_deprecation(\n", "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stderr", "output_type": "stream", "text": ["Missing logger folder: saved_models/ContrastiveLearning/ResNet/lightning_logs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/data_loading.py:376: UserWarning: Your test_dataloader has `shuffle=True`, it is best practice to turn this off for val/test/predict dataloaders.\n", " rank_zero_warn(\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "0f6b628c8d4d45f9876bc31bc99904ed", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "d901ede9b3054a479a22fda21e763fea", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Accuracy on training set: 99.76%\n", "Accuracy on test set: 73.31%\n"]}], "source": ["resnet_model, resnet_result = train_resnet(batch_size=64, num_classes=10, lr=1e-3, weight_decay=2e-4, max_epochs=100)\n", "print(f\"Accuracy on training set: {100*resnet_result['train']:4.2f}%\")\n", "print(f\"Accuracy on test set: {100*resnet_result['test']:4.2f}%\")"]}, {"cell_type": "markdown", "id": "a98707ed", "metadata": {"papermill": {"duration": 0.05204, "end_time": "2021-10-10T16:42:27.724471", "exception": false, "start_time": "2021-10-10T16:42:27.672431", "status": "completed"}, "tags": []}, "source": ["The ResNet trained from scratch achieves 73.31% on the test set.\n", "This is almost 8% less than the contrastive learning model, and even slightly less than SimCLR achieves with 1/10 of the data.\n", "This shows that self-supervised, contrastive learning provides\n", "considerable performance gains by leveraging large amounts of unlabeled\n", "data when little labeled data is available."]}, {"cell_type": "markdown", "id": "333d9e8c", "metadata": {"papermill": {"duration": 0.051935, "end_time": "2021-10-10T16:42:27.828975", "exception": false, "start_time": "2021-10-10T16:42:27.777040", "status": "completed"}, "tags": []}, "source": ["## Conclusion\n", "\n", "In this tutorial, we have discussed self-supervised contrastive learning and implemented SimCLR as an example method.\n", "We have applied it to the STL10 dataset and showed that it can learn generalizable representations that we can use to train simple classification models.\n", "With 500 images per label, it achieved an 8% higher accuracy than a similar model solely trained from supervision and performs on par with it when only using a tenth of the labeled data.\n", "Our experimental results are limited to a single dataset, but recent works such as [Ting Chen et al. ](https://arxiv.org/abs/2006.10029) showed similar trends for larger datasets like ImageNet.\n", "Besides the discussed hyperparameters, the size of the model seems to be important in contrastive learning as well.\n", "If a lot of unlabeled data is available, larger models can achieve much stronger results and come close to their supervised baselines.\n", "Further, there are also approaches for combining contrastive and supervised learning, leading to performance gains beyond supervision (see [Khosla et al.](https://arxiv.org/abs/2004.11362)).\n", "Moreover, contrastive learning is not the only approach to self-supervised learning that has come up in the last two years and showed great results.\n", "Other methods include distillation-based methods like [BYOL](https://arxiv.org/abs/2006.07733) and redundancy reduction techniques like [Barlow Twins](https://arxiv.org/abs/2103.03230).\n", "There is a lot more to explore in the self-supervised domain, and more, impressive steps ahead are to be expected.\n", "\n", "### References\n", "\n", "[1] Chen, T., Kornblith, S., Norouzi, M., and Hinton, G. (2020).\n", "A simple framework for contrastive learning of visual representations.\n", "In International conference on machine learning (pp.\n", "1597-1607).\n", "PMLR.\n", "([link](https://arxiv.org/abs/2002.05709))\n", "\n", "[2] Chen, T., Kornblith, S., Swersky, K., Norouzi, M., and Hinton, G. (2020).\n", "Big self-supervised models are strong semi-supervised learners.\n", "NeurIPS 2021 ([link](https://arxiv.org/abs/2006.10029)).\n", "\n", "[3] Oord, A. V. D., Li, Y., and Vinyals, O.\n", "(2018).\n", "Representation learning with contrastive predictive coding.\n", "arXiv preprint arXiv:1807.03748.\n", "([link](https://arxiv.org/abs/1807.03748))\n", "\n", "[4] Grill, J.B., Strub, F., Altch\u00e9, F., Tallec, C., Richemond, P.H., Buchatskaya, E., Doersch, C., Pires, B.A., Guo, Z.D., Azar, M.G.\n", "and Piot, B.\n", "(2020).\n", "Bootstrap your own latent: A new approach to self-supervised learning.\n", "arXiv preprint arXiv:2006.07733.\n", "([link](https://arxiv.org/abs/2006.07733))\n", "\n", "[5] Khosla, P., Teterwak, P., Wang, C., Sarna, A., Tian, Y., Isola, P., Maschinot, A., Liu, C. and Krishnan, D. (2020).\n", "Supervised contrastive learning.\n", "arXiv preprint arXiv:2004.11362.\n", "([link](https://arxiv.org/abs/2004.11362))\n", "\n", "[6] Zbontar, J., Jing, L., Misra, I., LeCun, Y. and Deny, S. (2021).\n", "Barlow twins: Self-supervised learning via redundancy reduction.\n", "arXiv preprint arXiv:2103.03230.\n", "([link](https://arxiv.org/abs/2103.03230))"]}, {"cell_type": "markdown", "id": "ce384bac", "metadata": {"papermill": {"duration": 0.052469, "end_time": "2021-10-10T16:42:27.933096", "exception": false, "start_time": "2021-10-10T16:42:27.880627", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "![Pytorch Lightning](){height=\"60px\" width=\"240px\"}"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: Tutorial 13: Self-Supervised Contrastive Learning with SimCLR\n", " :card_description: In this tutorial, we will take a closer look at self-supervised contrastive learning. Self-supervised learning, or also sometimes called unsupervised learning, describes the...\n", " :tags: Image,Self-Supervised,Contrastive-Learning,GPU/TPU,UvA-DL-Course\n", " :image: _static/images/course_UvA-DL/13-contrastive-learning.jpg"]}], "metadata": {"jupytext": {"cell_metadata_filter": "id,colab_type,colab,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 249.204813, "end_time": "2021-10-10T16:42:28.695919", "environment_variables": {}, "exception": null, "input_path": "course_UvA-DL/13-contrastive-learning/SimCLR.ipynb", "output_path": ".notebooks/course_UvA-DL/13-contrastive-learning.ipynb", "parameters": {}, "start_time": "2021-10-10T16:38:19.491106", "version": "2.3.3"}, "widgets": {"application/vnd.jupyter.widget-state+json": {"state": {"014eb2b9e9f84518838020b1995c1b8d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b2fc0cc8b5aa4c0c8b7c6ed61e30e1a1", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_06e3324339554e7d8653dd5ca34502c3", "value": 1.0}}, "06e3324339554e7d8653dd5ca34502c3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "0f6b628c8d4d45f9876bc31bc99904ed": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_574e12bb3361469f9592f0b1e3ea131c", "IPY_MODEL_17ae240504aa41a69aac2f89637a872f", "IPY_MODEL_3c71b91bf99a44088d998afcceba0c5a"], "layout": "IPY_MODEL_c9f6fa6ff0a4421bbbebceb0868d6f72"}}, "17ae240504aa41a69aac2f89637a872f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_9815469b386b421aa09d7a7c435486d6", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_48df5e7e12f14d529ee8253b7e81c15d", "value": 1.0}}, "1ba6707c32324d89a25d94b8826ad3fb": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "261190710d154e79846a4b2be71408ed": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "262c7a46de2548a1bb2c1bd654bae044": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_5dc49442ae4b4da1b8883f9729335464", "placeholder": "\u200b", "style": "IPY_MODEL_6fa3b6f47f774f06911972e497cbaa80", "value": " 79/79 [00:01<00:00, 80.29it/s]"}}, "29f4053f18004b2aa3ad1439d2b93651": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "2e223ff880144417a99a792b90424c4e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "32cad3ea3e3644baaa844883a715a613": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_8ac65a9e9dbc4e9b84ae76dbf7ba131e", "IPY_MODEL_ac28c76d49c141fb834867a4cee9bb41", "IPY_MODEL_262c7a46de2548a1bb2c1bd654bae044"], "layout": "IPY_MODEL_4d296fe6da9a4f4fbc71862dd3aef6a8"}}, "3329a069de5d4624a9412647f0d80198": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_492d73828f01466f9f1aad76d13d0217", "IPY_MODEL_b7093bf46de847f79cd6d83a8bca17be", "IPY_MODEL_dad5ea58db1c4416bebfd763d88c5c70"], "layout": "IPY_MODEL_261190710d154e79846a4b2be71408ed"}}, "3c71b91bf99a44088d998afcceba0c5a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b769c6c21b5b4aeba81b70f8ac423d79", "placeholder": "\u200b", "style": "IPY_MODEL_5a9c689a271f4e35b11302006704a498", "value": " 78/78 [00:02<00:00, 35.66it/s]"}}, "3de31fdecbe4407286cc95695466de5d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d87935149db141678e50b111ed61ec82", "placeholder": "\u200b", "style": "IPY_MODEL_98e77a3d53234245ab2a62d09bd5ddef", "value": " 2640397312/? [02:43<00:00, 17274904.03it/s]"}}, "48df5e7e12f14d529ee8253b7e81c15d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "492d73828f01466f9f1aad76d13d0217": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d56f70bb6f13477e9412473f278615c1", "placeholder": "\u200b", "style": "IPY_MODEL_f8d33dc2ecbe4476bd02a6b12d40d79b", "value": "100%"}}, "4b5ff77984894ccbb8ae6abd263a4b7c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4d296fe6da9a4f4fbc71862dd3aef6a8": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "57424a7cd3c7417dae1073397b010b1c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "574e12bb3361469f9592f0b1e3ea131c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1ba6707c32324d89a25d94b8826ad3fb", "placeholder": "\u200b", "style": "IPY_MODEL_57424a7cd3c7417dae1073397b010b1c", "value": "Testing: 100%"}}, "5a9c689a271f4e35b11302006704a498": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "5c036d43b260499385714d1317f05efe": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "5d2b7d0577694436ade46306715f91de": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "5dc49442ae4b4da1b8883f9729335464": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "6fa3b6f47f774f06911972e497cbaa80": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "721cee3a7bed406c8050c8433a106386": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "762e3668c79e48839269b8d565098578": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "84c4574fe0744cdf837bcc9c3032acfc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "8ac65a9e9dbc4e9b84ae76dbf7ba131e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2e223ff880144417a99a792b90424c4e", "placeholder": "\u200b", "style": "IPY_MODEL_721cee3a7bed406c8050c8433a106386", "value": "100%"}}, "8c91c107ddbc4f84a5a8b5e583c69773": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "979d4939c8c04651bfd4a96e20d4d508": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "97fdda0f484c4954804bd2c4ff8d013a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_be6a5b00c73049329a585c53e6eb481a", "placeholder": "\u200b", "style": "IPY_MODEL_762e3668c79e48839269b8d565098578", "value": " 125/125 [00:01<00:00, 106.26it/s]"}}, "9815469b386b421aa09d7a7c435486d6": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "98e77a3d53234245ab2a62d09bd5ddef": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "ac28c76d49c141fb834867a4cee9bb41": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8c91c107ddbc4f84a5a8b5e583c69773", "max": 79.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_5d2b7d0577694436ade46306715f91de", "value": 79.0}}, "b2a75df791794c5cbf5d75ccfd368544": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d174cfe6f91a431fbedf6fe767738f26", "placeholder": "\u200b", "style": "IPY_MODEL_84c4574fe0744cdf837bcc9c3032acfc", "value": ""}}, "b2fc0cc8b5aa4c0c8b7c6ed61e30e1a1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b7093bf46de847f79cd6d83a8bca17be": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_979d4939c8c04651bfd4a96e20d4d508", "max": 125.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_c967a959d2e54813af244ce923b9bf70", "value": 125.0}}, "b769c6c21b5b4aeba81b70f8ac423d79": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "be6a5b00c73049329a585c53e6eb481a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c111f74da90d4a8f831df4733df12b94": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_b2a75df791794c5cbf5d75ccfd368544", "IPY_MODEL_dd15111b76d447d783d02a4ea9a5dbb2", "IPY_MODEL_3de31fdecbe4407286cc95695466de5d"], "layout": "IPY_MODEL_ef6374a810a14d32a08759170c9d66d1"}}, "c6548cbf34cb4f5f88108f9f7ac77fb4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "c967a959d2e54813af244ce923b9bf70": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "c9f6fa6ff0a4421bbbebceb0868d6f72": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "d174cfe6f91a431fbedf6fe767738f26": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d56f70bb6f13477e9412473f278615c1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d87935149db141678e50b111ed61ec82": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d901ede9b3054a479a22fda21e763fea": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_f56016fba5604d9db49374c9af2829e1", "IPY_MODEL_014eb2b9e9f84518838020b1995c1b8d", "IPY_MODEL_97fdda0f484c4954804bd2c4ff8d013a"], "layout": "IPY_MODEL_e8120e786bbe4d56aed3a534970c020d"}}, "dad5ea58db1c4416bebfd763d88c5c70": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4b5ff77984894ccbb8ae6abd263a4b7c", "placeholder": "\u200b", "style": "IPY_MODEL_ef38b8535cdf4ddfba9ced74f238ab28", "value": " 125/125 [00:01<00:00, 77.70it/s]"}}, "dd15111b76d447d783d02a4ea9a5dbb2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e2187c1fd5554b5c89ebf37667b20858", "max": 2640397119.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_29f4053f18004b2aa3ad1439d2b93651", "value": 2640397119.0}}, "e2187c1fd5554b5c89ebf37667b20858": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "e8120e786bbe4d56aed3a534970c020d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "ef38b8535cdf4ddfba9ced74f238ab28": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "ef6374a810a14d32a08759170c9d66d1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "f56016fba5604d9db49374c9af2829e1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_5c036d43b260499385714d1317f05efe", "placeholder": "\u200b", "style": "IPY_MODEL_c6548cbf34cb4f5f88108f9f7ac77fb4", "value": "Testing: 100%"}}, "f8d33dc2ecbe4476bd02a6b12d40d79b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}}, "version_major": 2, "version_minor": 0}}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/lightning_examples/augmentation_kornia.ipynb b/source/notebooks/lightning_examples/augmentation_kornia.ipynb deleted file mode 100644 index e9c2340..0000000 --- a/source/notebooks/lightning_examples/augmentation_kornia.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "38906077", "metadata": {"papermill": {"duration": 0.034946, "end_time": "2021-12-04T16:20:10.519350", "exception": false, "start_time": "2021-12-04T16:20:10.484404", "status": "completed"}, "tags": []}, "source": ["\n", "# GPU and batched data augmentation with Kornia and PyTorch-Lightning\n", "\n", "* **Author:** PL/Kornia team\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-12-04T16:52:56.657983\n", "\n", "In this tutorial we will show how to combine both Kornia.org and PyTorch Lightning\n", "to perform efficient data augmentation to train a simpple model using the GPU in batch\n", "mode without additional effort.\n", "\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/lightning_examples/augmentation_kornia.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "8ab0f89d", "metadata": {"papermill": {"duration": 0.031285, "end_time": "2021-12-04T16:20:10.583397", "exception": false, "start_time": "2021-12-04T16:20:10.552112", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "1dde05cd", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-12-04T16:20:10.652401Z", "iopub.status.busy": "2021-12-04T16:20:10.651932Z", "iopub.status.idle": "2021-12-04T16:20:13.540277Z", "shell.execute_reply": "2021-12-04T16:20:13.539730Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 2.926089, "end_time": "2021-12-04T16:20:13.540428", "exception": false, "start_time": "2021-12-04T16:20:10.614339", "status": "completed"}, "tags": []}, "outputs": [], "source": ["! pip install --quiet \"pytorch-lightning\" \"pandas\" \"pytorch-lightning>=1.3\" \"torchvision\" \"matplotlib\" \"torchmetrics\" \"kornia\" \"torchmetrics>=0.3\" \"torch>=1.6, <1.9\""]}, {"cell_type": "code", "execution_count": 2, "id": "bb66b32f", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:20:13.609472Z", "iopub.status.busy": "2021-12-04T16:20:13.609002Z", "iopub.status.idle": "2021-12-04T16:20:15.512338Z", "shell.execute_reply": "2021-12-04T16:20:15.511878Z"}, "papermill": {"duration": 1.939508, "end_time": "2021-12-04T16:20:15.512472", "exception": false, "start_time": "2021-12-04T16:20:13.572964", "status": "completed"}, "tags": []}, "outputs": [], "source": ["import os\n", "\n", "import matplotlib.pyplot as plt\n", "import numpy as np\n", "import pandas as pd\n", "import torch\n", "import torch.nn as nn\n", "import torchmetrics\n", "import torchvision\n", "from kornia import image_to_tensor, tensor_to_image\n", "from kornia.augmentation import ColorJitter, RandomChannelShuffle, RandomHorizontalFlip, RandomThinPlateSpline\n", "from pytorch_lightning import LightningModule, Trainer\n", "from pytorch_lightning.loggers import CSVLogger\n", "from torch import Tensor\n", "from torch.nn import functional as F\n", "from torch.utils.data import DataLoader\n", "from torchvision.datasets import CIFAR10\n", "\n", "AVAIL_GPUS = min(1, torch.cuda.device_count())"]}, {"cell_type": "markdown", "id": "4984c138", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.033859, "end_time": "2021-12-04T16:20:15.578656", "exception": false, "start_time": "2021-12-04T16:20:15.544797", "status": "completed"}, "tags": []}, "source": ["## Define Data Augmentations module\n", "\n", "[Kornia.org](https://www.kornia.org) is low level Computer Vision library that provides a dedicated module\n", "[`kornia.augmentation`](https://kornia.readthedocs.io/en/latest/augmentation.html) module implementing\n", "en extensive set of data augmentation techniques for image and video.\n", "\n", "Similar to Lightning, in Kornia it's promoted to encapsulate functionalities inside classes for readability\n", "and efficiency purposes. In this case, we define a data augmentaton pipeline subclassing a `nn.Module`\n", "where the augmentation_kornia (also subclassing `nn.Module`) are combined with other PyTorch components\n", "such as `nn.Sequential`.\n", "\n", "Checkout the different augmentation operators in Kornia docs and experiment yourself !"]}, {"cell_type": "code", "execution_count": 3, "id": "62adfd08", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:20:15.647672Z", "iopub.status.busy": "2021-12-04T16:20:15.647178Z", "iopub.status.idle": "2021-12-04T16:20:15.649220Z", "shell.execute_reply": "2021-12-04T16:20:15.648758Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.039378, "end_time": "2021-12-04T16:20:15.649322", "exception": false, "start_time": "2021-12-04T16:20:15.609944", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class DataAugmentation(nn.Module):\n", " \"\"\"Module to perform data augmentation using Kornia on torch tensors.\"\"\"\n", "\n", " def __init__(self, apply_color_jitter: bool = False) -> None:\n", " super().__init__()\n", " self._apply_color_jitter = apply_color_jitter\n", "\n", " self.transforms = nn.Sequential(\n", " RandomHorizontalFlip(p=0.75),\n", " RandomChannelShuffle(p=0.75),\n", " RandomThinPlateSpline(p=0.75),\n", " )\n", "\n", " self.jitter = ColorJitter(0.5, 0.5, 0.5, 0.5)\n", "\n", " @torch.no_grad() # disable gradients for effiency\n", " def forward(self, x: Tensor) -> Tensor:\n", " x_out = self.transforms(x) # BxCxHxW\n", " if self._apply_color_jitter:\n", " x_out = self.jitter(x_out)\n", " return x_out"]}, {"cell_type": "markdown", "id": "c57c4fbe", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.030806, "end_time": "2021-12-04T16:20:15.711761", "exception": false, "start_time": "2021-12-04T16:20:15.680955", "status": "completed"}, "tags": []}, "source": ["## Define a Pre-processing module\n", "\n", "In addition to the `DataAugmentation` modudle that will sample random parameters during the training stage,\n", "we define a `Preprocess` class to handle the conversion of the image type to properly work with `Tensor`.\n", "\n", "For this example we use `torchvision` CIFAR10 which return samples of `PIL.Image`, however,\n", "to take all the advantages of PyTorch and Kornia we need to cast the images into tensors.\n", "\n", "To do that we will use `kornia.image_to_tensor` which casts and permutes the images in the right format."]}, {"cell_type": "code", "execution_count": 4, "id": "55e81122", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:20:15.778048Z", "iopub.status.busy": "2021-12-04T16:20:15.777585Z", "iopub.status.idle": "2021-12-04T16:20:15.779274Z", "shell.execute_reply": "2021-12-04T16:20:15.779646Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.036947, "end_time": "2021-12-04T16:20:15.779757", "exception": false, "start_time": "2021-12-04T16:20:15.742810", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class Preprocess(nn.Module):\n", " \"\"\"Module to perform pre-process using Kornia on torch tensors.\"\"\"\n", "\n", " @torch.no_grad() # disable gradients for effiency\n", " def forward(self, x) -> Tensor:\n", " x_tmp: np.ndarray = np.array(x) # HxWxC\n", " x_out: Tensor = image_to_tensor(x_tmp, keepdim=True) # CxHxW\n", " return x_out.float() / 255.0"]}, {"cell_type": "markdown", "id": "d16cb9f3", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.03102, "end_time": "2021-12-04T16:20:15.841921", "exception": false, "start_time": "2021-12-04T16:20:15.810901", "status": "completed"}, "tags": []}, "source": ["## Define PyTorch Lightning model\n", "\n", "The next step is to define our `LightningModule` to have a proper organisation of our training pipeline.\n", "This is a simple example just to show how to structure your baseline to be used as a reference,\n", "do not expect a high performance.\n", "\n", "Notice that the `Preprocess` class is injected into the dataset and will be applied per sample.\n", "\n", "The interesting part in the proposed approach happens inside the `training_step` where with just a single\n", "line of code we apply the data augmentation in batch and no need to worry about the device.\n", "This means that our `DataAugmentation` pipeline will automatically executed in the GPU."]}, {"cell_type": "code", "execution_count": 5, "id": "fb8ce79c", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:20:15.915783Z", "iopub.status.busy": "2021-12-04T16:20:15.915307Z", "iopub.status.idle": "2021-12-04T16:20:15.917345Z", "shell.execute_reply": "2021-12-04T16:20:15.916889Z"}, "papermill": {"duration": 0.044237, "end_time": "2021-12-04T16:20:15.917441", "exception": false, "start_time": "2021-12-04T16:20:15.873204", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class CoolSystem(LightningModule):\n", " def __init__(self):\n", " super().__init__()\n", " # not the best model: expereiment yourself\n", " self.model = torchvision.models.resnet18(pretrained=True)\n", "\n", " self.preprocess = Preprocess() # per sample transforms\n", "\n", " self.transform = DataAugmentation() # per batch augmentation_kornia\n", "\n", " self.accuracy = torchmetrics.Accuracy()\n", "\n", " def forward(self, x):\n", " return F.softmax(self.model(x))\n", "\n", " def compute_loss(self, y_hat, y):\n", " return F.cross_entropy(y_hat, y)\n", "\n", " def show_batch(self, win_size=(10, 10)):\n", " def _to_vis(data):\n", " return tensor_to_image(torchvision.utils.make_grid(data, nrow=8))\n", "\n", " # get a batch from the training set: try with `val_datlaoader` :)\n", " imgs, labels = next(iter(self.train_dataloader()))\n", " imgs_aug = self.transform(imgs) # apply transforms\n", " # use matplotlib to visualize\n", " plt.figure(figsize=win_size)\n", " plt.imshow(_to_vis(imgs))\n", " plt.figure(figsize=win_size)\n", " plt.imshow(_to_vis(imgs_aug))\n", "\n", " def training_step(self, batch, batch_idx):\n", " x, y = batch\n", " x_aug = self.transform(x) # => we perform GPU/Batched data augmentation\n", " y_hat = self(x_aug)\n", " loss = self.compute_loss(y_hat, y)\n", " self.log(\"train_loss\", loss, prog_bar=False)\n", " self.log(\"train_acc\", self.accuracy(y_hat, y), prog_bar=False)\n", " return loss\n", "\n", " def validation_step(self, batch, batch_idx):\n", " x, y = batch\n", " y_hat = self(x)\n", " loss = self.compute_loss(y_hat, y)\n", " self.log(\"valid_loss\", loss, prog_bar=False)\n", " self.log(\"valid_acc\", self.accuracy(y_hat, y), prog_bar=True)\n", "\n", " def configure_optimizers(self):\n", " optimizer = torch.optim.AdamW(self.model.parameters(), lr=1e-4)\n", " scheduler = torch.optim.lr_scheduler.CosineAnnealingLR(optimizer, self.trainer.max_epochs, 0)\n", " return [optimizer], [scheduler]\n", "\n", " def prepare_data(self):\n", " CIFAR10(os.getcwd(), train=True, download=True, transform=self.preprocess)\n", " CIFAR10(os.getcwd(), train=False, download=True, transform=self.preprocess)\n", "\n", " def train_dataloader(self):\n", " dataset = CIFAR10(os.getcwd(), train=True, download=True, transform=self.preprocess)\n", " loader = DataLoader(dataset, batch_size=32)\n", " return loader\n", "\n", " def val_dataloader(self):\n", " dataset = CIFAR10(os.getcwd(), train=True, download=True, transform=self.preprocess)\n", " loader = DataLoader(dataset, batch_size=32)\n", " return loader"]}, {"cell_type": "markdown", "id": "e62c886f", "metadata": {"papermill": {"duration": 0.031204, "end_time": "2021-12-04T16:20:15.980101", "exception": false, "start_time": "2021-12-04T16:20:15.948897", "status": "completed"}, "tags": []}, "source": ["## Visualize images"]}, {"cell_type": "code", "execution_count": 6, "id": "ee50f76c", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:20:16.046489Z", "iopub.status.busy": "2021-12-04T16:20:16.046020Z", "iopub.status.idle": "2021-12-04T16:20:17.118504Z", "shell.execute_reply": "2021-12-04T16:20:17.117951Z"}, "papermill": {"duration": 1.107265, "end_time": "2021-12-04T16:20:17.118657", "exception": false, "start_time": "2021-12-04T16:20:16.011392", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Downloading: \"https://download.pytorch.org/models/resnet18-5c106cde.pth\" to /home/AzDevOps_azpcontainer/.cache/torch/hub/checkpoints/resnet18-5c106cde.pth\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "bb46bed597e04aa68d65fa7583f0b2fb", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0.00/44.7M [00:00"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"data": {"image/png": "\n", "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["model.show_batch(win_size=(14, 14))"]}, {"cell_type": "markdown", "id": "2a274076", "metadata": {"papermill": {"duration": 0.056571, "end_time": "2021-12-04T16:20:22.338599", "exception": false, "start_time": "2021-12-04T16:20:22.282028", "status": "completed"}, "tags": []}, "source": ["## Run training"]}, {"cell_type": "code", "execution_count": 8, "id": "8ce9aa4c", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:20:22.459678Z", "iopub.status.busy": "2021-12-04T16:20:22.459198Z", "iopub.status.idle": "2021-12-04T16:30:59.810226Z", "shell.execute_reply": "2021-12-04T16:30:59.809783Z"}, "papermill": {"duration": 637.415988, "end_time": "2021-12-04T16:30:59.810364", "exception": false, "start_time": "2021-12-04T16:20:22.394376", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/connectors/callback_connector.py:90: LightningDeprecationWarning: Setting `Trainer(progress_bar_refresh_rate=20)` is deprecated in v1.5 and will be removed in v1.7. Please pass `pytorch_lightning.callbacks.progress.TQDMProgressBar` with `refresh_rate` directly to the Trainer's `callbacks` argument instead. Or, to disable the progress bar pass `enable_progress_bar = False` to the Trainer.\n", " rank_zero_deprecation(\n", "GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stderr", "output_type": "stream", "text": ["\n", " | Name | Type | Params\n", "------------------------------------------------\n", "0 | model | ResNet | 11.7 M\n", "1 | preprocess | Preprocess | 0 \n", "2 | transform | DataAugmentation | 0 \n", "3 | accuracy | Accuracy | 0 \n", "------------------------------------------------\n", "11.7 M Trainable params\n", "0 Non-trainable params\n", "11.7 M Total params\n", "46.758 Total estimated model params size (MB)\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "bc56a439a8c747419a9cfce366960df9", "version_major": 2, "version_minor": 0}, "text/plain": ["Validation sanity check: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/data_loading.py:111: UserWarning: The dataloader, val_dataloader 0, does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` (try 12 which is the number of cpus on this machine) in the `DataLoader` init to improve performance.\n", " rank_zero_warn(\n", "/tmp/ipykernel_2475/711885801.py:14: UserWarning: Implicit dimension choice for softmax has been deprecated. Change the call to include dim=X as an argument.\n", " return F.softmax(self.model(x))\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/data_loading.py:111: UserWarning: The dataloader, train_dataloader, does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` (try 12 which is the number of cpus on this machine) in the `DataLoader` init to improve performance.\n", " rank_zero_warn(\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "d77d420abcbf47c0923ae5c54c44fa93", "version_major": 2, "version_minor": 0}, "text/plain": ["Training: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "b969d392aae3406f98244c05ffc71752", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "aef85224023d4c17bd6beef036b3bc95", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "0eed8fb3fe1a47308f90660740da3708", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "5ab4ced2d2af4d8b99579329b6d08851", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "b76ee81572514e77b560271a3c505645", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "efee6a19f778444e987cf2f8b9c9e709", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "eb4d88a3e74c4b8286414f889c809850", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "26a0a012ab2a4accac6df52663a5c3b3", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "3e467637b02b4cfd85562b3f1c5b58e8", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "558464e277d24562a26ef9696c7bad0d", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}], "source": ["# Initialize a trainer\n", "trainer = Trainer(\n", " progress_bar_refresh_rate=20,\n", " gpus=AVAIL_GPUS,\n", " max_epochs=10,\n", " logger=CSVLogger(save_dir=\"logs/\", name=\"cifar10-resnet18\"),\n", ")\n", "\n", "# Train the model \u26a1\n", "trainer.fit(model)"]}, {"cell_type": "markdown", "id": "842de94d", "metadata": {"papermill": {"duration": 0.074854, "end_time": "2021-12-04T16:30:59.963213", "exception": false, "start_time": "2021-12-04T16:30:59.888359", "status": "completed"}, "tags": []}, "source": ["### Visualize the training results"]}, {"cell_type": "code", "execution_count": 9, "id": "6e8ce374", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:31:00.120257Z", "iopub.status.busy": "2021-12-04T16:31:00.119802Z", "iopub.status.idle": "2021-12-04T16:31:00.391029Z", "shell.execute_reply": "2021-12-04T16:31:00.390630Z"}, "papermill": {"duration": 0.352406, "end_time": "2021-12-04T16:31:00.391154", "exception": false, "start_time": "2021-12-04T16:31:00.038748", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": [" train_loss train_acc epoch step valid_loss valid_acc\n", "0 6.785918 0.12500 0 49 NaN NaN\n", "1 6.782912 0.12500 0 99 NaN NaN\n", "2 6.770435 0.15625 0 149 NaN NaN\n", "3 6.690282 0.21875 0 199 NaN NaN\n", "4 6.782069 0.15625 0 249 NaN NaN\n"]}, {"data": {"text/plain": [""]}, "execution_count": 9, "metadata": {}, "output_type": "execute_result"}, {"data": {"image/png": "\n", "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}, {"data": {"image/png": "\n", "text/plain": ["
"]}, "metadata": {"needs_background": "light"}, "output_type": "display_data"}], "source": ["metrics = pd.read_csv(f\"{trainer.logger.log_dir}/metrics.csv\")\n", "print(metrics.head())\n", "\n", "aggreg_metrics = []\n", "agg_col = \"epoch\"\n", "for i, dfg in metrics.groupby(agg_col):\n", " agg = dict(dfg.mean())\n", " agg[agg_col] = i\n", " aggreg_metrics.append(agg)\n", "\n", "df_metrics = pd.DataFrame(aggreg_metrics)\n", "df_metrics[[\"train_loss\", \"valid_loss\"]].plot(grid=True, legend=True)\n", "df_metrics[[\"valid_acc\", \"train_acc\"]].plot(grid=True, legend=True)"]}, {"cell_type": "markdown", "id": "d8c0ecdf", "metadata": {"papermill": {"duration": 0.082158, "end_time": "2021-12-04T16:31:00.555481", "exception": false, "start_time": "2021-12-04T16:31:00.473323", "status": "completed"}, "tags": []}, "source": ["## Tensorboard"]}, {"cell_type": "code", "execution_count": 10, "id": "8a67c1e5", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:31:00.720165Z", "iopub.status.busy": "2021-12-04T16:31:00.719717Z", "iopub.status.idle": "2021-12-04T16:31:00.721655Z", "shell.execute_reply": "2021-12-04T16:31:00.721209Z"}, "papermill": {"duration": 0.086419, "end_time": "2021-12-04T16:31:00.721760", "exception": false, "start_time": "2021-12-04T16:31:00.635341", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# Start tensorboard.\n", "# %load_ext tensorboard\n", "# %tensorboard --logdir lightning_logs/"]}, {"cell_type": "markdown", "id": "d0cdd5cf", "metadata": {"papermill": {"duration": 0.079729, "end_time": "2021-12-04T16:31:00.881954", "exception": false, "start_time": "2021-12-04T16:31:00.802225", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "[![Pytorch Lightning](){height=\"60px\" width=\"240px\"}](https://pytorchlightning.ai)"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: GPU and batched data augmentation with Kornia and PyTorch-Lightning\n", " :card_description: In this tutorial we will show how to combine both Kornia.org and PyTorch Lightning to perform efficient data augmentation to train a simpple model using the GPU in batch mode...\n", " :tags: Image,GPU/TPU,Lightning-Examples\n", " :image: _static/images/lightning_examples/augmentation_kornia.svg"]}], "metadata": {"jupytext": {"cell_metadata_filter": "id,colab,colab_type,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 652.68493, "end_time": "2021-12-04T16:31:01.876440", "environment_variables": {}, "exception": null, "input_path": "lightning_examples/augmentation_kornia/augmentation.ipynb", "output_path": ".notebooks/lightning_examples/augmentation_kornia.ipynb", "parameters": {}, "start_time": "2021-12-04T16:20:09.191510", "version": "2.3.3"}, "widgets": {"application/vnd.jupyter.widget-state+json": {"state": {"00648a26dbda4fd5a46e11eb2de65394": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_046d7b6ec7ae4b7b835b38406ef12b7b", "max": 3126.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_f91e7c90408b4d189703088295affe7e", "value": 3126.0}}, "00ae340e2c934a289981b0fa1320a63c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "00c0ff7fb0d14a24a91f72f2261fe411": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "046d7b6ec7ae4b7b835b38406ef12b7b": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "0963635c7a054aa6b3d78746adca575e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_dcaea45e34e741b6a90232516d5e5cc9", "placeholder": "\u200b", "style": "IPY_MODEL_f9b913913c4b4491ac3bcf7fa35384ef", "value": "Validating: 100%"}}, "0d3841271e604be7b572f89d155537fa": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_00c0ff7fb0d14a24a91f72f2261fe411", "placeholder": "\u200b", "style": "IPY_MODEL_3219d2bbd48b4a268d7a9e1c28768e37", "value": " 1560/1563 [00:17<00:00, 89.54it/s]"}}, "0ed93a7a201f484eaa6f8d7246a5038f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_6af962b59cad4dba940f908fe07b961b", "max": 1563.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_54adbc53f7f14af5974fa706733bad2e", "value": 1563.0}}, "0eed8fb3fe1a47308f90660740da3708": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_70799825c1db415f98624df354200512", "IPY_MODEL_bb97a6ac530a452899a0323aa84cb8ea", "IPY_MODEL_0d3841271e604be7b572f89d155537fa"], "layout": "IPY_MODEL_9f16f1a321e54049ad9e4341550e5642"}}, "10a200370e054b249ecf1ea16ecf383f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "15d06f0222f441e58bb27b82be5b188f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "162bc591eff249078b9cc67ef718da0a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d621bcb9284e47e28c190e6a7781924d", "max": 1563.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_6de03aba110e4897aad75f6052017fd1", "value": 1563.0}}, "195c56daec194f64a8a6c318adef0af0": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "19e4d1afe39c4b3ca0f37b8851cc8707": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "1a3a9cc456654328b7a7bf78905af9b3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a113958c0fe445a0b3227b4c41bb54cf", "max": 46827520.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_d12a329b34864edea9fb3c511ca062fe", "value": 46827520.0}}, "1c89b25cd44d42d8b6eb2c8937ac96fe": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_52d64155154f40509e85bb87d133e2c2", "placeholder": "\u200b", "style": "IPY_MODEL_b1f5934bc26f4f04a3eb235a87ec8d9c", "value": "Validating: 100%"}}, "1cc3e5803d3a4657bcdd8fc1d061c12b": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1e560bd4592943dabe0b4f5535a76933": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "danger", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_579307f4c11b4a02a9ad16d735305b01", "max": 2.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_aca0852b47ca4a55a2e2104bf21e8e87", "value": 0.0}}, "231f4c199a8f458e8ca9cb5987a5bedb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "243cac8083774d7993f668e7e17cdb10": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "24987c3a0e9945e3aa4184de42cd8133": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "24e727294dec4d55b83d7d9bd834590f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "24ead37777974d36bede94e54e270620": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "26a0a012ab2a4accac6df52663a5c3b3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_59aad08c7f434fd3aa35c2bee4f73a95", "IPY_MODEL_2b9cdd139e6d45a4a185da07900faf2f", "IPY_MODEL_ff1843ce802446d587aa5d666f2fffb2"], "layout": "IPY_MODEL_10a200370e054b249ecf1ea16ecf383f"}}, "2b32eddc9ca547ceace73440308036a7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e4407841504c456da355ea8b54e4a43b", "max": 1563.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_f68bc350228c4e7397629524e9325f0d", "value": 1563.0}}, "2b9cdd139e6d45a4a185da07900faf2f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_33d08c68fa77428d9fddcdc29625e1ee", "max": 1563.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_231f4c199a8f458e8ca9cb5987a5bedb", "value": 1563.0}}, "2c337a8fa7874b6aaa9502467932c0fe": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_9b8e8dd3fd5a46d786745a1851c72bbf", "max": 1563.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_6a66e81e0cc845e696ce7ff3c0d01b7b", "value": 1563.0}}, "3219d2bbd48b4a268d7a9e1c28768e37": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "33d08c68fa77428d9fddcdc29625e1ee": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3436c7b40e684abbb6d5d925c1e3562c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "36ed0a721f424d74b38eb5a912ab693b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c39a8ce99b7f4f0dbc2c34aa53c972d2", "placeholder": "\u200b", "style": "IPY_MODEL_86a453d61d574ac1baa007882b7a6b0f", "value": " 1560/1563 [00:17<00:00, 89.36it/s]"}}, "371384fdf3a8410191184cc20007148d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "3809e6fe848843dfaaf6b9e7f5a08dc8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_6210e1a1628048b39561d7e5f684ab73", "placeholder": "\u200b", "style": "IPY_MODEL_ad50fbd1f4be41f6935d8efbafe4da05", "value": " 1560/1563 [00:17<00:00, 89.13it/s]"}}, "384a2ed4bd214b6299151e6e870fb7fc": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3e467637b02b4cfd85562b3f1c5b58e8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_fb06c3f845574aeb8dc22e44961cd33f", "IPY_MODEL_2c337a8fa7874b6aaa9502467932c0fe", "IPY_MODEL_36ed0a721f424d74b38eb5a912ab693b"], "layout": "IPY_MODEL_87c36192b69043779c3db1bf5fee3872"}}, "408e2b530a9641e18ea5df659d08e4ae": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "42ea17def7cc48e59c0e0f95348555c4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_711ca9fe21654973ae92db9419db1252", "max": 1563.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_699fae0a08bb42fb944ad9d33aab171d", "value": 1563.0}}, "44d5b7627b544985bc926220a5bc9a20": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_c4516ed461704a70afb4dc46435a3f56", "IPY_MODEL_925fcc0b20d747fd9f0d5ec004b07ff0", "IPY_MODEL_e1ffcef9fbd94b638001b8f6b09eaa24"], "layout": "IPY_MODEL_d31f5864c95a4fc5a83552e28a52d0c7"}}, "479a86133e0e40dcad3f097243ad760c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "47d19a4a9d7d40a98ec8311b15742d30": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "47eca2c448fd42cdbb4171118143b086": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "47f1a317780d4bd080de45c16617045a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4d0bbc3b172f458dbc05e627ab55422b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "4eaacd5d1c9c4c2c91330d16285a3fdb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_bfd5a2987c7e48f0ba3c06565fc43e16", "placeholder": "\u200b", "style": "IPY_MODEL_7e6dd612c3094b56861bfbf839635c56", "value": " 44.7M/44.7M [00:00<00:00, 77.3MB/s]"}}, "4eb11692485a4c7aa6e6b08cf42af441": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "4eecb5352ef14d36a58a439ceba50d09": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_70d3ca125efb40aabb4e2f09f0d8673a", "placeholder": "\u200b", "style": "IPY_MODEL_e01d3ee23be94b33bc2eb290319c680a", "value": "Validating: 100%"}}, "4f478fcfc9dd4785823b60704e03e896": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "4fa52e476b6a463d9fbd3fe51fba722f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "52d64155154f40509e85bb87d133e2c2": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "54adbc53f7f14af5974fa706733bad2e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "555f5797cc10466da974bab15226644e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "558464e277d24562a26ef9696c7bad0d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_4eecb5352ef14d36a58a439ceba50d09", "IPY_MODEL_162bc591eff249078b9cc67ef718da0a", "IPY_MODEL_af817170ed6943f18f5d497fbfb4fbf6"], "layout": "IPY_MODEL_4f478fcfc9dd4785823b60704e03e896"}}, "579307f4c11b4a02a9ad16d735305b01": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "58a0aef8e87247a9a7251faa45b5a0e4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e82e94047cdf40649ad6d937c19b8a9c", "placeholder": "\u200b", "style": "IPY_MODEL_371384fdf3a8410191184cc20007148d", "value": "Validating: 100%"}}, "59aad08c7f434fd3aa35c2bee4f73a95": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_243cac8083774d7993f668e7e17cdb10", "placeholder": "\u200b", "style": "IPY_MODEL_bf7dfb92583341f4942256a769bb3c87", "value": "Validating: 100%"}}, "5a9c032cecf54bcc82e7e513f2df06fc": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "5ab4ced2d2af4d8b99579329b6d08851": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_1c89b25cd44d42d8b6eb2c8937ac96fe", "IPY_MODEL_42ea17def7cc48e59c0e0f95348555c4", "IPY_MODEL_671449dc36d847a2ad8de05053960192"], "layout": "IPY_MODEL_68a74fe8935b4009bf74be5b575d0c27"}}, "5bc08e9c52764c8eb90024a7553652f1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "5edc7ec8b841473b920060032307385a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "61398a1cc2df40cb993dcbadf134d6eb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "6210e1a1628048b39561d7e5f684ab73": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "62258ba192b44f1782b24c2b3c6704da": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "671449dc36d847a2ad8de05053960192": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a88798c471b24f27b68b964b603bc4fa", "placeholder": "\u200b", "style": "IPY_MODEL_b4c14d3ba7174694bf9c2967ea5fa369", "value": " 1560/1563 [00:17<00:00, 88.36it/s]"}}, "68a74fe8935b4009bf74be5b575d0c27": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "699fae0a08bb42fb944ad9d33aab171d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "6a66e81e0cc845e696ce7ff3c0d01b7b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "6af962b59cad4dba940f908fe07b961b": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "6de03aba110e4897aad75f6052017fd1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "6dfddf144e2d43428755da99ae5ade36": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "70799825c1db415f98624df354200512": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_da0599f60e9a462bad72a7a78c3832b8", "placeholder": "\u200b", "style": "IPY_MODEL_d0eb14e4e0594f82890b77087740a299", "value": "Validating: 100%"}}, "70d3ca125efb40aabb4e2f09f0d8673a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "711ca9fe21654973ae92db9419db1252": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "715baf310fe648feb142396eecf38d0a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1cc3e5803d3a4657bcdd8fc1d061c12b", "placeholder": "\u200b", "style": "IPY_MODEL_4d0bbc3b172f458dbc05e627ab55422b", "value": " 1560/1563 [00:17<00:00, 87.18it/s]"}}, "772ed0b8cf8442c989145ce9f497f307": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_9676b47b51cd408a93294f1744d9cea0", "placeholder": "\u200b", "style": "IPY_MODEL_f2f9d0ed7c854e2b846bf55b27d11b8a", "value": " 1560/1563 [00:17<00:00, 89.64it/s]"}}, "79c867abef4f483a806ae5fca70d480b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f2414c6fd3224202a1c15254d26a326e", "placeholder": "\u200b", "style": "IPY_MODEL_47eca2c448fd42cdbb4171118143b086", "value": "Validating: 100%"}}, "7a64b6cedb514aaba2da59fc403764de": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c2138e3e88574b7dbec8aa95d9df0cd6", "placeholder": "\u200b", "style": "IPY_MODEL_c69aef2f63754111a0c7c556e6f06240", "value": " 3126/3126 [01:02<00:00, 49.85it/s, loss=6.37, v_num=0, valid_acc=0.627]"}}, "7c061e609d934ff898a6ecf8adca080c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "7cfd590006c94519a366a6d9d84f5175": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c51d4d146a6d4181a06f30c9b357c634", "placeholder": "\u200b", "style": "IPY_MODEL_f1042eb12a7844d6a76a5313b589379d", "value": "Validating: 100%"}}, "7e6dd612c3094b56861bfbf839635c56": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "86a453d61d574ac1baa007882b7a6b0f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "86cc8c84003d40b58f5a92580a3dbe16": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "874502aaeb7b4cd8b7f09e3dd432b9c2": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "87c36192b69043779c3db1bf5fee3872": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "8f5b3bb013e54b789487936589afaaaa": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "925fcc0b20d747fd9f0d5ec004b07ff0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_24987c3a0e9945e3aa4184de42cd8133", "max": 170498071.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_3436c7b40e684abbb6d5d925c1e3562c", "value": 170498071.0}}, "9676b47b51cd408a93294f1744d9cea0": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "98b44dcfc1de4e7ea715d9cae75c34c5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "9a80a16ecded4902b414de0c6534eeec": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "9b8e8dd3fd5a46d786745a1851c72bbf": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "9f16f1a321e54049ad9e4341550e5642": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "a0bcd7aa305e4919b63fee7e9a4c41cd": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "a113958c0fe445a0b3227b4c41bb54cf": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "a43601c3ae434a4e9e7c6c7bf5043e40": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "a5de7871bbd1480e949558688be41c31": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_9a80a16ecded4902b414de0c6534eeec", "max": 1563.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_c86eb064ecde400d9d1a5e0ec6919112", "value": 1563.0}}, "a714651a443a41bea533c841965a0122": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_24e727294dec4d55b83d7d9bd834590f", "max": 1563.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_4fa52e476b6a463d9fbd3fe51fba722f", "value": 1563.0}}, "a88798c471b24f27b68b964b603bc4fa": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ab99f6a13607433c846e0c8491ba5bfb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "aba2a18665444538aa89282c2ac8df50": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_5edc7ec8b841473b920060032307385a", "placeholder": "\u200b", "style": "IPY_MODEL_408e2b530a9641e18ea5df659d08e4ae", "value": "Epoch 9: 100%"}}, "ac1fbe8bcd9241359f10d2eb1865bd94": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_384a2ed4bd214b6299151e6e870fb7fc", "max": 1563.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_479a86133e0e40dcad3f097243ad760c", "value": 1563.0}}, "aca0852b47ca4a55a2e2104bf21e8e87": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "acbddb30cb4346699a58b846a50d5c72": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ad50fbd1f4be41f6935d8efbafe4da05": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "aef85224023d4c17bd6beef036b3bc95": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_0963635c7a054aa6b3d78746adca575e", "IPY_MODEL_a5de7871bbd1480e949558688be41c31", "IPY_MODEL_715baf310fe648feb142396eecf38d0a"], "layout": "IPY_MODEL_62258ba192b44f1782b24c2b3c6704da"}}, "af817170ed6943f18f5d497fbfb4fbf6": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_cea2bd49df4f4445aceafe78bd628574", "placeholder": "\u200b", "style": "IPY_MODEL_ab99f6a13607433c846e0c8491ba5bfb", "value": " 1560/1563 [00:17<00:00, 92.42it/s]"}}, "afb56e9b281d41eaa676543b2a9dc32c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_dbf6e3b998a1419bbaabec661484e424", "placeholder": "\u200b", "style": "IPY_MODEL_a0bcd7aa305e4919b63fee7e9a4c41cd", "value": "Validating: 100%"}}, "b1f5934bc26f4f04a3eb235a87ec8d9c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "b3cf8f790356444e811a7505b8d9418e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "b4c14d3ba7174694bf9c2967ea5fa369": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "b6d3b98afbca43dda7d416208a651068": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b76ee81572514e77b560271a3c505645": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_79c867abef4f483a806ae5fca70d480b", "IPY_MODEL_a714651a443a41bea533c841965a0122", "IPY_MODEL_772ed0b8cf8442c989145ce9f497f307"], "layout": "IPY_MODEL_b3cf8f790356444e811a7505b8d9418e"}}, "b8210703bcc4451e877bf84bb63d0520": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b969d392aae3406f98244c05ffc71752": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_afb56e9b281d41eaa676543b2a9dc32c", "IPY_MODEL_0ed93a7a201f484eaa6f8d7246a5038f", "IPY_MODEL_bf1aff0040a04b83ac127f15c82ea8bb"], "layout": "IPY_MODEL_e0eceb45524d4044a25b165087aa1167"}}, "bb46bed597e04aa68d65fa7583f0b2fb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_ebef98d79fd84c7a8f9589c23a507c7f", "IPY_MODEL_1a3a9cc456654328b7a7bf78905af9b3", "IPY_MODEL_4eaacd5d1c9c4c2c91330d16285a3fdb"], "layout": "IPY_MODEL_98b44dcfc1de4e7ea715d9cae75c34c5"}}, "bb97a6ac530a452899a0323aa84cb8ea": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_be1548fdd13a40c1a50d943bdc0c6503", "max": 1563.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_8f5b3bb013e54b789487936589afaaaa", "value": 1563.0}}, "bc56a439a8c747419a9cfce366960df9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_bd92bb6a660a4fccbb217a891fdfda3e", "IPY_MODEL_1e560bd4592943dabe0b4f5535a76933", "IPY_MODEL_be0a49f27744499e89140291c9a6f48f"], "layout": "IPY_MODEL_195c56daec194f64a8a6c318adef0af0"}}, "bd92bb6a660a4fccbb217a891fdfda3e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_874502aaeb7b4cd8b7f09e3dd432b9c2", "placeholder": "\u200b", "style": "IPY_MODEL_24ead37777974d36bede94e54e270620", "value": "Validation sanity check: 0%"}}, "be0a49f27744499e89140291c9a6f48f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_6dfddf144e2d43428755da99ae5ade36", "placeholder": "\u200b", "style": "IPY_MODEL_00ae340e2c934a289981b0fa1320a63c", "value": " 0/2 [00:00<?, ?it/s]"}}, "be1548fdd13a40c1a50d943bdc0c6503": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "bf1aff0040a04b83ac127f15c82ea8bb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_47f1a317780d4bd080de45c16617045a", "placeholder": "\u200b", "style": "IPY_MODEL_61398a1cc2df40cb993dcbadf134d6eb", "value": " 1560/1563 [00:17<00:00, 88.37it/s]"}}, "bf7dfb92583341f4942256a769bb3c87": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "bfd5a2987c7e48f0ba3c06565fc43e16": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c2138e3e88574b7dbec8aa95d9df0cd6": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c39a8ce99b7f4f0dbc2c34aa53c972d2": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c4516ed461704a70afb4dc46435a3f56": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_7c061e609d934ff898a6ecf8adca080c", "placeholder": "\u200b", "style": "IPY_MODEL_19e4d1afe39c4b3ca0f37b8851cc8707", "value": ""}}, "c51d4d146a6d4181a06f30c9b357c634": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c69aef2f63754111a0c7c556e6f06240": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "c86eb064ecde400d9d1a5e0ec6919112": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "cea2bd49df4f4445aceafe78bd628574": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d0eb14e4e0594f82890b77087740a299": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "d12a329b34864edea9fb3c511ca062fe": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "d31f5864c95a4fc5a83552e28a52d0c7": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d621bcb9284e47e28c190e6a7781924d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d6dfa8b20f7c47ba8367a50953618cef": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_15d06f0222f441e58bb27b82be5b188f", "placeholder": "\u200b", "style": "IPY_MODEL_5bc08e9c52764c8eb90024a7553652f1", "value": " 1560/1563 [00:17<00:00, 89.27it/s]"}}, "d77d420abcbf47c0923ae5c54c44fa93": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_aba2a18665444538aa89282c2ac8df50", "IPY_MODEL_00648a26dbda4fd5a46e11eb2de65394", "IPY_MODEL_7a64b6cedb514aaba2da59fc403764de"], "layout": "IPY_MODEL_5a9c032cecf54bcc82e7e513f2df06fc"}}, "da0599f60e9a462bad72a7a78c3832b8": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "da2c2bcab50d42a4b69305ce45610d95": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "db87d19eb9a14d00926944a0945a7e55": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "dbf6e3b998a1419bbaabec661484e424": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "dcaea45e34e741b6a90232516d5e5cc9": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "e01d3ee23be94b33bc2eb290319c680a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "e0eceb45524d4044a25b165087aa1167": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "e1ffcef9fbd94b638001b8f6b09eaa24": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_86cc8c84003d40b58f5a92580a3dbe16", "placeholder": "\u200b", "style": "IPY_MODEL_555f5797cc10466da974bab15226644e", "value": " 170499072/? [00:01<00:00, 113379438.72it/s]"}}, "e4407841504c456da355ea8b54e4a43b": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "e82e94047cdf40649ad6d937c19b8a9c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "eb4d88a3e74c4b8286414f889c809850": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_7cfd590006c94519a366a6d9d84f5175", "IPY_MODEL_ac1fbe8bcd9241359f10d2eb1865bd94", "IPY_MODEL_d6dfa8b20f7c47ba8367a50953618cef"], "layout": "IPY_MODEL_a43601c3ae434a4e9e7c6c7bf5043e40"}}, "ebef98d79fd84c7a8f9589c23a507c7f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b6d3b98afbca43dda7d416208a651068", "placeholder": "\u200b", "style": "IPY_MODEL_47d19a4a9d7d40a98ec8311b15742d30", "value": "100%"}}, "efee6a19f778444e987cf2f8b9c9e709": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_58a0aef8e87247a9a7251faa45b5a0e4", "IPY_MODEL_2b32eddc9ca547ceace73440308036a7", "IPY_MODEL_3809e6fe848843dfaaf6b9e7f5a08dc8"], "layout": "IPY_MODEL_da2c2bcab50d42a4b69305ce45610d95"}}, "f1042eb12a7844d6a76a5313b589379d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "f2414c6fd3224202a1c15254d26a326e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "f2f9d0ed7c854e2b846bf55b27d11b8a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "f68bc350228c4e7397629524e9325f0d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "f91e7c90408b4d189703088295affe7e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "f9b913913c4b4491ac3bcf7fa35384ef": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "fb06c3f845574aeb8dc22e44961cd33f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_acbddb30cb4346699a58b846a50d5c72", "placeholder": "\u200b", "style": "IPY_MODEL_4eb11692485a4c7aa6e6b08cf42af441", "value": "Validating: 100%"}}, "ff1843ce802446d587aa5d666f2fffb2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b8210703bcc4451e877bf84bb63d0520", "placeholder": "\u200b", "style": "IPY_MODEL_db87d19eb9a14d00926944a0945a7e55", "value": " 1560/1563 [00:17<00:00, 89.28it/s]"}}}, "version_major": 2, "version_minor": 0}}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/lightning_examples/barlow-twins.ipynb b/source/notebooks/lightning_examples/barlow-twins.ipynb deleted file mode 100644 index cc46f85..0000000 --- a/source/notebooks/lightning_examples/barlow-twins.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "9b0d3dbf", "metadata": {"papermill": {"duration": 0.012709, "end_time": "2021-10-25T20:00:43.480755", "exception": false, "start_time": "2021-10-25T20:00:43.468046", "status": "completed"}, "tags": []}, "source": ["\n", "# Barlow Twins Tutorial\n", "\n", "* **Author:** Ananya Harsh Jha (ananya@pytorchlightning.ai)\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-10-25T22:00:34.269471\n", "\n", "This notebook describes the self-supervised learning method Barlow Twins.\n", "Barlow Twins differs from other recently proposed algorithms as it doesn't\n", "fall under the category of either contrastive learning, or methods like knowledge\n", "distillation or clustering. The simplicity of the loss function and its effectiveness\n", "in comparison to the current state of the art makes Barlow Twins an interesting\n", "case study.\n", "\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/lightning_examples/barlow-twins.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "a0f8a9cf", "metadata": {"papermill": {"duration": 0.011144, "end_time": "2021-10-25T20:00:43.503475", "exception": false, "start_time": "2021-10-25T20:00:43.492331", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "9ba1fb3e", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-10-25T20:00:43.529599Z", "iopub.status.busy": "2021-10-25T20:00:43.529097Z", "iopub.status.idle": "2021-10-25T20:00:43.531815Z", "shell.execute_reply": "2021-10-25T20:00:43.531280Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 0.017035, "end_time": "2021-10-25T20:00:43.531927", "exception": false, "start_time": "2021-10-25T20:00:43.514892", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# ! pip install --quiet \"torch>=1.6, <1.9\" \"torchmetrics>=0.3\" \"torchvision\" \"matplotlib\" \"pytorch-lightning>=1.3\""]}, {"cell_type": "markdown", "id": "23d70cf8", "metadata": {"papermill": {"duration": 0.011167, "end_time": "2021-10-25T20:00:43.554606", "exception": false, "start_time": "2021-10-25T20:00:43.543439", "status": "completed"}, "tags": []}, "source": ["## Barlow Twins\n", "\n", "Barlow Twins finds itself in unique place amongst the current state-of-the-art self-supervised learning methods. It does not fall under the existing categories of contrastive learning, knowledge distillation or clustering based methods. Instead, it creates its own category of redundancy reductionand achieves competitive performance with a simple yet effective loss function. In this tutorial, we look at coding up a small version of Barlow Twins algorithm using PyTorch Lightning."]}, {"cell_type": "code", "execution_count": 2, "id": "29341bf4", "metadata": {"execution": {"iopub.execute_input": "2021-10-25T20:00:43.584461Z", "iopub.status.busy": "2021-10-25T20:00:43.583974Z", "iopub.status.idle": "2021-10-25T20:00:44.983203Z", "shell.execute_reply": "2021-10-25T20:00:44.982750Z"}, "papermill": {"duration": 1.417567, "end_time": "2021-10-25T20:00:44.983322", "exception": false, "start_time": "2021-10-25T20:00:43.565755", "status": "completed"}, "tags": []}, "outputs": [], "source": ["from functools import partial\n", "from typing import Sequence, Tuple, Union\n", "\n", "import matplotlib.pyplot as plt\n", "import numpy as np\n", "import pytorch_lightning as pl\n", "import torch\n", "import torch.nn as nn\n", "import torch.nn.functional as F\n", "import torchvision.transforms as transforms\n", "import torchvision.transforms.functional as VisionF\n", "from pytorch_lightning import Callback, LightningModule, Trainer\n", "from pytorch_lightning.callbacks import ModelCheckpoint\n", "from pytorch_lightning.metrics.functional import accuracy\n", "from torch.utils.data import DataLoader\n", "from torchvision.datasets import CIFAR10\n", "from torchvision.models.resnet import resnet18\n", "from torchvision.utils import make_grid\n", "\n", "batch_size = 32\n", "num_workers = 0 # to run notebook on CPU\n", "max_epochs = 200\n", "z_dim = 128"]}, {"cell_type": "markdown", "id": "721a96db", "metadata": {"papermill": {"duration": 0.011192, "end_time": "2021-10-25T20:00:45.006236", "exception": false, "start_time": "2021-10-25T20:00:44.995044", "status": "completed"}, "tags": []}, "source": ["### Transforms\n", "\n", "We first define the data augmentation pipeline used in Barlow Twins. Here, we use pipeline proposed in SimCLR, which generates two copies/views of an input image by applying the following transformations in a sequence.\n", "\n", "First it takes a random crop of the image and resizes it to a fixed pre-specified size. Then, it applies a left-to-right random flip with a probability of 0.5. This step is followed by a composition of color jitter, conversion to grayscale with a probability of 0.2 and the application of a Gaussian blur filter. Finally, we normalize the image and convert it to a tensor.\n", "\n", "Within this transform, we add a third view for our online finetuner, which we explain later on. But, to explain things quickly here, we add a another transform to perform perform test our encoder on a downstream classification task."]}, {"cell_type": "code", "execution_count": 3, "id": "6cb8b894", "metadata": {"execution": {"iopub.execute_input": "2021-10-25T20:00:45.037011Z", "iopub.status.busy": "2021-10-25T20:00:45.030646Z", "iopub.status.idle": "2021-10-25T20:00:45.038691Z", "shell.execute_reply": "2021-10-25T20:00:45.039079Z"}, "papermill": {"duration": 0.021697, "end_time": "2021-10-25T20:00:45.039192", "exception": false, "start_time": "2021-10-25T20:00:45.017495", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class BarlowTwinsTransform:\n", " def __init__(self, train=True, input_height=224, gaussian_blur=True, jitter_strength=1.0, normalize=None):\n", "\n", " self.input_height = input_height\n", " self.gaussian_blur = gaussian_blur\n", " self.jitter_strength = jitter_strength\n", " self.normalize = normalize\n", " self.train = train\n", "\n", " color_jitter = transforms.ColorJitter(\n", " 0.8 * self.jitter_strength,\n", " 0.8 * self.jitter_strength,\n", " 0.8 * self.jitter_strength,\n", " 0.2 * self.jitter_strength,\n", " )\n", "\n", " color_transform = [transforms.RandomApply([color_jitter], p=0.8), transforms.RandomGrayscale(p=0.2)]\n", "\n", " if self.gaussian_blur:\n", " kernel_size = int(0.1 * self.input_height)\n", " if kernel_size % 2 == 0:\n", " kernel_size += 1\n", "\n", " color_transform.append(transforms.RandomApply([transforms.GaussianBlur(kernel_size=kernel_size)], p=0.5))\n", "\n", " self.color_transform = transforms.Compose(color_transform)\n", "\n", " if normalize is None:\n", " self.final_transform = transforms.ToTensor()\n", " else:\n", " self.final_transform = transforms.Compose([transforms.ToTensor(), normalize])\n", "\n", " self.transform = transforms.Compose(\n", " [\n", " transforms.RandomResizedCrop(self.input_height),\n", " transforms.RandomHorizontalFlip(p=0.5),\n", " self.color_transform,\n", " self.final_transform,\n", " ]\n", " )\n", "\n", " self.finetune_transform = None\n", " if self.train:\n", " self.finetune_transform = transforms.Compose(\n", " [\n", " transforms.RandomCrop(32, padding=4, padding_mode=\"reflect\"),\n", " transforms.RandomHorizontalFlip(),\n", " transforms.ToTensor(),\n", " ]\n", " )\n", " else:\n", " self.finetune_transform = transforms.ToTensor()\n", "\n", " def __call__(self, sample):\n", " return self.transform(sample), self.transform(sample), self.finetune_transform(sample)"]}, {"cell_type": "markdown", "id": "69b57f48", "metadata": {"papermill": {"duration": 0.011342, "end_time": "2021-10-25T20:00:45.061887", "exception": false, "start_time": "2021-10-25T20:00:45.050545", "status": "completed"}, "tags": []}, "source": ["### Dataset\n", "\n", "We select CIFAR10 as the dataset to demonstrate the pre-training process for Barlow Twins. CIFAR10 images are 32x32 in size and we do not apply a Gaussian blur transformation on them. In this step, we create the training and validation dataloaders for CIFAR10."]}, {"cell_type": "code", "execution_count": 4, "id": "273da819", "metadata": {"execution": {"iopub.execute_input": "2021-10-25T20:00:45.091605Z", "iopub.status.busy": "2021-10-25T20:00:45.086769Z", "iopub.status.idle": "2021-10-25T20:00:49.752232Z", "shell.execute_reply": "2021-10-25T20:00:49.751801Z"}, "papermill": {"duration": 4.679129, "end_time": "2021-10-25T20:00:49.752355", "exception": false, "start_time": "2021-10-25T20:00:45.073226", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to ./cifar-10-python.tar.gz\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "b13dfae7160c4c8586c5780f597cd8e4", "version_major": 2, "version_minor": 0}, "text/plain": [" 0%| | 0/170498071 [00:00"]}, "metadata": {}, "output_type": "display_data"}], "source": ["for batch in val_loader:\n", " (img1, img2, _), label = batch\n", " break\n", "\n", "img_grid = make_grid(img1, normalize=True)\n", "\n", "\n", "def show(imgs):\n", " if not isinstance(imgs, list):\n", " imgs = [imgs]\n", " fix, axs = plt.subplots(ncols=len(imgs), squeeze=False)\n", " for i, img in enumerate(imgs):\n", " img = img.detach()\n", " img = VisionF.to_pil_image(img)\n", " axs[0, i].imshow(np.asarray(img))\n", " axs[0, i].set(xticklabels=[], yticklabels=[], xticks=[], yticks=[])\n", "\n", "\n", "show(img_grid)"]}, {"cell_type": "markdown", "id": "a0233366", "metadata": {"papermill": {"duration": 0.018776, "end_time": "2021-10-25T20:00:50.033993", "exception": false, "start_time": "2021-10-25T20:00:50.015217", "status": "completed"}, "tags": []}, "source": ["### Barlow Twins Loss\n", "\n", "Here we define the loss function for Barlow Twins. It first normalizes the D dimensinonal vectors from the projection head and then computes the DxD cross-correlation matrix between the normalized vectors of the 2 views of each image.\n", "\n", "Then it splits this cross-correlation matrix into two parts. The first part, the diagonal of this matrix is brought closer to 1, which pushes up the cosine similarity between the latent vectors of two views of each image, thus making the backbone invariant to the transformations applied to the views. The second part of the loss pushes the non-diagonal elements of the cross-corrlelation matrix closes to 0. This reduces the redundancy between the different dimensions of the latent vector."]}, {"cell_type": "code", "execution_count": 6, "id": "7f3f6369", "metadata": {"execution": {"iopub.execute_input": "2021-10-25T20:00:50.069422Z", "iopub.status.busy": "2021-10-25T20:00:50.068917Z", "iopub.status.idle": "2021-10-25T20:00:50.071108Z", "shell.execute_reply": "2021-10-25T20:00:50.070701Z"}, "papermill": {"duration": 0.02278, "end_time": "2021-10-25T20:00:50.071208", "exception": false, "start_time": "2021-10-25T20:00:50.048428", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class BarlowTwinsLoss(nn.Module):\n", " def __init__(self, batch_size, lambda_coeff=5e-3, z_dim=128):\n", " super().__init__()\n", "\n", " self.z_dim = z_dim\n", " self.batch_size = batch_size\n", " self.lambda_coeff = lambda_coeff\n", "\n", " def off_diagonal_ele(self, x):\n", " # taken from: https://github.com/facebookresearch/barlowtwins/blob/main/main.py\n", " # return a flattened view of the off-diagonal elements of a square matrix\n", " n, m = x.shape\n", " assert n == m\n", " return x.flatten()[:-1].view(n - 1, n + 1)[:, 1:].flatten()\n", "\n", " def forward(self, z1, z2):\n", " # N x D, where N is the batch size and D is output dim of projection head\n", " z1_norm = (z1 - torch.mean(z1, dim=0)) / torch.std(z1, dim=0)\n", " z2_norm = (z2 - torch.mean(z2, dim=0)) / torch.std(z2, dim=0)\n", "\n", " cross_corr = torch.matmul(z1_norm.T, z2_norm) / self.batch_size\n", "\n", " on_diag = torch.diagonal(cross_corr).add_(-1).pow_(2).sum()\n", " off_diag = self.off_diagonal_ele(cross_corr).pow_(2).sum()\n", "\n", " return on_diag + self.lambda_coeff * off_diag"]}, {"cell_type": "markdown", "id": "050c8b3c", "metadata": {"papermill": {"duration": 0.014594, "end_time": "2021-10-25T20:00:50.101352", "exception": false, "start_time": "2021-10-25T20:00:50.086758", "status": "completed"}, "tags": []}, "source": ["### Backbone\n", "\n", "This is a standard Resnet backbone that we pre-train using the Barlow Twins method. To accommodate the 32x32 CIFAR10 images, we replace the first 7x7 convolution of the Resnet backbone by a 3x3 filter. We also remove the first Maxpool layer from the network for CIFAR10 images."]}, {"cell_type": "code", "execution_count": 7, "id": "a1df9ad9", "metadata": {"execution": {"iopub.execute_input": "2021-10-25T20:00:50.134356Z", "iopub.status.busy": "2021-10-25T20:00:50.133886Z", "iopub.status.idle": "2021-10-25T20:00:50.315984Z", "shell.execute_reply": "2021-10-25T20:00:50.315481Z"}, "papermill": {"duration": 0.200049, "end_time": "2021-10-25T20:00:50.316105", "exception": false, "start_time": "2021-10-25T20:00:50.116056", "status": "completed"}, "tags": []}, "outputs": [], "source": ["encoder = resnet18()\n", "\n", "# for CIFAR10, replace the first 7x7 conv with smaller 3x3 conv and remove the first maxpool\n", "encoder.conv1 = nn.Conv2d(3, 64, kernel_size=3, stride=1, padding=1, bias=False)\n", "encoder.maxpool = nn.MaxPool2d(kernel_size=1, stride=1)\n", "\n", "# replace classification fc layer of Resnet to obtain representations from the backbone\n", "encoder.fc = nn.Identity()"]}, {"cell_type": "markdown", "id": "c85b1d8a", "metadata": {"papermill": {"duration": 0.014604, "end_time": "2021-10-25T20:00:50.345738", "exception": false, "start_time": "2021-10-25T20:00:50.331134", "status": "completed"}, "tags": []}, "source": ["### Projection head\n", "\n", "Unlike SimCLR and BYOL, the downstream performance of Barlow Twins greatly benefits from having a larger projection head after the backbone network. The paper utilizes a 3 layer MLP with 8192 hidden dimensions and 8192 as the output dimenion of the projection head. For the purposes of the tutorial, we use a smaller projection head. But, it is imperative to mention here that in practice, Barlow Twins needs to be trained using a bigger projection head as it is highly sensitive to its architecture and output dimensionality."]}, {"cell_type": "code", "execution_count": 8, "id": "62392e1c", "metadata": {"execution": {"iopub.execute_input": "2021-10-25T20:00:50.379426Z", "iopub.status.busy": "2021-10-25T20:00:50.378950Z", "iopub.status.idle": "2021-10-25T20:00:50.380731Z", "shell.execute_reply": "2021-10-25T20:00:50.381114Z"}, "papermill": {"duration": 0.020782, "end_time": "2021-10-25T20:00:50.381232", "exception": false, "start_time": "2021-10-25T20:00:50.360450", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class ProjectionHead(nn.Module):\n", " def __init__(self, input_dim=2048, hidden_dim=2048, output_dim=128):\n", " super().__init__()\n", "\n", " self.projection_head = nn.Sequential(\n", " nn.Linear(input_dim, hidden_dim, bias=True),\n", " nn.BatchNorm1d(hidden_dim),\n", " nn.ReLU(),\n", " nn.Linear(hidden_dim, output_dim, bias=False),\n", " )\n", "\n", " def forward(self, x):\n", " return self.projection_head(x)"]}, {"cell_type": "markdown", "id": "3b69afcd", "metadata": {"papermill": {"duration": 0.014461, "end_time": "2021-10-25T20:00:50.410233", "exception": false, "start_time": "2021-10-25T20:00:50.395772", "status": "completed"}, "tags": []}, "source": ["### Learning rate warmup\n", "\n", "For the purposes of this tutorial, we keep things simple and use a linear warmup schedule with Adam optimizer. In our previous experiments we have found that linear warmup part is much more important for the final performance of a model than the cosine decay component of the schedule."]}, {"cell_type": "code", "execution_count": 9, "id": "1df8bf31", "metadata": {"execution": {"iopub.execute_input": "2021-10-25T20:00:50.442982Z", "iopub.status.busy": "2021-10-25T20:00:50.442512Z", "iopub.status.idle": "2021-10-25T20:00:50.444620Z", "shell.execute_reply": "2021-10-25T20:00:50.444217Z"}, "papermill": {"duration": 0.019933, "end_time": "2021-10-25T20:00:50.444716", "exception": false, "start_time": "2021-10-25T20:00:50.424783", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def fn(warmup_steps, step):\n", " if step < warmup_steps:\n", " return float(step) / float(max(1, warmup_steps))\n", " else:\n", " return 1.0\n", "\n", "\n", "def linear_warmup_decay(warmup_steps):\n", " return partial(fn, warmup_steps)"]}, {"cell_type": "markdown", "id": "0f165fdf", "metadata": {"papermill": {"duration": 0.014653, "end_time": "2021-10-25T20:00:50.473995", "exception": false, "start_time": "2021-10-25T20:00:50.459342", "status": "completed"}, "tags": []}, "source": ["### Barlow Twins Lightning Module\n", "\n", "We keep the LightningModule for Barlow Twins neat and simple. It takes in an backbone encoder and initializes the projection head and the loss function. We configure the optimizer and the learning rate scheduler in the ``configure_optimizers`` method."]}, {"cell_type": "code", "execution_count": 10, "id": "ad94b021", "metadata": {"execution": {"iopub.execute_input": "2021-10-25T20:00:50.511807Z", "iopub.status.busy": "2021-10-25T20:00:50.511324Z", "iopub.status.idle": "2021-10-25T20:00:50.513468Z", "shell.execute_reply": "2021-10-25T20:00:50.512978Z"}, "papermill": {"duration": 0.024798, "end_time": "2021-10-25T20:00:50.513565", "exception": false, "start_time": "2021-10-25T20:00:50.488767", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class BarlowTwins(LightningModule):\n", " def __init__(\n", " self,\n", " encoder,\n", " encoder_out_dim,\n", " num_training_samples,\n", " batch_size,\n", " lambda_coeff=5e-3,\n", " z_dim=128,\n", " learning_rate=1e-4,\n", " warmup_epochs=10,\n", " max_epochs=200,\n", " ):\n", " super().__init__()\n", "\n", " self.encoder = encoder\n", " self.projection_head = ProjectionHead(input_dim=encoder_out_dim, hidden_dim=encoder_out_dim, output_dim=z_dim)\n", " self.loss_fn = BarlowTwinsLoss(batch_size=batch_size, lambda_coeff=lambda_coeff, z_dim=z_dim)\n", "\n", " self.learning_rate = learning_rate\n", " self.warmup_epochs = warmup_epochs\n", " self.max_epochs = max_epochs\n", "\n", " self.train_iters_per_epoch = num_training_samples // batch_size\n", "\n", " def forward(self, x):\n", " return self.encoder(x)\n", "\n", " def shared_step(self, batch):\n", " (x1, x2, _), _ = batch\n", "\n", " z1 = self.projection_head(self.encoder(x1))\n", " z2 = self.projection_head(self.encoder(x2))\n", "\n", " return self.loss_fn(z1, z2)\n", "\n", " def training_step(self, batch, batch_idx):\n", " loss = self.shared_step(batch)\n", "\n", " self.log(\"train_loss\", loss.item(), on_step=True, on_epoch=False)\n", " return loss\n", "\n", " def validation_step(self, batch, batch_idx):\n", " loss = self.shared_step(batch)\n", "\n", " self.log(\"val_loss\", loss, on_step=False, on_epoch=True)\n", " return loss\n", "\n", " def configure_optimizers(self):\n", " optimizer = torch.optim.Adam(self.parameters(), lr=self.learning_rate)\n", "\n", " warmup_steps = self.train_iters_per_epoch * self.warmup_epochs\n", "\n", " scheduler = {\n", " \"scheduler\": torch.optim.lr_scheduler.LambdaLR(\n", " optimizer,\n", " linear_warmup_decay(warmup_steps),\n", " ),\n", " \"interval\": \"step\",\n", " \"frequency\": 1,\n", " }\n", "\n", " return [optimizer], [scheduler]"]}, {"cell_type": "markdown", "id": "5ec4d0aa", "metadata": {"papermill": {"duration": 0.014734, "end_time": "2021-10-25T20:00:50.543024", "exception": false, "start_time": "2021-10-25T20:00:50.528290", "status": "completed"}, "tags": []}, "source": ["### Evaluation\n", "\n", "We define a callback which appends a linear layer on top of the encoder and trains the classification evaluation head in an online manner. We make sure not to backpropagate the gradients back to the encoder while tuning the linear layer. This technique was used in SimCLR as well and they showed that the final downstream classification peformance is pretty much similar to the results on online finetuning as the training progresses."]}, {"cell_type": "code", "execution_count": 11, "id": "f271c5a3", "metadata": {"execution": {"iopub.execute_input": "2021-10-25T20:00:50.582976Z", "iopub.status.busy": "2021-10-25T20:00:50.574339Z", "iopub.status.idle": "2021-10-25T20:00:50.585053Z", "shell.execute_reply": "2021-10-25T20:00:50.584582Z"}, "papermill": {"duration": 0.027403, "end_time": "2021-10-25T20:00:50.585148", "exception": false, "start_time": "2021-10-25T20:00:50.557745", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class OnlineFineTuner(Callback):\n", " def __init__(\n", " self,\n", " encoder_output_dim: int,\n", " num_classes: int,\n", " ) -> None:\n", " super().__init__()\n", "\n", " self.optimizer: torch.optim.Optimizer\n", "\n", " self.encoder_output_dim = encoder_output_dim\n", " self.num_classes = num_classes\n", "\n", " def on_pretrain_routine_start(self, trainer: pl.Trainer, pl_module: pl.LightningModule) -> None:\n", "\n", " # add linear_eval layer and optimizer\n", " pl_module.online_finetuner = nn.Linear(self.encoder_output_dim, self.num_classes).to(pl_module.device)\n", " self.optimizer = torch.optim.Adam(pl_module.online_finetuner.parameters(), lr=1e-4)\n", "\n", " def extract_online_finetuning_view(\n", " self, batch: Sequence, device: Union[str, torch.device]\n", " ) -> Tuple[torch.Tensor, torch.Tensor]:\n", " (_, _, finetune_view), y = batch\n", " finetune_view = finetune_view.to(device)\n", " y = y.to(device)\n", "\n", " return finetune_view, y\n", "\n", " def on_train_batch_end(\n", " self,\n", " trainer: pl.Trainer,\n", " pl_module: pl.LightningModule,\n", " outputs: Sequence,\n", " batch: Sequence,\n", " batch_idx: int,\n", " dataloader_idx: int,\n", " ) -> None:\n", " x, y = self.extract_online_finetuning_view(batch, pl_module.device)\n", "\n", " with torch.no_grad():\n", " feats = pl_module(x)\n", "\n", " feats = feats.detach()\n", " preds = pl_module.online_finetuner(feats)\n", " loss = F.cross_entropy(preds, y)\n", "\n", " loss.backward()\n", " self.optimizer.step()\n", " self.optimizer.zero_grad()\n", "\n", " acc = accuracy(F.softmax(preds, dim=1), y)\n", " pl_module.log(\"online_train_acc\", acc, on_step=True, on_epoch=False)\n", " pl_module.log(\"online_train_loss\", loss, on_step=True, on_epoch=False)\n", "\n", " def on_validation_batch_end(\n", " self,\n", " trainer: pl.Trainer,\n", " pl_module: pl.LightningModule,\n", " outputs: Sequence,\n", " batch: Sequence,\n", " batch_idx: int,\n", " dataloader_idx: int,\n", " ) -> None:\n", " x, y = self.extract_online_finetuning_view(batch, pl_module.device)\n", "\n", " with torch.no_grad():\n", " feats = pl_module(x)\n", "\n", " feats = feats.detach()\n", " preds = pl_module.online_finetuner(feats)\n", " loss = F.cross_entropy(preds, y)\n", "\n", " acc = accuracy(F.softmax(preds, dim=1), y)\n", " pl_module.log(\"online_val_acc\", acc, on_step=False, on_epoch=True, sync_dist=True)\n", " pl_module.log(\"online_val_loss\", loss, on_step=False, on_epoch=True, sync_dist=True)"]}, {"cell_type": "markdown", "id": "c7f6bb76", "metadata": {"papermill": {"duration": 0.014775, "end_time": "2021-10-25T20:00:50.614884", "exception": false, "start_time": "2021-10-25T20:00:50.600109", "status": "completed"}, "tags": []}, "source": ["Finally, we define the trainer for training the model. We pass in the ``train_loader`` and ``val_loader`` we had initialized earlier to the ``fit`` function."]}, {"cell_type": "code", "execution_count": 12, "id": "21965f37", "metadata": {"execution": {"iopub.execute_input": "2021-10-25T20:00:50.649228Z", "iopub.status.busy": "2021-10-25T20:00:50.648753Z", "iopub.status.idle": "2021-10-25T20:00:50.731321Z", "shell.execute_reply": "2021-10-25T20:00:50.730897Z"}, "papermill": {"duration": 0.101688, "end_time": "2021-10-25T20:00:50.731435", "exception": false, "start_time": "2021-10-25T20:00:50.629747", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/callbacks/model_checkpoint.py:240: LightningDeprecationWarning: `ModelCheckpoint(every_n_val_epochs)` is deprecated in v1.4 and will be removed in v1.6. Please use `every_n_epochs` instead.\n", " rank_zero_deprecation(\n", "/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/callbacks/model_checkpoint.py:432: UserWarning: ModelCheckpoint(save_last=True, save_top_k=None, monitor=None) is a redundant configuration. You can save the last checkpoint with ModelCheckpoint(save_top_k=None, monitor=None).\n", " rank_zero_warn(\n", "ModelCheckpoint(save_last=True, save_top_k=-1, monitor=None) will duplicate the last checkpoint saved.\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/connectors/accelerator_connector.py:746: UserWarning: You requested multiple GPUs but did not specify a backend, e.g. `Trainer(accelerator=\"dp\"|\"ddp\"|\"ddp2\")`. Setting `accelerator=\"ddp_spawn\"` for you.\n", " rank_zero_warn(\n", "Using native 16bit precision.\n"]}, {"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}], "source": ["encoder_out_dim = 512\n", "\n", "model = BarlowTwins(\n", " encoder=encoder,\n", " encoder_out_dim=encoder_out_dim,\n", " num_training_samples=len(train_dataset),\n", " batch_size=batch_size,\n", " z_dim=z_dim,\n", ")\n", "\n", "online_finetuner = OnlineFineTuner(encoder_output_dim=encoder_out_dim, num_classes=10)\n", "checkpoint_callback = ModelCheckpoint(every_n_val_epochs=100, save_top_k=-1, save_last=True)\n", "\n", "trainer = Trainer(\n", " max_epochs=max_epochs,\n", " gpus=torch.cuda.device_count(),\n", " precision=16 if torch.cuda.device_count() > 0 else 32,\n", " callbacks=[online_finetuner, checkpoint_callback],\n", ")\n", "\n", "# uncomment this to train the model\n", "# this is done for the tutorial so that the notebook compiles\n", "# trainer.fit(model, train_loader, val_loader)"]}, {"cell_type": "markdown", "id": "9cb9b57c", "metadata": {"papermill": {"duration": 0.016005, "end_time": "2021-10-25T20:00:50.763854", "exception": false, "start_time": "2021-10-25T20:00:50.747849", "status": "completed"}, "tags": []}, "source": ["### Using the trained encoder for downstream tasks\n", "\n", "Once the encoder is pretrained on CIFAR10, we can use it to get image embeddings and use them further downstream on tasks like classification, detection, segmentation etc.\n", "\n", "In this tutorial, we did not completely train our encoder for 100s of epochs using the Barlow Twins pretraining method. So, we will load the pretrained encoder weights from a checkpoint and show the image embeddings obtained from that.\n", "\n", "To create this checkpoint, the encoder was pretrained for 200 epochs, and obtained a online finetune accuracy of x% on CIFAR-10."]}, {"cell_type": "code", "execution_count": 13, "id": "bc2dfce3", "metadata": {"execution": {"iopub.execute_input": "2021-10-25T20:00:50.800041Z", "iopub.status.busy": "2021-10-25T20:00:50.799564Z", "iopub.status.idle": "2021-10-25T20:00:51.171031Z", "shell.execute_reply": "2021-10-25T20:00:51.170535Z"}, "papermill": {"duration": 0.391254, "end_time": "2021-10-25T20:00:51.171147", "exception": false, "start_time": "2021-10-25T20:00:50.779893", "status": "completed"}, "tags": []}, "outputs": [{"name": "stdout", "output_type": "stream", "text": ["torch.Size([4, 512])\n"]}], "source": ["# ckpt_model = torch.load('') # upload checkpoint to aws\n", "# encoder = ckpt_model.encoder\n", "encoder = model.encoder\n", "\n", "downstream_dataset = CIFAR10(root=\".\", train=False, transform=transforms.ToTensor())\n", "dataloader = DataLoader(downstream_dataset, batch_size=4, shuffle=False)\n", "\n", "for batch in dataloader:\n", " img, label = batch\n", " print(encoder(img).shape)\n", " break"]}, {"cell_type": "markdown", "id": "68078df0", "metadata": {"papermill": {"duration": 0.01633, "end_time": "2021-10-25T20:00:51.204343", "exception": false, "start_time": "2021-10-25T20:00:51.188013", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "![Pytorch Lightning](){height=\"60px\" width=\"240px\"}"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: Barlow Twins Tutorial\n", " :card_description: This notebook describes the self-supervised learning method Barlow Twins. Barlow Twins differs from other recently proposed algorithms as it doesn't fall under the category of...\n", " :tags: Image,Self-Supervised,GPU/TPU,Lightning-Examples"]}], "metadata": {"jupytext": {"cell_metadata_filter": "colab_type,id,colab,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 9.405997, "end_time": "2021-10-25T20:00:51.627704", "environment_variables": {}, "exception": null, "input_path": "lightning_examples/barlow-twins/barlow_twins.ipynb", "output_path": ".notebooks/lightning_examples/barlow-twins.ipynb", "parameters": {}, "start_time": "2021-10-25T20:00:42.221707", "version": "2.3.3"}, "widgets": {"application/vnd.jupyter.widget-state+json": {"state": {"3365e6cc23b14f7480580fbdbd5bc019": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3882c1fab7874567af01f5ca5b6b5529": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "431aeabf10b2446bb97010d31753e44e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4bb27c7671944b6e97113a02c0341e2c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "7ddd35cbfb3845b1a206ac0fcbdbfc85": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3365e6cc23b14f7480580fbdbd5bc019", "placeholder": "\u200b", "style": "IPY_MODEL_4bb27c7671944b6e97113a02c0341e2c", "value": ""}}, "7f3c22706f004367af15c8839b531c8a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "a75cd1c0f8504f44a015affaa4e54a48": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_431aeabf10b2446bb97010d31753e44e", "placeholder": "\u200b", "style": "IPY_MODEL_d8f730207f83419cb86c5c93f4f7584e", "value": " 170499072/? [00:01<00:00, 116151155.58it/s]"}}, "b13dfae7160c4c8586c5780f597cd8e4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_7ddd35cbfb3845b1a206ac0fcbdbfc85", "IPY_MODEL_eca693d1c480402d8c204656916344ad", "IPY_MODEL_a75cd1c0f8504f44a015affaa4e54a48"], "layout": "IPY_MODEL_3882c1fab7874567af01f5ca5b6b5529"}}, "bd170e01fdeb46d4aff4afb77af815fd": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d8f730207f83419cb86c5c93f4f7584e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "eca693d1c480402d8c204656916344ad": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_bd170e01fdeb46d4aff4afb77af815fd", "max": 170498071.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_7f3c22706f004367af15c8839b531c8a", "value": 170498071.0}}}, "version_major": 2, "version_minor": 0}}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/lightning_examples/basic-gan.ipynb b/source/notebooks/lightning_examples/basic-gan.ipynb deleted file mode 100644 index 6562784..0000000 --- a/source/notebooks/lightning_examples/basic-gan.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "e931dfa6", "metadata": {"papermill": {"duration": 0.026978, "end_time": "2021-12-04T16:31:12.165165", "exception": false, "start_time": "2021-12-04T16:31:12.138187", "status": "completed"}, "tags": []}, "source": ["\n", "# PyTorch Lightning Basic GAN Tutorial\n", "\n", "* **Author:** PL team\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-12-04T16:52:58.309356\n", "\n", "How to train a GAN!\n", "\n", "Main takeaways:\n", "1. Generator and discriminator are arbitrary PyTorch modules.\n", "2. training_step does both the generator and discriminator training.\n", "\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/lightning_examples/basic-gan.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "bb4e55df", "metadata": {"papermill": {"duration": 0.024834, "end_time": "2021-12-04T16:31:12.216179", "exception": false, "start_time": "2021-12-04T16:31:12.191345", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "194d85bf", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-12-04T16:31:12.271333Z", "iopub.status.busy": "2021-12-04T16:31:12.270849Z", "iopub.status.idle": "2021-12-04T16:31:15.189840Z", "shell.execute_reply": "2021-12-04T16:31:15.190229Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 2.950578, "end_time": "2021-12-04T16:31:15.190518", "exception": false, "start_time": "2021-12-04T16:31:12.239940", "status": "completed"}, "tags": []}, "outputs": [], "source": ["! pip install --quiet \"pytorch-lightning>=1.3\" \"torchmetrics>=0.3\" \"torchvision\" \"torch>=1.6, <1.9\""]}, {"cell_type": "code", "execution_count": 2, "id": "15a6b707", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:31:15.245721Z", "iopub.status.busy": "2021-12-04T16:31:15.245214Z", "iopub.status.idle": "2021-12-04T16:31:16.576617Z", "shell.execute_reply": "2021-12-04T16:31:16.576153Z"}, "papermill": {"duration": 1.360833, "end_time": "2021-12-04T16:31:16.576756", "exception": false, "start_time": "2021-12-04T16:31:15.215923", "status": "completed"}, "tags": []}, "outputs": [], "source": ["import os\n", "from collections import OrderedDict\n", "\n", "import numpy as np\n", "import torch\n", "import torch.nn as nn\n", "import torch.nn.functional as F\n", "import torchvision\n", "import torchvision.transforms as transforms\n", "from pytorch_lightning import LightningDataModule, LightningModule, Trainer\n", "from torch.utils.data import DataLoader, random_split\n", "from torchvision.datasets import MNIST\n", "\n", "PATH_DATASETS = os.environ.get(\"PATH_DATASETS\", \".\")\n", "AVAIL_GPUS = min(1, torch.cuda.device_count())\n", "BATCH_SIZE = 256 if AVAIL_GPUS else 64\n", "NUM_WORKERS = int(os.cpu_count() / 2)"]}, {"cell_type": "markdown", "id": "f96cbcf4", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.023734, "end_time": "2021-12-04T16:31:16.625285", "exception": false, "start_time": "2021-12-04T16:31:16.601551", "status": "completed"}, "tags": []}, "source": ["### MNIST DataModule\n", "\n", "Below, we define a DataModule for the MNIST Dataset. To learn more about DataModules, check out our tutorial\n", "on them or see the [latest docs](https://pytorch-lightning.readthedocs.io/en/latest/extensions/datamodules.html)."]}, {"cell_type": "code", "execution_count": 3, "id": "a42b438c", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:31:16.681426Z", "iopub.status.busy": "2021-12-04T16:31:16.680944Z", "iopub.status.idle": "2021-12-04T16:31:16.682821Z", "shell.execute_reply": "2021-12-04T16:31:16.682406Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.034042, "end_time": "2021-12-04T16:31:16.682921", "exception": false, "start_time": "2021-12-04T16:31:16.648879", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class MNISTDataModule(LightningDataModule):\n", " def __init__(\n", " self,\n", " data_dir: str = PATH_DATASETS,\n", " batch_size: int = BATCH_SIZE,\n", " num_workers: int = NUM_WORKERS,\n", " ):\n", " super().__init__()\n", " self.data_dir = data_dir\n", " self.batch_size = batch_size\n", " self.num_workers = num_workers\n", "\n", " self.transform = transforms.Compose(\n", " [\n", " transforms.ToTensor(),\n", " transforms.Normalize((0.1307,), (0.3081,)),\n", " ]\n", " )\n", "\n", " # self.dims is returned when you call dm.size()\n", " # Setting default dims here because we know them.\n", " # Could optionally be assigned dynamically in dm.setup()\n", " self.dims = (1, 28, 28)\n", " self.num_classes = 10\n", "\n", " def prepare_data(self):\n", " # download\n", " MNIST(self.data_dir, train=True, download=True)\n", " MNIST(self.data_dir, train=False, download=True)\n", "\n", " def setup(self, stage=None):\n", " # Assign train/val datasets for use in dataloaders\n", " if stage == \"fit\" or stage is None:\n", " mnist_full = MNIST(self.data_dir, train=True, transform=self.transform)\n", " self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000])\n", "\n", " # Assign test dataset for use in dataloader(s)\n", " if stage == \"test\" or stage is None:\n", " self.mnist_test = MNIST(self.data_dir, train=False, transform=self.transform)\n", "\n", " def train_dataloader(self):\n", " return DataLoader(\n", " self.mnist_train,\n", " batch_size=self.batch_size,\n", " num_workers=self.num_workers,\n", " )\n", "\n", " def val_dataloader(self):\n", " return DataLoader(self.mnist_val, batch_size=self.batch_size, num_workers=self.num_workers)\n", "\n", " def test_dataloader(self):\n", " return DataLoader(self.mnist_test, batch_size=self.batch_size, num_workers=self.num_workers)"]}, {"cell_type": "markdown", "id": "46774b1a", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.023599, "end_time": "2021-12-04T16:31:16.730307", "exception": false, "start_time": "2021-12-04T16:31:16.706708", "status": "completed"}, "tags": []}, "source": ["### A. Generator"]}, {"cell_type": "code", "execution_count": 4, "id": "fbe0fd0f", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:31:16.783691Z", "iopub.status.busy": "2021-12-04T16:31:16.783213Z", "iopub.status.idle": "2021-12-04T16:31:16.784820Z", "shell.execute_reply": "2021-12-04T16:31:16.785196Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.031187, "end_time": "2021-12-04T16:31:16.785309", "exception": false, "start_time": "2021-12-04T16:31:16.754122", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class Generator(nn.Module):\n", " def __init__(self, latent_dim, img_shape):\n", " super().__init__()\n", " self.img_shape = img_shape\n", "\n", " def block(in_feat, out_feat, normalize=True):\n", " layers = [nn.Linear(in_feat, out_feat)]\n", " if normalize:\n", " layers.append(nn.BatchNorm1d(out_feat, 0.8))\n", " layers.append(nn.LeakyReLU(0.2, inplace=True))\n", " return layers\n", "\n", " self.model = nn.Sequential(\n", " *block(latent_dim, 128, normalize=False),\n", " *block(128, 256),\n", " *block(256, 512),\n", " *block(512, 1024),\n", " nn.Linear(1024, int(np.prod(img_shape))),\n", " nn.Tanh(),\n", " )\n", "\n", " def forward(self, z):\n", " img = self.model(z)\n", " img = img.view(img.size(0), *self.img_shape)\n", " return img"]}, {"cell_type": "markdown", "id": "858d80f0", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.024118, "end_time": "2021-12-04T16:31:16.833616", "exception": false, "start_time": "2021-12-04T16:31:16.809498", "status": "completed"}, "tags": []}, "source": ["### B. Discriminator"]}, {"cell_type": "code", "execution_count": 5, "id": "08a9d3be", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:31:16.887890Z", "iopub.status.busy": "2021-12-04T16:31:16.887416Z", "iopub.status.idle": "2021-12-04T16:31:16.889412Z", "shell.execute_reply": "2021-12-04T16:31:16.889038Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.030604, "end_time": "2021-12-04T16:31:16.889510", "exception": false, "start_time": "2021-12-04T16:31:16.858906", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class Discriminator(nn.Module):\n", " def __init__(self, img_shape):\n", " super().__init__()\n", "\n", " self.model = nn.Sequential(\n", " nn.Linear(int(np.prod(img_shape)), 512),\n", " nn.LeakyReLU(0.2, inplace=True),\n", " nn.Linear(512, 256),\n", " nn.LeakyReLU(0.2, inplace=True),\n", " nn.Linear(256, 1),\n", " nn.Sigmoid(),\n", " )\n", "\n", " def forward(self, img):\n", " img_flat = img.view(img.size(0), -1)\n", " validity = self.model(img_flat)\n", "\n", " return validity"]}, {"cell_type": "markdown", "id": "087e93db", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.023955, "end_time": "2021-12-04T16:31:16.937896", "exception": false, "start_time": "2021-12-04T16:31:16.913941", "status": "completed"}, "tags": []}, "source": ["### C. GAN\n", "\n", "#### A couple of cool features to check out in this example...\n", "\n", " - We use `some_tensor.type_as(another_tensor)` to make sure we initialize new tensors on the right device (i.e. GPU, CPU).\n", " - Lightning will put your dataloader data on the right device automatically\n", " - In this example, we pull from latent dim on the fly, so we need to dynamically add tensors to the right device.\n", " - `type_as` is the way we recommend to do this.\n", " - This example shows how to use multiple dataloaders in your `LightningModule`."]}, {"cell_type": "code", "execution_count": 6, "id": "dc2ed597", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:31:16.999160Z", "iopub.status.busy": "2021-12-04T16:31:16.988365Z", "iopub.status.idle": "2021-12-04T16:31:17.001905Z", "shell.execute_reply": "2021-12-04T16:31:17.001522Z"}, "papermill": {"duration": 0.040067, "end_time": "2021-12-04T16:31:17.002009", "exception": false, "start_time": "2021-12-04T16:31:16.961942", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class GAN(LightningModule):\n", " def __init__(\n", " self,\n", " channels,\n", " width,\n", " height,\n", " latent_dim: int = 100,\n", " lr: float = 0.0002,\n", " b1: float = 0.5,\n", " b2: float = 0.999,\n", " batch_size: int = BATCH_SIZE,\n", " **kwargs\n", " ):\n", " super().__init__()\n", " self.save_hyperparameters()\n", "\n", " # networks\n", " data_shape = (channels, width, height)\n", " self.generator = Generator(latent_dim=self.hparams.latent_dim, img_shape=data_shape)\n", " self.discriminator = Discriminator(img_shape=data_shape)\n", "\n", " self.validation_z = torch.randn(8, self.hparams.latent_dim)\n", "\n", " self.example_input_array = torch.zeros(2, self.hparams.latent_dim)\n", "\n", " def forward(self, z):\n", " return self.generator(z)\n", "\n", " def adversarial_loss(self, y_hat, y):\n", " return F.binary_cross_entropy(y_hat, y)\n", "\n", " def training_step(self, batch, batch_idx, optimizer_idx):\n", " imgs, _ = batch\n", "\n", " # sample noise\n", " z = torch.randn(imgs.shape[0], self.hparams.latent_dim)\n", " z = z.type_as(imgs)\n", "\n", " # train generator\n", " if optimizer_idx == 0:\n", "\n", " # generate images\n", " self.generated_imgs = self(z)\n", "\n", " # log sampled images\n", " sample_imgs = self.generated_imgs[:6]\n", " grid = torchvision.utils.make_grid(sample_imgs)\n", " self.logger.experiment.add_image(\"generated_images\", grid, 0)\n", "\n", " # ground truth result (ie: all fake)\n", " # put on GPU because we created this tensor inside training_loop\n", " valid = torch.ones(imgs.size(0), 1)\n", " valid = valid.type_as(imgs)\n", "\n", " # adversarial loss is binary cross-entropy\n", " g_loss = self.adversarial_loss(self.discriminator(self(z)), valid)\n", " tqdm_dict = {\"g_loss\": g_loss}\n", " output = OrderedDict({\"loss\": g_loss, \"progress_bar\": tqdm_dict, \"log\": tqdm_dict})\n", " return output\n", "\n", " # train discriminator\n", " if optimizer_idx == 1:\n", " # Measure discriminator's ability to classify real from generated samples\n", "\n", " # how well can it label as real?\n", " valid = torch.ones(imgs.size(0), 1)\n", " valid = valid.type_as(imgs)\n", "\n", " real_loss = self.adversarial_loss(self.discriminator(imgs), valid)\n", "\n", " # how well can it label as fake?\n", " fake = torch.zeros(imgs.size(0), 1)\n", " fake = fake.type_as(imgs)\n", "\n", " fake_loss = self.adversarial_loss(self.discriminator(self(z).detach()), fake)\n", "\n", " # discriminator loss is the average of these\n", " d_loss = (real_loss + fake_loss) / 2\n", " tqdm_dict = {\"d_loss\": d_loss}\n", " output = OrderedDict({\"loss\": d_loss, \"progress_bar\": tqdm_dict, \"log\": tqdm_dict})\n", " return output\n", "\n", " def configure_optimizers(self):\n", " lr = self.hparams.lr\n", " b1 = self.hparams.b1\n", " b2 = self.hparams.b2\n", "\n", " opt_g = torch.optim.Adam(self.generator.parameters(), lr=lr, betas=(b1, b2))\n", " opt_d = torch.optim.Adam(self.discriminator.parameters(), lr=lr, betas=(b1, b2))\n", " return [opt_g, opt_d], []\n", "\n", " def on_epoch_end(self):\n", " z = self.validation_z.type_as(self.generator.model[0].weight)\n", "\n", " # log sampled images\n", " sample_imgs = self(z)\n", " grid = torchvision.utils.make_grid(sample_imgs)\n", " self.logger.experiment.add_image(\"generated_images\", grid, self.current_epoch)"]}, {"cell_type": "code", "execution_count": 7, "id": "139fbdbb", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:31:17.053387Z", "iopub.status.busy": "2021-12-04T16:31:17.052920Z", "iopub.status.idle": "2021-12-04T16:31:40.163711Z", "shell.execute_reply": "2021-12-04T16:31:40.164113Z"}, "papermill": {"duration": 23.13819, "end_time": "2021-12-04T16:31:40.164285", "exception": false, "start_time": "2021-12-04T16:31:17.026095", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/core/datamodule.py:175: LightningDeprecationWarning: DataModule property `dims` was deprecated in v1.5 and will be removed in v1.7.\n", " rank_zero_deprecation(\"DataModule property `dims` was deprecated in v1.5 and will be removed in v1.7.\")\n", "/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/core/datamodule.py:184: LightningDeprecationWarning: DataModule property `size` was deprecated in v1.5 and will be removed in v1.7.\n", " rank_zero_deprecation(\"DataModule property `size` was deprecated in v1.5 and will be removed in v1.7.\")\n", "/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/core/datamodule.py:170: LightningDeprecationWarning: DataModule property `dims` was deprecated in v1.5 and will be removed in v1.7.\n", " rank_zero_deprecation(\"DataModule property `dims` was deprecated in v1.5 and will be removed in v1.7.\")\n", "/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/connectors/callback_connector.py:90: LightningDeprecationWarning: Setting `Trainer(progress_bar_refresh_rate=20)` is deprecated in v1.5 and will be removed in v1.7. Please pass `pytorch_lightning.callbacks.progress.TQDMProgressBar` with `refresh_rate` directly to the Trainer's `callbacks` argument instead. Or, to disable the progress bar pass `enable_progress_bar = False` to the Trainer.\n", " rank_zero_deprecation(\n", "GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/configuration_validator.py:116: UserWarning: You passed in a `val_dataloader` but have no `validation_step`. Skipping val loop.\n", " rank_zero_warn(\"You passed in a `val_dataloader` but have no `validation_step`. Skipping val loop.\")\n", "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stderr", "output_type": "stream", "text": ["\n", " | Name | Type | Params | In sizes | Out sizes \n", "----------------------------------------------------------------------------\n", "0 | generator | Generator | 1.5 M | [2, 100] | [2, 1, 28, 28]\n", "1 | discriminator | Discriminator | 533 K | ? | ? \n", "----------------------------------------------------------------------------\n", "2.0 M Trainable params\n", "0 Non-trainable params\n", "2.0 M Total params\n", "8.174 Total estimated model params size (MB)\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "76879ff1edbb4c10a39a477697fe2c18", "version_major": 2, "version_minor": 0}, "text/plain": ["Training: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/loops/optimization/closure.py:35: LightningDeprecationWarning: One of the returned values {'progress_bar', 'log'} has a `grad_fn`. We will detach it automatically but this behaviour will change in v1.6. Please detach it manually: `return {'loss': ..., 'something': something.detach()}`\n", " rank_zero_deprecation(\n"]}], "source": ["dm = MNISTDataModule()\n", "model = GAN(*dm.size())\n", "trainer = Trainer(gpus=AVAIL_GPUS, max_epochs=5, progress_bar_refresh_rate=20)\n", "trainer.fit(model, dm)"]}, {"cell_type": "code", "execution_count": 8, "id": "a1c00604", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:31:40.230047Z", "iopub.status.busy": "2021-12-04T16:31:40.229583Z", "iopub.status.idle": "2021-12-04T16:31:41.785539Z", "shell.execute_reply": "2021-12-04T16:31:41.785929Z"}, "papermill": {"duration": 1.590294, "end_time": "2021-12-04T16:31:41.786093", "exception": false, "start_time": "2021-12-04T16:31:40.195799", "status": "completed"}, "tags": []}, "outputs": [{"data": {"text/html": ["\n", " \n", " \n", " "], "text/plain": [""]}, "metadata": {}, "output_type": "display_data"}], "source": ["# Start tensorboard.\n", "%load_ext tensorboard\n", "%tensorboard --logdir lightning_logs/"]}, {"cell_type": "markdown", "id": "880bb312", "metadata": {"papermill": {"duration": 0.031498, "end_time": "2021-12-04T16:31:41.850435", "exception": false, "start_time": "2021-12-04T16:31:41.818937", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "[![Pytorch Lightning](){height=\"60px\" width=\"240px\"}](https://pytorchlightning.ai)"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: PyTorch Lightning Basic GAN Tutorial\n", " :card_description: How to train a GAN! Main takeaways: 1. Generator and discriminator are arbitrary PyTorch modules. 2. training_step does both the generator and discriminator training.\n", " :tags: Image,GPU/TPU,Lightning-Examples"]}], "metadata": {"jupytext": {"cell_metadata_filter": "colab_type,colab,id,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 31.853342, "end_time": "2021-12-04T16:31:42.690537", "environment_variables": {}, "exception": null, "input_path": "lightning_examples/basic-gan/gan.ipynb", "output_path": ".notebooks/lightning_examples/basic-gan.ipynb", "parameters": {}, "start_time": "2021-12-04T16:31:10.837195", "version": "2.3.3"}, "widgets": {"application/vnd.jupyter.widget-state+json": {"state": {"0701a66e70844b08b6faf0ec350d0f73": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3280c47883334a8d92de4bc0f3dec466", "placeholder": "\u200b", "style": "IPY_MODEL_28b4d248eea6416ebb4ca9ad55fc5158", "value": " 215/215 [00:03<00:00, 56.07it/s, loss=2.9, v_num=2]"}}, "18355a5b23f843278a2ccfabdd979d9b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "28b4d248eea6416ebb4ca9ad55fc5158": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "3280c47883334a8d92de4bc0f3dec466": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4fa9eee054704cddb87d67a50d621ba0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "5829933d957a462b86e52dc55b26e993": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e556860a92d8442997b62b57ce44fd2c", "max": 215.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_18355a5b23f843278a2ccfabdd979d9b", "value": 215.0}}, "610766e1db924f5ab0933c1bec342ff8": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "62e2171df1994799b6987ec549a7ac47": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_610766e1db924f5ab0933c1bec342ff8", "placeholder": "\u200b", "style": "IPY_MODEL_4fa9eee054704cddb87d67a50d621ba0", "value": "Epoch 4: 100%"}}, "67121f7a826b4be2bd6356f337f40b0f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "76879ff1edbb4c10a39a477697fe2c18": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_62e2171df1994799b6987ec549a7ac47", "IPY_MODEL_5829933d957a462b86e52dc55b26e993", "IPY_MODEL_0701a66e70844b08b6faf0ec350d0f73"], "layout": "IPY_MODEL_67121f7a826b4be2bd6356f337f40b0f"}}, "e556860a92d8442997b62b57ce44fd2c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}}, "version_major": 2, "version_minor": 0}}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/lightning_examples/cifar10-baseline.ipynb b/source/notebooks/lightning_examples/cifar10-baseline.ipynb deleted file mode 100644 index e87ea66..0000000 --- a/source/notebooks/lightning_examples/cifar10-baseline.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "150fd244", "metadata": {"papermill": {"duration": 0.031551, "end_time": "2021-12-04T16:31:53.611675", "exception": false, "start_time": "2021-12-04T16:31:53.580124", "status": "completed"}, "tags": []}, "source": ["\n", "# PyTorch Lightning CIFAR10 ~94% Baseline Tutorial\n", "\n", "* **Author:** PL team\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-12-04T16:52:59.958801\n", "\n", "Train a Resnet to 94% accuracy on Cifar10!\n", "\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/lightning_examples/cifar10-baseline.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "50dc70a0", "metadata": {"papermill": {"duration": 0.02736, "end_time": "2021-12-04T16:31:53.668809", "exception": false, "start_time": "2021-12-04T16:31:53.641449", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "e797c5cf", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-12-04T16:31:53.738761Z", "iopub.status.busy": "2021-12-04T16:31:53.738222Z", "iopub.status.idle": "2021-12-04T16:31:56.632390Z", "shell.execute_reply": "2021-12-04T16:31:56.631747Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 2.935806, "end_time": "2021-12-04T16:31:56.632538", "exception": false, "start_time": "2021-12-04T16:31:53.696732", "status": "completed"}, "tags": []}, "outputs": [], "source": ["! pip install --quiet \"torch>=1.6, <1.9\" \"torchmetrics>=0.3\" \"lightning-bolts\" \"pytorch-lightning>=1.3\" \"torchvision\""]}, {"cell_type": "code", "execution_count": 2, "id": "fae10f21", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:31:56.692496Z", "iopub.status.busy": "2021-12-04T16:31:56.691990Z", "iopub.status.idle": "2021-12-04T16:31:56.693339Z", "shell.execute_reply": "2021-12-04T16:31:56.693734Z"}, "papermill": {"duration": 0.033333, "end_time": "2021-12-04T16:31:56.693854", "exception": false, "start_time": "2021-12-04T16:31:56.660521", "status": "completed"}, "tags": []}, "outputs": [], "source": ["# Run this if you intend to use TPUs\n", "# !pip install cloud-tpu-client==0.10 https://storage.googleapis.com/tpu-pytorch/wheels/torch_xla-1.8-cp37-cp37m-linux_x86_64.whl"]}, {"cell_type": "code", "execution_count": 3, "id": "086fcceb", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:31:56.754809Z", "iopub.status.busy": "2021-12-04T16:31:56.754316Z", "iopub.status.idle": "2021-12-04T16:31:58.695537Z", "shell.execute_reply": "2021-12-04T16:31:58.695074Z"}, "papermill": {"duration": 1.974192, "end_time": "2021-12-04T16:31:58.695673", "exception": false, "start_time": "2021-12-04T16:31:56.721481", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 7\n"]}], "source": ["import os\n", "\n", "import torch\n", "import torch.nn as nn\n", "import torch.nn.functional as F\n", "import torchvision\n", "from pl_bolts.datamodules import CIFAR10DataModule\n", "from pl_bolts.transforms.dataset_normalizations import cifar10_normalization\n", "from pytorch_lightning import LightningModule, Trainer, seed_everything\n", "from pytorch_lightning.callbacks import LearningRateMonitor\n", "from pytorch_lightning.loggers import TensorBoardLogger\n", "from torch.optim.lr_scheduler import OneCycleLR\n", "from torch.optim.swa_utils import AveragedModel, update_bn\n", "from torchmetrics.functional import accuracy\n", "\n", "seed_everything(7)\n", "\n", "PATH_DATASETS = os.environ.get(\"PATH_DATASETS\", \".\")\n", "AVAIL_GPUS = min(1, torch.cuda.device_count())\n", "BATCH_SIZE = 256 if AVAIL_GPUS else 64\n", "NUM_WORKERS = int(os.cpu_count() / 2)"]}, {"cell_type": "markdown", "id": "0755d159", "metadata": {"papermill": {"duration": 0.028087, "end_time": "2021-12-04T16:31:58.755971", "exception": false, "start_time": "2021-12-04T16:31:58.727884", "status": "completed"}, "tags": []}, "source": ["### CIFAR10 Data Module\n", "\n", "Import the existing data module from `bolts` and modify the train and test transforms."]}, {"cell_type": "code", "execution_count": 4, "id": "cf38e878", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:31:58.820631Z", "iopub.status.busy": "2021-12-04T16:31:58.820074Z", "iopub.status.idle": "2021-12-04T16:31:58.823137Z", "shell.execute_reply": "2021-12-04T16:31:58.822662Z"}, "papermill": {"duration": 0.038494, "end_time": "2021-12-04T16:31:58.823238", "exception": false, "start_time": "2021-12-04T16:31:58.784744", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/core/datamodule.py:73: LightningDeprecationWarning: DataModule property `train_transforms` was deprecated in v1.5 and will be removed in v1.7.\n", " rank_zero_deprecation(\n", "/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/core/datamodule.py:77: LightningDeprecationWarning: DataModule property `val_transforms` was deprecated in v1.5 and will be removed in v1.7.\n", " rank_zero_deprecation(\n", "/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/core/datamodule.py:81: LightningDeprecationWarning: DataModule property `test_transforms` was deprecated in v1.5 and will be removed in v1.7.\n", " rank_zero_deprecation(\n"]}], "source": ["\n", "train_transforms = torchvision.transforms.Compose(\n", " [\n", " torchvision.transforms.RandomCrop(32, padding=4),\n", " torchvision.transforms.RandomHorizontalFlip(),\n", " torchvision.transforms.ToTensor(),\n", " cifar10_normalization(),\n", " ]\n", ")\n", "\n", "test_transforms = torchvision.transforms.Compose(\n", " [\n", " torchvision.transforms.ToTensor(),\n", " cifar10_normalization(),\n", " ]\n", ")\n", "\n", "cifar10_dm = CIFAR10DataModule(\n", " data_dir=PATH_DATASETS,\n", " batch_size=BATCH_SIZE,\n", " num_workers=NUM_WORKERS,\n", " train_transforms=train_transforms,\n", " test_transforms=test_transforms,\n", " val_transforms=test_transforms,\n", ")"]}, {"cell_type": "markdown", "id": "eed0041b", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.028881, "end_time": "2021-12-04T16:31:58.881421", "exception": false, "start_time": "2021-12-04T16:31:58.852540", "status": "completed"}, "tags": []}, "source": ["### Resnet\n", "Modify the pre-existing Resnet architecture from TorchVision. The pre-existing architecture is based on ImageNet\n", "images (224x224) as input. So we need to modify it for CIFAR10 images (32x32)."]}, {"cell_type": "code", "execution_count": 5, "id": "3f51300e", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:31:58.943228Z", "iopub.status.busy": "2021-12-04T16:31:58.942763Z", "iopub.status.idle": "2021-12-04T16:31:58.944731Z", "shell.execute_reply": "2021-12-04T16:31:58.944361Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.034218, "end_time": "2021-12-04T16:31:58.944829", "exception": false, "start_time": "2021-12-04T16:31:58.910611", "status": "completed"}, "tags": []}, "outputs": [], "source": ["def create_model():\n", " model = torchvision.models.resnet18(pretrained=False, num_classes=10)\n", " model.conv1 = nn.Conv2d(3, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n", " model.maxpool = nn.Identity()\n", " return model"]}, {"cell_type": "markdown", "id": "e60c4b8b", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.029284, "end_time": "2021-12-04T16:31:59.003290", "exception": false, "start_time": "2021-12-04T16:31:58.974006", "status": "completed"}, "tags": []}, "source": ["### Lightning Module\n", "Check out the [`configure_optimizers`](https://pytorch-lightning.readthedocs.io/en/stable/common/lightning_module.html#configure-optimizers)\n", "method to use custom Learning Rate schedulers. The OneCycleLR with SGD will get you to around 92-93% accuracy\n", "in 20-30 epochs and 93-94% accuracy in 40-50 epochs. Feel free to experiment with different\n", "LR schedules from https://pytorch.org/docs/stable/optim.html#how-to-adjust-learning-rate"]}, {"cell_type": "code", "execution_count": 6, "id": "0c7981e3", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:31:59.069865Z", "iopub.status.busy": "2021-12-04T16:31:59.069383Z", "iopub.status.idle": "2021-12-04T16:31:59.073065Z", "shell.execute_reply": "2021-12-04T16:31:59.073425Z"}, "papermill": {"duration": 0.041188, "end_time": "2021-12-04T16:31:59.073548", "exception": false, "start_time": "2021-12-04T16:31:59.032360", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class LitResnet(LightningModule):\n", " def __init__(self, lr=0.05):\n", " super().__init__()\n", "\n", " self.save_hyperparameters()\n", " self.model = create_model()\n", "\n", " def forward(self, x):\n", " out = self.model(x)\n", " return F.log_softmax(out, dim=1)\n", "\n", " def training_step(self, batch, batch_idx):\n", " x, y = batch\n", " logits = self(x)\n", " loss = F.nll_loss(logits, y)\n", " self.log(\"train_loss\", loss)\n", " return loss\n", "\n", " def evaluate(self, batch, stage=None):\n", " x, y = batch\n", " logits = self(x)\n", " loss = F.nll_loss(logits, y)\n", " preds = torch.argmax(logits, dim=1)\n", " acc = accuracy(preds, y)\n", "\n", " if stage:\n", " self.log(f\"{stage}_loss\", loss, prog_bar=True)\n", " self.log(f\"{stage}_acc\", acc, prog_bar=True)\n", "\n", " def validation_step(self, batch, batch_idx):\n", " self.evaluate(batch, \"val\")\n", "\n", " def test_step(self, batch, batch_idx):\n", " self.evaluate(batch, \"test\")\n", "\n", " def configure_optimizers(self):\n", " optimizer = torch.optim.SGD(\n", " self.parameters(),\n", " lr=self.hparams.lr,\n", " momentum=0.9,\n", " weight_decay=5e-4,\n", " )\n", " steps_per_epoch = 45000 // BATCH_SIZE\n", " scheduler_dict = {\n", " \"scheduler\": OneCycleLR(\n", " optimizer,\n", " 0.1,\n", " epochs=self.trainer.max_epochs,\n", " steps_per_epoch=steps_per_epoch,\n", " ),\n", " \"interval\": \"step\",\n", " }\n", " return {\"optimizer\": optimizer, \"lr_scheduler\": scheduler_dict}"]}, {"cell_type": "code", "execution_count": 7, "id": "0658d2df", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:31:59.139932Z", "iopub.status.busy": "2021-12-04T16:31:59.139466Z", "iopub.status.idle": "2021-12-04T16:38:59.899188Z", "shell.execute_reply": "2021-12-04T16:38:59.898678Z"}, "papermill": {"duration": 420.794323, "end_time": "2021-12-04T16:38:59.899315", "exception": false, "start_time": "2021-12-04T16:31:59.104992", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/connectors/callback_connector.py:90: LightningDeprecationWarning: Setting `Trainer(progress_bar_refresh_rate=10)` is deprecated in v1.5 and will be removed in v1.7. Please pass `pytorch_lightning.callbacks.progress.TQDMProgressBar` with `refresh_rate` directly to the Trainer's `callbacks` argument instead. Or, to disable the progress bar pass `enable_progress_bar = False` to the Trainer.\n", " rank_zero_deprecation(\n", "GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/core/datamodule.py:114: LightningDeprecationWarning: DataModule property `train_transforms` was deprecated in v1.5 and will be removed in v1.7.\n", " rank_zero_deprecation(\n", "/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/core/datamodule.py:133: LightningDeprecationWarning: DataModule property `val_transforms` was deprecated in v1.5 and will be removed in v1.7.\n", " rank_zero_deprecation(\n"]}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stderr", "output_type": "stream", "text": ["\n", " | Name | Type | Params\n", "---------------------------------\n", "0 | model | ResNet | 11.2 M\n", "---------------------------------\n", "11.2 M Trainable params\n", "0 Non-trainable params\n", "11.2 M Total params\n", "44.696 Total estimated model params size (MB)\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "c4382d4da66d4ef58c7336a37a81ff5f", "version_major": 2, "version_minor": 0}, "text/plain": ["Validation sanity check: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["Global seed set to 7\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "962e49594a8b455f8f3f5c9501deb987", "version_major": 2, "version_minor": 0}, "text/plain": ["Training: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "c590712538fa4ef7bd045c44f9aec516", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "4f4648b512ae49ef94785386a4b95c48", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "9893b65283724b288b89fd1114dc79f5", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "9438d4a6012b47c8807ebda5adce1712", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "605f32169bcd4c8ea8c309e9d7638595", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "f71b6be05b7d43f4b438780bf1f6fab1", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "b9de98eebdb34b8e9c55081ebd753057", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "56b17c0aa8a64f40968f6cadbe1149ab", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "15b6d624010642f39e0ab1a2c3a49295", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "d2f8ed4e980348e5a4e806296f45ab09", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "07d0c290c34847eb9df55d1b71e1b7ec", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "29ef56d7400d4ea9a4a53c5a591d7f6e", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "729ae8a5142b414d879d0c49ca9d9742", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "638f18d72e704478b58126fee0504686", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "ef2f42b7a9cd4ad59cf933bf03cdcbc4", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "6c6a4a78c5244926b5ab585c71b22b31", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "9204f19c687749b4b9d8c58c9c5936d2", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "ea96711d4212428ba4dcc07e4ecba6bc", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "a71887abf4ff44b99939cdb9fdd47db7", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "5ed5caa95d6249e1bf43b2610b56b266", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "7a959e215a164e54aec9c5c1729fb4cd", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "78dcf8ab81484972bef98ee4808976a3", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "e2538d2d42254355a24cb5bffdd4f083", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "a7293a6474ce4e9499a1d0159c9d2034", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "ced8e9bb515746e5930f529d1c4c3f2c", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "ca42033167d84b95828523a32f20fbc7", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "3933670d051445c2a966996be4aead2d", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "b8b046652eb14f2fbb40712fbe04995b", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "8aa60a1e120540efb36aefb2ea7c6158", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "c57fece658f444f18bd89f142c343bb0", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/core/datamodule.py:152: LightningDeprecationWarning: DataModule property `test_transforms` was deprecated in v1.5 and will be removed in v1.7.\n", " rank_zero_deprecation(\n"]}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "52ca8ac78894431683ff393c47922053", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["--------------------------------------------------------------------------------\n", "DATALOADER:0 TEST RESULTS\n", "{'test_acc': 0.9203000068664551, 'test_loss': 0.27301323413848877}\n", "--------------------------------------------------------------------------------\n"]}, {"data": {"text/plain": ["[{'test_loss': 0.27301323413848877, 'test_acc': 0.9203000068664551}]"]}, "execution_count": 7, "metadata": {}, "output_type": "execute_result"}], "source": ["model = LitResnet(lr=0.05)\n", "model.datamodule = cifar10_dm\n", "\n", "trainer = Trainer(\n", " progress_bar_refresh_rate=10,\n", " max_epochs=30,\n", " gpus=AVAIL_GPUS,\n", " logger=TensorBoardLogger(\"lightning_logs/\", name=\"resnet\"),\n", " callbacks=[LearningRateMonitor(logging_interval=\"step\")],\n", ")\n", "\n", "trainer.fit(model, cifar10_dm)\n", "trainer.test(model, datamodule=cifar10_dm)"]}, {"cell_type": "markdown", "id": "47b074c0", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.080733, "end_time": "2021-12-04T16:39:00.060155", "exception": false, "start_time": "2021-12-04T16:38:59.979422", "status": "completed"}, "tags": []}, "source": ["### Bonus: Use [Stochastic Weight Averaging](https://arxiv.org/abs/1803.05407) to get a boost on performance\n", "\n", "Use SWA from torch.optim to get a quick performance boost. Also shows a couple of cool features from Lightning:\n", "- Use `training_epoch_end` to run code after the end of every epoch\n", "- Use a pretrained model directly with this wrapper for SWA"]}, {"cell_type": "code", "execution_count": 8, "id": "325d806a", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:39:00.229553Z", "iopub.status.busy": "2021-12-04T16:39:00.229086Z", "iopub.status.idle": "2021-12-04T16:39:00.230724Z", "shell.execute_reply": "2021-12-04T16:39:00.231129Z"}, "papermill": {"duration": 0.090027, "end_time": "2021-12-04T16:39:00.231260", "exception": false, "start_time": "2021-12-04T16:39:00.141233", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class SWAResnet(LitResnet):\n", " def __init__(self, trained_model, lr=0.01):\n", " super().__init__()\n", "\n", " self.save_hyperparameters(\"lr\")\n", " self.model = trained_model\n", " self.swa_model = AveragedModel(self.model)\n", "\n", " def forward(self, x):\n", " out = self.swa_model(x)\n", " return F.log_softmax(out, dim=1)\n", "\n", " def training_epoch_end(self, training_step_outputs):\n", " self.swa_model.update_parameters(self.model)\n", "\n", " def validation_step(self, batch, batch_idx, stage=None):\n", " x, y = batch\n", " logits = F.log_softmax(self.model(x), dim=1)\n", " loss = F.nll_loss(logits, y)\n", " preds = torch.argmax(logits, dim=1)\n", " acc = accuracy(preds, y)\n", "\n", " self.log(\"val_loss\", loss, prog_bar=True)\n", " self.log(\"val_acc\", acc, prog_bar=True)\n", "\n", " def configure_optimizers(self):\n", " optimizer = torch.optim.SGD(self.model.parameters(), lr=self.hparams.lr, momentum=0.9, weight_decay=5e-4)\n", " return optimizer\n", "\n", " def on_train_end(self):\n", " update_bn(self.datamodule.train_dataloader(), self.swa_model, device=self.device)"]}, {"cell_type": "code", "execution_count": 9, "id": "ecdf4282", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:39:00.393861Z", "iopub.status.busy": "2021-12-04T16:39:00.391739Z", "iopub.status.idle": "2021-12-04T16:45:38.129033Z", "shell.execute_reply": "2021-12-04T16:45:38.128630Z"}, "papermill": {"duration": 397.818564, "end_time": "2021-12-04T16:45:38.129158", "exception": false, "start_time": "2021-12-04T16:39:00.310594", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/connectors/callback_connector.py:90: LightningDeprecationWarning: Setting `Trainer(progress_bar_refresh_rate=20)` is deprecated in v1.5 and will be removed in v1.7. Please pass `pytorch_lightning.callbacks.progress.TQDMProgressBar` with `refresh_rate` directly to the Trainer's `callbacks` argument instead. Or, to disable the progress bar pass `enable_progress_bar = False` to the Trainer.\n", " rank_zero_deprecation(\n", "GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/core/datamodule.py:469: LightningDeprecationWarning: DataModule.setup has already been called, so it will not be called again. In v1.6 this behavior will change to always call DataModule.setup.\n", " rank_zero_deprecation(\n", "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stderr", "output_type": "stream", "text": ["\n", " | Name | Type | Params\n", "--------------------------------------------\n", "0 | model | ResNet | 11.2 M\n", "1 | swa_model | AveragedModel | 11.2 M\n", "--------------------------------------------\n", "22.3 M Trainable params\n", "0 Non-trainable params\n", "22.3 M Total params\n", "89.392 Total estimated model params size (MB)\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "9ea460da748d4d009fdb4416fc5ba362", "version_major": 2, "version_minor": 0}, "text/plain": ["Validation sanity check: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["Global seed set to 7\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "d581aedbcb7f48fb8c8dbeaa079ad651", "version_major": 2, "version_minor": 0}, "text/plain": ["Training: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "ff4bf4ad13c04a8791e8283c83765a05", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "f078f962d66c497b8e95231564665108", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "9ef0cc8972ec476babb87467b9ff6a00", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "664cb138f57949dfbc68e0fdcbb7144e", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "7df7c6698b064aaa92cbabaa7e6167dc", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "cc47c9cd42a140a590dddb6dc560a4d6", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "73a78a6b3957447da7f88492c1c0de36", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "a73cdacebbd14b3b9c697a62b8a758ee", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "5e17f6802c6749b0b906adc69c6ba1e9", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "2b8c7d8035ce46cc83e460afa5e96079", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "6584051a70a7443f811094bb8bb1b7ba", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "d498421af6c6458ea4fe33bf22796e86", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "4b242be8d44b4627881cdf9527e1a9b9", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "9adfc41d30154a99938b0d97fa767e21", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "efb67b6f296c44fdb4309f206eb09f4a", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "e24b7c22fbee405c8d202b376aafa909", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "3d2424c1751a42d3b71a7ee8c59e8491", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "c5a56a5d6926452cb6046dcad5b94e20", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "257e57819b96473aaf512f61d62a57d9", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "c213c26b0b8547b0bba620a692676198", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/core/datamodule.py:469: LightningDeprecationWarning: DataModule.teardown has already been called, so it will not be called again. In v1.6 this behavior will change to always call DataModule.teardown.\n", " rank_zero_deprecation(\n", "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "6d08e235cef542568fd7741e38ae73bb", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["--------------------------------------------------------------------------------\n", "DATALOADER:0 TEST RESULTS\n", "{'test_acc': 0.920199990272522, 'test_loss': 0.2513697147369385}\n", "--------------------------------------------------------------------------------\n"]}, {"data": {"text/plain": ["[{'test_loss': 0.2513697147369385, 'test_acc': 0.920199990272522}]"]}, "execution_count": 9, "metadata": {}, "output_type": "execute_result"}], "source": ["swa_model = SWAResnet(model.model, lr=0.01)\n", "swa_model.datamodule = cifar10_dm\n", "\n", "swa_trainer = Trainer(\n", " progress_bar_refresh_rate=20,\n", " max_epochs=20,\n", " gpus=AVAIL_GPUS,\n", " logger=TensorBoardLogger(\"lightning_logs/\", name=\"swa_resnet\"),\n", ")\n", "\n", "swa_trainer.fit(swa_model, cifar10_dm)\n", "swa_trainer.test(swa_model, datamodule=cifar10_dm)"]}, {"cell_type": "code", "execution_count": 10, "id": "ad6589a9", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:45:38.358787Z", "iopub.status.busy": "2021-12-04T16:45:38.358313Z", "iopub.status.idle": "2021-12-04T16:45:39.919126Z", "shell.execute_reply": "2021-12-04T16:45:39.919485Z"}, "papermill": {"duration": 1.677786, "end_time": "2021-12-04T16:45:39.919651", "exception": false, "start_time": "2021-12-04T16:45:38.241865", "status": "completed"}, "tags": []}, "outputs": [{"data": {"text/html": ["\n", " \n", " \n", " "], "text/plain": [""]}, "metadata": {}, "output_type": "display_data"}], "source": ["# Start tensorboard.\n", "%reload_ext tensorboard\n", "%tensorboard --logdir lightning_logs/"]}, {"cell_type": "markdown", "id": "25ec73cb", "metadata": {"papermill": {"duration": 0.113883, "end_time": "2021-12-04T16:45:40.148272", "exception": false, "start_time": "2021-12-04T16:45:40.034389", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "[![Pytorch Lightning](){height=\"60px\" width=\"240px\"}](https://pytorchlightning.ai)"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: PyTorch Lightning CIFAR10 ~94% Baseline Tutorial\n", " :card_description: Train a Resnet to 94% accuracy on Cifar10!\n", " :tags: Image,GPU/TPU,Lightning-Examples"]}], "metadata": {"jupytext": {"cell_metadata_filter": "id,colab,colab_type,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 829.702297, "end_time": "2021-12-04T16:45:41.984443", "environment_variables": {}, "exception": null, "input_path": "lightning_examples/cifar10-baseline/baseline.ipynb", "output_path": ".notebooks/lightning_examples/cifar10-baseline.ipynb", "parameters": {}, "start_time": "2021-12-04T16:31:52.282146", "version": "2.3.3"}, "widgets": {"application/vnd.jupyter.widget-state+json": {"state": {"000e17cab12b4a16a5bb24fd4c8e6c3d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "0014f8f4f49841aaa7c1a64c57b2d49b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "0027c59a46544bef8bf57f2d9eedb383": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "0046c6e7fea345d28a76745b89586893": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1caa64c8e4ed4f8bb0121571896488f3", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_3a67eda0941549d88440223701afe60a", "value": 40.0}}, "00546a0bf8f647af912556b130e3909c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_5fea728b72f343eeba2ea5e3750d8aed", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_da4e670e9d594e7394b38d518354f613", "value": 40.0}}, "00734065a4b748bf86e1fbb33f7a0561": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "008fa6e0a9314811a075d8ca8805709c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "014b058f5dad4a9b90029ee5c0d1941a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "01a67df105214806b42a4974f14e5792": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "023b923393b045618df10b498f0cbc13": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "024680be6f384e20a19910a8db277616": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "029ded4281f84e23a64442a8c51ad87d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "03d4fb52bb2c460b8164142c6a8b3e8a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "0425ec3a0d7849b38e947a2f4cf56349": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "0440b10cf4f441fe843002eec4c8613e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4d37c25af0834d6e8c7a53d704713ce1", "placeholder": "\u200b", "style": "IPY_MODEL_e248b9247393444b95f4e426e49403e1", "value": " 40/40 [00:01<00:00, 41.48it/s]"}}, "0447aa40a49344e79e2e683d6819d5ec": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "04c97639949842bfb3979dd8712abe8b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "05414796bb8b4c4095db6029e7c298ba": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "05a2d51877d9418b8417e35cea00aed8": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "05ed6750b13e4928846c6a3626a2a2bd": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "061ab79450ee4a1eadc75fc6a34c673a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "06a89e7eb1cf4eb9b31b1792b6022475": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "07728fa1b1644efdafa0f0d2934a04b1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "07c8f9ed1f6d48bbb2ccf3bc58ee548b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_731875ee32dc4c7b925239b1c3d08b9b", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_556562fbd5ed4226897e6cf42af6f527", "value": 40.0}}, "07d0c290c34847eb9df55d1b71e1b7ec": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_eceec782c1ce454dbfcadced855e791e", "IPY_MODEL_34b47bf1c5df4fa09fcc2fdc002e5722", "IPY_MODEL_77fe203b76bd43c2a5dcd03f0fa19fe9"], "layout": "IPY_MODEL_8a088cec1f3e490ca376df311ac639c3"}}, "08a677083e9a4a54a0ae80297ffbac0b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ad8f945d28464a879d7686f7d7595509", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_7223547950ec4f0abb4178506b4b5f93", "value": 40.0}}, "099f27f210e24769853bc51f75969ed5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "0a6e971473a845dbaf7dd70544a4fb4e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_0d45a84159db4c7ab0b5475e70ddb95a", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_241a851d435a4a9c90e8c0220fd341dc", "value": 1.0}}, "0adf97988f5d47ffb50136dfb49519e8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3f97b2d29d544bb788df0f53c6a3dba5", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_b52a63138c094b7893e021bc49c0c89e", "value": 40.0}}, "0b34e1a046f14629b409b16c1f1bd8e1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "0bb72c82108147e1a13350b851a960e5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "0bed5eb371c54b7eb3fd9a73697732dc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "0ceec98503a649368d6868abd90c5ab2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "0d45a84159db4c7ab0b5475e70ddb95a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "0e2a984e8cc043f5b58c6508689078ad": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a0ed6130ec664309837dff68eb1609a3", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_c5fc4d52ddb84b7082395834d134e2c4", "value": 40.0}}, "0e7532eb90c044f0b8dc0d480a9a8f98": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2dc4d71da4ae4ea1b0e5df1a7ab34dc9", "placeholder": "\u200b", "style": "IPY_MODEL_1eeb893719c04ca1ba087c7868806512", "value": " 40/40 [00:01<00:00, 41.31it/s]"}}, "0efe49958483403d970448b78c035fce": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_779ed45ace6b4434a574e897384a0f52", "placeholder": "\u200b", "style": "IPY_MODEL_de344810abe548119b3f8ddf3a1cc97a", "value": "Validating: 100%"}}, "0eff93661e2e4c6fbf791ba89304603f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "0fad7f239d664ad29b3c069a3e5cf4c2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1d916e501963438fabfc53c5499facdb", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_281b4f3ac301430589f8068f75febc90", "value": 40.0}}, "0fb7a9bdc2ee4a88a7d79afdb165e0fa": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "109ca19434f2492cb50ddb48624fbef5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "10e2de30c7fa4812a7c096bfec3334ad": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "10ebfd89ac8743988d3afde159a8daa1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b131dac2a55c4445bc5f49457e59cefb", "placeholder": "\u200b", "style": "IPY_MODEL_97ca9563964441899f571f985aa19800", "value": "Validating: 100%"}}, "118e280fa5af441b80565177c090e25d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "11a171b0797a461bba2b27144b84fb35": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "11af77bd1a3c4ed48b8f79dc3bc09ee1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "122fd41a86a14cdd8d291908b9901f6b": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1243b677bc9d45e5b6e28a1e33612d18": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "1259349431444f968af6416e4c991b47": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_18b9cee410e34cc98996c1c827864df3", "placeholder": "\u200b", "style": "IPY_MODEL_ffde3dbed47844968f5b0057538b78ae", "value": "Validating: 100%"}}, "125f9fd7e9d0489c86a06c1f7175f1a8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8a0481c1451549c0bc682a58facfdc39", "placeholder": "\u200b", "style": "IPY_MODEL_2d1fa20403064769858bb4cce177ff4a", "value": "Validating: 100%"}}, "12a96d79a23f49e593233c11258cc1ba": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_6f9a37425e114b73801eeb7e97580200", "placeholder": "\u200b", "style": "IPY_MODEL_bfe210ee12f24249b6194fdbd5990052", "value": " 40/40 [00:01<00:00, 38.09it/s]"}}, "1346ed84515b4784be24ab3b6739983d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "13b6d5004cc64d67a46dac2c2452eb23": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_edd32f0ef84348a4b07891fb8ed6f0ab", "placeholder": "\u200b", "style": "IPY_MODEL_a85a055c9d844ad2b9bacb9583402386", "value": " 40/40 [00:01<00:00, 37.36it/s]"}}, "14086e65c6e24ccebd05a4282991f8a5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1489d138c9cd4c9bb49c6ebfed2a1317": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "14ac48af733144429e4d011377b08b9c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "1593171a93284546a79ca15574055476": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "15b6d624010642f39e0ab1a2c3a49295": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_241907e611804e898fd8836588f68600", "IPY_MODEL_a25c3623d687465cae93c39b76c3ce65", "IPY_MODEL_cc0069da0700482b8bd07d5e61eccf14"], "layout": "IPY_MODEL_f669afd47abf4c0a9b3b79df62009f7e"}}, "1690182c73a74d4bb791931fe9f31bdf": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "16ec8ca835ce4edbbf71ee881cd05bbf": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "174cce3b873b4c2a8e173f5805d837c8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "174fb53b8ed247ebb714ec07b7abf26e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "1791c0d96d094df2ace36a97551cfff6": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_5566375d2f014d478f2453b1738a4831", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_558d75fe32a542b39dd8d4bdbc96518a", "value": 40.0}}, "17d2cf8733d24e43988554c1aac65490": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "18b9cee410e34cc98996c1c827864df3": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "19895a4d415d4b9fb4f7c3e3ffa56ede": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_991c9442e91f483792474ebe4f09d152", "placeholder": "\u200b", "style": "IPY_MODEL_d2c31fdab421480389949e8f0af20cd0", "value": "Validating: 100%"}}, "19ef5cd49b4e4f16aa5d557bede8de6e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_40d36134e0eb4dd0bc557a6c9c47d7bd", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_a14120d2181444b3a233980b6ca6bbe4", "value": 40.0}}, "1ad088f478ef4874bd0ba0e322387932": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1b1dac267473433fa46bd05bc37db269": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_44c208c346064816aa37fbc549b50ed4", "placeholder": "\u200b", "style": "IPY_MODEL_1690182c73a74d4bb791931fe9f31bdf", "value": "Validating: 100%"}}, "1b610b37a5224b12a2bcee275a388a61": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "1ba5e824ccca492191ed59018571aa0d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "1c794c38f0124a2a8100f0179717f3fb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_74553b52649d485681cc6171b8367bdb", "placeholder": "\u200b", "style": "IPY_MODEL_008fa6e0a9314811a075d8ca8805709c", "value": " 40/40 [00:01<00:00, 38.03it/s]"}}, "1caa64c8e4ed4f8bb0121571896488f3": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1cf638c8ce874c81aad1d6991f6d4403": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_71e68f3d7467406ba056edd127a4b8ec", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_6faea2c255e14670a7afbcb3f1f68fc3", "value": 40.0}}, "1d0bc1bfcb6941c0b97cab36f7ab810f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1d32fa9c13af4fb69f2e7cea9a5ffab9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "1d3b103a11964a219559f9f13ba9ac28": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_bd347db500c445b5914ab4c7ed5d0bd1", "placeholder": "\u200b", "style": "IPY_MODEL_57c2ff8ae9a24531bf52ee049c113cad", "value": " 40/40 [00:01<00:00, 39.80it/s]"}}, "1d916e501963438fabfc53c5499facdb": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1db1255602ad4b929cd199e01fd9fa71": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_42e3454797f547f98d8e58789be26c59", "placeholder": "\u200b", "style": "IPY_MODEL_ec2f85ae2a11482b9d8967c431217991", "value": "Validating: 100%"}}, "1dcd0d34b8304b14a795e394769c5e73": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1e4437d1f3004a869ff875f935e6096e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1e5347ebd820410e88806a71d0bb8681": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f9abae85aee34c04a321d4e3410e2352", "placeholder": "\u200b", "style": "IPY_MODEL_e55684dd18f240efb5795f3d5ffdb25a", "value": " 40/40 [00:01<00:00, 40.60it/s]"}}, "1e664c703d4b4f20a8d8115990ec7248": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_556c99df63284336986c9bda4f87842b", "placeholder": "\u200b", "style": "IPY_MODEL_fb9d723beb3d4e36aaab60a344476126", "value": "Validating: 100%"}}, "1eeb893719c04ca1ba087c7868806512": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "1f2fa122be4545b6af4db56d669469e9": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1fabd40d482541188144c73793fb7cac": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "1fc2fe3fcf5f492c91ad6fcefe9bbbd5": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4aab3345397a4b7b93504ade55c2d1ec", "placeholder": "\u200b", "style": "IPY_MODEL_f90f1336e56a4cacb8b5f8666b6c9b16", "value": "Validating: 100%"}}, "1ff9401002354c4396c387857469b5e9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_122fd41a86a14cdd8d291908b9901f6b", "placeholder": "\u200b", "style": "IPY_MODEL_77265d2f46524f789f5803628aaa8bb8", "value": "Epoch 19: 100%"}}, "2000b053e3ab49058a89a8910fee9653": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "205d0539546b41d5a349af917189d235": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "21bab32483d844888f86f71067e0f69e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "21e0696ab83b479bb28bdf8ad31a6a01": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "2295acb193b2465fb3b749a6f3f9195c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "22bba232b95049b2b2d1ac3bf1ee1d09": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "22f0e92c33f040b987eea86cc152ae75": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "237abb092dc24a03977a37e02a700282": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "2394fc85d30d457d9edfc5ed0c0718e2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "23c2dfc91e574966becac4457d0b19d0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_704e66960a204403a5f4f89a9a15ead1", "placeholder": "\u200b", "style": "IPY_MODEL_959f41fc01f14eb896043296b3b9fa2e", "value": "Validating: 100%"}}, "23ddf0adf4f64bdea807fc3c6d586e40": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "241907e611804e898fd8836588f68600": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_205d0539546b41d5a349af917189d235", "placeholder": "\u200b", "style": "IPY_MODEL_11a171b0797a461bba2b27144b84fb35", "value": "Validating: 100%"}}, "241a851d435a4a9c90e8c0220fd341dc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "2541fdc2e94247aab508ae79c3def6d7": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "257e57819b96473aaf512f61d62a57d9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_aa9b2cbc1307478e805f735d938a3546", "IPY_MODEL_e4cb7f9a7537486cbddfb13c57ae7c09", "IPY_MODEL_13b6d5004cc64d67a46dac2c2452eb23"], "layout": "IPY_MODEL_76d6082fd84947949437d5809e934151"}}, "258cee43a0be4850ac25f425c4b1cc3f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d73b688acdba44a2ad89c92ce6153a0c", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_e3779b041324461eb68a37851e899963", "value": 40.0}}, "25f8a6e3d77844d2804a78cedcf79e5f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "26181fafa82f430dab9d294152e60ecf": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "2762fd8f9f0c4c4e87ebc2ca9ea843e2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "27899444bd854cbbb68957cc37bdc15d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "281b4f3ac301430589f8068f75febc90": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "289dba33db8a44b58178c628b4c1f3da": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "2954656e47e948d7b2b877e60b2f5bf3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "29d8dae79a094be8853e030d80e3d9d2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "29ef56d7400d4ea9a4a53c5a591d7f6e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_5a9423f111894a3b9907fb1f9eca1826", "IPY_MODEL_e0207d263a5f435289f3c4fd79f2f0c3", "IPY_MODEL_501bc07531894026a5e831aae8e32c18"], "layout": "IPY_MODEL_9693ff87ee62414e997ed8166a030243"}}, "2ace45c17feb45ddb2ece2fe0ba1f38e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_cfd16f7563604087a407b97d5e1af29f", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_1fabd40d482541188144c73793fb7cac", "value": 40.0}}, "2b19db000c0d4da2b4aa67aebc698ce3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_80e99363f6634d5589ad8a66fe027ed1", "placeholder": "\u200b", "style": "IPY_MODEL_b1b504c2adc34ee99d363ceaefa43e70", "value": "Validation sanity check: 0%"}}, "2b7f8addc532411ba1d455956c9ef33d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "2b8c7d8035ce46cc83e460afa5e96079": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_7bab0316f29c454e8d78451bcfce3fdf", "IPY_MODEL_6e03ab437e8043268a6de9dbe99085c7", "IPY_MODEL_12a96d79a23f49e593233c11258cc1ba"], "layout": "IPY_MODEL_4ec9c16f1ec64e17bdb2740b1ab35e30"}}, "2c3052af38294165bda5283aa0fd444f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_573417c3f24e472296b7f26592a24155", "placeholder": "\u200b", "style": "IPY_MODEL_8bc8667b056f432c9256e42bb212bab5", "value": " 40/40 [00:01<00:00, 41.31it/s]"}}, "2c53cdd37f474e1e8845c3e070be0b51": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_34d66aad9af0429d928328ee7d7e3f0e", "placeholder": "\u200b", "style": "IPY_MODEL_670deef521d54465a95b84ec4fd2a173", "value": "Validating: 100%"}}, "2ca4d5329b084df0b17a5737993cfb43": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "2ce48d7137ef47e79912f9a78bf1ca06": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "2d1fa20403064769858bb4cce177ff4a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "2d41f0971937454bbc65139c6f595f63": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_82df0c7e18334bb29176ed5ebdc8a6da", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_32552c3d3e0248a2a2685f1286c26895", "value": 40.0}}, "2dc4d71da4ae4ea1b0e5df1a7ab34dc9": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "2ecfef770cbf42c39241cba7dd6319b9": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "2f8037b7d6f943b594942290d79b6130": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "2ffa108ad10645a1b18413bd56b7d32a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "312a5c8115a6439e86a581a0b892399a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "31a45a8c81864c48be13eecf563fa8e6": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "31a6932351aa4dfb84a2d26f4f71bf82": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "32552c3d3e0248a2a2685f1286c26895": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "32afa96f636c4f8eafd51af14244276d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c62ef3187ae842bdaee3c4292b792d6f", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_34534e54a8e44eeab86a19770decd37b", "value": 40.0}}, "3321bd2d04a74315b5b937f121591995": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "33817b1ad96043c8b531eced9f189b33": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d49067dafd874b49a1c3d0288b0edf88", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_58fd0973990d4e32ae15e8d3d2fac25e", "value": 40.0}}, "33f836df599e44f88641129b441a51fc": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "340172c2cd084bbbb189896ccf76779f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "34534e54a8e44eeab86a19770decd37b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "34569022c125403fa42f989cd7a6677a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "34b47bf1c5df4fa09fcc2fdc002e5722": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3b5e104926314a50b388fae77aec2cb1", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_8e8a89ab50044f39b0bd15a946a0d30e", "value": 40.0}}, "34d66aad9af0429d928328ee7d7e3f0e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "35ac61ebf2d94417a183c5e85963e76f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "36208c417aec4e8b8cc4b4d36db804bd": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2295acb193b2465fb3b749a6f3f9195c", "placeholder": "\u200b", "style": "IPY_MODEL_2954656e47e948d7b2b877e60b2f5bf3", "value": "Validating: 100%"}}, "3630871e0dbb473f929745f5c5d44b5d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "363da95944f24deaa5693756bf690a76": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "365291d5f1a94dc5a9d8da5f0d414f3e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "36c8c922093b41fcab2400f631bdc06b": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "382dc007ef7b4baaaf107dcd94fc67ef": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_6344a1f5d33544c4b23b797e271be18c", "placeholder": "\u200b", "style": "IPY_MODEL_462c1e01930c4ae791cdbb2e481b3638", "value": " 40/40 [00:01<00:00, 38.17it/s]"}}, "3897c2a7c1e1445fbc604c1a741c98e1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c1c99766fd58427bb5d1aa4bb932b494", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_0425ec3a0d7849b38e947a2f4cf56349", "value": 40.0}}, "38e6f6251cc247f2a70007beb7f40c80": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "392d211b8a6947759a184062f2519e0c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_0eff93661e2e4c6fbf791ba89304603f", "placeholder": "\u200b", "style": "IPY_MODEL_c362daa772754d47b0063b6671836a81", "value": " 197/197 [00:13<00:00, 14.27it/s, loss=0.041, v_num=0, val_loss=0.254, val_acc=0.927]"}}, "3933670d051445c2a966996be4aead2d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_3cc22b487e6a4a709ac8bf74e290eda4", "IPY_MODEL_fe7af92e4442430d96daba437d4a374a", "IPY_MODEL_6b5ce997abf143f8b24d43f30d9999a9"], "layout": "IPY_MODEL_f0607cd375bf48418a683bc48438d6a0"}}, "3962343bfb0b44769ef42b5c98983b9c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "39772d3d7ef847248356d5afe732000c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3a67eda0941549d88440223701afe60a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "3a9384ba911144e998da472f66de9476": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "3b5e104926314a50b388fae77aec2cb1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3ba524598e40487fa22cc827d0fd284b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e7942984bfe2435b8d1a6ca6dbdbc27e", "placeholder": "\u200b", "style": "IPY_MODEL_45af9cda0f0742a0a80dabe353f66563", "value": "Validating: 100%"}}, "3c2777e8a64f4057a3384b45af8ad60e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3ca4a11a4bf24aa1a58ce41c7d3d2498": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_14086e65c6e24ccebd05a4282991f8a5", "placeholder": "\u200b", "style": "IPY_MODEL_29d8dae79a094be8853e030d80e3d9d2", "value": "Validating: 100%"}}, "3cc22b487e6a4a709ac8bf74e290eda4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d1c9ce3bf4fc44fbb4daa41d31c1ed72", "placeholder": "\u200b", "style": "IPY_MODEL_63929ac1f75e4195a41d57a8181aa23c", "value": "Validating: 100%"}}, "3d2424c1751a42d3b71a7ee8c59e8491": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_55fc4e4d0dba4756a4d99466b1fcd21a", "IPY_MODEL_1cf638c8ce874c81aad1d6991f6d4403", "IPY_MODEL_c1dd76b2378445f48f47c199006c16e9"], "layout": "IPY_MODEL_436b257a82fd48a2b685791087532d47"}}, "3d2af261942848d3a2b6c9282837ebeb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c5fad9a2cc4f42f887817c472070b776", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_fba15de3823947c997157fd19ee23ba4", "value": 40.0}}, "3d48472bd8584bd999a934e99e4534a2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8d180bcc608e40349d00ad4f02174832", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_61c8e196a838467389cee416fa5c3733", "value": 40.0}}, "3d6312bdfa8e4d7baacc6e87d7b8eebc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c3deaaeda2cb4bd3a122130339ba7bbb", "placeholder": "\u200b", "style": "IPY_MODEL_ac7a1aa262334ec094a633c7aed94a72", "value": "Validating: 100%"}}, "3de93c5568264b628ce08d92a9e2bdde": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3f1b09ad47b74af8bb89b4950d8ef999": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "3f223cafee19421782131b9f9bfcb873": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_22bba232b95049b2b2d1ac3bf1ee1d09", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_c27d2bf0ec8e4402a35653dd8da4b84d", "value": 40.0}}, "3f97b2d29d544bb788df0f53c6a3dba5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3fabbc3365a24ae98e4ddcd52b206868": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ef90020e0959424193c5298f4ab9a190", "max": 197.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_a5ac4f0fd6fe4ff0a93e849b930717a6", "value": 197.0}}, "3fcf6bf3438a429ea8d182a0f143763e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "405fe7ec85844f918ad93c8cd2daa06b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "4078308e69eb4f789e37f28c5d267f85": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "40d36134e0eb4dd0bc557a6c9c47d7bd": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "40ff73c7b3dc4556be5ecc1d35a6613f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "410b71b0a20941c089e536e4e128d13b": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "41e40cffb2094d97afd7a8e037cf0d5b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "4202db89a7a746bab07560c550105366": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "42a7109f566a424199400b71f736ec10": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_494313e50a4f4f7da351e74b310e0319", "placeholder": "\u200b", "style": "IPY_MODEL_0ceec98503a649368d6868abd90c5ab2", "value": " 40/40 [00:01<00:00, 40.97it/s]"}}, "42d5b26f1cb04b7495bb753b844e9fd6": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d3f774b1b0404f198af51238375c574e", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_65ddb1327fa64c2e903b003551fc22e8", "value": 40.0}}, "42e3454797f547f98d8e58789be26c59": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "436b257a82fd48a2b685791087532d47": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "44c208c346064816aa37fbc549b50ed4": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "45af9cda0f0742a0a80dabe353f66563": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "462c1e01930c4ae791cdbb2e481b3638": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "4664867aff844335bcaedda48bfe3310": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_109ca19434f2492cb50ddb48624fbef5", "placeholder": "\u200b", "style": "IPY_MODEL_7cf1b98468f946d29dce76701c9dc87a", "value": " 40/40 [00:01<00:00, 41.09it/s]"}}, "46b9c07e7b1545dc96651a56d933e2a4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "471d838b49da478fa34ccc96b6ec926a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "47208c4b604b47c382c1a3f773500da7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "48bea9eace8c48a9a5aa452d5dfed96e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e9eff4cf4c714f2680f7e77dbb5a372c", "placeholder": "\u200b", "style": "IPY_MODEL_9d95159b37974aff8914b24c0d943a37", "value": "Validating: 100%"}}, "494313e50a4f4f7da351e74b310e0319": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "496688b3d51445aebf14a8ccbd529eed": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4a36ee3223aa4003bf6c9c68b41ebca9": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4a86d8dd5c4d43faa9b83359c8b579fa": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4aab3345397a4b7b93504ade55c2d1ec": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4ac072f3e25e4c02b3b3e0e18e406a9c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4b242be8d44b4627881cdf9527e1a9b9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_d593afd8891e4b05ba9a03051d458764", "IPY_MODEL_e0fbc495e5d04f798a6cbfc91af1d0ed", "IPY_MODEL_b1954a59bdbf45ce91afe0766729fc53"], "layout": "IPY_MODEL_d2c757a2385045d3ab0adcf707dddba1"}}, "4b809c67a3f2448c9cfd7c34b8aa453f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4c36b11423d549cfaacf00c911dd0aa9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1d0bc1bfcb6941c0b97cab36f7ab810f", "placeholder": "\u200b", "style": "IPY_MODEL_0bed5eb371c54b7eb3fd9a73697732dc", "value": " 40/40 [00:01<00:00, 41.63it/s]"}}, "4c6b4042a5cf4501808c4c3cbd2a1ca1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4d118818f8cf4907816960bccee43c96": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "4d37c25af0834d6e8c7a53d704713ce1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4dac2f6ceaad4780b4452daf42ff31c7": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "4ec9c16f1ec64e17bdb2740b1ab35e30": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "4f4648b512ae49ef94785386a4b95c48": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_afcf640856fe47e29b40125065435826", "IPY_MODEL_7be887614c9a4b02bafb06c04247b854", "IPY_MODEL_4c36b11423d549cfaacf00c911dd0aa9"], "layout": "IPY_MODEL_cacae5ca1e9d4283b9afe8e1916e8618"}}, "501bc07531894026a5e831aae8e32c18": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_79efd9bc5e2f4515acb71a95a0f1228a", "placeholder": "\u200b", "style": "IPY_MODEL_a5c6db3bbffd4e0fa2ae551c18a03b1a", "value": " 40/40 [00:01<00:00, 41.40it/s]"}}, "5107381a8622411cb492283123901aa0": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "5107961954384c8aaaeba31c1b5bc4c8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_312a5c8115a6439e86a581a0b892399a", "placeholder": "\u200b", "style": "IPY_MODEL_996b6c65885c4495b49d1f4e857026a2", "value": " 40/40 [00:01<00:00, 37.95it/s]"}}, "51c67493b2aa4e04af474b9d59af6a6c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "52ca8ac78894431683ff393c47922053": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_d22a5b5a07714a7b9584aad405faee89", "IPY_MODEL_573e74a43a93462ab0e0e31aa9350a52", "IPY_MODEL_afac60f3d22346c3a68852bd55ea790a"], "layout": "IPY_MODEL_11af77bd1a3c4ed48b8f79dc3bc09ee1"}}, "52eae5f9929f4a0b962a3ff4447cea26": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "530f74cfa1894309b640a8910bafcccc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "535725f3fc3d47d1834dd8c5512c4be3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "552fc188b09645f4b397b21d960daf93": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "556562fbd5ed4226897e6cf42af6f527": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "5566375d2f014d478f2453b1738a4831": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "556c99df63284336986c9bda4f87842b": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "558d75fe32a542b39dd8d4bdbc96518a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "55b36c54b9f14e74aec831f953af07ea": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_61b7018ed05440359e4154848b1539d4", "placeholder": "\u200b", "style": "IPY_MODEL_46b9c07e7b1545dc96651a56d933e2a4", "value": " 40/40 [00:01<00:00, 37.80it/s]"}}, "55fc4e4d0dba4756a4d99466b1fcd21a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_de693622da2f4bb7b735600f02a60478", "placeholder": "\u200b", "style": "IPY_MODEL_47208c4b604b47c382c1a3f773500da7", "value": "Validating: 100%"}}, "56b17c0aa8a64f40968f6cadbe1149ab": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_19895a4d415d4b9fb4f7c3e3ffa56ede", "IPY_MODEL_df4ebdf10987433cb65c78dbf7e34b99", "IPY_MODEL_72a44be9f81f4117bf7754b66560ad0a"], "layout": "IPY_MODEL_ccd261d7a5764d43bcacce36b0f5db99"}}, "573417c3f24e472296b7f26592a24155": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "573e74a43a93462ab0e0e31aa9350a52": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_07728fa1b1644efdafa0f0d2934a04b1", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_eca7de566a424f17ae0b4b0d2f99f855", "value": 1.0}}, "57c2ff8ae9a24531bf52ee049c113cad": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "582fd37b71c74c259b2556b59425adee": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "58fd0973990d4e32ae15e8d3d2fac25e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "5a00a23b5f2348198bec2c1e8110482b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_cd17e0a2a3524fc5a548b86c61953b77", "placeholder": "\u200b", "style": "IPY_MODEL_f6f68d546ecb45ffb73be50d80994d1f", "value": " 40/40 [00:01<00:00, 37.04it/s]"}}, "5a9423f111894a3b9907fb1f9eca1826": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_887380ee431440efa0fa779b58a9070f", "placeholder": "\u200b", "style": "IPY_MODEL_d8ff45a13d3c4930b4eac298d783b7cf", "value": "Validating: 100%"}}, "5b065d928b3a4d6eab7911a18dccc14c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "5b7e893c983d44c6914b42a32154b513": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "5b9dddecff0f432da833b80160ad7568": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_061ab79450ee4a1eadc75fc6a34c673a", "placeholder": "\u200b", "style": "IPY_MODEL_1d32fa9c13af4fb69f2e7cea9a5ffab9", "value": " 0/2 [00:00<?, ?it/s]"}}, "5c03b886ad694e53861e7dceebdf0268": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f5438eeef53847ba95d157f56e438488", "placeholder": "\u200b", "style": "IPY_MODEL_6ab8985820164656ad60b9fbbe1e9db6", "value": "Validating: 100%"}}, "5cffc262cf264cbb9aa5e34a41176974": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "5d3e25d0f248411da504f0a0df9c0e2d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_582fd37b71c74c259b2556b59425adee", "placeholder": "\u200b", "style": "IPY_MODEL_d407101ddcc74699a620bbd6a9628bff", "value": " 40/40 [00:01<00:00, 40.97it/s]"}}, "5d937ee650f642d1aff4dcac62eb60b4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_17d2cf8733d24e43988554c1aac65490", "placeholder": "\u200b", "style": "IPY_MODEL_f4fb223218124ea6a02efef412bac44a", "value": "Validating: 100%"}}, "5e17f6802c6749b0b906adc69c6ba1e9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_10ebfd89ac8743988d3afde159a8daa1", "IPY_MODEL_bdd9067ae2bd48aa9eff55c12ba2a8de", "IPY_MODEL_c1609608c09b4580861adb27dd251f36"], "layout": "IPY_MODEL_5cffc262cf264cbb9aa5e34a41176974"}}, "5ed5caa95d6249e1bf43b2610b56b266": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_5d937ee650f642d1aff4dcac62eb60b4", "IPY_MODEL_0e2a984e8cc043f5b58c6508689078ad", "IPY_MODEL_4664867aff844335bcaedda48bfe3310"], "layout": "IPY_MODEL_4d118818f8cf4907816960bccee43c96"}}, "5fea728b72f343eeba2ea5e3750d8aed": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "605f32169bcd4c8ea8c309e9d7638595": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_913954479b9e42789254d32050020788", "IPY_MODEL_0fad7f239d664ad29b3c069a3e5cf4c2", "IPY_MODEL_2c3052af38294165bda5283aa0fd444f"], "layout": "IPY_MODEL_1b610b37a5224b12a2bcee275a388a61"}}, "608e803ac821482db32298d68e280acd": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "60cce88461724ab582baf5e4e7653386": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "61b7018ed05440359e4154848b1539d4": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "61c8e196a838467389cee416fa5c3733": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "62c0abdd86f543a6860fb5b514b6028f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "62defc9448f14799a799664a6e93e99d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4c6b4042a5cf4501808c4c3cbd2a1ca1", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_75b74524c9ce4147a12ee83304575022", "value": 40.0}}, "6344a1f5d33544c4b23b797e271be18c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "638225841dcb42bdbc24ab03315c976a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_72b9b7bf3f244f3c82de65666a8a0581", "placeholder": "\u200b", "style": "IPY_MODEL_d7f9bf3cbe3f4160a09f5376dae9e096", "value": " 40/40 [00:01<00:00, 38.06it/s]"}}, "638f18d72e704478b58126fee0504686": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_78f79019e20f42fd986deb90cfeff8ab", "IPY_MODEL_08a677083e9a4a54a0ae80297ffbac0b", "IPY_MODEL_c51670dd5d7e4d54be75ebd22696d49b"], "layout": "IPY_MODEL_4078308e69eb4f789e37f28c5d267f85"}}, "63929ac1f75e4195a41d57a8181aa23c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "648c1d314aff4a5989917ea9cfb40ee4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "6584051a70a7443f811094bb8bb1b7ba": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_908454428cd14d04999314d984b9422e", "IPY_MODEL_e62c3cbcb0564497b0215b03c619f0a2", "IPY_MODEL_a7062d3276dc4584bd580ce31d23250a"], "layout": "IPY_MODEL_78d77f6a76f8468b9e2f7f42f4222213"}}, "65ddb1327fa64c2e903b003551fc22e8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "664cb138f57949dfbc68e0fdcbb7144e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_1fc2fe3fcf5f492c91ad6fcefe9bbbd5", "IPY_MODEL_abcd702d4ccc492d93335618be15bf9d", "IPY_MODEL_df39f2726d03413ea1f46df9f7f4e16e"], "layout": "IPY_MODEL_6a1523a59cc84dab9155b7de57fc51be"}}, "667623f52df34426af41915a0c6857c7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1ad088f478ef4874bd0ba0e322387932", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_7015d1201f164432a3251437cca5be46", "value": 40.0}}, "668d9e48134f477fb12df091d0b7b2c3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_22f0e92c33f040b987eea86cc152ae75", "placeholder": "\u200b", "style": "IPY_MODEL_81d5b0aebde6419d9a21a71fa43b146d", "value": " 40/40 [00:01<00:00, 38.46it/s]"}}, "670deef521d54465a95b84ec4fd2a173": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "67e47d323fa6415896f68e98ed39242e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "6a1523a59cc84dab9155b7de57fc51be": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "6ab8985820164656ad60b9fbbe1e9db6": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "6b3fd758e2414d97a24b249abf45b2d1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_05ed6750b13e4928846c6a3626a2a2bd", "placeholder": "\u200b", "style": "IPY_MODEL_03d4fb52bb2c460b8164142c6a8b3e8a", "value": " 40/40 [00:01<00:00, 40.41it/s]"}}, "6b5ce997abf143f8b24d43f30d9999a9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_cac8b41d9a92451db93dccda6b5ccf2e", "placeholder": "\u200b", "style": "IPY_MODEL_2394fc85d30d457d9edfc5ed0c0718e2", "value": " 40/40 [00:01<00:00, 39.96it/s]"}}, "6b6968df7bb34058b2548fc8d67f10b7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "6bafb7e9a54a4abdb2b72bb7fdef79a6": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "6c12cb82a52f4703a3afcbee54c82e3f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "6c19c1928aad4db281729dceb27947b2": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "6c2d3949d97443bbadb861144c5a9403": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1489d138c9cd4c9bb49c6ebfed2a1317", "placeholder": "\u200b", "style": "IPY_MODEL_34569022c125403fa42f989cd7a6677a", "value": "Validating: 100%"}}, "6c6a4a78c5244926b5ab585c71b22b31": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_c6c19d03f7334159909e66b6419d5085", "IPY_MODEL_32afa96f636c4f8eafd51af14244276d", "IPY_MODEL_9d369d8ae62d4315b36fad5753458e06"], "layout": "IPY_MODEL_27899444bd854cbbb68957cc37bdc15d"}}, "6d08e235cef542568fd7741e38ae73bb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_9f7e30219ae345bbae61342a7d3415de", "IPY_MODEL_0a6e971473a845dbaf7dd70544a4fb4e", "IPY_MODEL_e3f10177a72948828fa102c2424cdbb1"], "layout": "IPY_MODEL_2ecfef770cbf42c39241cba7dd6319b9"}}, "6d3d89cfaac34c87bb9d4abecf5ca39c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "6dcdd5a2689e4a859bacf94fa50b7b65": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1e4437d1f3004a869ff875f935e6096e", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_530f74cfa1894309b640a8910bafcccc", "value": 40.0}}, "6dda5e78cb8e4728a315e1c052bd7bc9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_6ebcce28d37747fabd71debd16e24ec5", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_237abb092dc24a03977a37e02a700282", "value": 40.0}}, "6e03ab437e8043268a6de9dbe99085c7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_dceda10c727d4cce9a9976d60896b888", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_3f1b09ad47b74af8bb89b4950d8ef999", "value": 40.0}}, "6eac74d845bb40709e203b62c6b0453f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_779896bca5d940b280a04b700f733cfb", "placeholder": "\u200b", "style": "IPY_MODEL_21e0696ab83b479bb28bdf8ad31a6a01", "value": " 40/40 [00:01<00:00, 40.75it/s]"}}, "6ebcce28d37747fabd71debd16e24ec5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "6ebf16d170884218836f567c6624cf1c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "6f6727a7c5ce49a68d254766bd2c56f3": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "6f926ce2f6504e2caa5992aad503e942": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "6f9a37425e114b73801eeb7e97580200": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "6faea2c255e14670a7afbcb3f1f68fc3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "7015d1201f164432a3251437cca5be46": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "704e66960a204403a5f4f89a9a15ead1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "71223c1c01744836a04d36ae0daeda23": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "71e268e4a03840a480f268ce072f5be8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f792ef8d3d3642e68f7b5f226a1dcd5e", "placeholder": "\u200b", "style": "IPY_MODEL_289dba33db8a44b58178c628b4c1f3da", "value": "Validating: 100%"}}, "71e68f3d7467406ba056edd127a4b8ec": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "721f24953e8f4d09bdcb431bb7b0d3cd": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "7223547950ec4f0abb4178506b4b5f93": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "727948d722bc4f8a8a8a73e8c3db95b2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_95e89ee09e5447c9b984d38c6f6715e6", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_e4c405cc7a194ecb9d121ff54b15d90e", "value": 40.0}}, "729ae8a5142b414d879d0c49ca9d9742": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_3d6312bdfa8e4d7baacc6e87d7b8eebc", "IPY_MODEL_00546a0bf8f647af912556b130e3909c", "IPY_MODEL_0440b10cf4f441fe843002eec4c8613e"], "layout": "IPY_MODEL_4dac2f6ceaad4780b4452daf42ff31c7"}}, "72a44be9f81f4117bf7754b66560ad0a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_99113cd146b44349a75e67efec13ccb8", "placeholder": "\u200b", "style": "IPY_MODEL_5b065d928b3a4d6eab7911a18dccc14c", "value": " 40/40 [00:01<00:00, 41.30it/s]"}}, "72b9b7bf3f244f3c82de65666a8a0581": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "731875ee32dc4c7b925239b1c3d08b9b": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "7337db267f3d419ab12ca1ecde8bec6d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b4c522f9247b4ffdb77962a600ab9135", "placeholder": "\u200b", "style": "IPY_MODEL_9920ec0a3fe946dcbf869b1e03f31e6d", "value": " 40/40 [00:01<00:00, 38.03it/s]"}}, "739bd3b55771434897638447109dadbc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ba40c658c1c645df85b0edd784e70f67", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_d04a087ecb834c029b6dbc65f40d903f", "value": 40.0}}, "73a78a6b3957447da7f88492c1c0de36": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_75e902dbc9734435b9903de6cc344530", "IPY_MODEL_19ef5cd49b4e4f16aa5d557bede8de6e", "IPY_MODEL_9199845a8a8b450595630238279489de"], "layout": "IPY_MODEL_a4901b611fe04be69811d4abec2f979a"}}, "74553b52649d485681cc6171b8367bdb": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "7512d436c11543f7ae1e7b77269779bc": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "7525800113e049808ea8b820e07125f8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4ac072f3e25e4c02b3b3e0e18e406a9c", "placeholder": "\u200b", "style": "IPY_MODEL_552fc188b09645f4b397b21d960daf93", "value": "Validating: 100%"}}, "75b74524c9ce4147a12ee83304575022": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "75e902dbc9734435b9903de6cc344530": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_5107381a8622411cb492283123901aa0", "placeholder": "\u200b", "style": "IPY_MODEL_9dd7290bc6c9434da78d89ac36b662fd", "value": "Validating: 100%"}}, "7681fbb8aa304c03a9732a9c95f63ef9": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "76c56c21d24541e49d001359174d8a06": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "76d6082fd84947949437d5809e934151": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "76f4c9460c2544fabd27af4240792134": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "77265d2f46524f789f5803628aaa8bb8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "779896bca5d940b280a04b700f733cfb": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "779ed45ace6b4434a574e897384a0f52": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "77fe203b76bd43c2a5dcd03f0fa19fe9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1dcd0d34b8304b14a795e394769c5e73", "placeholder": "\u200b", "style": "IPY_MODEL_31a45a8c81864c48be13eecf563fa8e6", "value": " 40/40 [00:01<00:00, 40.76it/s]"}}, "78097292f6484ec1ade092c7bce9f457": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "781c2d73c32241af8536cea64f470739": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "danger", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a5c3635b42814a7982cca677d130aabf", "max": 2.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_87e730ffae1c4c54b9e8fe45d15ac50d", "value": 0.0}}, "78d77f6a76f8468b9e2f7f42f4222213": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "78dcf8ab81484972bef98ee4808976a3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_e87d5f0d76364422b001e9ba2009efd6", "IPY_MODEL_42d5b26f1cb04b7495bb753b844e9fd6", "IPY_MODEL_e14d135655704cee9e05ebdae198a92d"], "layout": "IPY_MODEL_dd99a71bd47844b69476dbc31a63e3c5"}}, "78f79019e20f42fd986deb90cfeff8ab": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_dae97dcd99ab412794e592f9eef4fcdd", "placeholder": "\u200b", "style": "IPY_MODEL_9b768c3f38414e3f88ae0c3add6475e4", "value": "Validating: 100%"}}, "79efd9bc5e2f4515acb71a95a0f1228a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "7a959e215a164e54aec9c5c1729fb4cd": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_3ca4a11a4bf24aa1a58ce41c7d3d2498", "IPY_MODEL_98b2037a54ef42188de9446df543151b", "IPY_MODEL_1d3b103a11964a219559f9f13ba9ac28"], "layout": "IPY_MODEL_000e17cab12b4a16a5bb24fd4c8e6c3d"}}, "7bab0316f29c454e8d78451bcfce3fdf": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4b809c67a3f2448c9cfd7c34b8aa453f", "placeholder": "\u200b", "style": "IPY_MODEL_e3bdf937acbc4aec97813939d969d48c", "value": "Validating: 100%"}}, "7be887614c9a4b02bafb06c04247b854": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_be6125a2050e4c97ad54c5e536c7afdf", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_beaa1e52816c41c0967f26b2e1c78546", "value": 40.0}}, "7cbdcb186be240daa066b9a04ed3dca3": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "7cf1b98468f946d29dce76701c9dc87a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "7d42a6086e82421a9e595b43ad729c72": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2ca4d5329b084df0b17a5737993cfb43", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_174fb53b8ed247ebb714ec07b7abf26e", "value": 40.0}}, "7df7c6698b064aaa92cbabaa7e6167dc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_8ad6c9c3073c49c1bfd83c6240832ab5", "IPY_MODEL_a0c98a98b6c84325a3ad30bcc5040c03", "IPY_MODEL_fab8109d1b334fe781851edfb02cfb44"], "layout": "IPY_MODEL_9c8adb261d2042fca1791aec070ea340"}}, "7e8eee7d4e4b4d208dc8aaee31968781": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8b2c33d6154d4557b30ef5e12200e8ee", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_9c532ce1146d4e1dbbcd2b3f782ff80c", "value": 40.0}}, "7eabd69400ff400daf651d434b6dc643": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "7eed8b7bd0bd41738ad7f3cef6dabfbc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ee0b4a9189cd4eb1ad630d7d45f10283", "placeholder": "\u200b", "style": "IPY_MODEL_e442a229b0e14efbbe6bbe05d188c8d7", "value": " 40/40 [00:01<00:00, 41.20it/s]"}}, "7fca13154b964dcd891a26420f4ecc4e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "80e99363f6634d5589ad8a66fe027ed1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "810fdf5d48554b6198f4f470baffc034": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8efc1a19d4f14cd8b996a4982ffab9d6", "placeholder": "\u200b", "style": "IPY_MODEL_ab84751327534b3990319ea653ae2a62", "value": " 40/40 [00:01<00:00, 38.22it/s]"}}, "81d5b0aebde6419d9a21a71fa43b146d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "8249bc65e7c14b708596bd66de402e61": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "82af5d90d4084ce9875b6e7ed0a8be8d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "82df0c7e18334bb29176ed5ebdc8a6da": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "83efcf75a4b14eb48238dfe52978f137": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "85b4d00008d84934acb2a3a0300977da": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "86557445ad984f038bc35ea22977b002": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3c2777e8a64f4057a3384b45af8ad60e", "placeholder": "\u200b", "style": "IPY_MODEL_8af8badd7aff46e1ae830a787428f307", "value": "Validating: 100%"}}, "86dbf891d6594a20a46e44de2dde8500": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "87e730ffae1c4c54b9e8fe45d15ac50d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "8822777752c042978be232ecf99811bb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "88359b1570cf4d278afcc12b52ca5cf3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_36c8c922093b41fcab2400f631bdc06b", "placeholder": "\u200b", "style": "IPY_MODEL_97c8405dea494331a4b840d715774e9e", "value": " 40/40 [00:01<00:00, 41.18it/s]"}}, "887380ee431440efa0fa779b58a9070f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "88a8d15063f74146bb9740c199a0263c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "895f50a960ef4de58e09ffaab83498a7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "8a0481c1451549c0bc682a58facfdc39": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "8a088cec1f3e490ca376df311ac639c3": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "8a11d75adfed4ef2a84d4b92fb8a51e3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "8a81ec850d2a4f89bfc568ec39f84e1d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d061820e73bb4ae7b1fc4384aaa911ef", "placeholder": "\u200b", "style": "IPY_MODEL_e0938103b55e4109bba1bd6a4c9c4a39", "value": " 40/40 [00:01<00:00, 41.20it/s]"}}, "8aa60a1e120540efb36aefb2ea7c6158": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_6c2d3949d97443bbadb861144c5a9403", "IPY_MODEL_2ace45c17feb45ddb2ece2fe0ba1f38e", "IPY_MODEL_6eac74d845bb40709e203b62c6b0453f"], "layout": "IPY_MODEL_f352e4d278dc4cda94f82a3846236f56"}}, "8ad6c9c3073c49c1bfd83c6240832ab5": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b97c2ea5358243679d1d4e31a8b05cbc", "placeholder": "\u200b", "style": "IPY_MODEL_721f24953e8f4d09bdcb431bb7b0d3cd", "value": "Validating: 100%"}}, "8af8badd7aff46e1ae830a787428f307": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "8b1a113312574d8a96b116058e4c9251": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "8b2c33d6154d4557b30ef5e12200e8ee": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "8bc8667b056f432c9256e42bb212bab5": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "8c9494e571964db491151ef9b8b845e2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "8cb60ad796bf4128af276b330260edca": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "8d180bcc608e40349d00ad4f02174832": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "8e8a89ab50044f39b0bd15a946a0d30e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "8ee337c0a7fd40dd87d9999965079d66": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_024680be6f384e20a19910a8db277616", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_8a11d75adfed4ef2a84d4b92fb8a51e3", "value": 40.0}}, "8ef7076c24ac4e3da9bc42adb84288d7": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "8efc1a19d4f14cd8b996a4982ffab9d6": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "8f2bc8575c9d477aae95569141884d3b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "908454428cd14d04999314d984b9422e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a50b3137d9c9433e9f6c9bfcc120cafc", "placeholder": "\u200b", "style": "IPY_MODEL_cce80a39b9d840f4a7dd7b3817da1de9", "value": "Validating: 100%"}}, "913954479b9e42789254d32050020788": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ebd6e86e6d364bfda696270bcd1285bc", "placeholder": "\u200b", "style": "IPY_MODEL_405fe7ec85844f918ad93c8cd2daa06b", "value": "Validating: 100%"}}, "9156902c48df4de4871d0325cf148752": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "9199845a8a8b450595630238279489de": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1f2fa122be4545b6af4db56d669469e9", "placeholder": "\u200b", "style": "IPY_MODEL_6f926ce2f6504e2caa5992aad503e942", "value": " 40/40 [00:01<00:00, 37.06it/s]"}}, "9204f19c687749b4b9d8c58c9c5936d2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_ec1a8cd04f67429fa8fa11d2dabea42a", "IPY_MODEL_d0efda7e12494752b39085bbffd4a6d1", "IPY_MODEL_9253725ef50148e48e5d8a1a1c30847b"], "layout": "IPY_MODEL_e9d179241fa845b98f5d31c870a271d8"}}, "9253725ef50148e48e5d8a1a1c30847b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c62e8526bfe34ecda82253d53329b7da", "placeholder": "\u200b", "style": "IPY_MODEL_3962343bfb0b44769ef42b5c98983b9c", "value": " 40/40 [00:01<00:00, 41.08it/s]"}}, "92978f1abdd34477bb7ec0325a838cc7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "93b06cad51a14b71911ec76dcaa59e83": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "9438d4a6012b47c8807ebda5adce1712": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_36208c417aec4e8b8cc4b4d36db804bd", "IPY_MODEL_1791c0d96d094df2ace36a97551cfff6", "IPY_MODEL_0e7532eb90c044f0b8dc0d480a9a8f98"], "layout": "IPY_MODEL_1243b677bc9d45e5b6e28a1e33612d18"}}, "953da11bc35d4b51ab1dea85dad0a8bb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_6c12cb82a52f4703a3afcbee54c82e3f", "placeholder": "\u200b", "style": "IPY_MODEL_41e40cffb2094d97afd7a8e037cf0d5b", "value": "Validating: 100%"}}, "959f41fc01f14eb896043296b3b9fa2e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "95dd373c362b4f4f989389cca1bf9bba": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "danger", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_93b06cad51a14b71911ec76dcaa59e83", "max": 2.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_2762fd8f9f0c4c4e87ebc2ca9ea843e2", "value": 0.0}}, "95e821bc924e42b38ef068733a15a96e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "95e89ee09e5447c9b984d38c6f6715e6": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "962e49594a8b455f8f3f5c9501deb987": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_e773d5290c3c481e80ec46e4337703ac", "IPY_MODEL_beb2d424cca549e3994971502cc2bc15", "IPY_MODEL_392d211b8a6947759a184062f2519e0c"], "layout": "IPY_MODEL_2ce48d7137ef47e79912f9a78bf1ca06"}}, "9693ff87ee62414e997ed8166a030243": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "97c8405dea494331a4b840d715774e9e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "97ca9563964441899f571f985aa19800": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "9893b65283724b288b89fd1114dc79f5": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_b8c893a656f44893912011b8ced212aa", "IPY_MODEL_3d2af261942848d3a2b6c9282837ebeb", "IPY_MODEL_bdca9160cad440f58fe24de81345b6fb"], "layout": "IPY_MODEL_06a89e7eb1cf4eb9b31b1792b6022475"}}, "98b2037a54ef42188de9446df543151b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c658abd81ef747f3aacf84adeabaa613", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_6b6968df7bb34058b2548fc8d67f10b7", "value": 40.0}}, "98c2bb8dfd9f42e7ba3a70833d3a9cf2": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "99113cd146b44349a75e67efec13ccb8": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "991c9442e91f483792474ebe4f09d152": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "9920ec0a3fe946dcbf869b1e03f31e6d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "996b6c65885c4495b49d1f4e857026a2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "99ce588597484149b5d5dfe5cbd055a1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "9a0dc5ee46ef43ab9610085cd998f750": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_10e2de30c7fa4812a7c096bfec3334ad", "placeholder": "\u200b", "style": "IPY_MODEL_82af5d90d4084ce9875b6e7ed0a8be8d", "value": " 0/2 [00:00<?, ?it/s]"}}, "9adfc41d30154a99938b0d97fa767e21": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_5c03b886ad694e53861e7dceebdf0268", "IPY_MODEL_33817b1ad96043c8b531eced9f189b33", "IPY_MODEL_55b36c54b9f14e74aec831f953af07ea"], "layout": "IPY_MODEL_8b1a113312574d8a96b116058e4c9251"}}, "9b768c3f38414e3f88ae0c3add6475e4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "9c0e4986ee594a8abd5a65453b5d896a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "9c532ce1146d4e1dbbcd2b3f782ff80c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "9c8adb261d2042fca1791aec070ea340": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "9d369d8ae62d4315b36fad5753458e06": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8cb60ad796bf4128af276b330260edca", "placeholder": "\u200b", "style": "IPY_MODEL_535725f3fc3d47d1834dd8c5512c4be3", "value": " 40/40 [00:01<00:00, 41.09it/s]"}}, "9d95159b37974aff8914b24c0d943a37": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "9dd7290bc6c9434da78d89ac36b662fd": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "9ea460da748d4d009fdb4416fc5ba362": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_b00d3649a1ed4aee83941ec3499cb5b1", "IPY_MODEL_95dd373c362b4f4f989389cca1bf9bba", "IPY_MODEL_5b9dddecff0f432da833b80160ad7568"], "layout": "IPY_MODEL_98c2bb8dfd9f42e7ba3a70833d3a9cf2"}}, "9ef0cc8972ec476babb87467b9ff6a00": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_abca9201b3a7431898b41f1296e9e47b", "IPY_MODEL_a1a3aa50e30d46fbb95b70d42d8134de", "IPY_MODEL_668d9e48134f477fb12df091d0b7b2c3"], "layout": "IPY_MODEL_05414796bb8b4c4095db6029e7c298ba"}}, "9f7e30219ae345bbae61342a7d3415de": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_fb6196786a4c449da5bfc3b74974f5b7", "placeholder": "\u200b", "style": "IPY_MODEL_88a8d15063f74146bb9740c199a0263c", "value": "Testing: 100%"}}, "a0c98a98b6c84325a3ad30bcc5040c03": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d19b21b31c1b4251989052b2a9405736", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_0014f8f4f49841aaa7c1a64c57b2d49b", "value": 40.0}}, "a0e32c7a94a744f8af40b68c9d2f8113": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "a0ed6130ec664309837dff68eb1609a3": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "a10691f4cc5f4264821e505be23d5c0d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "a14120d2181444b3a233980b6ca6bbe4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "a164e2d5015a442da8aaca5abe9b64ea": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_118e280fa5af441b80565177c090e25d", "placeholder": "\u200b", "style": "IPY_MODEL_cc76969b57f54e5a99a1c2ca9a23d657", "value": " 40/40 [00:01<00:00, 40.74it/s]"}}, "a1a3aa50e30d46fbb95b70d42d8134de": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1346ed84515b4784be24ab3b6739983d", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_b4d729133c2b48c0a791338890f0e427", "value": 40.0}}, "a25c3623d687465cae93c39b76c3ce65": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_7cbdcb186be240daa066b9a04ed3dca3", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_31a6932351aa4dfb84a2d26f4f71bf82", "value": 40.0}}, "a34763ee634d44768c767c2355e57e7a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "a47d56c8623841ffba64e31bb3294bfa": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "a4901b611fe04be69811d4abec2f979a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "a50b3137d9c9433e9f6c9bfcc120cafc": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "a56807f9e014434fb9f5ec740db1cdf4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "a5ac4f0fd6fe4ff0a93e849b930717a6": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "a5c3635b42814a7982cca677d130aabf": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "a5c6db3bbffd4e0fa2ae551c18a03b1a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "a7062d3276dc4584bd580ce31d23250a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_bd88a232244c411dbb7fd992c1027448", "placeholder": "\u200b", "style": "IPY_MODEL_d728bc80d8df41ea88685e94f199eff8", "value": " 40/40 [00:01<00:00, 38.13it/s]"}}, "a71887abf4ff44b99939cdb9fdd47db7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_3ba524598e40487fa22cc827d0fd284b", "IPY_MODEL_abdb8fc6f4ea4ee2b3e679e591afc37e", "IPY_MODEL_f187affa322744d7822bac58e3d366ee"], "layout": "IPY_MODEL_2541fdc2e94247aab508ae79c3def6d7"}}, "a7293a6474ce4e9499a1d0159c9d2034": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_2c53cdd37f474e1e8845c3e070be0b51", "IPY_MODEL_739bd3b55771434897638447109dadbc", "IPY_MODEL_a164e2d5015a442da8aaca5abe9b64ea"], "layout": "IPY_MODEL_2b7f8addc532411ba1d455956c9ef33d"}}, "a73cdacebbd14b3b9c697a62b8a758ee": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_48bea9eace8c48a9a5aa452d5dfed96e", "IPY_MODEL_0046c6e7fea345d28a76745b89586893", "IPY_MODEL_382dc007ef7b4baaaf107dcd94fc67ef"], "layout": "IPY_MODEL_51c67493b2aa4e04af474b9d59af6a6c"}}, "a85a055c9d844ad2b9bacb9583402386": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "a94008efe3024367adc524556ecb73e9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ffb2fbfef1064080b54b648785376dc5", "placeholder": "\u200b", "style": "IPY_MODEL_d1e0d12030ef4e4a8b237e92e1889f0e", "value": " 40/40 [00:01<00:00, 41.11it/s]"}}, "aa81d9f10a1343688ab35aed5fa9a733": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "aa9b2cbc1307478e805f735d938a3546": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_0bb72c82108147e1a13350b851a960e5", "placeholder": "\u200b", "style": "IPY_MODEL_62c0abdd86f543a6860fb5b514b6028f", "value": "Validating: 100%"}}, "ab1556a4dab6495da3a22de9eb920871": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ab84751327534b3990319ea653ae2a62": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "abca9201b3a7431898b41f1296e9e47b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b661d6f3970340209af6cdc59f9bc324", "placeholder": "\u200b", "style": "IPY_MODEL_174cce3b873b4c2a8e173f5805d837c8", "value": "Validating: 100%"}}, "abcd702d4ccc492d93335618be15bf9d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d2e50bfa91c0493d8c1e5e956f46b514", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_3630871e0dbb473f929745f5c5d44b5d", "value": 40.0}}, "abdb8fc6f4ea4ee2b3e679e591afc37e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_78097292f6484ec1ade092c7bce9f457", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_8822777752c042978be232ecf99811bb", "value": 40.0}}, "abeba1de74a4420d9a46da3ee64dab2d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ac7a1aa262334ec094a633c7aed94a72": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "ad8f945d28464a879d7686f7d7595509": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ae8bb373e5d7456d9627b43c3d1fa8ed": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "afac60f3d22346c3a68852bd55ea790a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_0027c59a46544bef8bf57f2d9eedb383", "placeholder": "\u200b", "style": "IPY_MODEL_8f2bc8575c9d477aae95569141884d3b", "value": " 40/40 [00:01<00:00, 39.90it/s]"}}, "afcf640856fe47e29b40125065435826": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c3e1b0656e78474886a5dd89b80d99cf", "placeholder": "\u200b", "style": "IPY_MODEL_029ded4281f84e23a64442a8c51ad87d", "value": "Validating: 100%"}}, "b00d3649a1ed4aee83941ec3499cb5b1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2f8037b7d6f943b594942290d79b6130", "placeholder": "\u200b", "style": "IPY_MODEL_e5b1df60b8d64f8bbca251ea1aa45fc9", "value": "Validation sanity check: 0%"}}, "b09d28854ea24312b741c7e4bef86735": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "b131dac2a55c4445bc5f49457e59cefb": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b1954a59bdbf45ce91afe0766729fc53": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f5b91ccd114d43dd83abfe60d5666295", "placeholder": "\u200b", "style": "IPY_MODEL_b09d28854ea24312b741c7e4bef86735", "value": " 40/40 [00:01<00:00, 37.71it/s]"}}, "b1b504c2adc34ee99d363ceaefa43e70": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "b4c522f9247b4ffdb77962a600ab9135": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b4d729133c2b48c0a791338890f0e427": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "b52a63138c094b7893e021bc49c0c89e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "b5b4aa182c534419be2c9f72ca2f62d6": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b5f729672dbe4f1784a511c5841f4e7b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_496688b3d51445aebf14a8ccbd529eed", "placeholder": "\u200b", "style": "IPY_MODEL_0b34e1a046f14629b409b16c1f1bd8e1", "value": " 40/40 [00:01<00:00, 40.96it/s]"}}, "b661d6f3970340209af6cdc59f9bc324": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b742a674c72f440aa5399890549262c4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "b77a76f27de54c2183bea1ad9864dc95": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "b825fe85788a46119b9da2f3f0168a69": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a34763ee634d44768c767c2355e57e7a", "placeholder": "\u200b", "style": "IPY_MODEL_c3b5ddb8b461432d9979ea0473d89c60", "value": "Validating: 100%"}}, "b8b046652eb14f2fbb40712fbe04995b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_7525800113e049808ea8b820e07125f8", "IPY_MODEL_3f223cafee19421782131b9f9bfcb873", "IPY_MODEL_b5f729672dbe4f1784a511c5841f4e7b"], "layout": "IPY_MODEL_95e821bc924e42b38ef068733a15a96e"}}, "b8c893a656f44893912011b8ced212aa": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_99ce588597484149b5d5dfe5cbd055a1", "placeholder": "\u200b", "style": "IPY_MODEL_c3d08c9ab755494196759d9dccafc132", "value": "Validating: 100%"}}, "b9415f0976ae48e1a5371a5e9f8d84bd": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b97c2ea5358243679d1d4e31a8b05cbc": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b9de98eebdb34b8e9c55081ebd753057": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_1259349431444f968af6416e4c991b47", "IPY_MODEL_6dda5e78cb8e4728a315e1c052bd7bc9", "IPY_MODEL_e7a99e4d130f498abb222496b5671ef4"], "layout": "IPY_MODEL_25f8a6e3d77844d2804a78cedcf79e5f"}}, "ba40c658c1c645df85b0edd784e70f67": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "baeb194ab5ed4089b8cfea9c622c7485": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c72cde952f804bb3a70852ecef68bcaf", "placeholder": "\u200b", "style": "IPY_MODEL_8249bc65e7c14b708596bd66de402e61", "value": "Validating: 100%"}}, "bd347db500c445b5914ab4c7ed5d0bd1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "bd7102a0c9bc45d8a32134a863be9966": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_410b71b0a20941c089e536e4e128d13b", "placeholder": "\u200b", "style": "IPY_MODEL_f5699ec6e6c847ab807ce5bf3cb03664", "value": "Validating: 100%"}}, "bd88a232244c411dbb7fd992c1027448": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "bdca9160cad440f58fe24de81345b6fb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c4d7717ac5a0497785625a98c346a91c", "placeholder": "\u200b", "style": "IPY_MODEL_d54e1ea3816541bca39a1e59a9817019", "value": " 40/40 [00:01<00:00, 41.62it/s]"}}, "bdd9067ae2bd48aa9eff55c12ba2a8de": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4a36ee3223aa4003bf6c9c68b41ebca9", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_6ebf16d170884218836f567c6624cf1c", "value": 40.0}}, "be6125a2050e4c97ad54c5e536c7afdf": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "beaa1e52816c41c0967f26b2e1c78546": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "beb2d424cca549e3994971502cc2bc15": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_099f27f210e24769853bc51f75969ed5", "max": 197.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_67e47d323fa6415896f68e98ed39242e", "value": 197.0}}, "bfab16490d4d401ca39e5fcbfad30dea": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "bfe210ee12f24249b6194fdbd5990052": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "c1609608c09b4580861adb27dd251f36": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4a86d8dd5c4d43faa9b83359c8b579fa", "placeholder": "\u200b", "style": "IPY_MODEL_14ac48af733144429e4d011377b08b9c", "value": " 40/40 [00:01<00:00, 37.99it/s]"}}, "c1c99766fd58427bb5d1aa4bb932b494": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c1dd76b2378445f48f47c199006c16e9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_83efcf75a4b14eb48238dfe52978f137", "placeholder": "\u200b", "style": "IPY_MODEL_363da95944f24deaa5693756bf690a76", "value": " 40/40 [00:01<00:00, 38.12it/s]"}}, "c213c26b0b8547b0bba620a692676198": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_1b1dac267473433fa46bd05bc37db269", "IPY_MODEL_6dcdd5a2689e4a859bacf94fa50b7b65", "IPY_MODEL_5107961954384c8aaaeba31c1b5bc4c8"], "layout": "IPY_MODEL_33f836df599e44f88641129b441a51fc"}}, "c27d2bf0ec8e4402a35653dd8da4b84d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "c362daa772754d47b0063b6671836a81": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "c3b5ddb8b461432d9979ea0473d89c60": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "c3d08c9ab755494196759d9dccafc132": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "c3deaaeda2cb4bd3a122130339ba7bbb": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c3e1b0656e78474886a5dd89b80d99cf": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c4382d4da66d4ef58c7336a37a81ff5f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_2b19db000c0d4da2b4aa67aebc698ce3", "IPY_MODEL_781c2d73c32241af8536cea64f470739", "IPY_MODEL_9a0dc5ee46ef43ab9610085cd998f750"], "layout": "IPY_MODEL_e17fb5bf5733405e8c98c36e58ffcf7e"}}, "c4d7717ac5a0497785625a98c346a91c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c51670dd5d7e4d54be75ebd22696d49b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_6d3d89cfaac34c87bb9d4abecf5ca39c", "placeholder": "\u200b", "style": "IPY_MODEL_7fca13154b964dcd891a26420f4ecc4e", "value": " 40/40 [00:01<00:00, 41.35it/s]"}}, "c57fece658f444f18bd89f142c343bb0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_baeb194ab5ed4089b8cfea9c622c7485", "IPY_MODEL_8ee337c0a7fd40dd87d9999965079d66", "IPY_MODEL_5d3e25d0f248411da504f0a0df9c0e2d"], "layout": "IPY_MODEL_d2e4ed49cb994cfe85d5c254f252ef98"}}, "c590712538fa4ef7bd045c44f9aec516": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_1e664c703d4b4f20a8d8115990ec7248", "IPY_MODEL_7d42a6086e82421a9e595b43ad729c72", "IPY_MODEL_db277be0c1004f0599dd4d4275351024"], "layout": "IPY_MODEL_86dbf891d6594a20a46e44de2dde8500"}}, "c5a56a5d6926452cb6046dcad5b94e20": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_de5ca57613b141ecab054a6a3bcdd20a", "IPY_MODEL_667623f52df34426af41915a0c6857c7", "IPY_MODEL_7337db267f3d419ab12ca1ecde8bec6d"], "layout": "IPY_MODEL_6bafb7e9a54a4abdb2b72bb7fdef79a6"}}, "c5fad9a2cc4f42f887817c472070b776": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c5fc4d52ddb84b7082395834d134e2c4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "c62e8526bfe34ecda82253d53329b7da": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c62ef3187ae842bdaee3c4292b792d6f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c658abd81ef747f3aacf84adeabaa613": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c6c19d03f7334159909e66b6419d5085": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a47d56c8623841ffba64e31bb3294bfa", "placeholder": "\u200b", "style": "IPY_MODEL_5b7e893c983d44c6914b42a32154b513", "value": "Validating: 100%"}}, "c72cde952f804bb3a70852ecef68bcaf": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ca42033167d84b95828523a32f20fbc7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_d898ceb905a74a9f9549aef4295429e2", "IPY_MODEL_f59bb6ed94cf497f9ddbf63eb196ab62", "IPY_MODEL_42a7109f566a424199400b71f736ec10"], "layout": "IPY_MODEL_4202db89a7a746bab07560c550105366"}}, "cac8b41d9a92451db93dccda6b5ccf2e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "cacae5ca1e9d4283b9afe8e1916e8618": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "cc0069da0700482b8bd07d5e61eccf14": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ccd0f6fa912f42549bb9d30d02738ef5", "placeholder": "\u200b", "style": "IPY_MODEL_7eabd69400ff400daf651d434b6dc643", "value": " 40/40 [00:01<00:00, 40.90it/s]"}}, "cc47c9cd42a140a590dddb6dc560a4d6": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_1db1255602ad4b929cd199e01fd9fa71", "IPY_MODEL_e031999ce4f140bcb9f659d91587a079", "IPY_MODEL_5a00a23b5f2348198bec2c1e8110482b"], "layout": "IPY_MODEL_3a9384ba911144e998da472f66de9476"}}, "cc76969b57f54e5a99a1c2ca9a23d657": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "ccd0f6fa912f42549bb9d30d02738ef5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ccd261d7a5764d43bcacce36b0f5db99": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "cce80a39b9d840f4a7dd7b3817da1de9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "cd17e0a2a3524fc5a548b86c61953b77": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ced07f39454f482a834aa01b5f977282": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ced8e9bb515746e5930f529d1c4c3f2c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_23c2dfc91e574966becac4457d0b19d0", "IPY_MODEL_3d48472bd8584bd999a934e99e4534a2", "IPY_MODEL_1e5347ebd820410e88806a71d0bb8681"], "layout": "IPY_MODEL_340172c2cd084bbbb189896ccf76779f"}}, "cfd16f7563604087a407b97d5e1af29f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d04a087ecb834c029b6dbc65f40d903f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "d061820e73bb4ae7b1fc4384aaa911ef": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d0efda7e12494752b39085bbffd4a6d1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8ef7076c24ac4e3da9bc42adb84288d7", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_3321bd2d04a74315b5b937f121591995", "value": 40.0}}, "d19b21b31c1b4251989052b2a9405736": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d1a0e1f95d0b400ba9deedf188ccef73": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "d1c9ce3bf4fc44fbb4daa41d31c1ed72": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d1e0d12030ef4e4a8b237e92e1889f0e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "d22a5b5a07714a7b9584aad405faee89": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_52eae5f9929f4a0b962a3ff4447cea26", "placeholder": "\u200b", "style": "IPY_MODEL_2000b053e3ab49058a89a8910fee9653", "value": "Testing: 100%"}}, "d27e62cbd5554ebc9dd552a9264f037d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d2c31fdab421480389949e8f0af20cd0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "d2c757a2385045d3ab0adcf707dddba1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "d2e4ed49cb994cfe85d5c254f252ef98": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "d2e50bfa91c0493d8c1e5e956f46b514": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d2f8ed4e980348e5a4e806296f45ab09": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_bd7102a0c9bc45d8a32134a863be9966", "IPY_MODEL_2d41f0971937454bbc65139c6f595f63", "IPY_MODEL_6b3fd758e2414d97a24b249abf45b2d1"], "layout": "IPY_MODEL_bfab16490d4d401ca39e5fcbfad30dea"}}, "d369517f48604be39f83df2af26cdd15": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "d3f774b1b0404f198af51238375c574e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d407101ddcc74699a620bbd6a9628bff": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "d49067dafd874b49a1c3d0288b0edf88": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d498421af6c6458ea4fe33bf22796e86": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_b825fe85788a46119b9da2f3f0168a69", "IPY_MODEL_0adf97988f5d47ffb50136dfb49519e8", "IPY_MODEL_1c794c38f0124a2a8100f0179717f3fb"], "layout": "IPY_MODEL_d8a0309b11494a5cae5994c0c04a818f"}}, "d4c1bc09dddd49d28af187e6be4c1caf": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "d54e1ea3816541bca39a1e59a9817019": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "d57038b8b2184a5eaaaaf182893cc796": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_fd6f831c86034ff3ab7821932b3086db", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_9156902c48df4de4871d0325cf148752", "value": 40.0}}, "d581aedbcb7f48fb8c8dbeaa079ad651": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_1ff9401002354c4396c387857469b5e9", "IPY_MODEL_3fabbc3365a24ae98e4ddcd52b206868", "IPY_MODEL_f2bfe826a71142faaf708abf3fcbfce6"], "layout": "IPY_MODEL_d1a0e1f95d0b400ba9deedf188ccef73"}}, "d593afd8891e4b05ba9a03051d458764": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e6cbac4b8c974514a58a947448fc412d", "placeholder": "\u200b", "style": "IPY_MODEL_04c97639949842bfb3979dd8712abe8b", "value": "Validating: 100%"}}, "d728bc80d8df41ea88685e94f199eff8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "d73b688acdba44a2ad89c92ce6153a0c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d7b5e58eb4d3438d8a5b648692171036": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d27e62cbd5554ebc9dd552a9264f037d", "placeholder": "\u200b", "style": "IPY_MODEL_21bab32483d844888f86f71067e0f69e", "value": " 40/40 [00:01<00:00, 37.88it/s]"}}, "d7f60bf8643a49eca3a16d56091b4154": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "d7f9bf3cbe3f4160a09f5376dae9e096": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "d898ceb905a74a9f9549aef4295429e2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_7512d436c11543f7ae1e7b77269779bc", "placeholder": "\u200b", "style": "IPY_MODEL_0fb7a9bdc2ee4a88a7d79afdb165e0fa", "value": "Validating: 100%"}}, "d8a0309b11494a5cae5994c0c04a818f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "d8ff45a13d3c4930b4eac298d783b7cf": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "d9bb8edb324b4f09977eac68ceb45e63": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "da4e670e9d594e7394b38d518354f613": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "dae97dcd99ab412794e592f9eef4fcdd": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "db277be0c1004f0599dd4d4275351024": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f57d9339abc84a62a49d3bacd275d7c9", "placeholder": "\u200b", "style": "IPY_MODEL_16ec8ca835ce4edbbf71ee881cd05bbf", "value": " 40/40 [00:01<00:00, 41.19it/s]"}}, "dceda10c727d4cce9a9976d60896b888": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "dd99a71bd47844b69476dbc31a63e3c5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "ddde61829a984873a4bbf6613184e2ee": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_fb537059a7b449fa8effe868845859bb", "placeholder": "\u200b", "style": "IPY_MODEL_365291d5f1a94dc5a9d8da5f0d414f3e", "value": "Validating: 100%"}}, "de344810abe548119b3f8ddf3a1cc97a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "de5ca57613b141ecab054a6a3bcdd20a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e1e5b90601d94304b7ef56ced388330a", "placeholder": "\u200b", "style": "IPY_MODEL_faeb509fbf3f4e5f93992b33634adab1", "value": "Validating: 100%"}}, "de693622da2f4bb7b735600f02a60478": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "df39f2726d03413ea1f46df9f7f4e16e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ced07f39454f482a834aa01b5f977282", "placeholder": "\u200b", "style": "IPY_MODEL_648c1d314aff4a5989917ea9cfb40ee4", "value": " 40/40 [00:01<00:00, 38.21it/s]"}}, "df4ebdf10987433cb65c78dbf7e34b99": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_23ddf0adf4f64bdea807fc3c6d586e40", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_76c56c21d24541e49d001359174d8a06", "value": 40.0}}, "dff17ba1b5ae45e3851d3ab860b9f529": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_6f6727a7c5ce49a68d254766bd2c56f3", "placeholder": "\u200b", "style": "IPY_MODEL_1ba5e824ccca492191ed59018571aa0d", "value": "Validating: 100%"}}, "e0207d263a5f435289f3c4fd79f2f0c3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ab1556a4dab6495da3a22de9eb920871", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_a56807f9e014434fb9f5ec740db1cdf4", "value": 40.0}}, "e031999ce4f140bcb9f659d91587a079": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_85b4d00008d84934acb2a3a0300977da", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_014b058f5dad4a9b90029ee5c0d1941a", "value": 40.0}}, "e0938103b55e4109bba1bd6a4c9c4a39": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "e0fbc495e5d04f798a6cbfc91af1d0ed": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_7681fbb8aa304c03a9732a9c95f63ef9", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_608e803ac821482db32298d68e280acd", "value": 40.0}}, "e14d135655704cee9e05ebdae198a92d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_023b923393b045618df10b498f0cbc13", "placeholder": "\u200b", "style": "IPY_MODEL_1593171a93284546a79ca15574055476", "value": " 40/40 [00:01<00:00, 41.08it/s]"}}, "e17fb5bf5733405e8c98c36e58ffcf7e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "e1e5b90601d94304b7ef56ced388330a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "e248b9247393444b95f4e426e49403e1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "e24b7c22fbee405c8d202b376aafa909": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_953da11bc35d4b51ab1dea85dad0a8bb", "IPY_MODEL_f7ca4e232d884ae6bd404288c78de3fe", "IPY_MODEL_638225841dcb42bdbc24ab03315c976a"], "layout": "IPY_MODEL_40ff73c7b3dc4556be5ecc1d35a6613f"}}, "e2538d2d42254355a24cb5bffdd4f083": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_86557445ad984f038bc35ea22977b002", "IPY_MODEL_7e8eee7d4e4b4d208dc8aaee31968781", "IPY_MODEL_88359b1570cf4d278afcc12b52ca5cf3"], "layout": "IPY_MODEL_00734065a4b748bf86e1fbb33f7a0561"}}, "e28368a911464b9db767854a5f048ca3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e367433e553a477ca6a56d8a25c5f16a", "placeholder": "\u200b", "style": "IPY_MODEL_d369517f48604be39f83df2af26cdd15", "value": " 40/40 [00:01<00:00, 38.04it/s]"}}, "e367433e553a477ca6a56d8a25c5f16a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "e3779b041324461eb68a37851e899963": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "e3bdf937acbc4aec97813939d969d48c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "e3d7871fd58d46e28fefff6d6f2d55ef": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "e3f10177a72948828fa102c2424cdbb1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e3d7871fd58d46e28fefff6d6f2d55ef", "placeholder": "\u200b", "style": "IPY_MODEL_71223c1c01744836a04d36ae0daeda23", "value": " 40/40 [00:01<00:00, 37.17it/s]"}}, "e442a229b0e14efbbe6bbe05d188c8d7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "e46414f0bbc2470a9a75e3c9a77582d4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "e4c405cc7a194ecb9d121ff54b15d90e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "e4cb7f9a7537486cbddfb13c57ae7c09": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_39772d3d7ef847248356d5afe732000c", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_92978f1abdd34477bb7ec0325a838cc7", "value": 40.0}}, "e55684dd18f240efb5795f3d5ffdb25a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "e5b1df60b8d64f8bbca251ea1aa45fc9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "e62c3cbcb0564497b0215b03c619f0a2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b5b4aa182c534419be2c9f72ca2f62d6", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_a10691f4cc5f4264821e505be23d5c0d", "value": 40.0}}, "e6cbac4b8c974514a58a947448fc412d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "e773d5290c3c481e80ec46e4337703ac": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3de93c5568264b628ce08d92a9e2bdde", "placeholder": "\u200b", "style": "IPY_MODEL_d4c1bc09dddd49d28af187e6be4c1caf", "value": "Epoch 29: 100%"}}, "e7942984bfe2435b8d1a6ca6dbdbc27e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "e7a99e4d130f498abb222496b5671ef4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_26181fafa82f430dab9d294152e60ecf", "placeholder": "\u200b", "style": "IPY_MODEL_b742a674c72f440aa5399890549262c4", "value": " 40/40 [00:01<00:00, 41.28it/s]"}}, "e87d5f0d76364422b001e9ba2009efd6": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_9c0e4986ee594a8abd5a65453b5d896a", "placeholder": "\u200b", "style": "IPY_MODEL_8c9494e571964db491151ef9b8b845e2", "value": "Validating: 100%"}}, "e9d179241fa845b98f5d31c870a271d8": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "e9eff4cf4c714f2680f7e77dbb5a372c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ea96711d4212428ba4dcc07e4ecba6bc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_125f9fd7e9d0489c86a06c1f7175f1a8", "IPY_MODEL_62defc9448f14799a799664a6e93e99d", "IPY_MODEL_7eed8b7bd0bd41738ad7f3cef6dabfbc"], "layout": "IPY_MODEL_38e6f6251cc247f2a70007beb7f40c80"}}, "ebd6e86e6d364bfda696270bcd1285bc": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ec1a8cd04f67429fa8fa11d2dabea42a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3fcf6bf3438a429ea8d182a0f143763e", "placeholder": "\u200b", "style": "IPY_MODEL_60cce88461724ab582baf5e4e7653386", "value": "Validating: 100%"}}, "ec2f85ae2a11482b9d8967c431217991": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "eca7de566a424f17ae0b4b0d2f99f855": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "ecb828657a224596ac79b7ca2953edc0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "eceec782c1ce454dbfcadced855e791e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_aa81d9f10a1343688ab35aed5fa9a733", "placeholder": "\u200b", "style": "IPY_MODEL_b77a76f27de54c2183bea1ad9864dc95", "value": "Validating: 100%"}}, "edd32f0ef84348a4b07891fb8ed6f0ab": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ee0b4a9189cd4eb1ad630d7d45f10283": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ef2f42b7a9cd4ad59cf933bf03cdcbc4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_f62d0978442b4f01b2c26d23d2451d4d", "IPY_MODEL_3897c2a7c1e1445fbc604c1a741c98e1", "IPY_MODEL_a94008efe3024367adc524556ecb73e9"], "layout": "IPY_MODEL_05a2d51877d9418b8417e35cea00aed8"}}, "ef90020e0959424193c5298f4ab9a190": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "efb67b6f296c44fdb4309f206eb09f4a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_dff17ba1b5ae45e3851d3ab860b9f529", "IPY_MODEL_727948d722bc4f8a8a8a73e8c3db95b2", "IPY_MODEL_e28368a911464b9db767854a5f048ca3"], "layout": "IPY_MODEL_76f4c9460c2544fabd27af4240792134"}}, "f0607cd375bf48418a683bc48438d6a0": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "f078f962d66c497b8e95231564665108": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_0efe49958483403d970448b78c035fce", "IPY_MODEL_258cee43a0be4850ac25f425c4b1cc3f", "IPY_MODEL_810fdf5d48554b6198f4f470baffc034"], "layout": "IPY_MODEL_d7f60bf8643a49eca3a16d56091b4154"}}, "f187affa322744d7822bac58e3d366ee": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_35ac61ebf2d94417a183c5e85963e76f", "placeholder": "\u200b", "style": "IPY_MODEL_f96af388a83c42afb6866a6f2b22b295", "value": " 40/40 [00:01<00:00, 39.67it/s]"}}, "f2bfe826a71142faaf708abf3fcbfce6": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_471d838b49da478fa34ccc96b6ec926a", "placeholder": "\u200b", "style": "IPY_MODEL_ecb828657a224596ac79b7ca2953edc0", "value": " 197/197 [00:13<00:00, 14.21it/s, loss=0.0285, v_num=0, val_loss=4.160, val_acc=0.104]"}}, "f352e4d278dc4cda94f82a3846236f56": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "f4fb223218124ea6a02efef412bac44a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "f5438eeef53847ba95d157f56e438488": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "f5699ec6e6c847ab807ce5bf3cb03664": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "f57d9339abc84a62a49d3bacd275d7c9": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "f59bb6ed94cf497f9ddbf63eb196ab62": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a0e32c7a94a744f8af40b68c9d2f8113", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_0447aa40a49344e79e2e683d6819d5ec", "value": 40.0}}, "f5b91ccd114d43dd83abfe60d5666295": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "f62d0978442b4f01b2c26d23d2451d4d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_01a67df105214806b42a4974f14e5792", "placeholder": "\u200b", "style": "IPY_MODEL_e46414f0bbc2470a9a75e3c9a77582d4", "value": "Validating: 100%"}}, "f669afd47abf4c0a9b3b79df62009f7e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "f6f68d546ecb45ffb73be50d80994d1f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "f71b6be05b7d43f4b438780bf1f6fab1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_ddde61829a984873a4bbf6613184e2ee", "IPY_MODEL_d57038b8b2184a5eaaaaf182893cc796", "IPY_MODEL_8a81ec850d2a4f89bfc568ec39f84e1d"], "layout": "IPY_MODEL_ae8bb373e5d7456d9627b43c3d1fa8ed"}}, "f792ef8d3d3642e68f7b5f226a1dcd5e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "f7ca4e232d884ae6bd404288c78de3fe": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_abeba1de74a4420d9a46da3ee64dab2d", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_895f50a960ef4de58e09ffaab83498a7", "value": 40.0}}, "f90f1336e56a4cacb8b5f8666b6c9b16": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "f96af388a83c42afb6866a6f2b22b295": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "f9abae85aee34c04a321d4e3410e2352": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "fab8109d1b334fe781851edfb02cfb44": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_6c19c1928aad4db281729dceb27947b2", "placeholder": "\u200b", "style": "IPY_MODEL_fe5d668723a244498cb33494e5bee2f2", "value": " 40/40 [00:01<00:00, 30.04it/s]"}}, "faeb509fbf3f4e5f93992b33634adab1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "fb537059a7b449fa8effe868845859bb": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "fb6196786a4c449da5bfc3b74974f5b7": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "fb9d723beb3d4e36aaab60a344476126": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "fba15de3823947c997157fd19ee23ba4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "fd6f831c86034ff3ab7821932b3086db": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "fe5d668723a244498cb33494e5bee2f2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "fe7af92e4442430d96daba437d4a374a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b9415f0976ae48e1a5371a5e9f8d84bd", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_d9bb8edb324b4f09977eac68ceb45e63", "value": 40.0}}, "ff4bf4ad13c04a8791e8283c83765a05": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_71e268e4a03840a480f268ce072f5be8", "IPY_MODEL_07c8f9ed1f6d48bbb2ccf3bc58ee548b", "IPY_MODEL_d7b5e58eb4d3438d8a5b648692171036"], "layout": "IPY_MODEL_2ffa108ad10645a1b18413bd56b7d32a"}}, "ffb2fbfef1064080b54b648785376dc5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ffde3dbed47844968f5b0057538b78ae": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}}, "version_major": 2, "version_minor": 0}}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/lightning_examples/datamodules.ipynb b/source/notebooks/lightning_examples/datamodules.ipynb deleted file mode 100644 index 6c3f0ff..0000000 --- a/source/notebooks/lightning_examples/datamodules.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "61739b4a", "metadata": {"papermill": {"duration": 0.035332, "end_time": "2021-12-04T16:45:52.526798", "exception": false, "start_time": "2021-12-04T16:45:52.491466", "status": "completed"}, "tags": []}, "source": ["\n", "# PyTorch Lightning DataModules\n", "\n", "* **Author:** PL team\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-12-04T16:53:01.674205\n", "\n", "This notebook will walk you through how to start using Datamodules. With the release of `pytorch-lightning` version 0.9.0, we have included a new class called `LightningDataModule` to help you decouple data related hooks from your `LightningModule`. The most up to date documentation on datamodules can be found [here](https://pytorch-lightning.readthedocs.io/en/latest/extensions/datamodules.html).\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/lightning_examples/datamodules.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "a3ad2cac", "metadata": {"papermill": {"duration": 0.031562, "end_time": "2021-12-04T16:45:52.591478", "exception": false, "start_time": "2021-12-04T16:45:52.559916", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "97feb35c", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-12-04T16:45:52.663442Z", "iopub.status.busy": "2021-12-04T16:45:52.662968Z", "iopub.status.idle": "2021-12-04T16:45:55.544955Z", "shell.execute_reply": "2021-12-04T16:45:55.545348Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 2.922242, "end_time": "2021-12-04T16:45:55.545634", "exception": false, "start_time": "2021-12-04T16:45:52.623392", "status": "completed"}, "tags": []}, "outputs": [], "source": ["! pip install --quiet \"torchvision\" \"pytorch-lightning>=1.3\" \"torchmetrics>=0.3\" \"torch>=1.6, <1.9\""]}, {"cell_type": "markdown", "id": "384d6a1b", "metadata": {"papermill": {"duration": 0.03178, "end_time": "2021-12-04T16:45:55.610463", "exception": false, "start_time": "2021-12-04T16:45:55.578683", "status": "completed"}, "tags": []}, "source": ["## Introduction\n", "\n", "First, we'll go over a regular `LightningModule` implementation without the use of a `LightningDataModule`"]}, {"cell_type": "code", "execution_count": 2, "id": "a39b56eb", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:45:55.682565Z", "iopub.status.busy": "2021-12-04T16:45:55.680296Z", "iopub.status.idle": "2021-12-04T16:45:59.522992Z", "shell.execute_reply": "2021-12-04T16:45:59.523374Z"}, "papermill": {"duration": 3.881462, "end_time": "2021-12-04T16:45:59.523593", "exception": false, "start_time": "2021-12-04T16:45:55.642131", "status": "completed"}, "tags": []}, "outputs": [], "source": ["import os\n", "\n", "import torch\n", "import torch.nn.functional as F\n", "from pytorch_lightning import LightningDataModule, LightningModule, Trainer\n", "from torch import nn\n", "from torch.utils.data import DataLoader, random_split\n", "from torchmetrics.functional import accuracy\n", "from torchvision import transforms\n", "\n", "# Note - you must have torchvision installed for this example\n", "from torchvision.datasets import CIFAR10, MNIST\n", "\n", "PATH_DATASETS = os.environ.get(\"PATH_DATASETS\", \".\")\n", "AVAIL_GPUS = min(1, torch.cuda.device_count())\n", "BATCH_SIZE = 256 if AVAIL_GPUS else 64"]}, {"cell_type": "markdown", "id": "0f3c51dc", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.031785, "end_time": "2021-12-04T16:45:59.588240", "exception": false, "start_time": "2021-12-04T16:45:59.556455", "status": "completed"}, "tags": []}, "source": ["### Defining the LitMNISTModel\n", "\n", "Below, we reuse a `LightningModule` from our hello world tutorial that classifies MNIST Handwritten Digits.\n", "\n", "Unfortunately, we have hardcoded dataset-specific items within the model,\n", "forever limiting it to working with MNIST Data. \ud83d\ude22\n", "\n", "This is fine if you don't plan on training/evaluating your model on different datasets.\n", "However, in many cases, this can become bothersome when you want to try out your architecture with different datasets."]}, {"cell_type": "code", "execution_count": 3, "id": "82a2f0d0", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:45:59.665520Z", "iopub.status.busy": "2021-12-04T16:45:59.665038Z", "iopub.status.idle": "2021-12-04T16:45:59.667349Z", "shell.execute_reply": "2021-12-04T16:45:59.666889Z"}, "papermill": {"duration": 0.04678, "end_time": "2021-12-04T16:45:59.667449", "exception": false, "start_time": "2021-12-04T16:45:59.620669", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class LitMNIST(LightningModule):\n", " def __init__(self, data_dir=PATH_DATASETS, hidden_size=64, learning_rate=2e-4):\n", "\n", " super().__init__()\n", "\n", " # We hardcode dataset specific stuff here.\n", " self.data_dir = data_dir\n", " self.num_classes = 10\n", " self.dims = (1, 28, 28)\n", " channels, width, height = self.dims\n", " self.transform = transforms.Compose(\n", " [\n", " transforms.ToTensor(),\n", " transforms.Normalize((0.1307,), (0.3081,)),\n", " ]\n", " )\n", "\n", " self.hidden_size = hidden_size\n", " self.learning_rate = learning_rate\n", "\n", " # Build model\n", " self.model = nn.Sequential(\n", " nn.Flatten(),\n", " nn.Linear(channels * width * height, hidden_size),\n", " nn.ReLU(),\n", " nn.Dropout(0.1),\n", " nn.Linear(hidden_size, hidden_size),\n", " nn.ReLU(),\n", " nn.Dropout(0.1),\n", " nn.Linear(hidden_size, self.num_classes),\n", " )\n", "\n", " def forward(self, x):\n", " x = self.model(x)\n", " return F.log_softmax(x, dim=1)\n", "\n", " def training_step(self, batch, batch_idx):\n", " x, y = batch\n", " logits = self(x)\n", " loss = F.nll_loss(logits, y)\n", " return loss\n", "\n", " def validation_step(self, batch, batch_idx):\n", " x, y = batch\n", " logits = self(x)\n", " loss = F.nll_loss(logits, y)\n", " preds = torch.argmax(logits, dim=1)\n", " acc = accuracy(preds, y)\n", " self.log(\"val_loss\", loss, prog_bar=True)\n", " self.log(\"val_acc\", acc, prog_bar=True)\n", " return loss\n", "\n", " def configure_optimizers(self):\n", " optimizer = torch.optim.Adam(self.parameters(), lr=self.learning_rate)\n", " return optimizer\n", "\n", " ####################\n", " # DATA RELATED HOOKS\n", " ####################\n", "\n", " def prepare_data(self):\n", " # download\n", " MNIST(self.data_dir, train=True, download=True)\n", " MNIST(self.data_dir, train=False, download=True)\n", "\n", " def setup(self, stage=None):\n", "\n", " # Assign train/val datasets for use in dataloaders\n", " if stage == \"fit\" or stage is None:\n", " mnist_full = MNIST(self.data_dir, train=True, transform=self.transform)\n", " self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000])\n", "\n", " # Assign test dataset for use in dataloader(s)\n", " if stage == \"test\" or stage is None:\n", " self.mnist_test = MNIST(self.data_dir, train=False, transform=self.transform)\n", "\n", " def train_dataloader(self):\n", " return DataLoader(self.mnist_train, batch_size=128)\n", "\n", " def val_dataloader(self):\n", " return DataLoader(self.mnist_val, batch_size=128)\n", "\n", " def test_dataloader(self):\n", " return DataLoader(self.mnist_test, batch_size=128)"]}, {"cell_type": "markdown", "id": "fde0b3ad", "metadata": {"papermill": {"duration": 0.03277, "end_time": "2021-12-04T16:45:59.734857", "exception": false, "start_time": "2021-12-04T16:45:59.702087", "status": "completed"}, "tags": []}, "source": ["### Training the ListMNIST Model"]}, {"cell_type": "code", "execution_count": 4, "id": "75ebf631", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:45:59.804804Z", "iopub.status.busy": "2021-12-04T16:45:59.804311Z", "iopub.status.idle": "2021-12-04T16:46:25.412130Z", "shell.execute_reply": "2021-12-04T16:46:25.411686Z"}, "papermill": {"duration": 25.644008, "end_time": "2021-12-04T16:46:25.412258", "exception": false, "start_time": "2021-12-04T16:45:59.768250", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/connectors/callback_connector.py:90: LightningDeprecationWarning: Setting `Trainer(progress_bar_refresh_rate=20)` is deprecated in v1.5 and will be removed in v1.7. Please pass `pytorch_lightning.callbacks.progress.TQDMProgressBar` with `refresh_rate` directly to the Trainer's `callbacks` argument instead. Or, to disable the progress bar pass `enable_progress_bar = False` to the Trainer.\n", " rank_zero_deprecation(\n", "GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stderr", "output_type": "stream", "text": ["\n", " | Name | Type | Params\n", "-------------------------------------\n", "0 | model | Sequential | 55.1 K\n", "-------------------------------------\n", "55.1 K Trainable params\n", "0 Non-trainable params\n", "55.1 K Total params\n", "0.220 Total estimated model params size (MB)\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "768f5e115e3f4d86b97c71b44f458240", "version_major": 2, "version_minor": 0}, "text/plain": ["Validation sanity check: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/data_loading.py:111: UserWarning: The dataloader, val_dataloader 0, does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` (try 12 which is the number of cpus on this machine) in the `DataLoader` init to improve performance.\n", " rank_zero_warn(\n", "/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/data_loading.py:111: UserWarning: The dataloader, train_dataloader, does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` (try 12 which is the number of cpus on this machine) in the `DataLoader` init to improve performance.\n", " rank_zero_warn(\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "eb61fdca27424a06a232c826ca5d695f", "version_major": 2, "version_minor": 0}, "text/plain": ["Training: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "2488acd527e24363aa31b980006ae745", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "7f7924338266405fadf862414d1f02a1", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}], "source": ["model = LitMNIST()\n", "trainer = Trainer(\n", " max_epochs=2,\n", " gpus=AVAIL_GPUS,\n", " progress_bar_refresh_rate=20,\n", ")\n", "trainer.fit(model)"]}, {"cell_type": "markdown", "id": "81192dcb", "metadata": {"papermill": {"duration": 0.040842, "end_time": "2021-12-04T16:46:25.498462", "exception": false, "start_time": "2021-12-04T16:46:25.457620", "status": "completed"}, "tags": []}, "source": ["## Using DataModules\n", "\n", "DataModules are a way of decoupling data-related hooks from the `LightningModule\n", "` so you can develop dataset agnostic models."]}, {"cell_type": "markdown", "id": "d7703409", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.04198, "end_time": "2021-12-04T16:46:25.580985", "exception": false, "start_time": "2021-12-04T16:46:25.539005", "status": "completed"}, "tags": []}, "source": ["### Defining The MNISTDataModule\n", "\n", "Let's go over each function in the class below and talk about what they're doing:\n", "\n", "1. ```__init__```\n", " - Takes in a `data_dir` arg that points to where you have downloaded/wish to download the MNIST dataset.\n", " - Defines a transform that will be applied across train, val, and test dataset splits.\n", " - Defines default `self.dims`, which is a tuple returned from `datamodule.size()` that can help you initialize models.\n", "\n", "\n", "2. ```prepare_data```\n", " - This is where we can download the dataset. We point to our desired dataset and ask torchvision's `MNIST` dataset class to download if the dataset isn't found there.\n", " - **Note we do not make any state assignments in this function** (i.e. `self.something = ...`)\n", "\n", "3. ```setup```\n", " - Loads in data from file and prepares PyTorch tensor datasets for each split (train, val, test).\n", " - Setup expects a 'stage' arg which is used to separate logic for 'fit' and 'test'.\n", " - If you don't mind loading all your datasets at once, you can set up a condition to allow for both 'fit' related setup and 'test' related setup to run whenever `None` is passed to `stage`.\n", " - **Note this runs across all GPUs and it *is* safe to make state assignments here**\n", "\n", "\n", "4. ```x_dataloader```\n", " - `train_dataloader()`, `val_dataloader()`, and `test_dataloader()` all return PyTorch `DataLoader` instances that are created by wrapping their respective datasets that we prepared in `setup()`"]}, {"cell_type": "code", "execution_count": 5, "id": "3d9cf13e", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:46:25.670687Z", "iopub.status.busy": "2021-12-04T16:46:25.670187Z", "iopub.status.idle": "2021-12-04T16:46:25.672182Z", "shell.execute_reply": "2021-12-04T16:46:25.671779Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.050689, "end_time": "2021-12-04T16:46:25.672288", "exception": false, "start_time": "2021-12-04T16:46:25.621599", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class MNISTDataModule(LightningDataModule):\n", " def __init__(self, data_dir: str = PATH_DATASETS):\n", " super().__init__()\n", " self.data_dir = data_dir\n", " self.transform = transforms.Compose(\n", " [\n", " transforms.ToTensor(),\n", " transforms.Normalize((0.1307,), (0.3081,)),\n", " ]\n", " )\n", "\n", " # self.dims is returned when you call dm.size()\n", " # Setting default dims here because we know them.\n", " # Could optionally be assigned dynamically in dm.setup()\n", " self.dims = (1, 28, 28)\n", " self.num_classes = 10\n", "\n", " def prepare_data(self):\n", " # download\n", " MNIST(self.data_dir, train=True, download=True)\n", " MNIST(self.data_dir, train=False, download=True)\n", "\n", " def setup(self, stage=None):\n", "\n", " # Assign train/val datasets for use in dataloaders\n", " if stage == \"fit\" or stage is None:\n", " mnist_full = MNIST(self.data_dir, train=True, transform=self.transform)\n", " self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000])\n", "\n", " # Assign test dataset for use in dataloader(s)\n", " if stage == \"test\" or stage is None:\n", " self.mnist_test = MNIST(self.data_dir, train=False, transform=self.transform)\n", "\n", " def train_dataloader(self):\n", " return DataLoader(self.mnist_train, batch_size=BATCH_SIZE)\n", "\n", " def val_dataloader(self):\n", " return DataLoader(self.mnist_val, batch_size=BATCH_SIZE)\n", "\n", " def test_dataloader(self):\n", " return DataLoader(self.mnist_test, batch_size=BATCH_SIZE)"]}, {"cell_type": "markdown", "id": "c916523e", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.044584, "end_time": "2021-12-04T16:46:25.757859", "exception": false, "start_time": "2021-12-04T16:46:25.713275", "status": "completed"}, "tags": []}, "source": ["### Defining the dataset agnostic `LitModel`\n", "\n", "Below, we define the same model as the `LitMNIST` model we made earlier.\n", "\n", "However, this time our model has the freedom to use any input data that we'd like \ud83d\udd25."]}, {"cell_type": "code", "execution_count": 6, "id": "2d745995", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:46:25.848843Z", "iopub.status.busy": "2021-12-04T16:46:25.848373Z", "iopub.status.idle": "2021-12-04T16:46:25.850404Z", "shell.execute_reply": "2021-12-04T16:46:25.849943Z"}, "papermill": {"duration": 0.051727, "end_time": "2021-12-04T16:46:25.850508", "exception": false, "start_time": "2021-12-04T16:46:25.798781", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class LitModel(LightningModule):\n", " def __init__(self, channels, width, height, num_classes, hidden_size=64, learning_rate=2e-4):\n", "\n", " super().__init__()\n", "\n", " # We take in input dimensions as parameters and use those to dynamically build model.\n", " self.channels = channels\n", " self.width = width\n", " self.height = height\n", " self.num_classes = num_classes\n", " self.hidden_size = hidden_size\n", " self.learning_rate = learning_rate\n", "\n", " self.model = nn.Sequential(\n", " nn.Flatten(),\n", " nn.Linear(channels * width * height, hidden_size),\n", " nn.ReLU(),\n", " nn.Dropout(0.1),\n", " nn.Linear(hidden_size, hidden_size),\n", " nn.ReLU(),\n", " nn.Dropout(0.1),\n", " nn.Linear(hidden_size, num_classes),\n", " )\n", "\n", " def forward(self, x):\n", " x = self.model(x)\n", " return F.log_softmax(x, dim=1)\n", "\n", " def training_step(self, batch, batch_idx):\n", " x, y = batch\n", " logits = self(x)\n", " loss = F.nll_loss(logits, y)\n", " return loss\n", "\n", " def validation_step(self, batch, batch_idx):\n", "\n", " x, y = batch\n", " logits = self(x)\n", " loss = F.nll_loss(logits, y)\n", " preds = torch.argmax(logits, dim=1)\n", " acc = accuracy(preds, y)\n", " self.log(\"val_loss\", loss, prog_bar=True)\n", " self.log(\"val_acc\", acc, prog_bar=True)\n", " return loss\n", "\n", " def configure_optimizers(self):\n", " optimizer = torch.optim.Adam(self.parameters(), lr=self.learning_rate)\n", " return optimizer"]}, {"cell_type": "markdown", "id": "a835525d", "metadata": {"papermill": {"duration": 0.04143, "end_time": "2021-12-04T16:46:25.933881", "exception": false, "start_time": "2021-12-04T16:46:25.892451", "status": "completed"}, "tags": []}, "source": ["### Training the `LitModel` using the `MNISTDataModule`\n", "\n", "Now, we initialize and train the `LitModel` using the `MNISTDataModule`'s configuration settings and dataloaders."]}, {"cell_type": "code", "execution_count": 7, "id": "08a4316a", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:46:26.019913Z", "iopub.status.busy": "2021-12-04T16:46:26.019449Z", "iopub.status.idle": "2021-12-04T16:46:56.702166Z", "shell.execute_reply": "2021-12-04T16:46:56.698729Z"}, "papermill": {"duration": 30.727168, "end_time": "2021-12-04T16:46:56.702286", "exception": false, "start_time": "2021-12-04T16:46:25.975118", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/core/datamodule.py:175: LightningDeprecationWarning: DataModule property `dims` was deprecated in v1.5 and will be removed in v1.7.\n", " rank_zero_deprecation(\"DataModule property `dims` was deprecated in v1.5 and will be removed in v1.7.\")\n", "/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/core/datamodule.py:184: LightningDeprecationWarning: DataModule property `size` was deprecated in v1.5 and will be removed in v1.7.\n", " rank_zero_deprecation(\"DataModule property `size` was deprecated in v1.5 and will be removed in v1.7.\")\n", "/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/core/datamodule.py:170: LightningDeprecationWarning: DataModule property `dims` was deprecated in v1.5 and will be removed in v1.7.\n", " rank_zero_deprecation(\"DataModule property `dims` was deprecated in v1.5 and will be removed in v1.7.\")\n", "GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stderr", "output_type": "stream", "text": ["\n", " | Name | Type | Params\n", "-------------------------------------\n", "0 | model | Sequential | 55.1 K\n", "-------------------------------------\n", "55.1 K Trainable params\n", "0 Non-trainable params\n", "55.1 K Total params\n", "0.220 Total estimated model params size (MB)\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "1a75cc9880ab40a8ba9ce7b57f0a0765", "version_major": 2, "version_minor": 0}, "text/plain": ["Validation sanity check: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "adae3a9829a54b508f38288825a67235", "version_major": 2, "version_minor": 0}, "text/plain": ["Training: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "bf86e207916b4e409d89947baee6b2a3", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "8e77575340994f2fbd6538d157de467e", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "8e95fecb92834da89d6246cbd02d3f06", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}], "source": ["# Init DataModule\n", "dm = MNISTDataModule()\n", "# Init model from datamodule's attributes\n", "model = LitModel(*dm.size(), dm.num_classes)\n", "# Init trainer\n", "trainer = Trainer(\n", " max_epochs=3,\n", " progress_bar_refresh_rate=20,\n", " gpus=AVAIL_GPUS,\n", ")\n", "# Pass the datamodule as arg to trainer.fit to override model hooks :)\n", "trainer.fit(model, dm)"]}, {"cell_type": "markdown", "id": "34f903fa", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.051415, "end_time": "2021-12-04T16:46:56.811131", "exception": false, "start_time": "2021-12-04T16:46:56.759716", "status": "completed"}, "tags": []}, "source": ["### Defining the CIFAR10 DataModule\n", "\n", "Lets prove the `LitModel` we made earlier is dataset agnostic by defining a new datamodule for the CIFAR10 dataset."]}, {"cell_type": "code", "execution_count": 8, "id": "1b86ab59", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:46:56.920233Z", "iopub.status.busy": "2021-12-04T16:46:56.919755Z", "iopub.status.idle": "2021-12-04T16:46:56.921851Z", "shell.execute_reply": "2021-12-04T16:46:56.921254Z"}, "papermill": {"duration": 0.060616, "end_time": "2021-12-04T16:46:56.921972", "exception": false, "start_time": "2021-12-04T16:46:56.861356", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class CIFAR10DataModule(LightningDataModule):\n", " def __init__(self, data_dir: str = \"./\"):\n", " super().__init__()\n", " self.data_dir = data_dir\n", " self.transform = transforms.Compose(\n", " [\n", " transforms.ToTensor(),\n", " transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5)),\n", " ]\n", " )\n", "\n", " self.dims = (3, 32, 32)\n", " self.num_classes = 10\n", "\n", " def prepare_data(self):\n", " # download\n", " CIFAR10(self.data_dir, train=True, download=True)\n", " CIFAR10(self.data_dir, train=False, download=True)\n", "\n", " def setup(self, stage=None):\n", "\n", " # Assign train/val datasets for use in dataloaders\n", " if stage == \"fit\" or stage is None:\n", " cifar_full = CIFAR10(self.data_dir, train=True, transform=self.transform)\n", " self.cifar_train, self.cifar_val = random_split(cifar_full, [45000, 5000])\n", "\n", " # Assign test dataset for use in dataloader(s)\n", " if stage == \"test\" or stage is None:\n", " self.cifar_test = CIFAR10(self.data_dir, train=False, transform=self.transform)\n", "\n", " def train_dataloader(self):\n", " return DataLoader(self.cifar_train, batch_size=BATCH_SIZE)\n", "\n", " def val_dataloader(self):\n", " return DataLoader(self.cifar_val, batch_size=BATCH_SIZE)\n", "\n", " def test_dataloader(self):\n", " return DataLoader(self.cifar_test, batch_size=BATCH_SIZE)"]}, {"cell_type": "markdown", "id": "ac30ef93", "metadata": {"papermill": {"duration": 0.050833, "end_time": "2021-12-04T16:46:57.023402", "exception": false, "start_time": "2021-12-04T16:46:56.972569", "status": "completed"}, "tags": []}, "source": ["### Training the `LitModel` using the `CIFAR10DataModule`\n", "\n", "Our model isn't very good, so it will perform pretty badly on the CIFAR10 dataset.\n", "\n", "The point here is that we can see that our `LitModel` has no problem using a different datamodule as its input data."]}, {"cell_type": "code", "execution_count": 9, "id": "11d3054c", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:46:57.128360Z", "iopub.status.busy": "2021-12-04T16:46:57.127907Z", "iopub.status.idle": "2021-12-04T16:47:50.619126Z", "shell.execute_reply": "2021-12-04T16:47:50.618692Z"}, "papermill": {"duration": 53.545438, "end_time": "2021-12-04T16:47:50.619260", "exception": false, "start_time": "2021-12-04T16:46:57.073822", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}, {"name": "stdout", "output_type": "stream", "text": ["Files already downloaded and verified\n"]}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stderr", "output_type": "stream", "text": ["\n", " | Name | Type | Params\n", "-------------------------------------\n", "0 | model | Sequential | 855 K \n", "-------------------------------------\n", "855 K Trainable params\n", "0 Non-trainable params\n", "855 K Total params\n", "3.420 Total estimated model params size (MB)\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "07d7ba996450429b80d5a056099cf110", "version_major": 2, "version_minor": 0}, "text/plain": ["Validation sanity check: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "db19a78a15954e2b8a4f99eb2de9270a", "version_major": 2, "version_minor": 0}, "text/plain": ["Training: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "7f2aa9df928e4925a1193b7427380ff4", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "37a0aca2beb042d78d3680070561bfdc", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "3e91c57c5e1a446384fa939d0b3d6525", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "aa675ba935754589a5a9550795c04bee", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "1b28004c7448443a97074788b559d535", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}], "source": ["dm = CIFAR10DataModule()\n", "model = LitModel(*dm.size(), dm.num_classes, hidden_size=256)\n", "trainer = Trainer(\n", " max_epochs=5,\n", " progress_bar_refresh_rate=20,\n", " gpus=AVAIL_GPUS,\n", ")\n", "trainer.fit(model, dm)"]}, {"cell_type": "markdown", "id": "d7227386", "metadata": {"papermill": {"duration": 0.063624, "end_time": "2021-12-04T16:47:50.747460", "exception": false, "start_time": "2021-12-04T16:47:50.683836", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "[![Pytorch Lightning](){height=\"60px\" width=\"240px\"}](https://pytorchlightning.ai)"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: PyTorch Lightning DataModules\n", " :card_description: This notebook will walk you through how to start using Datamodules. With the release of `pytorch-lightning` version 0.9.0, we have included a new class called...\n", " :tags: GPU/TPU,Lightning-Examples"]}], "metadata": {"jupytext": {"cell_metadata_filter": "colab_type,id,colab,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 121.040769, "end_time": "2021-12-04T16:47:52.223467", "environment_variables": {}, "exception": null, "input_path": "lightning_examples/datamodules/datamodules.ipynb", "output_path": ".notebooks/lightning_examples/datamodules.ipynb", "parameters": {}, "start_time": "2021-12-04T16:45:51.182698", "version": "2.3.3"}, "widgets": {"application/vnd.jupyter.widget-state+json": {"state": {"041f10d5c9fe42f6b6101bf3ce7f53fb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_bbe528fe44644854a9bb9189dbba1160", "placeholder": "\u200b", "style": "IPY_MODEL_c18acb5a037d4945a4501d96c8fae24e", "value": " 20/20 [00:00<00:00, 20.23it/s]"}}, "046540f066864bcb84c4d37a584da370": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "05008355dc2d450ca42051e370346f18": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "055ce06d091b4f4eba52bf64158e9675": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_fd49beba21cd45ccb858e36c10762a7f", "placeholder": "\u200b", "style": "IPY_MODEL_e56f1ea9380d47d0aa130d82d6e8d685", "value": "Validation sanity check: 0%"}}, "071176e5c655438588281056b551d627": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "07d7ba996450429b80d5a056099cf110": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_81027aed2f2546b99962209d53f522d9", "IPY_MODEL_65ef56c9c8eb42a598a68cacc8da5177", "IPY_MODEL_6e580744cc7e4a40a82df1730f663865"], "layout": "IPY_MODEL_549689ee50894c42a5bfcfe90b7f4565"}}, "0bb08f9ebb7d4bf89852a14acc0aa9d2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "0dc0803d41cd4c28a7a6f76b8e1ae0ec": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "0e797437e8cd4d4dbaf695d6bb3082a7": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "0fc92bf19ad54f50b87e243797da525b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "12948f6cb81e42c2a28c87635182f380": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_fd0efe1ba0794d07801286e8c8c82151", "max": 20.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_e10e4a67b6bf467aa5d3d8e7fa91f1ce", "value": 20.0}}, "12f1519dc785487eb49a85ca47b5149d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1337cb79348240b58c48427043f51f85": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "1418aae647f04591870a4931b9c70781": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1969d64dc7634207ae872d28b6e425e0", "placeholder": "\u200b", "style": "IPY_MODEL_ff2fae1a3eff4dbbab900312f78a04fc", "value": " 235/235 [00:10<00:00, 23.16it/s, loss=0.331, v_num=4, val_loss=0.278, val_acc=0.918]"}}, "1476ef3e1ecd4018957f0130dfcdb383": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "15d8aa5839444bac8dbb125f268d3727": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_0dc0803d41cd4c28a7a6f76b8e1ae0ec", "placeholder": "\u200b", "style": "IPY_MODEL_6df35592e449430d9f7a9ea085855234", "value": "Epoch 1: 100%"}}, "18ffda5c5a4d48ed9652bc713190efa0": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "1969d64dc7634207ae872d28b6e425e0": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1a75cc9880ab40a8ba9ce7b57f0a0765": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_055ce06d091b4f4eba52bf64158e9675", "IPY_MODEL_fe6f724fbcd549d18f69f46f73cec77e", "IPY_MODEL_3608aa33ad044ec8ad3bbfbe65572fdf"], "layout": "IPY_MODEL_db6cb2d3f32b4b7b96f746b70541cdbd"}}, "1b28004c7448443a97074788b559d535": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_c09fe936a9dd4feaac58207b660e91b8", "IPY_MODEL_b50255939b1448908a80c51319aeb709", "IPY_MODEL_27d3d469dd744b83a084677b4f022b5d"], "layout": "IPY_MODEL_fb9bc72381a24c0ab759f875fe5d1d3b"}}, "1ce8afc6ca874703a5c9a25e499207f3": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1e3ae51213e24a278b69f7e367bf851c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1e823fd4e7d0434982e274023a5274bc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "1efd9542e7ca4ad3a0db3d631cbee72f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_9d73f752544d4bcc9f1b5b4769c7317d", "max": 20.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_999aa998227047dda17516eeb71aa6db", "value": 20.0}}, "1fa7d7f81f7b4420ae91e983bfb9b4ae": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "20ce657f01dd4c5d8a947124d44078ba": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "23662fea34734dd48718c50b28585645": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "23efe0a29c96456d97de2fefdd7b6806": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2aed645a39a44501b2259a5a10f806d1", "placeholder": "\u200b", "style": "IPY_MODEL_20ce657f01dd4c5d8a947124d44078ba", "value": " 470/470 [00:11<00:00, 42.59it/s, loss=0.301, v_num=3, val_loss=0.255, val_acc=0.925]"}}, "2488acd527e24363aa31b980006ae745": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_b2f89c7143ae4567ae699cbee23fe747", "IPY_MODEL_2fb4cb9abeee4b53a47645473806aac2", "IPY_MODEL_3b1643d2b31745f99c51189861531ad0"], "layout": "IPY_MODEL_81c7d575b0f6457f84a3c37bbb09da67"}}, "248e123d9a48408097a33ee63175d655": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_397d40dda3864639b0263f97e6168457", "max": 20.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_9315c66ada0346da8c053c80b636402d", "value": 20.0}}, "27d3d469dd744b83a084677b4f022b5d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_0e797437e8cd4d4dbaf695d6bb3082a7", "placeholder": "\u200b", "style": "IPY_MODEL_4e001ded9e2142b1ab49555a49c3441c", "value": " 20/20 [00:00<00:00, 20.34it/s]"}}, "2aed645a39a44501b2259a5a10f806d1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "2bacc7082a704e2d8047b2d17e27e83d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "2fb4cb9abeee4b53a47645473806aac2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c6171b1b06a84e75aa7dc2fa35c36f57", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_488ea46105c04a458dc95deb2b53e609", "value": 40.0}}, "30707f52823346dab1b3a6db2b4dfa27": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "31695284f0d944f0b7a423300f908390": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1476ef3e1ecd4018957f0130dfcdb383", "placeholder": "\u200b", "style": "IPY_MODEL_3a654946c7384b10b9ec0de1c2a9683b", "value": " 0/2 [00:00<?, ?it/s]"}}, "3490c0eeca5c4fa1b2fb1540df1e0119": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3608aa33ad044ec8ad3bbfbe65572fdf": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_12f1519dc785487eb49a85ca47b5149d", "placeholder": "\u200b", "style": "IPY_MODEL_b34601cdb9f34fedb83d2b3b92095d84", "value": " 0/2 [00:00<?, ?it/s]"}}, "36505e9126384458b7a2f19343d6e37b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1fa7d7f81f7b4420ae91e983bfb9b4ae", "placeholder": "\u200b", "style": "IPY_MODEL_0fc92bf19ad54f50b87e243797da525b", "value": "Validating: 100%"}}, "369f33250b7e46e6b54a31680946081c": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "37a0aca2beb042d78d3680070561bfdc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_e1e722b4ba6347d0b864de5c29e7d324", "IPY_MODEL_1efd9542e7ca4ad3a0db3d631cbee72f", "IPY_MODEL_6534be4f1769429b88eebad316c7c2ed"], "layout": "IPY_MODEL_6026cb507a9c4740b0d93a33b710c66f"}}, "397d40dda3864639b0263f97e6168457": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3a654946c7384b10b9ec0de1c2a9683b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "3b1643d2b31745f99c51189861531ad0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3490c0eeca5c4fa1b2fb1540df1e0119", "placeholder": "\u200b", "style": "IPY_MODEL_a62f633a147d475caa8490ecbb8427cf", "value": " 40/40 [00:00<00:00, 45.54it/s]"}}, "3be62b6211c54a36a9c749eebc7ba65e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_046540f066864bcb84c4d37a584da370", "max": 196.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_5828ec1d42a947628434634af513fda9", "value": 196.0}}, "3e91c57c5e1a446384fa939d0b3d6525": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_b5dfecd17bef4d9e8683f470462fa197", "IPY_MODEL_c6c1c3ec1a0341da92b182780b7a6fd0", "IPY_MODEL_cf2a40a0c5174457aea4aec7b8f7864a"], "layout": "IPY_MODEL_bdc92ba2821945acb2db16c1814d4ad1"}}, "40a0d394ad834802a994ae894ce61923": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4352932c9dc94329b785a1ae04cae96a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "488ea46105c04a458dc95deb2b53e609": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "4a042e1f9f8c47488002f5e5ef01163e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "4daeedb9efbd4bdcaee5e9e209ff85f1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "4e001ded9e2142b1ab49555a49c3441c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "50701a5262a04c9eade1571e1c112870": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "50bac340b87c4a8aa003a7cc128809ba": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "526b549d670640ebb4c66046ca783375": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "53a860195fe74155b2e3084d57f934b2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_91359b90570043e684bd0d5c807305eb", "placeholder": "\u200b", "style": "IPY_MODEL_7d14ca2343e84708889dcd5651bdadd5", "value": "Validating: 100%"}}, "53ad10603a244414a17fa3d70960844e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1e3ae51213e24a278b69f7e367bf851c", "placeholder": "\u200b", "style": "IPY_MODEL_eea47fbfb6764d2d8072c08ad33bf2bd", "value": "Validating: 100%"}}, "549689ee50894c42a5bfcfe90b7f4565": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "549a503432ca4c309730849495d09e90": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "56342bc4e2bc4fe4af37821040ac0ecd": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "56d6913766104181a3d312e70a384b5d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_50bac340b87c4a8aa003a7cc128809ba", "placeholder": "\u200b", "style": "IPY_MODEL_72a9f02a5dfe46a5ad8a4f73f1feb091", "value": "Validating: 100%"}}, "5828ec1d42a947628434634af513fda9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "58658a5812d741c693aa21f0ea95f63b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a7f8bc154c9c40d2840fd03f50e2fb93", "max": 20.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_f2ba50047c764c5c9f8e384672d49050", "value": 20.0}}, "59f0e262344d4ea8b2800057ee40f45e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "5ae4444dbb994b9eb661bae0061a0545": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "5c66fc27f7bc4809b4a91c1eb28c7be3": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "6026cb507a9c4740b0d93a33b710c66f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "6218602ae56242fc8427ca200c5caa90": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "64004563a6074b9c876c648bbce6cde5": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "64c91d37fcb8443e966da1b29266351f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a9877ca759754a0fa4beaaf9627608ac", "placeholder": "\u200b", "style": "IPY_MODEL_b1f67ebe8dc64b7b8cfc6649dd4217c5", "value": " 20/20 [00:00<00:00, 24.24it/s]"}}, "6534be4f1769429b88eebad316c7c2ed": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_369f33250b7e46e6b54a31680946081c", "placeholder": "\u200b", "style": "IPY_MODEL_a94711718593447395d16addb1a12cda", "value": " 20/20 [00:00<00:00, 20.07it/s]"}}, "6537a3c66b00455c9581c8a9d2d7075f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "65ef56c9c8eb42a598a68cacc8da5177": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "danger", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_6218602ae56242fc8427ca200c5caa90", "max": 2.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_071176e5c655438588281056b551d627", "value": 0.0}}, "6df35592e449430d9f7a9ea085855234": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "6e580744cc7e4a40a82df1730f663865": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_fbe640bbc7d541fa9e337874f7ebb100", "placeholder": "\u200b", "style": "IPY_MODEL_85bad507a7d54408897de1439438c898", "value": " 0/2 [00:00<?, ?it/s]"}}, "72a9f02a5dfe46a5ad8a4f73f1feb091": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "768f5e115e3f4d86b97c71b44f458240": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_c5011f431d28417395dd982e6424d342", "IPY_MODEL_81b1d48c4ac047828f825d21ab953234", "IPY_MODEL_31695284f0d944f0b7a423300f908390"], "layout": "IPY_MODEL_6537a3c66b00455c9581c8a9d2d7075f"}}, "7a5ccbb2499b43e9ae6b1501456d2d86": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "7d14ca2343e84708889dcd5651bdadd5": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "7dad3ba253814912a31e2c6e420fc7c8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "7e228107476b4c7dadf3c70d6dab8d44": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_97cec026f48a4eeb8c5af10f22a3cfa4", "max": 235.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_9eca64b3bb7241ff8758aad3c16cf743", "value": 235.0}}, "7f2aa9df928e4925a1193b7427380ff4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_e45d95dc1d834de9a0c760552507a3e2", "IPY_MODEL_58658a5812d741c693aa21f0ea95f63b", "IPY_MODEL_041f10d5c9fe42f6b6101bf3ce7f53fb"], "layout": "IPY_MODEL_30707f52823346dab1b3a6db2b4dfa27"}}, "7f7924338266405fadf862414d1f02a1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_ca22e6df84e94eb1b72081b7566bfadf", "IPY_MODEL_b613e0efb250468f85488aad1904e785", "IPY_MODEL_d1371d179edb4b7690fb18a3751f3065"], "layout": "IPY_MODEL_4352932c9dc94329b785a1ae04cae96a"}}, "805eb023d3974ad2adeb2370206bd70d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_90625c2b1c1c4c2d82efb5ad6b7ace57", "max": 20.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_d08c85acb5d2474dbc5e83ced26a5be0", "value": 20.0}}, "80b13852475d438f864f8a7a1a8e6094": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "81027aed2f2546b99962209d53f522d9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ec02b811e3c9471caa5176c09991e4e3", "placeholder": "\u200b", "style": "IPY_MODEL_d49a6c09dd1c423294792b28058ad3e0", "value": "Validation sanity check: 0%"}}, "81108d80cde546739a034f085412f763": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1ce8afc6ca874703a5c9a25e499207f3", "placeholder": "\u200b", "style": "IPY_MODEL_cd49716ced8a47cd86767a8d334572f8", "value": " 20/20 [00:00<00:00, 24.59it/s]"}}, "81b1d48c4ac047828f825d21ab953234": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "danger", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_fa01c038682a40668590b94a00a4a241", "max": 2.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_56342bc4e2bc4fe4af37821040ac0ecd", "value": 0.0}}, "81c7d575b0f6457f84a3c37bbb09da67": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "841ac1bf4d1f405d9af8db196992c21e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "85bad507a7d54408897de1439438c898": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "889fbb4df4784c92bd9d17bc662ddca0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d1245a33a19644fb8a69adfa1a213b2e", "placeholder": "\u200b", "style": "IPY_MODEL_4daeedb9efbd4bdcaee5e9e209ff85f1", "value": " 20/20 [00:01<00:00, 19.99it/s]"}}, "8ad9135da95e41b980ccec4cbdad6e6e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "8b001407ab8447beb6aac24fe26f6e07": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "8e413e2031854c979e00e11e9c931a1a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "8e77575340994f2fbd6538d157de467e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_53a860195fe74155b2e3084d57f934b2", "IPY_MODEL_248e123d9a48408097a33ee63175d655", "IPY_MODEL_81108d80cde546739a034f085412f763"], "layout": "IPY_MODEL_d0a8e767be6a443e9a705ae58e413564"}}, "8e95fecb92834da89d6246cbd02d3f06": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_56d6913766104181a3d312e70a384b5d", "IPY_MODEL_805eb023d3974ad2adeb2370206bd70d", "IPY_MODEL_9c91bccae6324afbbfd226218c1a6ec3"], "layout": "IPY_MODEL_5ae4444dbb994b9eb661bae0061a0545"}}, "90625c2b1c1c4c2d82efb5ad6b7ace57": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "91359b90570043e684bd0d5c807305eb": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "9315c66ada0346da8c053c80b636402d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "961ec875a4bc468db541f4d17cb0c959": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_59f0e262344d4ea8b2800057ee40f45e", "max": 470.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_1337cb79348240b58c48427043f51f85", "value": 470.0}}, "97cec026f48a4eeb8c5af10f22a3cfa4": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "98056abfaec44f74b95511d322efcffb": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "999aa998227047dda17516eeb71aa6db": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "9c91bccae6324afbbfd226218c1a6ec3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ce596973849e485784e0f322bd2fee72", "placeholder": "\u200b", "style": "IPY_MODEL_f0e8755a989b493791b9efcb6b675aa5", "value": " 20/20 [00:00<00:00, 24.50it/s]"}}, "9ce8d78f6d7644588c5cd03364c044cd": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_be8d323ac655443da2433c4688cc3b58", "max": 20.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_64004563a6074b9c876c648bbce6cde5", "value": 20.0}}, "9d73f752544d4bcc9f1b5b4769c7317d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "9eca64b3bb7241ff8758aad3c16cf743": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "a066a53b41e249e2831e5980bd4003bf": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "a1984adb3ecb4dd1a030cf6360f62604": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "a62f633a147d475caa8490ecbb8427cf": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "a7f8bc154c9c40d2840fd03f50e2fb93": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "a94711718593447395d16addb1a12cda": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "a9877ca759754a0fa4beaaf9627608ac": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "aa675ba935754589a5a9550795c04bee": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_53ad10603a244414a17fa3d70960844e", "IPY_MODEL_12948f6cb81e42c2a28c87635182f380", "IPY_MODEL_889fbb4df4784c92bd9d17bc662ddca0"], "layout": "IPY_MODEL_e1cbc478e48c4cc2b308deca86016e48"}}, "adae3a9829a54b508f38288825a67235": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_d9cb7bfe4691411bbb36fc53a2a61d59", "IPY_MODEL_7e228107476b4c7dadf3c70d6dab8d44", "IPY_MODEL_1418aae647f04591870a4931b9c70781"], "layout": "IPY_MODEL_18ffda5c5a4d48ed9652bc713190efa0"}}, "ae0ef34d0d254bc2a5bf9ab0cb7ebcce": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "af18873d5e6c462bb6b97c59b6dda6d8": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b1f67ebe8dc64b7b8cfc6649dd4217c5": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "b2f89c7143ae4567ae699cbee23fe747": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_5c66fc27f7bc4809b4a91c1eb28c7be3", "placeholder": "\u200b", "style": "IPY_MODEL_c7615b777eb1436984e41ded24171cab", "value": "Validating: 100%"}}, "b34601cdb9f34fedb83d2b3b92095d84": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "b50255939b1448908a80c51319aeb709": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a1984adb3ecb4dd1a030cf6360f62604", "max": 20.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_ae0ef34d0d254bc2a5bf9ab0cb7ebcce", "value": 20.0}}, "b5249f51e9854f6398e334263a18f1b7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "b5dfecd17bef4d9e8683f470462fa197": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_fb18af4aa2d64f3da0e019ed601d7d7b", "placeholder": "\u200b", "style": "IPY_MODEL_f5d0c5dae3fc41848ba45e99fccc57f6", "value": "Validating: 100%"}}, "b613e0efb250468f85488aad1904e785": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_549a503432ca4c309730849495d09e90", "max": 40.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_b5249f51e9854f6398e334263a18f1b7", "value": 40.0}}, "b836287ffdbd45f484e253bf70957e90": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "bb867f5c3ba04190998f65812f6f76a2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_841ac1bf4d1f405d9af8db196992c21e", "placeholder": "\u200b", "style": "IPY_MODEL_a066a53b41e249e2831e5980bd4003bf", "value": " 196/196 [00:10<00:00, 19.16it/s, loss=1.35, v_num=5, val_loss=1.440, val_acc=0.495]"}}, "bbe528fe44644854a9bb9189dbba1160": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "bdc92ba2821945acb2db16c1814d4ad1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "be8d323ac655443da2433c4688cc3b58": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "bf86e207916b4e409d89947baee6b2a3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_36505e9126384458b7a2f19343d6e37b", "IPY_MODEL_9ce8d78f6d7644588c5cd03364c044cd", "IPY_MODEL_64c91d37fcb8443e966da1b29266351f"], "layout": "IPY_MODEL_23662fea34734dd48718c50b28585645"}}, "c09fe936a9dd4feaac58207b660e91b8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_cb762151a751470eb7c69722f2bd2168", "placeholder": "\u200b", "style": "IPY_MODEL_cc22e526515a48918562f074ab776ac3", "value": "Validating: 100%"}}, "c18acb5a037d4945a4501d96c8fae24e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "c5011f431d28417395dd982e6424d342": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e7ad9f0b4e9742a69c0b436f5269eb0a", "placeholder": "\u200b", "style": "IPY_MODEL_1e823fd4e7d0434982e274023a5274bc", "value": "Validation sanity check: 0%"}}, "c6171b1b06a84e75aa7dc2fa35c36f57": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c6c1c3ec1a0341da92b182780b7a6fd0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_40a0d394ad834802a994ae894ce61923", "max": 20.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_7dad3ba253814912a31e2c6e420fc7c8", "value": 20.0}}, "c7615b777eb1436984e41ded24171cab": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "ca22e6df84e94eb1b72081b7566bfadf": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_80b13852475d438f864f8a7a1a8e6094", "placeholder": "\u200b", "style": "IPY_MODEL_8e413e2031854c979e00e11e9c931a1a", "value": "Validating: 100%"}}, "cb762151a751470eb7c69722f2bd2168": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "cc22e526515a48918562f074ab776ac3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "cd49716ced8a47cd86767a8d334572f8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "cdd719fc342a4a57aa0c39d938d34bd9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "ce596973849e485784e0f322bd2fee72": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "cf2a40a0c5174457aea4aec7b8f7864a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8b001407ab8447beb6aac24fe26f6e07", "placeholder": "\u200b", "style": "IPY_MODEL_50701a5262a04c9eade1571e1c112870", "value": " 20/20 [00:00<00:00, 20.07it/s]"}}, "d08c85acb5d2474dbc5e83ced26a5be0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "d0a8e767be6a443e9a705ae58e413564": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "d1245a33a19644fb8a69adfa1a213b2e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d1371d179edb4b7690fb18a3751f3065": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2bacc7082a704e2d8047b2d17e27e83d", "placeholder": "\u200b", "style": "IPY_MODEL_0bb08f9ebb7d4bf89852a14acc0aa9d2", "value": " 40/40 [00:00<00:00, 44.58it/s]"}}, "d49a6c09dd1c423294792b28058ad3e0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "d9cb7bfe4691411bbb36fc53a2a61d59": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_05008355dc2d450ca42051e370346f18", "placeholder": "\u200b", "style": "IPY_MODEL_cdd719fc342a4a57aa0c39d938d34bd9", "value": "Epoch 2: 100%"}}, "da7c1771e1794b5da89c02462ab3b3a9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ee6e60f6f20b44bda4de9976ee4553e5", "placeholder": "\u200b", "style": "IPY_MODEL_b836287ffdbd45f484e253bf70957e90", "value": "Epoch 4: 100%"}}, "db19a78a15954e2b8a4f99eb2de9270a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_da7c1771e1794b5da89c02462ab3b3a9", "IPY_MODEL_3be62b6211c54a36a9c749eebc7ba65e", "IPY_MODEL_bb867f5c3ba04190998f65812f6f76a2"], "layout": "IPY_MODEL_de2baa14900e4345adbd48d2ba942b9f"}}, "db6cb2d3f32b4b7b96f746b70541cdbd": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "de2baa14900e4345adbd48d2ba942b9f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "e10e4a67b6bf467aa5d3d8e7fa91f1ce": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "e1cbc478e48c4cc2b308deca86016e48": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "e1e722b4ba6347d0b864de5c29e7d324": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_7a5ccbb2499b43e9ae6b1501456d2d86", "placeholder": "\u200b", "style": "IPY_MODEL_526b549d670640ebb4c66046ca783375", "value": "Validating: 100%"}}, "e45d95dc1d834de9a0c760552507a3e2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_98056abfaec44f74b95511d322efcffb", "placeholder": "\u200b", "style": "IPY_MODEL_8ad9135da95e41b980ccec4cbdad6e6e", "value": "Validating: 100%"}}, "e56f1ea9380d47d0aa130d82d6e8d685": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "e7ad9f0b4e9742a69c0b436f5269eb0a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "eb61fdca27424a06a232c826ca5d695f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_15d8aa5839444bac8dbb125f268d3727", "IPY_MODEL_961ec875a4bc468db541f4d17cb0c959", "IPY_MODEL_23efe0a29c96456d97de2fefdd7b6806"], "layout": "IPY_MODEL_4a042e1f9f8c47488002f5e5ef01163e"}}, "ec02b811e3c9471caa5176c09991e4e3": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ee6e60f6f20b44bda4de9976ee4553e5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "ee78442ff4344ba1927dbd6e3fdb3893": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "eea47fbfb6764d2d8072c08ad33bf2bd": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "f0e8755a989b493791b9efcb6b675aa5": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "f2ba50047c764c5c9f8e384672d49050": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "f5d0c5dae3fc41848ba45e99fccc57f6": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "fa01c038682a40668590b94a00a4a241": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "fb18af4aa2d64f3da0e019ed601d7d7b": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "fb9bc72381a24c0ab759f875fe5d1d3b": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "fbe640bbc7d541fa9e337874f7ebb100": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "fd0efe1ba0794d07801286e8c8c82151": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "fd49beba21cd45ccb858e36c10762a7f": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "fe6f724fbcd549d18f69f46f73cec77e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "danger", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_af18873d5e6c462bb6b97c59b6dda6d8", "max": 2.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_ee78442ff4344ba1927dbd6e3fdb3893", "value": 0.0}}, "ff2fae1a3eff4dbbab900312f78a04fc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}}, "version_major": 2, "version_minor": 0}}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/lightning_examples/mnist-hello-world.ipynb b/source/notebooks/lightning_examples/mnist-hello-world.ipynb deleted file mode 100644 index ea6d433..0000000 --- a/source/notebooks/lightning_examples/mnist-hello-world.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "afc54843", "metadata": {"papermill": {"duration": 0.031932, "end_time": "2021-12-04T16:48:02.533062", "exception": false, "start_time": "2021-12-04T16:48:02.501130", "status": "completed"}, "tags": []}, "source": ["\n", "# Introduction to Pytorch Lightning\n", "\n", "* **Author:** PL team\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-12-04T16:53:03.416116\n", "\n", "In this notebook, we'll go over the basics of lightning by preparing models to train on the [MNIST Handwritten Digits dataset](https://en.wikipedia.org/wiki/MNIST_database).\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/lightning_examples/mnist-hello-world.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "27a845da", "metadata": {"papermill": {"duration": 0.027971, "end_time": "2021-12-04T16:48:02.591409", "exception": false, "start_time": "2021-12-04T16:48:02.563438", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "012ca993", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-12-04T16:48:02.653518Z", "iopub.status.busy": "2021-12-04T16:48:02.653036Z", "iopub.status.idle": "2021-12-04T16:48:05.576378Z", "shell.execute_reply": "2021-12-04T16:48:05.576765Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 2.958093, "end_time": "2021-12-04T16:48:05.577047", "exception": false, "start_time": "2021-12-04T16:48:02.618954", "status": "completed"}, "tags": []}, "outputs": [], "source": ["! pip install --quiet \"torchvision\" \"torch>=1.6, <1.9\" \"pytorch-lightning>=1.3\" \"torchmetrics>=0.3\""]}, {"cell_type": "code", "execution_count": 2, "id": "bd97d928", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:48:05.639252Z", "iopub.status.busy": "2021-12-04T16:48:05.638766Z", "iopub.status.idle": "2021-12-04T16:48:09.447461Z", "shell.execute_reply": "2021-12-04T16:48:09.446985Z"}, "papermill": {"duration": 3.841766, "end_time": "2021-12-04T16:48:09.447591", "exception": false, "start_time": "2021-12-04T16:48:05.605825", "status": "completed"}, "tags": []}, "outputs": [], "source": ["import os\n", "\n", "import torch\n", "from pytorch_lightning import LightningModule, Trainer\n", "from torch import nn\n", "from torch.nn import functional as F\n", "from torch.utils.data import DataLoader, random_split\n", "from torchmetrics import Accuracy\n", "from torchvision import transforms\n", "from torchvision.datasets import MNIST\n", "\n", "PATH_DATASETS = os.environ.get(\"PATH_DATASETS\", \".\")\n", "AVAIL_GPUS = min(1, torch.cuda.device_count())\n", "BATCH_SIZE = 256 if AVAIL_GPUS else 64"]}, {"cell_type": "markdown", "id": "5239bd0b", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.027737, "end_time": "2021-12-04T16:48:09.504088", "exception": false, "start_time": "2021-12-04T16:48:09.476351", "status": "completed"}, "tags": []}, "source": ["## Simplest example\n", "\n", "Here's the simplest most minimal example with just a training loop (no validation, no testing).\n", "\n", "**Keep in Mind** - A `LightningModule` *is* a PyTorch `nn.Module` - it just has a few more helpful features."]}, {"cell_type": "code", "execution_count": 3, "id": "6bd8a190", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:48:09.567111Z", "iopub.status.busy": "2021-12-04T16:48:09.566628Z", "iopub.status.idle": "2021-12-04T16:48:09.568711Z", "shell.execute_reply": "2021-12-04T16:48:09.568201Z"}, "papermill": {"duration": 0.035325, "end_time": "2021-12-04T16:48:09.568811", "exception": false, "start_time": "2021-12-04T16:48:09.533486", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class MNISTModel(LightningModule):\n", " def __init__(self):\n", " super().__init__()\n", " self.l1 = torch.nn.Linear(28 * 28, 10)\n", "\n", " def forward(self, x):\n", " return torch.relu(self.l1(x.view(x.size(0), -1)))\n", "\n", " def training_step(self, batch, batch_nb):\n", " x, y = batch\n", " loss = F.cross_entropy(self(x), y)\n", " return loss\n", "\n", " def configure_optimizers(self):\n", " return torch.optim.Adam(self.parameters(), lr=0.02)"]}, {"cell_type": "markdown", "id": "341c1376", "metadata": {"papermill": {"duration": 0.028061, "end_time": "2021-12-04T16:48:09.624815", "exception": false, "start_time": "2021-12-04T16:48:09.596754", "status": "completed"}, "tags": []}, "source": ["By using the `Trainer` you automatically get:\n", "1. Tensorboard logging\n", "2. Model checkpointing\n", "3. Training and validation loop\n", "4. early-stopping"]}, {"cell_type": "code", "execution_count": 4, "id": "b86e988a", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:48:09.685915Z", "iopub.status.busy": "2021-12-04T16:48:09.685422Z", "iopub.status.idle": "2021-12-04T16:48:28.879121Z", "shell.execute_reply": "2021-12-04T16:48:28.879523Z"}, "papermill": {"duration": 19.226607, "end_time": "2021-12-04T16:48:28.879683", "exception": false, "start_time": "2021-12-04T16:48:09.653076", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/connectors/callback_connector.py:90: LightningDeprecationWarning: Setting `Trainer(progress_bar_refresh_rate=20)` is deprecated in v1.5 and will be removed in v1.7. Please pass `pytorch_lightning.callbacks.progress.TQDMProgressBar` with `refresh_rate` directly to the Trainer's `callbacks` argument instead. Or, to disable the progress bar pass `enable_progress_bar = False` to the Trainer.\n", " rank_zero_deprecation(\n", "GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stderr", "output_type": "stream", "text": ["\n", " | Name | Type | Params\n", "--------------------------------\n", "0 | l1 | Linear | 7.9 K \n", "--------------------------------\n", "7.9 K Trainable params\n", "0 Non-trainable params\n", "7.9 K Total params\n", "0.031 Total estimated model params size (MB)\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/data_loading.py:111: UserWarning: The dataloader, train_dataloader, does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` (try 12 which is the number of cpus on this machine) in the `DataLoader` init to improve performance.\n", " rank_zero_warn(\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "5f5b35087a20496caa3f259693946413", "version_major": 2, "version_minor": 0}, "text/plain": ["Training: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}], "source": ["# Init our model\n", "mnist_model = MNISTModel()\n", "\n", "# Init DataLoader from MNIST Dataset\n", "train_ds = MNIST(PATH_DATASETS, train=True, download=True, transform=transforms.ToTensor())\n", "train_loader = DataLoader(train_ds, batch_size=BATCH_SIZE)\n", "\n", "# Initialize a trainer\n", "trainer = Trainer(\n", " gpus=AVAIL_GPUS,\n", " max_epochs=3,\n", " progress_bar_refresh_rate=20,\n", ")\n", "\n", "# Train the model \u26a1\n", "trainer.fit(mnist_model, train_loader)"]}, {"cell_type": "markdown", "id": "d3248fa1", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.033634, "end_time": "2021-12-04T16:48:28.948915", "exception": false, "start_time": "2021-12-04T16:48:28.915281", "status": "completed"}, "tags": []}, "source": ["## A more complete MNIST Lightning Module Example\n", "\n", "That wasn't so hard was it?\n", "\n", "Now that we've got our feet wet, let's dive in a bit deeper and write a more complete `LightningModule` for MNIST...\n", "\n", "This time, we'll bake in all the dataset specific pieces directly in the `LightningModule`.\n", "This way, we can avoid writing extra code at the beginning of our script every time we want to run it.\n", "\n", "---\n", "\n", "### Note what the following built-in functions are doing:\n", "\n", "1. [prepare_data()](https://pytorch-lightning.readthedocs.io/en/stable/common/lightning_module.html#prepare-data) \ud83d\udcbe\n", " - This is where we can download the dataset. We point to our desired dataset and ask torchvision's `MNIST` dataset class to download if the dataset isn't found there.\n", " - **Note we do not make any state assignments in this function** (i.e. `self.something = ...`)\n", "\n", "2. [setup(stage)](https://pytorch-lightning.readthedocs.io/en/stable/common/lightning_module.html#setup) \u2699\ufe0f\n", " - Loads in data from file and prepares PyTorch tensor datasets for each split (train, val, test).\n", " - Setup expects a 'stage' arg which is used to separate logic for 'fit' and 'test'.\n", " - If you don't mind loading all your datasets at once, you can set up a condition to allow for both 'fit' related setup and 'test' related setup to run whenever `None` is passed to `stage` (or ignore it altogether and exclude any conditionals).\n", " - **Note this runs across all GPUs and it *is* safe to make state assignments here**\n", "\n", "3. [x_dataloader()](https://pytorch-lightning.readthedocs.io/en/stable/api/pytorch_lightning.core.hooks.html) \u267b\ufe0f\n", " - `train_dataloader()`, `val_dataloader()`, and `test_dataloader()` all return PyTorch `DataLoader` instances that are created by wrapping their respective datasets that we prepared in `setup()`"]}, {"cell_type": "code", "execution_count": 5, "id": "6a0ca038", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:48:29.028294Z", "iopub.status.busy": "2021-12-04T16:48:29.018412Z", "iopub.status.idle": "2021-12-04T16:48:29.030251Z", "shell.execute_reply": "2021-12-04T16:48:29.029861Z"}, "papermill": {"duration": 0.04784, "end_time": "2021-12-04T16:48:29.030353", "exception": false, "start_time": "2021-12-04T16:48:28.982513", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class LitMNIST(LightningModule):\n", " def __init__(self, data_dir=PATH_DATASETS, hidden_size=64, learning_rate=2e-4):\n", "\n", " super().__init__()\n", "\n", " # Set our init args as class attributes\n", " self.data_dir = data_dir\n", " self.hidden_size = hidden_size\n", " self.learning_rate = learning_rate\n", "\n", " # Hardcode some dataset specific attributes\n", " self.num_classes = 10\n", " self.dims = (1, 28, 28)\n", " channels, width, height = self.dims\n", " self.transform = transforms.Compose(\n", " [\n", " transforms.ToTensor(),\n", " transforms.Normalize((0.1307,), (0.3081,)),\n", " ]\n", " )\n", "\n", " # Define PyTorch model\n", " self.model = nn.Sequential(\n", " nn.Flatten(),\n", " nn.Linear(channels * width * height, hidden_size),\n", " nn.ReLU(),\n", " nn.Dropout(0.1),\n", " nn.Linear(hidden_size, hidden_size),\n", " nn.ReLU(),\n", " nn.Dropout(0.1),\n", " nn.Linear(hidden_size, self.num_classes),\n", " )\n", "\n", " self.accuracy = Accuracy()\n", "\n", " def forward(self, x):\n", " x = self.model(x)\n", " return F.log_softmax(x, dim=1)\n", "\n", " def training_step(self, batch, batch_idx):\n", " x, y = batch\n", " logits = self(x)\n", " loss = F.nll_loss(logits, y)\n", " return loss\n", "\n", " def validation_step(self, batch, batch_idx):\n", " x, y = batch\n", " logits = self(x)\n", " loss = F.nll_loss(logits, y)\n", " preds = torch.argmax(logits, dim=1)\n", " self.accuracy(preds, y)\n", "\n", " # Calling self.log will surface up scalars for you in TensorBoard\n", " self.log(\"val_loss\", loss, prog_bar=True)\n", " self.log(\"val_acc\", self.accuracy, prog_bar=True)\n", " return loss\n", "\n", " def test_step(self, batch, batch_idx):\n", " # Here we just reuse the validation_step for testing\n", " return self.validation_step(batch, batch_idx)\n", "\n", " def configure_optimizers(self):\n", " optimizer = torch.optim.Adam(self.parameters(), lr=self.learning_rate)\n", " return optimizer\n", "\n", " ####################\n", " # DATA RELATED HOOKS\n", " ####################\n", "\n", " def prepare_data(self):\n", " # download\n", " MNIST(self.data_dir, train=True, download=True)\n", " MNIST(self.data_dir, train=False, download=True)\n", "\n", " def setup(self, stage=None):\n", "\n", " # Assign train/val datasets for use in dataloaders\n", " if stage == \"fit\" or stage is None:\n", " mnist_full = MNIST(self.data_dir, train=True, transform=self.transform)\n", " self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000])\n", "\n", " # Assign test dataset for use in dataloader(s)\n", " if stage == \"test\" or stage is None:\n", " self.mnist_test = MNIST(self.data_dir, train=False, transform=self.transform)\n", "\n", " def train_dataloader(self):\n", " return DataLoader(self.mnist_train, batch_size=BATCH_SIZE)\n", "\n", " def val_dataloader(self):\n", " return DataLoader(self.mnist_val, batch_size=BATCH_SIZE)\n", "\n", " def test_dataloader(self):\n", " return DataLoader(self.mnist_test, batch_size=BATCH_SIZE)"]}, {"cell_type": "code", "execution_count": 6, "id": "8b595285", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:48:29.104668Z", "iopub.status.busy": "2021-12-04T16:48:29.104193Z", "iopub.status.idle": "2021-12-04T16:49:00.348987Z", "shell.execute_reply": "2021-12-04T16:49:00.348528Z"}, "papermill": {"duration": 31.284667, "end_time": "2021-12-04T16:49:00.349114", "exception": false, "start_time": "2021-12-04T16:48:29.064447", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stderr", "output_type": "stream", "text": ["\n", " | Name | Type | Params\n", "----------------------------------------\n", "0 | model | Sequential | 55.1 K\n", "1 | accuracy | Accuracy | 0 \n", "----------------------------------------\n", "55.1 K Trainable params\n", "0 Non-trainable params\n", "55.1 K Total params\n", "0.220 Total estimated model params size (MB)\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "601373ace9d24621bdc3be090c0e9b8b", "version_major": 2, "version_minor": 0}, "text/plain": ["Validation sanity check: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/data_loading.py:111: UserWarning: The dataloader, val_dataloader 0, does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` (try 12 which is the number of cpus on this machine) in the `DataLoader` init to improve performance.\n", " rank_zero_warn(\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "11ce7ae5de484643b6cc8ad0b77411fe", "version_major": 2, "version_minor": 0}, "text/plain": ["Training: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "f7c86a8dd9c04460b3a3cf2b3056dad0", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "292a3bb25f83487db56ebc2b6e7d117b", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "6fefda9cb8654253bbd58b94764626e3", "version_major": 2, "version_minor": 0}, "text/plain": ["Validating: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}], "source": ["model = LitMNIST()\n", "trainer = Trainer(\n", " gpus=AVAIL_GPUS,\n", " max_epochs=3,\n", " progress_bar_refresh_rate=20,\n", ")\n", "trainer.fit(model)"]}, {"cell_type": "markdown", "id": "436f04a4", "metadata": {"papermill": {"duration": 0.043938, "end_time": "2021-12-04T16:49:00.437413", "exception": false, "start_time": "2021-12-04T16:49:00.393475", "status": "completed"}, "tags": []}, "source": ["### Testing\n", "\n", "To test a model, call `trainer.test(model)`.\n", "\n", "Or, if you've just trained a model, you can just call `trainer.test()` and Lightning will automatically\n", "test using the best saved checkpoint (conditioned on val_loss)."]}, {"cell_type": "code", "execution_count": 7, "id": "caee2e97", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:49:00.530200Z", "iopub.status.busy": "2021-12-04T16:49:00.529111Z", "iopub.status.idle": "2021-12-04T16:49:02.326996Z", "shell.execute_reply": "2021-12-04T16:49:02.326564Z"}, "papermill": {"duration": 1.845813, "end_time": "2021-12-04T16:49:02.327125", "exception": false, "start_time": "2021-12-04T16:49:00.481312", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/trainer.py:1393: UserWarning: `.test(ckpt_path=None)` was called without a model. The best model of the previous `fit` call will be used. You can pass `test(ckpt_path='best')` to use and best model checkpoint and avoid this warning or `ckpt_path=trainer.model_checkpoint.last_model_path` to use the last model.\n", " rank_zero_warn(\n", "Restoring states from the checkpoint path at /__w/1/s/lightning_logs/version_7/checkpoints/epoch=2-step=644.ckpt\n"]}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stderr", "output_type": "stream", "text": ["Loaded model weights from checkpoint at /__w/1/s/lightning_logs/version_7/checkpoints/epoch=2-step=644.ckpt\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/data_loading.py:111: UserWarning: The dataloader, test_dataloader 0, does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` (try 12 which is the number of cpus on this machine) in the `DataLoader` init to improve performance.\n", " rank_zero_warn(\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "b2042d298d80448885957a83ec7d3c2b", "version_major": 2, "version_minor": 0}, "text/plain": ["Testing: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stdout", "output_type": "stream", "text": ["--------------------------------------------------------------------------------\n", "DATALOADER:0 TEST RESULTS\n", "{'val_acc': 0.9211000204086304, 'val_loss': 0.25840938091278076}\n", "--------------------------------------------------------------------------------\n"]}, {"data": {"text/plain": ["[{'val_loss': 0.25840938091278076, 'val_acc': 0.9211000204086304}]"]}, "execution_count": 7, "metadata": {}, "output_type": "execute_result"}], "source": ["trainer.test()"]}, {"cell_type": "markdown", "id": "5a843462", "metadata": {"papermill": {"duration": 0.049757, "end_time": "2021-12-04T16:49:02.427433", "exception": false, "start_time": "2021-12-04T16:49:02.377676", "status": "completed"}, "tags": []}, "source": ["### Bonus Tip\n", "\n", "You can keep calling `trainer.fit(model)` as many times as you'd like to continue training"]}, {"cell_type": "code", "execution_count": 8, "id": "249d097e", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:49:02.532137Z", "iopub.status.busy": "2021-12-04T16:49:02.531667Z", "iopub.status.idle": "2021-12-04T16:49:02.760734Z", "shell.execute_reply": "2021-12-04T16:49:02.760300Z"}, "papermill": {"duration": 0.283193, "end_time": "2021-12-04T16:49:02.760859", "exception": false, "start_time": "2021-12-04T16:49:02.477666", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stderr", "output_type": "stream", "text": ["\n", " | Name | Type | Params\n", "----------------------------------------\n", "0 | model | Sequential | 55.1 K\n", "1 | accuracy | Accuracy | 0 \n", "----------------------------------------\n", "55.1 K Trainable params\n", "0 Non-trainable params\n", "55.1 K Total params\n", "0.220 Total estimated model params size (MB)\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/callbacks/model_checkpoint.py:623: UserWarning: Checkpoint directory /__w/1/s/lightning_logs/version_7/checkpoints exists and is not empty.\n", " rank_zero_warn(f\"Checkpoint directory {dirpath} exists and is not empty.\")\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "a123bf1c0353409dbe32f4a4a590ab6e", "version_major": 2, "version_minor": 0}, "text/plain": ["Validation sanity check: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}], "source": ["trainer.fit(model)"]}, {"cell_type": "markdown", "id": "c1c65385", "metadata": {"papermill": {"duration": 0.053219, "end_time": "2021-12-04T16:49:02.867679", "exception": false, "start_time": "2021-12-04T16:49:02.814460", "status": "completed"}, "tags": []}, "source": ["In Colab, you can use the TensorBoard magic function to view the logs that Lightning has created for you!"]}, {"cell_type": "code", "execution_count": 9, "id": "fdd68fee", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:49:02.978094Z", "iopub.status.busy": "2021-12-04T16:49:02.977622Z", "iopub.status.idle": "2021-12-04T16:49:04.563924Z", "shell.execute_reply": "2021-12-04T16:49:04.564319Z"}, "papermill": {"duration": 1.643849, "end_time": "2021-12-04T16:49:04.564484", "exception": false, "start_time": "2021-12-04T16:49:02.920635", "status": "completed"}, "tags": []}, "outputs": [{"data": {"text/html": ["\n", " \n", " \n", " "], "text/plain": [""]}, "metadata": {}, "output_type": "display_data"}], "source": ["# Start tensorboard.\n", "%load_ext tensorboard\n", "%tensorboard --logdir lightning_logs/"]}, {"cell_type": "markdown", "id": "fb7c0504", "metadata": {"papermill": {"duration": 0.054861, "end_time": "2021-12-04T16:49:04.675577", "exception": false, "start_time": "2021-12-04T16:49:04.620716", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "[![Pytorch Lightning](){height=\"60px\" width=\"240px\"}](https://pytorchlightning.ai)"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: Introduction to Pytorch Lightning\n", " :card_description: In this notebook, we'll go over the basics of lightning by preparing models to train on the [MNIST Handwritten Digits dataset](https://en.wikipedia.org/wiki/MNIST_database).\n", " :tags: Image,GPU/TPU,Lightning-Examples"]}], "metadata": {"jupytext": {"cell_metadata_filter": "id,colab,colab_type,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 64.932502, "end_time": "2021-12-04T16:49:06.142038", "environment_variables": {}, "exception": null, "input_path": "lightning_examples/mnist-hello-world/hello-world.ipynb", "output_path": ".notebooks/lightning_examples/mnist-hello-world.ipynb", "parameters": {}, "start_time": "2021-12-04T16:48:01.209536", "version": "2.3.3"}, "widgets": {"application/vnd.jupyter.widget-state+json": {"state": {"09b7fc22ad90482a84100bbd3d5b1c53": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "09ba6f68123f47288cacec730782831d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "11ce7ae5de484643b6cc8ad0b77411fe": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_c4b7018fa4ef4a62ad60e470cfee1c9f", "IPY_MODEL_7566c4e4b4234020b638cf6c489feb47", "IPY_MODEL_b3ab34ed6d4042ae91e80bdd838ad63d"], "layout": "IPY_MODEL_7fafd99b34754f9fb3ff703cb1c762a1"}}, "14b9bf5c15264c889319160095808d4b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1c3f0a5537464548ba3655d0151b913b", "max": 20.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_4501abf9f43b45fdadccf542b6dc11bc", "value": 20.0}}, "19d6db216fc94fd7a8b903efbcaf8d7e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "1c3f0a5537464548ba3655d0151b913b": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1e4f591b0f5c4310a2e2c3df78d41654": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "2432b8e2d34a4213a0ac1bdc1e25ff98": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "273c67245899415eadf04785d18c24fe": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "27b765a1b4d54bc1b9cb84c86b4d53fa": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "28e0a4fd04d944bba0bdd698f9f39fbb": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "danger", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_29c0045e415c420cbdd41c7d5b2fe42a", "max": 2.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_478fad99664b4688be1597372d2a8cd3", "value": 0.0}}, "292a3bb25f83487db56ebc2b6e7d117b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_bee7eb1c5f004aa09e8c8d480450ddff", "IPY_MODEL_14b9bf5c15264c889319160095808d4b", "IPY_MODEL_95d4c0d79a4440bdb504b719acbf0778"], "layout": "IPY_MODEL_273c67245899415eadf04785d18c24fe"}}, "29c0045e415c420cbdd41c7d5b2fe42a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "33522fca1b8a4402b486f5bd2ec52f16": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "36c52a31cbd84d1da6e45c5a1123c8e0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_56a2270791254a2b8f2d90010ef093de", "placeholder": "\u200b", "style": "IPY_MODEL_fee96cc5fbdc402aa2943e79a4f2adad", "value": " 0/2 [00:00<?, ?it/s]"}}, "36f68744cfbd40919535814cfe014de3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "danger", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8a457394c16d4c5da14f73ede0aa58dc", "max": 2.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_c48ac9d9272f48f0a4930157bbbc4544", "value": 0.0}}, "3945a41419174768bdd37f6346ac4800": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "3d9ac0fe691d49799e8bfd681c7a0da6": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "41a1e336782045fa8b4c51d48bec6076": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c717831da0c7486782afa3bd59a5867a", "placeholder": "\u200b", "style": "IPY_MODEL_d70e90c6cb0646769c81d4754c39c29b", "value": " 0/2 [00:00<?, ?it/s]"}}, "440b8511219849d8a2035bacc3faae8b": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "4501abf9f43b45fdadccf542b6dc11bc": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "46ed279af4134635be629e5f424c178b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "478fad99664b4688be1597372d2a8cd3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "56a2270791254a2b8f2d90010ef093de": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "57326adc0f7447209791335361c9b25e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "5785b759472d4738b820d3404fb97ea2": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "5b5fd440314f4e08b05560ea5411d6a7": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "5e503ce2e5d547369325b3b3c57c91d4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_440b8511219849d8a2035bacc3faae8b", "max": 20.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_3d9ac0fe691d49799e8bfd681c7a0da6", "value": 20.0}}, "5f5b35087a20496caa3f259693946413": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_61750b7330d8424dba8b0236b1ea916f", "IPY_MODEL_dd0e944c91f0494e9de3e89daa1d4c3d", "IPY_MODEL_6968aa8766cd43f58e25354153ec2c89"], "layout": "IPY_MODEL_fbc62c1a049e480799d3bdb649afc778"}}, "601373ace9d24621bdc3be090c0e9b8b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_7bb333f35c324e62b30a6cf6c18ff8c4", "IPY_MODEL_28e0a4fd04d944bba0bdd698f9f39fbb", "IPY_MODEL_36c52a31cbd84d1da6e45c5a1123c8e0"], "layout": "IPY_MODEL_f1ca115efd3241449f819b4377f98007"}}, "61750b7330d8424dba8b0236b1ea916f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_aa7559605123408da3bb35c2363314a2", "placeholder": "\u200b", "style": "IPY_MODEL_962f2ab6be8e40118d4609258536dde1", "value": "Epoch 2: 100%"}}, "6968aa8766cd43f58e25354153ec2c89": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b6d778d7d9b54c099015a006d3385bcb", "placeholder": "\u200b", "style": "IPY_MODEL_46ed279af4134635be629e5f424c178b", "value": " 235/235 [00:05<00:00, 45.01it/s, loss=0.213, v_num=6]"}}, "6fefda9cb8654253bbd58b94764626e3": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_db908903174440b59181bb496ad0bd7d", "IPY_MODEL_5e503ce2e5d547369325b3b3c57c91d4", "IPY_MODEL_75c54f7791c849ae8fbe03af570c54a1"], "layout": "IPY_MODEL_33522fca1b8a4402b486f5bd2ec52f16"}}, "7566c4e4b4234020b638cf6c489feb47": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3945a41419174768bdd37f6346ac4800", "max": 235.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_f68fa8b22e4e4c0a8ba07448efaac3d5", "value": 235.0}}, "75c54f7791c849ae8fbe03af570c54a1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e38e27d7dd8a435792803c03f6af9982", "placeholder": "\u200b", "style": "IPY_MODEL_57326adc0f7447209791335361c9b25e", "value": " 20/20 [00:00<00:00, 23.11it/s]"}}, "775676e5b53e4a3fa26c8ea381b4e483": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "79eb4cc1040e4a9a8b971876af6fd9bf": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "7bb333f35c324e62b30a6cf6c18ff8c4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c41d39eee0404e809f007049084d30cb", "placeholder": "\u200b", "style": "IPY_MODEL_09ba6f68123f47288cacec730782831d", "value": "Validation sanity check: 0%"}}, "7fafd99b34754f9fb3ff703cb1c762a1": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "80ef770fb6a34f94a5b0cb6d4629f1c9": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_1e4f591b0f5c4310a2e2c3df78d41654", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_a6926eb7fd14423e8f9b284b6b88564c", "value": 1.0}}, "8289d840a8174725a33705d0439b9f10": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_5785b759472d4738b820d3404fb97ea2", "placeholder": "\u200b", "style": "IPY_MODEL_a18c5a748a154261b6e333e87968d4a8", "value": "Validation sanity check: 0%"}}, "8406484c64fe477c9d3486292a77d2da": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "89f6945a57fa4bed9a22d6d3f329c59b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "8a457394c16d4c5da14f73ede0aa58dc": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "8bcd7a8fc13e46a5945906814a70721d": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "8ceaaab585ca48ac83ad55bb94e639d2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d7ea8fa06e4549c58feb8fbf60d54f12", "placeholder": "\u200b", "style": "IPY_MODEL_8ef594a7ac2a49b4b4bb65a932f800a4", "value": "Validating: 100%"}}, "8ef594a7ac2a49b4b4bb65a932f800a4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "9071e7327b5744a1b17e70e9608e9662": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_90c9f1abf4e6487f9db8021657ad8057", "placeholder": "\u200b", "style": "IPY_MODEL_775676e5b53e4a3fa26c8ea381b4e483", "value": " 20/20 [00:00<00:00, 23.27it/s]"}}, "90c9f1abf4e6487f9db8021657ad8057": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "94477649bcc24394b6766ae40ee7a37b": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "95d4c0d79a4440bdb504b719acbf0778": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8bcd7a8fc13e46a5945906814a70721d", "placeholder": "\u200b", "style": "IPY_MODEL_27b765a1b4d54bc1b9cb84c86b4d53fa", "value": " 20/20 [00:00<00:00, 23.17it/s]"}}, "962f2ab6be8e40118d4609258536dde1": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "a123bf1c0353409dbe32f4a4a590ab6e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_8289d840a8174725a33705d0439b9f10", "IPY_MODEL_36f68744cfbd40919535814cfe014de3", "IPY_MODEL_41a1e336782045fa8b4c51d48bec6076"], "layout": "IPY_MODEL_ff65026a9670453ebcecb7e57edd3cec"}}, "a18c5a748a154261b6e333e87968d4a8": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "a6926eb7fd14423e8f9b284b6b88564c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "aa7559605123408da3bb35c2363314a2": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b2042d298d80448885957a83ec7d3c2b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_df7beb8dbb0446d9a206713382500de7", "IPY_MODEL_80ef770fb6a34f94a5b0cb6d4629f1c9", "IPY_MODEL_f42bc9c824594b859e33d07c4246c0b5"], "layout": "IPY_MODEL_b3c049feedaf4965a787b5c4d545f32e"}}, "b294ce2c629b4c8ca6e53502f288a603": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "b3ab34ed6d4042ae91e80bdd838ad63d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_8406484c64fe477c9d3486292a77d2da", "placeholder": "\u200b", "style": "IPY_MODEL_c420cef9f94f454b8698511085cf538e", "value": " 235/235 [00:10<00:00, 22.72it/s, loss=0.31, v_num=7, val_loss=0.275, val_acc=0.921]"}}, "b3c049feedaf4965a787b5c4d545f32e": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "b6d778d7d9b54c099015a006d3385bcb": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "bee7eb1c5f004aa09e8c8d480450ddff": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_94477649bcc24394b6766ae40ee7a37b", "placeholder": "\u200b", "style": "IPY_MODEL_e6903d15de3d45f091f541aa054db6db", "value": "Validating: 100%"}}, "c41d39eee0404e809f007049084d30cb": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c420cef9f94f454b8698511085cf538e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "c48ac9d9272f48f0a4930157bbbc4544": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "c4b7018fa4ef4a62ad60e470cfee1c9f": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_09b7fc22ad90482a84100bbd3d5b1c53", "placeholder": "\u200b", "style": "IPY_MODEL_e4c04bc4371d4ca4b06392616ee7ccd7", "value": "Epoch 2: 100%"}}, "c717831da0c7486782afa3bd59a5867a": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d55566f7956945348c51ae8cec3095d2": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "d70e90c6cb0646769c81d4754c39c29b": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "d7ea8fa06e4549c58feb8fbf60d54f12": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "db908903174440b59181bb496ad0bd7d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f79e96bcb58a4eb4bcbacb7174bc2ba2", "placeholder": "\u200b", "style": "IPY_MODEL_e91201e5eeb14339b07597e7a1d71aad", "value": "Validating: 100%"}}, "dd0e944c91f0494e9de3e89daa1d4c3d": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f4700930b6674d4fba7ef5015f0bd1fc", "max": 235.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_d55566f7956945348c51ae8cec3095d2", "value": 235.0}}, "de4a8179670a4f57b219144d967a13c5": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "df7beb8dbb0446d9a206713382500de7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_de4a8179670a4f57b219144d967a13c5", "placeholder": "\u200b", "style": "IPY_MODEL_79eb4cc1040e4a9a8b971876af6fd9bf", "value": "Testing: 100%"}}, "e38e27d7dd8a435792803c03f6af9982": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "e4c04bc4371d4ca4b06392616ee7ccd7": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "e6903d15de3d45f091f541aa054db6db": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "e91201e5eeb14339b07597e7a1d71aad": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "f1ca115efd3241449f819b4377f98007": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "f42bc9c824594b859e33d07c4246c0b5": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_5b5fd440314f4e08b05560ea5411d6a7", "placeholder": "\u200b", "style": "IPY_MODEL_89f6945a57fa4bed9a22d6d3f329c59b", "value": " 40/40 [00:01<00:00, 23.36it/s]"}}, "f4700930b6674d4fba7ef5015f0bd1fc": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "f68fa8b22e4e4c0a8ba07448efaac3d5": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}, "f79e96bcb58a4eb4bcbacb7174bc2ba2": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "f7c86a8dd9c04460b3a3cf2b3056dad0": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_8ceaaab585ca48ac83ad55bb94e639d2", "IPY_MODEL_fc20401683aa4661a2ab78db340ccbd4", "IPY_MODEL_9071e7327b5744a1b17e70e9608e9662"], "layout": "IPY_MODEL_2432b8e2d34a4213a0ac1bdc1e25ff98"}}, "fbc62c1a049e480799d3bdb649afc778": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "fc20401683aa4661a2ab78db340ccbd4": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b294ce2c629b4c8ca6e53502f288a603", "max": 20.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_19d6db216fc94fd7a8b903efbcaf8d7e", "value": 20.0}}, "fee96cc5fbdc402aa2943e79a4f2adad": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "ff65026a9670453ebcecb7e57edd3cec": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}}, "version_major": 2, "version_minor": 0}}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/lightning_examples/mnist-tpu-training.ipynb b/source/notebooks/lightning_examples/mnist-tpu-training.ipynb deleted file mode 100644 index d718144..0000000 --- a/source/notebooks/lightning_examples/mnist-tpu-training.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "e49ff764", "metadata": {}, "source": ["\n", "# TPU training with PyTorch Lightning\n", "\n", "* **Author:** PL team\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-12-04T16:53:07.915320\n", "\n", "In this notebook, we'll train a model on TPUs. Updating one Trainer flag is all you need for that. The most up to documentation related to TPU training can be found [here](https://pytorch-lightning.readthedocs.io/en/latest/advanced/tpu.html).\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/lightning_examples/mnist-tpu-training.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "f024b9fe", "metadata": {}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": null, "id": "26f8e4d5", "metadata": {"colab": {}, "colab_type": "code", "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0}, "outputs": [], "source": ["! pip install --quiet \"torch>=1.6, <1.9\" \"pytorch-lightning>=1.3\" \"torchvision\" \"torchmetrics>=0.3\""]}, {"cell_type": "markdown", "id": "a1a49780", "metadata": {}, "source": ["### Install Colab TPU compatible PyTorch/TPU wheels and dependencies"]}, {"cell_type": "code", "execution_count": null, "id": "4ed2602f", "metadata": {}, "outputs": [], "source": ["! pip install cloud-tpu-client==0.10 https://storage.googleapis.com/tpu-pytorch/wheels/torch_xla-1.8-cp37-cp37m-linux_x86_64.whl"]}, {"cell_type": "code", "execution_count": null, "id": "5d907ddd", "metadata": {}, "outputs": [], "source": ["import torch\n", "import torch.nn.functional as F\n", "from pytorch_lightning import LightningDataModule, LightningModule, Trainer\n", "from torch import nn\n", "from torch.utils.data import DataLoader, random_split\n", "from torchmetrics.functional import accuracy\n", "from torchvision import transforms\n", "\n", "# Note - you must have torchvision installed for this example\n", "from torchvision.datasets import MNIST\n", "\n", "BATCH_SIZE = 1024"]}, {"cell_type": "markdown", "id": "5f438e89", "metadata": {"lines_to_next_cell": 2}, "source": ["### Defining The `MNISTDataModule`\n", "\n", "Below we define `MNISTDataModule`. You can learn more about datamodules\n", "in [docs](https://pytorch-lightning.readthedocs.io/en/latest/extensions/datamodules.html)."]}, {"cell_type": "code", "execution_count": null, "id": "5e591ce5", "metadata": {"lines_to_next_cell": 2}, "outputs": [], "source": ["class MNISTDataModule(LightningDataModule):\n", " def __init__(self, data_dir: str = \"./\"):\n", " super().__init__()\n", " self.data_dir = data_dir\n", " self.transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.1307,), (0.3081,))])\n", "\n", " # self.dims is returned when you call dm.size()\n", " # Setting default dims here because we know them.\n", " # Could optionally be assigned dynamically in dm.setup()\n", " self.dims = (1, 28, 28)\n", " self.num_classes = 10\n", "\n", " def prepare_data(self):\n", " # download\n", " MNIST(self.data_dir, train=True, download=True)\n", " MNIST(self.data_dir, train=False, download=True)\n", "\n", " def setup(self, stage=None):\n", "\n", " # Assign train/val datasets for use in dataloaders\n", " if stage == \"fit\" or stage is None:\n", " mnist_full = MNIST(self.data_dir, train=True, transform=self.transform)\n", " self.mnist_train, self.mnist_val = random_split(mnist_full, [55000, 5000])\n", "\n", " # Assign test dataset for use in dataloader(s)\n", " if stage == \"test\" or stage is None:\n", " self.mnist_test = MNIST(self.data_dir, train=False, transform=self.transform)\n", "\n", " def train_dataloader(self):\n", " return DataLoader(self.mnist_train, batch_size=BATCH_SIZE)\n", "\n", " def val_dataloader(self):\n", " return DataLoader(self.mnist_val, batch_size=BATCH_SIZE)\n", "\n", " def test_dataloader(self):\n", " return DataLoader(self.mnist_test, batch_size=BATCH_SIZE)"]}, {"cell_type": "markdown", "id": "fa53ebb7", "metadata": {"lines_to_next_cell": 2}, "source": ["### Defining the `LitModel`\n", "\n", "Below, we define the model `LitMNIST`."]}, {"cell_type": "code", "execution_count": null, "id": "a5f891e3", "metadata": {}, "outputs": [], "source": ["class LitModel(LightningModule):\n", " def __init__(self, channels, width, height, num_classes, hidden_size=64, learning_rate=2e-4):\n", "\n", " super().__init__()\n", "\n", " self.save_hyperparameters()\n", "\n", " self.model = nn.Sequential(\n", " nn.Flatten(),\n", " nn.Linear(channels * width * height, hidden_size),\n", " nn.ReLU(),\n", " nn.Dropout(0.1),\n", " nn.Linear(hidden_size, hidden_size),\n", " nn.ReLU(),\n", " nn.Dropout(0.1),\n", " nn.Linear(hidden_size, num_classes),\n", " )\n", "\n", " def forward(self, x):\n", " x = self.model(x)\n", " return F.log_softmax(x, dim=1)\n", "\n", " def training_step(self, batch, batch_idx):\n", " x, y = batch\n", " logits = self(x)\n", " loss = F.nll_loss(logits, y)\n", " self.log(\"train_loss\", loss)\n", " return loss\n", "\n", " def validation_step(self, batch, batch_idx):\n", " x, y = batch\n", " logits = self(x)\n", " loss = F.nll_loss(logits, y)\n", " preds = torch.argmax(logits, dim=1)\n", " acc = accuracy(preds, y)\n", " self.log(\"val_loss\", loss, prog_bar=True)\n", " self.log(\"val_acc\", acc, prog_bar=True)\n", " return loss\n", "\n", " def configure_optimizers(self):\n", " optimizer = torch.optim.Adam(self.parameters(), lr=self.hparams.learning_rate)\n", " return optimizer"]}, {"cell_type": "markdown", "id": "1009ada4", "metadata": {}, "source": ["### TPU Training\n", "\n", "Lightning supports training on a single TPU core or 8 TPU cores.\n", "\n", "The Trainer parameters `tpu_cores` defines how many TPU cores to train on (1 or 8) / Single TPU core to train on [1].\n", "\n", "For Single TPU training, Just pass the TPU core ID [1-8] in a list.\n", "Setting `tpu_cores=[5]` will train on TPU core ID 5."]}, {"cell_type": "markdown", "id": "55c40381", "metadata": {}, "source": ["Train on TPU core ID 5 with `tpu_cores=[5]`."]}, {"cell_type": "code", "execution_count": null, "id": "0eb329b1", "metadata": {}, "outputs": [], "source": ["# Init DataModule\n", "dm = MNISTDataModule()\n", "# Init model from datamodule's attributes\n", "model = LitModel(*dm.size(), dm.num_classes)\n", "# Init trainer\n", "trainer = Trainer(max_epochs=3, progress_bar_refresh_rate=20, tpu_cores=[5])\n", "# Train\n", "trainer.fit(model, dm)"]}, {"cell_type": "markdown", "id": "e4b81515", "metadata": {}, "source": ["Train on single TPU core with `tpu_cores=1`."]}, {"cell_type": "code", "execution_count": null, "id": "83272dbd", "metadata": {}, "outputs": [], "source": ["# Init DataModule\n", "dm = MNISTDataModule()\n", "# Init model from datamodule's attributes\n", "model = LitModel(*dm.size(), dm.num_classes)\n", "# Init trainer\n", "trainer = Trainer(max_epochs=3, progress_bar_refresh_rate=20, tpu_cores=1)\n", "# Train\n", "trainer.fit(model, dm)"]}, {"cell_type": "markdown", "id": "3d2ce0a8", "metadata": {}, "source": ["Train on 8 TPU cores with `tpu_cores=8`.\n", "You might have to restart the notebook to run it on 8 TPU cores after training on single TPU core."]}, {"cell_type": "code", "execution_count": null, "id": "4d07c972", "metadata": {}, "outputs": [], "source": ["# Init DataModule\n", "dm = MNISTDataModule()\n", "# Init model from datamodule's attributes\n", "model = LitModel(*dm.size(), dm.num_classes)\n", "# Init trainer\n", "trainer = Trainer(max_epochs=3, progress_bar_refresh_rate=20, tpu_cores=8)\n", "# Train\n", "trainer.fit(model, dm)"]}, {"cell_type": "markdown", "id": "6ebe791c", "metadata": {}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "[![Pytorch Lightning](){height=\"60px\" width=\"240px\"}](https://pytorchlightning.ai)"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: TPU training with PyTorch Lightning\n", " :card_description: In this notebook, we'll train a model on TPUs. Updating one Trainer flag is all you need for that. The most up to documentation related to TPU training can be found...\n", " :tags: Image,GPU/TPU,Lightning-Examples"]}], "metadata": {"jupytext": {"cell_metadata_filter": "colab_type,colab,id,-all", "formats": "ipynb,py:percent", "main_language": "python"}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/lightning_examples/reinforce-learning-DQN.ipynb b/source/notebooks/lightning_examples/reinforce-learning-DQN.ipynb deleted file mode 100644 index c69b474..0000000 --- a/source/notebooks/lightning_examples/reinforce-learning-DQN.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "4efbbac7", "metadata": {"papermill": {"duration": 0.032188, "end_time": "2021-12-04T16:49:24.620327", "exception": false, "start_time": "2021-12-04T16:49:24.588139", "status": "completed"}, "tags": []}, "source": ["\n", "# How to train a Deep Q Network\n", "\n", "* **Author:** PL team\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-12-04T16:53:09.587502\n", "\n", "Main takeaways:\n", "\n", "1. RL has the same flow as previous models we have seen, with a few additions\n", "2. Handle unsupervised learning by using an IterableDataset where the dataset itself is constantly updated during training\n", "3. Each training step carries has the agent taking an action in the environment and storing the experience in the IterableDataset\n", "\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/lightning_examples/reinforce-learning-DQN.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "efc6c370", "metadata": {"papermill": {"duration": 0.02782, "end_time": "2021-12-04T16:49:24.679755", "exception": false, "start_time": "2021-12-04T16:49:24.651935", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "5894fd9f", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-12-04T16:49:24.744158Z", "iopub.status.busy": "2021-12-04T16:49:24.743680Z", "iopub.status.idle": "2021-12-04T16:49:27.687873Z", "shell.execute_reply": "2021-12-04T16:49:27.687317Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 2.979438, "end_time": "2021-12-04T16:49:27.688021", "exception": false, "start_time": "2021-12-04T16:49:24.708583", "status": "completed"}, "tags": []}, "outputs": [], "source": ["! pip install --quiet \"torch>=1.6, <1.9\" \"pytorch-lightning>=1.3\" \"gym\" \"torchmetrics>=0.3\""]}, {"cell_type": "code", "execution_count": 2, "id": "ad4092f4", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:49:27.750875Z", "iopub.status.busy": "2021-12-04T16:49:27.750375Z", "iopub.status.idle": "2021-12-04T16:49:31.622878Z", "shell.execute_reply": "2021-12-04T16:49:31.623262Z"}, "papermill": {"duration": 3.906565, "end_time": "2021-12-04T16:49:31.623443", "exception": false, "start_time": "2021-12-04T16:49:27.716878", "status": "completed"}, "tags": []}, "outputs": [], "source": ["import os\n", "from collections import OrderedDict, deque, namedtuple\n", "from typing import List, Tuple\n", "\n", "import gym\n", "import numpy as np\n", "import torch\n", "from pytorch_lightning import LightningModule, Trainer\n", "from pytorch_lightning.utilities import DistributedType\n", "from torch import Tensor, nn\n", "from torch.optim import Adam, Optimizer\n", "from torch.utils.data import DataLoader\n", "from torch.utils.data.dataset import IterableDataset\n", "\n", "PATH_DATASETS = os.environ.get(\"PATH_DATASETS\", \".\")\n", "AVAIL_GPUS = min(1, torch.cuda.device_count())"]}, {"cell_type": "code", "execution_count": 3, "id": "4bd3cb4e", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:49:31.685019Z", "iopub.status.busy": "2021-12-04T16:49:31.684540Z", "iopub.status.idle": "2021-12-04T16:49:31.686662Z", "shell.execute_reply": "2021-12-04T16:49:31.686183Z"}, "papermill": {"duration": 0.035013, "end_time": "2021-12-04T16:49:31.686760", "exception": false, "start_time": "2021-12-04T16:49:31.651747", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class DQN(nn.Module):\n", " \"\"\"Simple MLP network.\"\"\"\n", "\n", " def __init__(self, obs_size: int, n_actions: int, hidden_size: int = 128):\n", " \"\"\"\n", " Args:\n", " obs_size: observation/state size of the environment\n", " n_actions: number of discrete actions available in the environment\n", " hidden_size: size of hidden layers\n", " \"\"\"\n", " super().__init__()\n", " self.net = nn.Sequential(\n", " nn.Linear(obs_size, hidden_size),\n", " nn.ReLU(),\n", " nn.Linear(hidden_size, n_actions),\n", " )\n", "\n", " def forward(self, x):\n", " return self.net(x.float())"]}, {"cell_type": "markdown", "id": "012cc8f7", "metadata": {"papermill": {"duration": 0.032792, "end_time": "2021-12-04T16:49:31.746872", "exception": false, "start_time": "2021-12-04T16:49:31.714080", "status": "completed"}, "tags": []}, "source": ["### Memory"]}, {"cell_type": "code", "execution_count": 4, "id": "77510037", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:49:31.806464Z", "iopub.status.busy": "2021-12-04T16:49:31.805941Z", "iopub.status.idle": "2021-12-04T16:49:31.808050Z", "shell.execute_reply": "2021-12-04T16:49:31.807649Z"}, "papermill": {"duration": 0.033474, "end_time": "2021-12-04T16:49:31.808151", "exception": false, "start_time": "2021-12-04T16:49:31.774677", "status": "completed"}, "tags": []}, "outputs": [], "source": ["\n", "# Named tuple for storing experience steps gathered in training\n", "Experience = namedtuple(\n", " \"Experience\",\n", " field_names=[\"state\", \"action\", \"reward\", \"done\", \"new_state\"],\n", ")"]}, {"cell_type": "code", "execution_count": 5, "id": "8ae0c219", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:49:31.869846Z", "iopub.status.busy": "2021-12-04T16:49:31.869370Z", "iopub.status.idle": "2021-12-04T16:49:31.871439Z", "shell.execute_reply": "2021-12-04T16:49:31.870977Z"}, "papermill": {"duration": 0.035508, "end_time": "2021-12-04T16:49:31.871534", "exception": false, "start_time": "2021-12-04T16:49:31.836026", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class ReplayBuffer:\n", " \"\"\"Replay Buffer for storing past experiences allowing the agent to learn from them.\n", "\n", " Args:\n", " capacity: size of the buffer\n", " \"\"\"\n", "\n", " def __init__(self, capacity: int) -> None:\n", " self.buffer = deque(maxlen=capacity)\n", "\n", " def __len__(self) -> None:\n", " return len(self.buffer)\n", "\n", " def append(self, experience: Experience) -> None:\n", " \"\"\"Add experience to the buffer.\n", "\n", " Args:\n", " experience: tuple (state, action, reward, done, new_state)\n", " \"\"\"\n", " self.buffer.append(experience)\n", "\n", " def sample(self, batch_size: int) -> Tuple:\n", " indices = np.random.choice(len(self.buffer), batch_size, replace=False)\n", " states, actions, rewards, dones, next_states = zip(*(self.buffer[idx] for idx in indices))\n", "\n", " return (\n", " np.array(states),\n", " np.array(actions),\n", " np.array(rewards, dtype=np.float32),\n", " np.array(dones, dtype=np.bool),\n", " np.array(next_states),\n", " )"]}, {"cell_type": "code", "execution_count": 6, "id": "d1052c84", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:49:31.931299Z", "iopub.status.busy": "2021-12-04T16:49:31.930829Z", "iopub.status.idle": "2021-12-04T16:49:31.932898Z", "shell.execute_reply": "2021-12-04T16:49:31.932435Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.033795, "end_time": "2021-12-04T16:49:31.932991", "exception": false, "start_time": "2021-12-04T16:49:31.899196", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class RLDataset(IterableDataset):\n", " \"\"\"Iterable Dataset containing the ExperienceBuffer which will be updated with new experiences during training.\n", "\n", " Args:\n", " buffer: replay buffer\n", " sample_size: number of experiences to sample at a time\n", " \"\"\"\n", "\n", " def __init__(self, buffer: ReplayBuffer, sample_size: int = 200) -> None:\n", " self.buffer = buffer\n", " self.sample_size = sample_size\n", "\n", " def __iter__(self) -> Tuple:\n", " states, actions, rewards, dones, new_states = self.buffer.sample(self.sample_size)\n", " for i in range(len(dones)):\n", " yield states[i], actions[i], rewards[i], dones[i], new_states[i]"]}, {"cell_type": "markdown", "id": "fbe4a973", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.027797, "end_time": "2021-12-04T16:49:31.988622", "exception": false, "start_time": "2021-12-04T16:49:31.960825", "status": "completed"}, "tags": []}, "source": ["### Agent"]}, {"cell_type": "code", "execution_count": 7, "id": "42dd9534", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:49:32.054816Z", "iopub.status.busy": "2021-12-04T16:49:32.054310Z", "iopub.status.idle": "2021-12-04T16:49:32.056372Z", "shell.execute_reply": "2021-12-04T16:49:32.055906Z"}, "lines_to_next_cell": 2, "papermill": {"duration": 0.039725, "end_time": "2021-12-04T16:49:32.056473", "exception": false, "start_time": "2021-12-04T16:49:32.016748", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class Agent:\n", " \"\"\"Base Agent class handeling the interaction with the environment.\"\"\"\n", "\n", " def __init__(self, env: gym.Env, replay_buffer: ReplayBuffer) -> None:\n", " \"\"\"\n", " Args:\n", " env: training environment\n", " replay_buffer: replay buffer storing experiences\n", " \"\"\"\n", " self.env = env\n", " self.replay_buffer = replay_buffer\n", " self.reset()\n", " self.state = self.env.reset()\n", "\n", " def reset(self) -> None:\n", " \"\"\"Resents the environment and updates the state.\"\"\"\n", " self.state = self.env.reset()\n", "\n", " def get_action(self, net: nn.Module, epsilon: float, device: str) -> int:\n", " \"\"\"Using the given network, decide what action to carry out using an epsilon-greedy policy.\n", "\n", " Args:\n", " net: DQN network\n", " epsilon: value to determine likelihood of taking a random action\n", " device: current device\n", "\n", " Returns:\n", " action\n", " \"\"\"\n", " if np.random.random() < epsilon:\n", " action = self.env.action_space.sample()\n", " else:\n", " state = torch.tensor([self.state])\n", "\n", " if device not in [\"cpu\"]:\n", " state = state.cuda(device)\n", "\n", " q_values = net(state)\n", " _, action = torch.max(q_values, dim=1)\n", " action = int(action.item())\n", "\n", " return action\n", "\n", " @torch.no_grad()\n", " def play_step(\n", " self,\n", " net: nn.Module,\n", " epsilon: float = 0.0,\n", " device: str = \"cpu\",\n", " ) -> Tuple[float, bool]:\n", " \"\"\"Carries out a single interaction step between the agent and the environment.\n", "\n", " Args:\n", " net: DQN network\n", " epsilon: value to determine likelihood of taking a random action\n", " device: current device\n", "\n", " Returns:\n", " reward, done\n", " \"\"\"\n", "\n", " action = self.get_action(net, epsilon, device)\n", "\n", " # do step in the environment\n", " new_state, reward, done, _ = self.env.step(action)\n", "\n", " exp = Experience(self.state, action, reward, done, new_state)\n", "\n", " self.replay_buffer.append(exp)\n", "\n", " self.state = new_state\n", " if done:\n", " self.reset()\n", " return reward, done"]}, {"cell_type": "markdown", "id": "17cb3c7e", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.03211, "end_time": "2021-12-04T16:49:32.116593", "exception": false, "start_time": "2021-12-04T16:49:32.084483", "status": "completed"}, "tags": []}, "source": ["### DQN Lightning Module"]}, {"cell_type": "code", "execution_count": 8, "id": "ed5b8877", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:49:32.185758Z", "iopub.status.busy": "2021-12-04T16:49:32.175032Z", "iopub.status.idle": "2021-12-04T16:49:32.190998Z", "shell.execute_reply": "2021-12-04T16:49:32.190598Z"}, "papermill": {"duration": 0.045916, "end_time": "2021-12-04T16:49:32.191102", "exception": false, "start_time": "2021-12-04T16:49:32.145186", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class DQNLightning(LightningModule):\n", " \"\"\"Basic DQN Model.\"\"\"\n", "\n", " def __init__(\n", " self,\n", " batch_size: int = 16,\n", " lr: float = 1e-2,\n", " env: str = \"CartPole-v0\",\n", " gamma: float = 0.99,\n", " sync_rate: int = 10,\n", " replay_size: int = 1000,\n", " warm_start_size: int = 1000,\n", " eps_last_frame: int = 1000,\n", " eps_start: float = 1.0,\n", " eps_end: float = 0.01,\n", " episode_length: int = 200,\n", " warm_start_steps: int = 1000,\n", " ) -> None:\n", " \"\"\"\n", " Args:\n", " batch_size: size of the batches\")\n", " lr: learning rate\n", " env: gym environment tag\n", " gamma: discount factor\n", " sync_rate: how many frames do we update the target network\n", " replay_size: capacity of the replay buffer\n", " warm_start_size: how many samples do we use to fill our buffer at the start of training\n", " eps_last_frame: what frame should epsilon stop decaying\n", " eps_start: starting value of epsilon\n", " eps_end: final value of epsilon\n", " episode_length: max length of an episode\n", " warm_start_steps: max episode reward in the environment\n", " \"\"\"\n", " super().__init__()\n", " self.save_hyperparameters()\n", "\n", " self.env = gym.make(self.hparams.env)\n", " obs_size = self.env.observation_space.shape[0]\n", " n_actions = self.env.action_space.n\n", "\n", " self.net = DQN(obs_size, n_actions)\n", " self.target_net = DQN(obs_size, n_actions)\n", "\n", " self.buffer = ReplayBuffer(self.hparams.replay_size)\n", " self.agent = Agent(self.env, self.buffer)\n", " self.total_reward = 0\n", " self.episode_reward = 0\n", " self.populate(self.hparams.warm_start_steps)\n", "\n", " def populate(self, steps: int = 1000) -> None:\n", " \"\"\"Carries out several random steps through the environment to initially fill up the replay buffer with\n", " experiences.\n", "\n", " Args:\n", " steps: number of random steps to populate the buffer with\n", " \"\"\"\n", " for i in range(steps):\n", " self.agent.play_step(self.net, epsilon=1.0)\n", "\n", " def forward(self, x: Tensor) -> Tensor:\n", " \"\"\"Passes in a state x through the network and gets the q_values of each action as an output.\n", "\n", " Args:\n", " x: environment state\n", "\n", " Returns:\n", " q values\n", " \"\"\"\n", " output = self.net(x)\n", " return output\n", "\n", " def dqn_mse_loss(self, batch: Tuple[Tensor, Tensor]) -> Tensor:\n", " \"\"\"Calculates the mse loss using a mini batch from the replay buffer.\n", "\n", " Args:\n", " batch: current mini batch of replay data\n", "\n", " Returns:\n", " loss\n", " \"\"\"\n", " states, actions, rewards, dones, next_states = batch\n", "\n", " state_action_values = self.net(states).gather(1, actions.unsqueeze(-1)).squeeze(-1)\n", "\n", " with torch.no_grad():\n", " next_state_values = self.target_net(next_states).max(1)[0]\n", " next_state_values[dones] = 0.0\n", " next_state_values = next_state_values.detach()\n", "\n", " expected_state_action_values = next_state_values * self.hparams.gamma + rewards\n", "\n", " return nn.MSELoss()(state_action_values, expected_state_action_values)\n", "\n", " def training_step(self, batch: Tuple[Tensor, Tensor], nb_batch) -> OrderedDict:\n", " \"\"\"Carries out a single step through the environment to update the replay buffer. Then calculates loss\n", " based on the minibatch recieved.\n", "\n", " Args:\n", " batch: current mini batch of replay data\n", " nb_batch: batch number\n", "\n", " Returns:\n", " Training loss and log metrics\n", " \"\"\"\n", " device = self.get_device(batch)\n", " epsilon = max(\n", " self.hparams.eps_end,\n", " self.hparams.eps_start - self.global_step + 1 / self.hparams.eps_last_frame,\n", " )\n", "\n", " # step through environment with agent\n", " reward, done = self.agent.play_step(self.net, epsilon, device)\n", " self.episode_reward += reward\n", "\n", " # calculates training loss\n", " loss = self.dqn_mse_loss(batch)\n", "\n", " if self.trainer._distrib_type in {DistributedType.DP, DistributedType.DDP2}:\n", " loss = loss.unsqueeze(0)\n", "\n", " if done:\n", " self.total_reward = self.episode_reward\n", " self.episode_reward = 0\n", "\n", " # Soft update of target network\n", " if self.global_step % self.hparams.sync_rate == 0:\n", " self.target_net.load_state_dict(self.net.state_dict())\n", "\n", " log = {\n", " \"total_reward\": torch.tensor(self.total_reward).to(device),\n", " \"reward\": torch.tensor(reward).to(device),\n", " \"train_loss\": loss,\n", " }\n", " status = {\n", " \"steps\": torch.tensor(self.global_step).to(device),\n", " \"total_reward\": torch.tensor(self.total_reward).to(device),\n", " }\n", "\n", " return OrderedDict({\"loss\": loss, \"log\": log, \"progress_bar\": status})\n", "\n", " def configure_optimizers(self) -> List[Optimizer]:\n", " \"\"\"Initialize Adam optimizer.\"\"\"\n", " optimizer = Adam(self.net.parameters(), lr=self.hparams.lr)\n", " return [optimizer]\n", "\n", " def __dataloader(self) -> DataLoader:\n", " \"\"\"Initialize the Replay Buffer dataset used for retrieving experiences.\"\"\"\n", " dataset = RLDataset(self.buffer, self.hparams.episode_length)\n", " dataloader = DataLoader(\n", " dataset=dataset,\n", " batch_size=self.hparams.batch_size,\n", " )\n", " return dataloader\n", "\n", " def train_dataloader(self) -> DataLoader:\n", " \"\"\"Get train loader.\"\"\"\n", " return self.__dataloader()\n", "\n", " def get_device(self, batch) -> str:\n", " \"\"\"Retrieve device currently being used by minibatch.\"\"\"\n", " return batch[0].device.index if self.on_gpu else \"cpu\""]}, {"cell_type": "markdown", "id": "6068b50b", "metadata": {"papermill": {"duration": 0.029024, "end_time": "2021-12-04T16:49:32.248526", "exception": false, "start_time": "2021-12-04T16:49:32.219502", "status": "completed"}, "tags": []}, "source": ["### Trainer"]}, {"cell_type": "code", "execution_count": 9, "id": "223c17c5", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:49:32.308551Z", "iopub.status.busy": "2021-12-04T16:49:32.308085Z", "iopub.status.idle": "2021-12-04T16:49:48.709258Z", "shell.execute_reply": "2021-12-04T16:49:48.709649Z"}, "papermill": {"duration": 16.433171, "end_time": "2021-12-04T16:49:48.709816", "exception": false, "start_time": "2021-12-04T16:49:32.276645", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["GPU available: True, used: True\n"]}, {"name": "stderr", "output_type": "stream", "text": ["TPU available: False, using: 0 TPU cores\n"]}, {"name": "stderr", "output_type": "stream", "text": ["IPU available: False, using: 0 IPUs\n"]}, {"name": "stderr", "output_type": "stream", "text": ["LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n"]}, {"name": "stderr", "output_type": "stream", "text": ["\n", " | Name | Type | Params\n", "------------------------------------\n", "0 | net | DQN | 898 \n", "1 | target_net | DQN | 898 \n", "------------------------------------\n", "1.8 K Trainable params\n", "0 Non-trainable params\n", "1.8 K Total params\n", "0.007 Total estimated model params size (MB)\n"]}, {"name": "stderr", "output_type": "stream", "text": ["/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/trainer/data_loading.py:111: UserWarning: The dataloader, train_dataloader, does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` (try 12 which is the number of cpus on this machine) in the `DataLoader` init to improve performance.\n", " rank_zero_warn(\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "7809a9f0b92743a3bdfcc9d4e6096fec", "version_major": 2, "version_minor": 0}, "text/plain": ["Training: 0it [00:00, ?it/s]"]}, "metadata": {}, "output_type": "display_data"}, {"name": "stderr", "output_type": "stream", "text": ["/tmp/ipykernel_6545/3638216480.py:30: DeprecationWarning: `np.bool` is a deprecated alias for the builtin `bool`. To silence this warning, use `bool` by itself. Doing this will not modify any behavior and is safe. If you specifically wanted the numpy scalar type, use `np.bool_` here.\n", "Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations\n", " np.array(dones, dtype=np.bool),\n", "/home/AzDevOps_azpcontainer/.local/lib/python3.9/site-packages/pytorch_lightning/loops/optimization/closure.py:35: LightningDeprecationWarning: One of the returned values {'progress_bar', 'log'} has a `grad_fn`. We will detach it automatically but this behaviour will change in v1.6. Please detach it manually: `return {'loss': ..., 'something': something.detach()}`\n", " rank_zero_deprecation(\n"]}], "source": ["\n", "model = DQNLightning()\n", "\n", "trainer = Trainer(\n", " gpus=AVAIL_GPUS,\n", " max_epochs=200,\n", " val_check_interval=100,\n", ")\n", "\n", "trainer.fit(model)"]}, {"cell_type": "code", "execution_count": 10, "id": "b0dc7a72", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:49:48.784401Z", "iopub.status.busy": "2021-12-04T16:49:48.783938Z", "iopub.status.idle": "2021-12-04T16:49:50.361154Z", "shell.execute_reply": "2021-12-04T16:49:50.361542Z"}, "papermill": {"duration": 1.615711, "end_time": "2021-12-04T16:49:50.361705", "exception": false, "start_time": "2021-12-04T16:49:48.745994", "status": "completed"}, "tags": []}, "outputs": [{"data": {"text/html": ["\n", " \n", " \n", " "], "text/plain": [""]}, "metadata": {}, "output_type": "display_data"}], "source": ["# Start tensorboard.\n", "%load_ext tensorboard\n", "%tensorboard --logdir lightning_logs/"]}, {"cell_type": "markdown", "id": "46d9a7e6", "metadata": {"papermill": {"duration": 0.037856, "end_time": "2021-12-04T16:49:50.435994", "exception": false, "start_time": "2021-12-04T16:49:50.398138", "status": "completed"}, "tags": []}, "source": ["## Congratulations - Time to Join the Community!\n", "\n", "Congratulations on completing this notebook tutorial! If you enjoyed this and would like to join the Lightning\n", "movement, you can do so in the following ways!\n", "\n", "### Star [Lightning](https://github.com/PyTorchLightning/pytorch-lightning) on GitHub\n", "The easiest way to help our community is just by starring the GitHub repos! This helps raise awareness of the cool\n", "tools we're building.\n", "\n", "### Join our [Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)!\n", "The best way to keep up to date on the latest advancements is to join our community! Make sure to introduce yourself\n", "and share your interests in `#general` channel\n", "\n", "\n", "### Contributions !\n", "The best way to contribute to our community is to become a code contributor! At any time you can go to\n", "[Lightning](https://github.com/PyTorchLightning/pytorch-lightning) or [Bolt](https://github.com/PyTorchLightning/lightning-bolts)\n", "GitHub Issues page and filter for \"good first issue\".\n", "\n", "* [Lightning good first issue](https://github.com/PyTorchLightning/pytorch-lightning/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* [Bolt good first issue](https://github.com/PyTorchLightning/lightning-bolts/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22)\n", "* You can also contribute your own notebooks with useful examples !\n", "\n", "### Great thanks from the entire Pytorch Lightning Team for your interest !\n", "\n", "[![Pytorch Lightning](){height=\"60px\" width=\"240px\"}](https://pytorchlightning.ai)"]}, {"cell_type": "raw", "metadata": {"raw_mimetype": "text/restructuredtext"}, "source": [".. customcarditem::\n", " :header: How to train a Deep Q Network\n", " :card_description: Main takeaways: 1. RL has the same flow as previous models we have seen, with a few additions 2. Handle unsupervised learning by using an IterableDataset where the dataset...\n", " :tags: RL,GPU/TPU,Lightning-Examples"]}], "metadata": {"jupytext": {"cell_metadata_filter": "id,colab_type,colab,-all", "formats": "ipynb,py:percent", "main_language": "python"}, "language_info": {"codemirror_mode": {"name": "ipython", "version": 3}, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.7"}, "papermill": {"default_parameters": {}, "duration": 29.486464, "end_time": "2021-12-04T16:49:52.782807", "environment_variables": {}, "exception": null, "input_path": "lightning_examples/reinforce-learning-DQN/dqn.ipynb", "output_path": ".notebooks/lightning_examples/reinforce-learning-DQN.ipynb", "parameters": {}, "start_time": "2021-12-04T16:49:23.296343", "version": "2.3.3"}, "widgets": {"application/vnd.jupyter.widget-state+json": {"state": {"0885ff08e5e847eebdcfdc546cf79123": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "142276d4fabb4037a6c15952c792292b": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": "2", "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "1f8780cfa7d5451fbfa8deb76ebec06a": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c47ec2cbd7bc4b288dae843a48dca3c7", "placeholder": "\u200b", "style": "IPY_MODEL_0885ff08e5e847eebdcfdc546cf79123", "value": "Epoch 199: "}}, "36eace64700644bb8e54ccc45212596c": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": ""}}, "5bdaf8d89f2f4abd9c821c3f7eac63d7": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": "inline-flex", "flex": null, "flex_flow": "row wrap", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "100%"}}, "7809a9f0b92743a3bdfcc9d4e6096fec": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": ["IPY_MODEL_1f8780cfa7d5451fbfa8deb76ebec06a", "IPY_MODEL_94af77267feb429a90ec99375045262e", "IPY_MODEL_d1478e69106c4687a0b853cbc557271e"], "layout": "IPY_MODEL_5bdaf8d89f2f4abd9c821c3f7eac63d7"}}, "94af77267feb429a90ec99375045262e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_142276d4fabb4037a6c15952c792292b", "max": 1.0, "min": 0.0, "orientation": "horizontal", "style": "IPY_MODEL_e0376cde46734387ac89cb86a858bf70", "value": 1.0}}, "9c315c37e7f947e7ba7d32663c2399c2": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "c47ec2cbd7bc4b288dae843a48dca3c7": {"model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "d1478e69106c4687a0b853cbc557271e": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_9c315c37e7f947e7ba7d32663c2399c2", "placeholder": "\u200b", "style": "IPY_MODEL_36eace64700644bb8e54ccc45212596c", "value": " 13/? [00:00<00:00, 205.93it/s, loss=45.6, v_num=8]"}}, "e0376cde46734387ac89cb86a858bf70": {"model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": {"_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": ""}}}, "version_major": 2, "version_minor": 0}}}, "nbformat": 4, "nbformat_minor": 5} \ No newline at end of file diff --git a/source/notebooks/lightning_examples/text-transformers.ipynb b/source/notebooks/lightning_examples/text-transformers.ipynb deleted file mode 100644 index 6dc58ca..0000000 --- a/source/notebooks/lightning_examples/text-transformers.ipynb +++ /dev/null @@ -1 +0,0 @@ -{"cells": [{"cell_type": "markdown", "id": "3c99ec5d", "metadata": {"papermill": {"duration": 0.033967, "end_time": "2021-12-04T16:50:09.385288", "exception": false, "start_time": "2021-12-04T16:50:09.351321", "status": "completed"}, "tags": []}, "source": ["\n", "# Finetune Transformers Models with PyTorch Lightning\n", "\n", "* **Author:** PL team\n", "* **License:** CC BY-SA\n", "* **Generated:** 2021-12-04T16:53:11.286202\n", "\n", "This notebook will use HuggingFace's `datasets` library to get data, which will be wrapped in a `LightningDataModule`.\n", "Then, we write a class to perform text classification on any dataset from the [GLUE Benchmark](https://gluebenchmark.com/).\n", "(We just show CoLA and MRPC due to constraint on compute/disk)\n", "\n", "\n", "---\n", "Open in [![Open In Colab](){height=\"20px\" width=\"117px\"}](https://colab.research.google.com/github/PytorchLightning/lightning-tutorials/blob/publication/.notebooks/lightning_examples/text-transformers.ipynb)\n", "\n", "Give us a \u2b50 [on Github](https://www.github.com/PytorchLightning/pytorch-lightning/)\n", "| Check out [the documentation](https://pytorch-lightning.readthedocs.io/en/latest/)\n", "| Join us [on Slack](https://join.slack.com/t/pytorch-lightning/shared_invite/zt-pw5v393p-qRaDgEk24~EjiZNBpSQFgQ)"]}, {"cell_type": "markdown", "id": "0e4d7209", "metadata": {"papermill": {"duration": 0.028692, "end_time": "2021-12-04T16:50:09.445776", "exception": false, "start_time": "2021-12-04T16:50:09.417084", "status": "completed"}, "tags": []}, "source": ["## Setup\n", "This notebook requires some packages besides pytorch-lightning."]}, {"cell_type": "code", "execution_count": 1, "id": "49b84d9c", "metadata": {"colab": {}, "colab_type": "code", "execution": {"iopub.execute_input": "2021-12-04T16:50:09.510470Z", "iopub.status.busy": "2021-12-04T16:50:09.505774Z", "iopub.status.idle": "2021-12-04T16:50:12.925383Z", "shell.execute_reply": "2021-12-04T16:50:12.924802Z"}, "id": "LfrJLKPFyhsK", "lines_to_next_cell": 0, "papermill": {"duration": 3.45077, "end_time": "2021-12-04T16:50:12.925533", "exception": false, "start_time": "2021-12-04T16:50:09.474763", "status": "completed"}, "tags": []}, "outputs": [], "source": ["! pip install --quiet \"datasets\" \"pytorch-lightning>=1.3\" \"scipy\" \"transformers\" \"torchmetrics>=0.3\" \"scikit-learn\" \"torchtext>=0.9\" \"torch>=1.6, <1.9\""]}, {"cell_type": "code", "execution_count": 2, "id": "8c24af2f", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:50:12.990546Z", "iopub.status.busy": "2021-12-04T16:50:12.990070Z", "iopub.status.idle": "2021-12-04T16:50:17.320862Z", "shell.execute_reply": "2021-12-04T16:50:17.320412Z"}, "papermill": {"duration": 4.364813, "end_time": "2021-12-04T16:50:17.320999", "exception": false, "start_time": "2021-12-04T16:50:12.956186", "status": "completed"}, "tags": []}, "outputs": [], "source": ["from datetime import datetime\n", "from typing import Optional\n", "\n", "import datasets\n", "import torch\n", "from pytorch_lightning import LightningDataModule, LightningModule, Trainer, seed_everything\n", "from torch.utils.data import DataLoader\n", "from transformers import (\n", " AdamW,\n", " AutoConfig,\n", " AutoModelForSequenceClassification,\n", " AutoTokenizer,\n", " get_linear_schedule_with_warmup,\n", ")\n", "\n", "AVAIL_GPUS = min(1, torch.cuda.device_count())"]}, {"cell_type": "markdown", "id": "2134c12c", "metadata": {"papermill": {"duration": 0.029134, "end_time": "2021-12-04T16:50:17.381739", "exception": false, "start_time": "2021-12-04T16:50:17.352605", "status": "completed"}, "tags": []}, "source": ["## Training BERT with Lightning"]}, {"cell_type": "markdown", "id": "c827ca58", "metadata": {"lines_to_next_cell": 2, "papermill": {"duration": 0.029129, "end_time": "2021-12-04T16:50:17.441085", "exception": false, "start_time": "2021-12-04T16:50:17.411956", "status": "completed"}, "tags": []}, "source": ["### Lightning DataModule for GLUE"]}, {"cell_type": "code", "execution_count": 3, "id": "5a856234", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:50:17.515779Z", "iopub.status.busy": "2021-12-04T16:50:17.512843Z", "iopub.status.idle": "2021-12-04T16:50:17.517417Z", "shell.execute_reply": "2021-12-04T16:50:17.517796Z"}, "papermill": {"duration": 0.047785, "end_time": "2021-12-04T16:50:17.517928", "exception": false, "start_time": "2021-12-04T16:50:17.470143", "status": "completed"}, "tags": []}, "outputs": [], "source": ["class GLUEDataModule(LightningDataModule):\n", "\n", " task_text_field_map = {\n", " \"cola\": [\"sentence\"],\n", " \"sst2\": [\"sentence\"],\n", " \"mrpc\": [\"sentence1\", \"sentence2\"],\n", " \"qqp\": [\"question1\", \"question2\"],\n", " \"stsb\": [\"sentence1\", \"sentence2\"],\n", " \"mnli\": [\"premise\", \"hypothesis\"],\n", " \"qnli\": [\"question\", \"sentence\"],\n", " \"rte\": [\"sentence1\", \"sentence2\"],\n", " \"wnli\": [\"sentence1\", \"sentence2\"],\n", " \"ax\": [\"premise\", \"hypothesis\"],\n", " }\n", "\n", " glue_task_num_labels = {\n", " \"cola\": 2,\n", " \"sst2\": 2,\n", " \"mrpc\": 2,\n", " \"qqp\": 2,\n", " \"stsb\": 1,\n", " \"mnli\": 3,\n", " \"qnli\": 2,\n", " \"rte\": 2,\n", " \"wnli\": 2,\n", " \"ax\": 3,\n", " }\n", "\n", " loader_columns = [\n", " \"datasets_idx\",\n", " \"input_ids\",\n", " \"token_type_ids\",\n", " \"attention_mask\",\n", " \"start_positions\",\n", " \"end_positions\",\n", " \"labels\",\n", " ]\n", "\n", " def __init__(\n", " self,\n", " model_name_or_path: str,\n", " task_name: str = \"mrpc\",\n", " max_seq_length: int = 128,\n", " train_batch_size: int = 32,\n", " eval_batch_size: int = 32,\n", " **kwargs,\n", " ):\n", " super().__init__()\n", " self.model_name_or_path = model_name_or_path\n", " self.task_name = task_name\n", " self.max_seq_length = max_seq_length\n", " self.train_batch_size = train_batch_size\n", " self.eval_batch_size = eval_batch_size\n", "\n", " self.text_fields = self.task_text_field_map[task_name]\n", " self.num_labels = self.glue_task_num_labels[task_name]\n", " self.tokenizer = AutoTokenizer.from_pretrained(self.model_name_or_path, use_fast=True)\n", "\n", " def setup(self, stage: str):\n", " self.dataset = datasets.load_dataset(\"glue\", self.task_name)\n", "\n", " for split in self.dataset.keys():\n", " self.dataset[split] = self.dataset[split].map(\n", " self.convert_to_features,\n", " batched=True,\n", " remove_columns=[\"label\"],\n", " )\n", " self.columns = [c for c in self.dataset[split].column_names if c in self.loader_columns]\n", " self.dataset[split].set_format(type=\"torch\", columns=self.columns)\n", "\n", " self.eval_splits = [x for x in self.dataset.keys() if \"validation\" in x]\n", "\n", " def prepare_data(self):\n", " datasets.load_dataset(\"glue\", self.task_name)\n", " AutoTokenizer.from_pretrained(self.model_name_or_path, use_fast=True)\n", "\n", " def train_dataloader(self):\n", " return DataLoader(self.dataset[\"train\"], batch_size=self.train_batch_size)\n", "\n", " def val_dataloader(self):\n", " if len(self.eval_splits) == 1:\n", " return DataLoader(self.dataset[\"validation\"], batch_size=self.eval_batch_size)\n", " elif len(self.eval_splits) > 1:\n", " return [DataLoader(self.dataset[x], batch_size=self.eval_batch_size) for x in self.eval_splits]\n", "\n", " def test_dataloader(self):\n", " if len(self.eval_splits) == 1:\n", " return DataLoader(self.dataset[\"test\"], batch_size=self.eval_batch_size)\n", " elif len(self.eval_splits) > 1:\n", " return [DataLoader(self.dataset[x], batch_size=self.eval_batch_size) for x in self.eval_splits]\n", "\n", " def convert_to_features(self, example_batch, indices=None):\n", "\n", " # Either encode single sentence or sentence pairs\n", " if len(self.text_fields) > 1:\n", " texts_or_text_pairs = list(zip(example_batch[self.text_fields[0]], example_batch[self.text_fields[1]]))\n", " else:\n", " texts_or_text_pairs = example_batch[self.text_fields[0]]\n", "\n", " # Tokenize the text/text pairs\n", " features = self.tokenizer.batch_encode_plus(\n", " texts_or_text_pairs, max_length=self.max_seq_length, pad_to_max_length=True, truncation=True\n", " )\n", "\n", " # Rename label to labels to make it easier to pass to model forward\n", " features[\"labels\"] = example_batch[\"label\"]\n", "\n", " return features"]}, {"cell_type": "markdown", "id": "532d63d6", "metadata": {"papermill": {"duration": 0.029073, "end_time": "2021-12-04T16:50:17.576485", "exception": false, "start_time": "2021-12-04T16:50:17.547412", "status": "completed"}, "tags": []}, "source": ["**You could use this datamodule with standalone PyTorch if you wanted...**"]}, {"cell_type": "code", "execution_count": 4, "id": "f3f27b26", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:50:17.637888Z", "iopub.status.busy": "2021-12-04T16:50:17.637424Z", "iopub.status.idle": "2021-12-04T16:50:24.396830Z", "shell.execute_reply": "2021-12-04T16:50:24.396334Z"}, "papermill": {"duration": 6.791378, "end_time": "2021-12-04T16:50:24.396956", "exception": false, "start_time": "2021-12-04T16:50:17.605578", "status": "completed"}, "tags": []}, "outputs": [{"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "232400085c33454e97f802179183d1ed", "version_major": 2, "version_minor": 0}, "text/plain": ["Downloading: 0%| | 0.00/28.0 [00:00= 1:\n", " preds = torch.argmax(logits, axis=1)\n", " elif self.hparams.num_labels == 1:\n", " preds = logits.squeeze()\n", "\n", " labels = batch[\"labels\"]\n", "\n", " return {\"loss\": val_loss, \"preds\": preds, \"labels\": labels}\n", "\n", " def validation_epoch_end(self, outputs):\n", " if self.hparams.task_name == \"mnli\":\n", " for i, output in enumerate(outputs):\n", " # matched or mismatched\n", " split = self.hparams.eval_splits[i].split(\"_\")[-1]\n", " preds = torch.cat([x[\"preds\"] for x in output]).detach().cpu().numpy()\n", " labels = torch.cat([x[\"labels\"] for x in output]).detach().cpu().numpy()\n", " loss = torch.stack([x[\"loss\"] for x in output]).mean()\n", " self.log(f\"val_loss_{split}\", loss, prog_bar=True)\n", " split_metrics = {\n", " f\"{k}_{split}\": v for k, v in self.metric.compute(predictions=preds, references=labels).items()\n", " }\n", " self.log_dict(split_metrics, prog_bar=True)\n", " return loss\n", "\n", " preds = torch.cat([x[\"preds\"] for x in outputs]).detach().cpu().numpy()\n", " labels = torch.cat([x[\"labels\"] for x in outputs]).detach().cpu().numpy()\n", " loss = torch.stack([x[\"loss\"] for x in outputs]).mean()\n", " self.log(\"val_loss\", loss, prog_bar=True)\n", " self.log_dict(self.metric.compute(predictions=preds, references=labels), prog_bar=True)\n", " return loss\n", "\n", " def setup(self, stage=None) -> None:\n", " if stage != \"fit\":\n", " return\n", " # Get dataloader by calling it - train_dataloader() is called after setup() by default\n", " train_loader = self.trainer.datamodule.train_dataloader()\n", "\n", " # Calculate total steps\n", " tb_size = self.hparams.train_batch_size * max(1, self.trainer.gpus)\n", " ab_size = self.trainer.accumulate_grad_batches * float(self.trainer.max_epochs)\n", " self.total_steps = (len(train_loader.dataset) // tb_size) // ab_size\n", "\n", " def configure_optimizers(self):\n", " \"\"\"Prepare optimizer and schedule (linear warmup and decay)\"\"\"\n", " model = self.model\n", " no_decay = [\"bias\", \"LayerNorm.weight\"]\n", " optimizer_grouped_parameters = [\n", " {\n", " \"params\": [p for n, p in model.named_parameters() if not any(nd in n for nd in no_decay)],\n", " \"weight_decay\": self.hparams.weight_decay,\n", " },\n", " {\n", " \"params\": [p for n, p in model.named_parameters() if any(nd in n for nd in no_decay)],\n", " \"weight_decay\": 0.0,\n", " },\n", " ]\n", " optimizer = AdamW(optimizer_grouped_parameters, lr=self.hparams.learning_rate, eps=self.hparams.adam_epsilon)\n", "\n", " scheduler = get_linear_schedule_with_warmup(\n", " optimizer,\n", " num_warmup_steps=self.hparams.warmup_steps,\n", " num_training_steps=self.total_steps,\n", " )\n", " scheduler = {\"scheduler\": scheduler, \"interval\": \"step\", \"frequency\": 1}\n", " return [optimizer], [scheduler]"]}, {"cell_type": "markdown", "id": "be59b890", "metadata": {"papermill": {"duration": 0.055801, "end_time": "2021-12-04T16:50:24.863114", "exception": false, "start_time": "2021-12-04T16:50:24.807313", "status": "completed"}, "tags": []}, "source": ["## Training"]}, {"cell_type": "markdown", "id": "c1a5d61a", "metadata": {"papermill": {"duration": 0.054576, "end_time": "2021-12-04T16:50:24.972560", "exception": false, "start_time": "2021-12-04T16:50:24.917984", "status": "completed"}, "tags": []}, "source": ["### CoLA\n", "\n", "See an interactive view of the\n", "CoLA dataset in [NLP Viewer](https://huggingface.co/nlp/viewer/?dataset=glue&config=cola)"]}, {"cell_type": "code", "execution_count": 6, "id": "774115a0", "metadata": {"execution": {"iopub.execute_input": "2021-12-04T16:50:25.086490Z", "iopub.status.busy": "2021-12-04T16:50:25.086020Z", "iopub.status.idle": "2021-12-04T16:51:46.067948Z", "shell.execute_reply": "2021-12-04T16:51:46.068322Z"}, "papermill": {"duration": 81.04138, "end_time": "2021-12-04T16:51:46.068501", "exception": false, "start_time": "2021-12-04T16:50:25.027121", "status": "completed"}, "tags": []}, "outputs": [{"name": "stderr", "output_type": "stream", "text": ["Global seed set to 42\n"]}, {"data": {"application/vnd.jupyter.widget-view+json": {"model_id": "0071178f4db54b2a9c7a0c792adbfde9", "version_major": 2, "version_minor": 0}, "text/plain": ["Downloading: 0%| | 0.00/684 [00:00` _ 에서 PyTorch를 설치한 뒤, -아래 명령어로 `pip `_ 를 사용하여 설치할 수 있습니다: - -.. code-block:: bash - - pip install pytorch-lightning - --------------- - -*********************** -Conda를 사용하여 설치 -*********************** - -만약 conda를 아직 설치하지 않았다면, `Conda 설치 가이드 `_ 를 참고하세요. -Lightning은 아래 명령어로 `conda `_ 를 사용하여 설치할 수 있습니다: - -.. code-block:: bash - - conda install pytorch-lightning -c conda-forge - -`Conda 가상환경(Environments) `_ 을 사용할 수도 있습니다: - -.. code-block:: bash - - conda activate my_env - conda install pytorch-lightning -c conda-forge - --------------- - -************************ -소스 코드로 설치 -************************ - -소스 코드로 최신 버전(nightly)을 설치합니다. 아직 배포되지 않은 버그 수정(bug fix)과 새롭게 출시할 기능들이 -포함되어 있습니다. 미검증·불안정 최신 기능(bleeding edge)이므로, 신중하게 사용하세요. - -.. code-block:: bash - - pip install https://github.com/PyTorchLightning/pytorch-lightning/archive/master.zip - -향후 공개될 개선 버전(patch release)를 소스 코드로부터 설치합니다. 개선 버전은 가장 최근의 주요 버전(major release)에 대한 버그 수정만 -포함되어 있습니다. - -.. code-block:: bash - - pip install https://github.com/PyTorchLightning/pytorch-lightning/archive/refs/heads/release/1.5.x.zip - --------------- - -************************************ -Lightning 커버리지(Coverage) -************************************ - -파이토치 라이트닝(PyTorch Lightning)은 다양한 Python과 PyTorch 버전에서 유지 보수 및 테스트되고 있습니다. - -더 자세한 정보는 `CI Coverage `_ 를 참고하세요. - -다양한 GPU와 TPU, CPU, IPU에서 엄격하게 테스트되었습니다. GPU 테스트는 2개의 NVIDIA P100에서 실행됩니다. TPU 테스트는 Google GKE TPUv2/3에서 -실행됩니다. TPU py3.7은 Colab 및 Kaggle 환경을 지원함을 뜻합니다. IPU 테스트는 MK1 IPU 장비에서 실행됩니다. diff --git a/source/starter/introduction.rst b/source/starter/introduction.rst deleted file mode 100644 index a5e92d2..0000000 --- a/source/starter/introduction.rst +++ /dev/null @@ -1,406 +0,0 @@ -:orphan: - -############################### -Lightning 15분 만에 배워보기 -############################### - -**필요한 배경지식:** 없음 - -**목표:** 이 문서에서는 일반적인 Lightning 워크플로우의 주요한 7단계를 안내합니다. - -PyTorch Lightning(파이토치 라이트닝)은 대규모로 엄청 빠른 성능을 요구하면서 최대한의 유연성을 필요로 하는 -전문적인 AI 연구자들과 머신러닝 엔지니어들을 위한 "배터리가 포함된(batteries included)" 딥러닝 프레임워크입니다. - -.. join_slack:: - :align: left - :margin: 20 - -Lightning(라이트닝)은 반복적으로 사용하는 코드(boilerplate)를 제거하고 확장성(scalability)을 확보하도록 PyTorch 코드를 재구성합니다. - -.. raw:: html - - - -| - -PyTorch 코드를 재구성함으로써, Lightning에서는 이런 것들이 가능해집니다: - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: 완전한 유연성 - :description: 반복되는 코드 없이 PyTorch를 그대로 사용하여 아이디어를 구현합니다. - :col_css: col-md-3 - :image_center: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/card_full_control.png - :height: 290 - -.. displayitem:: - :header: 재현성 + 가독성 - :description: 연구용 코드와 엔지니어링 코드를 분리하여 재현성을 갖추고 더 나은 가독성을 제공합니다. - :col_css: col-md-3 - :image_center: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/card_no_boilerplate.png - :height: 290 - -.. displayitem:: - :header: 간단한 다중 GPU 학습 - :description: 코드 변경 없이 여러개의 GPU/TPU/HPU 등을 사용합니다. - :col_css: col-md-3 - :image_center: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/card_hardware.png - :height: 290 - -.. displayitem:: - :header: 테스트 완료 - :description: 이미 모든 테스트를 완료하여 직접 테스트 할 필요없습니다. - :col_css: col-md-3 - :image_center: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/card_testing.png - :height: 290 - -.. raw:: html - -
-
- -.. End of callout item section - ----- - -****************************** -1: PyTorch Lightning 설치하기 -****************************** -.. raw:: html - -
-
- -`pip `_ 사용자라면, - -.. code-block:: bash - - pip install pytorch-lightning - -.. raw:: html - -
-
- -`conda `_ 사용자라면, - -.. code-block:: bash - - conda install pytorch-lightning -c conda-forge - -.. raw:: html - -
-
- -또는 `advanced install guide `_ 를 참조하세요. - ----- - -.. _new_project: - -***************************** -2: LightningModule 정의하기 -***************************** - -LightningModule을 사용하여 PyTorch nn.Module이 training_step (뿐만 아니라 validation_step이나 test_step) 내에서 복잡한 방식으로 함께 동작할 수 있도록 합니다. - -.. testcode:: - - import os - from torch import optim, nn, utils, Tensor - from tests.helpers.datasets import MNIST - import pytorch_lightning as pl - - # 원하는만큼의 nn.Module (또는 기존 모델)을 정의합니다. - encoder = nn.Sequential(nn.Linear(28 * 28, 64), nn.ReLU(), nn.Linear(64, 3)) - decoder = nn.Sequential(nn.Linear(3, 64), nn.ReLU(), nn.Linear(64, 28 * 28)) - - # LightningModule을 정의합니다. - class LitAutoEncoder(pl.LightningModule): - def __init__(self, encoder, decoder): - super().__init__() - self.encoder = encoder - self.decoder = decoder - - def training_step(self, batch, batch_idx): - # training_step defines the train loop. - # it is independent of forward - x, y = batch - x = x.view(x.size(0), -1) - z = self.encoder(x) - x_hat = self.decoder(z) - loss = nn.functional.mse_loss(x_hat, x) - # Logging to TensorBoard by default - self.log("train_loss", loss) - return loss - - def configure_optimizers(self): - optimizer = optim.Adam(self.parameters(), lr=1e-3) - return optimizer - - - # 오토인코더(autoencoder)를 초기화합니다. - autoencoder = LitAutoEncoder(encoder, decoder) - ----- - -********************** -3: 데이터셋 정의하기 -********************** - -Lightning은 *어떠한* 순회 가능한 객체(iterable; :class:`~torch.utils.data.DataLoader`, numpy 등...)도 학습/검증/테스트/예측용으로 나누어 사용할 수 있습니다. - -.. code-block:: python - - # 데이터를 설정합니다. - dataset = MNIST(os.getcwd(), download=True) - train_loader = utils.data.DataLoader(dataset) - ----- - -****************** -4: 모델 학습하기 -****************** - -Lightning :doc:`Trainer <../common/trainer>` 는 모든 :doc:`LightningModule <../common/lightning_module>` 과 데이터셋을 "함께(mix)" 학습할 수 있으며, -확장에 필요한 모든 엔지니어링적 복잡성들을 추상화(abstract)합니다. - -.. code-block:: python - - # 모델을 학습합니다 (힌트: 빠른 아이디어 반복에 도움이 되는 Trainer의 인자들을 참고하세요) - trainer = pl.Trainer(limit_train_batches=100, max_epochs=1) - trainer.fit(model=autoencoder, train_dataloaders=train_loader) - -Lightning :doc:`Trainer <../common/trainer>` 는 아래 예시들을 포함하여 `40종류 이상의 기법들 <../common/trainer.html#trainer-flags>`_ 을 자동화합니다: - -* 에폭(epoch) 및 배치(batch) 반복 -* ``optimizer.step()``, ``loss.backward()``, ``optimizer.zero_grad()`` 호출 -* 평가(evaluation) 도중 경사도(grads) 활성화/비활성화를 위한 ``model.eval()`` 호출 -* :doc:`체크포인트(checkpoint) 저장하기 및 불러오기 <../common/checkpointing>` -* 텐서보드(tensorboard) (:doc:`loggers <../visualize/loggers>` 옵션 참조) -* :doc:`Multi-GPU <../accelerators/gpu>` 지원 -* :doc:`TPU <../accelerators/tpu>` -* :ref:`16비트 정밀도(precision) AMP ` 지원 - ----- - - -****************** -5: 모델 사용하기 -****************** - -모델을 학습한 뒤에는 ONNX, TorchScript로 내보내기(export)하여 상용 환경에 포함하거나 단순히 가중치를 불러오고 예측을 실행할 수 있습니다. - -.. code:: python - - # 체크포인트(checkpoint)를 불러옵니다. - checkpoint = "./lightning_logs/version_0/checkpoints/epoch=0-step=100.ckpt" - autoencoder = LitAutoEncoder.load_from_checkpoint(checkpoint, encoder=encoder, decoder=decoder) - - # 학습한 nn.Module을 선택합니다. - encoder = autoencoder.encoder - encoder.eval() - - # 4개의 가짜 이미지로 예측(embed)합니다! - fake_image_batch = Tensor(4, 28 * 28) - embeddings = encoder(fake_image_batch) - print("⚡" * 20, "\nPredictions (4 image embeddings):\n", embeddings, "\n", "⚡" * 20) - ----- - -********************* -6: 학습 시각화하기 -********************* - -Lightning에는 *많은* 배터리가 포함되어 있습니다. 실험을 시각화하는데 사용하는 텐서보드(Tensorboard)도 유용한 도구 중 하나입니다. - -명령줄(commandline)에서 아래를 실행하고 브라우저에서 **http://localhost:6006/** 을 열어보세요. - -.. code:: bash - - tensorboard --logdir . - ----- - -************************* -7: 엄청 빠르게 학습하기 -************************* - -Trainer에 인자(argument)를 사용하여 고급 학습 기능을 사용할 수 있습니다. 이는 다른 코드를 변경하지 않으면서 학습 단계(train loop)에 자동으로 통합할 수 있도록 하는 최신(state-of-the-art)의 기술입니다. - -.. code:: - - # 4개의 GPU에서 학습 - trainer = Trainer( - devices=4, - accelerator="gpu", - ) - - # Deepspeed/FSDP를 사용하여 1TB 이상의 매개변수를 갖는 모델 학습 - trainer = Trainer( - devices=4, - accelerator="gpu", - strategy="deepspeed_stage_2", - precision=16 - ) - - # 빠른 아이디어 반복을 위한 20개 이상의 유용한 플래그(flag) - trainer = Trainer( - max_epochs=10, - min_epochs=5, - overfit_batches=1 - ) - - # 최신 기술을 사용 - trainer = Trainer(callbacks=[StochasticWeightAveraging(...)]) - ----- - -******************** -유연성 극대화하기 -******************** - -Lightning의 핵심 원칙은 **PyTorch의 어떠한 부분도 숨기지 않으면서** 언제나 최대한의 유연성을 제공하는 것입니다. - -Lightning은 프로젝트의 복잡도에 따라 *추가적인* 5단계의 유연성을 제공합니다. - ----- - -학습 단계(loop) 사용자 정의하기 -================================== - -.. image:: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/custom_loop.png - :width: 600 - :alt: Injecting custom code in a training loop - -LightningModule에서 사용할 수 있는 20개 이상의 메소드 (:ref:`lightning_hooks`) 중 일부를 사용하여 훈련 단계 어디에든 사용자 정의 코드를 삽입할 수 있습니다. - -.. testcode:: - - class LitAutoEncoder(pl.LightningModule): - def backward(self, loss, optimizer, optimizer_idx): - loss.backward() - ----- - -Trainer 확장하기 -================== - -.. raw:: html - - - -유사한 기능을 하는 여러줄의 코드가 있는 경우, 콜백(callback)을 사용하여 손쉽게 그룹으로 묶어서 해당하는 코드들을 동시에 켜거나 끌 수 있습니다. - -.. code:: - - trainer = Trainer(callbacks=[AWSCheckpoints()]) - ----- - -PyTorch 자체의 반복(loop) 사용하기 -=================================== - -최첨단 연구 시 특정 유형의 작업들을 위해, Lightning은 전문가들이 다양한 방식으로 학습 단계를 완전히 제어할 수 있는 기능을 제공합니다. - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: 직접 최적화(manual optimization) - :description: 자동화된 학습 단계에서 최적화 단계는 사용자가 직접 관여합니다. - :col_css: col-md-4 - :image_center: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/manual_opt.png - :button_link: ../model/build_model_advanced.html#manual-optimization - :image_height: 220px - :height: 320 - -.. displayitem:: - :header: Lightning Lite(라이트닝 라이트) - :description: 복잡한 PyTorch 프로젝트를 이관하기 위한 반복 단계를 완벽히 제어합니다. - :col_css: col-md-4 - :image_center: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/lite.png - :button_link: ../model/build_model_expert.html - :image_height: 220px - :height: 320 - -.. displayitem:: - :header: 반복(Loop) - :description: 메타학습(meta-learning), 강화학습(reinforcement learning), GAN을 완벽히 제어합니다. - :col_css: col-md-4 - :image_center: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/loops.png - :button_link: ../extensions/loops.html - :image_height: 220px - :height: 320 - -.. raw:: html - -
-
- -.. End of callout item section - ----- - -********** -다음 단계 -********** - -사용 사례에 따라, 아래 내용들 중 하나를 다음 단계로 살펴보세요. - -.. raw:: html - -
-
- -.. Add callout items below this line - -.. displayitem:: - :header: Level 2: Add a validation and test set - :description: Add validation and test sets to avoid over/underfitting. - :button_link: ../levels/basic_level_2.html - :col_css: col-md-3 - :height: 180 - :tag: basic - -.. displayitem:: - :header: See more examples - :description: See examples across computer vision, NLP, RL, etc... - :col_css: col-md-3 - :button_link: ../tutorials.html - :height: 180 - :tag: basic - -.. displayitem:: - :header: I need my raw PyTorch Loop - :description: Expert-level control for researchers working on the bleeding-edge - :col_css: col-md-3 - :button_link: ../model/build_model_expert.html - :height: 180 - :tag: expert - -.. displayitem:: - :header: Deploy your model - :description: Learn how to predict or put your model into production - :col_css: col-md-3 - :button_link: ../deploy/production.html - :height: 180 - :tag: basic - -.. raw:: html - -
-
diff --git a/source/starter/lightning_lite.rst b/source/starter/lightning_lite.rst deleted file mode 100644 index 79081bb..0000000 --- a/source/starter/lightning_lite.rst +++ /dev/null @@ -1,718 +0,0 @@ -########################################### -LightningLite (Lightning을 위한 디딤돌) -########################################### - - -:class:`~pytorch_lightning.lite.LightningLite` 는 PyTorch 사용자들이 기존 반복(loop) / 최적화 로직을 -완벽하게 제어하면서 기존 코드를 모든 종류의 장치에서 사용 가능하도록 확장할 수 있도록 합니다. - -.. image:: https://pl-public-data.s3.amazonaws.com/docs/static/images/lite/lightning_lite.gif - :alt: PyTorch 코드를 LightningLite로 변환하는 방법을 보여주는 애니메이션. - :width: 500 - :align: center - -| - -아래 설명들 중 하나에 해당한다면 :class:`~pytorch_lightning.lite.LightningLite` 가 바로 적합한 도구입니다: - -- 기존 코드에 최소한의 변경만으로 여러 장치로 빠르게 확장하고 싶습니다. -- 기존 코드를 Lightning API로 변환하고 싶지만, Lightning으로의 완벽한 전환 과정(full path)이 다소 복잡할 것 같습니다. - 전환하는 동안 재현성(reproducibility)을 보장하기 위한 디딤돌(stepping stone)을 찾고 있습니다. - - -.. warning:: :class:`~pytorch_lightning.lite.LightningLite` 은 현재 beta 기능입니다. 사용자 피드백에 따라 API가 변경될 수 있습니다. - - ----------- - -**************** -예제로 배우기 -**************** - - -기존 PyTorch 코드 -======================== - -``run`` 함수는 ``MyModel`` 학습을 위해 ``MyDataset`` 을 ``num_epochs`` 에폭(epoch)만큼 반복하는 사용자 정의 학습 루프(loop)를 포함하고 있습니다. - -.. code-block:: python - - import torch - from torch import nn - from torch.utils.data import DataLoader, Dataset - - - class MyModel(nn.Module): - ... - - - class MyDataset(Dataset): - ... - - - def run(args): - device = "cuda" if torch.cuda.is_available() else "cpu" - - model = MyModel(...).to(device) - optimizer = torch.optim.SGD(model.parameters(), ...) - - dataloader = DataLoader(MyDataset(...), ...) - - model.train() - for epoch in range(args.num_epochs): - for batch in dataloader: - batch = batch.to(device) - optimizer.zero_grad() - loss = model(batch) - loss.backward() - optimizer.step() - - - run(args) - ----------- - - -LightningLite로 변환하기 -========================== - -:class:`~pytorch_lightning.lite.LightningLite` 로 변환하기 위해 필요한 다섯 단계는 다음과 같습니다. - -1. :class:`~pytorch_lightning.lite.LightningLite` 를 상속(subclass)받아 :meth:`~pytorch_lightning.lite.LightningLite.run` 메소드를 재정의합니다. -2. 기존 ``run`` 함수의 내용을 :class:`~pytorch_lightning.lite.LightningLite` 의 ``run`` 메소드로 이동합니다. -3. ``.to(...)``, ``.cuda()`` 등과 같은 모든 호출을 제거합니다. :class:`~pytorch_lightning.lite.LightningLite` 가 자동으로 이를 처리할 것입니다. -4. 각 모델과 옵티마이저(optimizer) 쌍에는 :meth:`~pytorch_lightning.lite.LightningLite.setup` 을, 모든 데이터로더(dataloader)에는 :meth:`~pytorch_lightning.lite.LightningLite.setup_dataloaders` 을 적용하고, ``loss.backward()`` 를 ``self.backward(loss)`` 로 변경합니다. -5. :class:`~pytorch_lightning.lite.LightningLite` 를 상속받은 서브클래스를 객체화(instantiate)한 뒤 :meth:`~pytorch_lightning.lite.LightningLite.run` 메소드를 호출합니다. - -| - -.. code-block:: python - - import torch - from torch import nn - from torch.utils.data import DataLoader, Dataset - from pytorch_lightning.lite import LightningLite - - - class MyModel(nn.Module): - ... - - - class MyDataset(Dataset): - ... - - - class Lite(LightningLite): - def run(self, args): - - model = MyModel(...) - optimizer = torch.optim.SGD(model.parameters(), ...) - model, optimizer = self.setup(model, optimizer) # 모델 / 옵티마이저(optimizer) 확장 - - dataloader = DataLoader(MyDataset(...), ...) - dataloader = self.setup_dataloaders(dataloader) # 데이터로더(dataloader) 확장 - - model.train() - for epoch in range(args.num_epochs): - for batch in dataloader: - optimizer.zero_grad() - loss = model(batch) - self.backward(loss) # loss.backward() 대체 - optimizer.step() - - - Lite(...).run(args) - - -이게 전부입니다. 이제 모든 종류의 장치에서 학습하고 확장할 수 있습니다. LightningLite를 사용한 전체 MNIST 학습 예제는 `여기 `_ 에서 확인할 수 있습니다. - -:class:`~pytorch_lightning.lite.LightningLite` 가 장치를 관리하므로, 사용자가 관리하지 않아도 됩니다. -코드 내에 특정 장치용 로직이 있다면 삭제해야 합니다. - -다음은 8개의 GPU에서 `torch.bfloat16 `_ 정밀도(precision)로 학습을 하는 방법을 보여줍니다: - -.. code-block:: python - - Lite(strategy="ddp", devices=8, accelerator="gpu", precision="bf16").run(10) - -`DeepSpeed Zero3 `_ 를 사용하여 8개의 GPU와 정밀도 16으로 학습하는 방법은 다음과 같습니다: - -.. code-block:: python - - Lite(strategy="deepspeed", devices=8, accelerator="gpu", precision=16).run(10) - -나아가 :class:`~pytorch_lightning.lite.LightningLite` 가 알아서 해주기도 합니다! - -.. code-block:: python - - Lite(devices="auto", accelerator="auto", precision=16).run(10) - -필요한 경우 분산-집합(distributed collectives)을 사용할 수도 있습니다. -다음은 (8개의 GPU x 32개 노드의) GPU 256개에서 실행하는 예제입니다. - -.. code-block:: python - - class Lite(LightningLite): - def run(self): - - # Transfer and concatenate tensors across processes - self.all_gather(...) - - # Transfer an object from one process to all the others - self.broadcast(..., src=...) - - # The total number of processes running across all devices and nodes. - self.world_size - - # The global index of the current process across all devices and nodes. - self.global_rank - - # The index of the current process among the processes running on the local node. - self.local_rank - - # The index of the current node. - self.node_rank - - # Wether this global rank is rank zero. - if self.is_global_zero: - # do something on rank 0 - ... - - # Wait for all processes to enter this call. - self.barrier() - - - Lite(strategy="ddp", devices=8, num_nodes=32, accelerator="gpu").run() - - -사용자 지정 데이터 또는 모델에 장치 할당이 필요한 경우, 데이터에는 ``self.setup_dataloaders(..., move_to_device=False)`` 를 하고 -모델에는 ``self.setup(..., move_to_device=False)`` 를 함으로써 :class:`~pytorch_lightning.lite.LightningLite` 의 자동 배치를 -비활성화할 수 있습니다. -뿐만 아니라, ``self.device`` 로 현재 장치에 접근하거나 :meth:`~pytorch_lightning.lite.LightningLite.to_device` 를 사용하여 -객체를 현재 장치로 이동할 수 있습니다. - - -.. note:: 큰 모델들은 out-of-memory(메모리 부족) 에러가 발생하므로 :meth:`~pytorch_lightning.lite.LightningLite.run` 에서 모델을 생성(instantiate)하는 것을 권장합니다. - -.. tip:: - - :meth:`~pytorch_lightning.lite.LightningLite.run` 함수 내에 수백에서 수천 라인의 코드가 있고 이에 대해 확신이 서지 않는다면, - 적절한 느낌입니다. 2019년에 :class:`~pytorch_lightning.core.lightning.LightningModule` 이 점점 커지면서 개발자들 또한 같은 느낌을 받았고, - 이에 따라 단순성(simplicity)과 상호운용성(interoperability), 표준화(standardization)를 위해 코드를 구성하기 시작했습니다. - 이러한 느낌은 코드 리팩토링(refactoring)과 함께 / 또는 :class:`~pytorch_lightning.core.lightning.LightningModule` 으로 완전히 전환하는 것을 - 고려해봐야 한다는 좋은 신호입니다. - - ----------- - - -분산 학습 시의 함정(pitfall) -============================= - -:class:`~pytorch_lightning.lite.LightningLite` 는 학습을 확장할 수 있는 도구들을 제공하지만, 직면해야 할 몇 가지 주요한 과제들도 있습니다: - - -.. list-table:: - :widths: 50 50 - :header-rows: 0 - - * - 프로세스 발산(Processes divergence) - - 이전 파일 또는 다른 이유에서 서로 다른 if/else 조건, 경쟁 조건(race condition)으로 프로세스가 코드의 다른 부분(section) 실행하여 멈출(hanging) 때 발생합니다. - * - 프로세스 간 리듀스(Cross processes reduction) - - 리듀스 과정(reduction)에서의 오류로 메트릭(metric) 또는 변화도(gradient)가 잘못 계산되었습니다. - * - 대규모의 샤딩된 모델(Large sharded models) - - 대규모 모델의 생성(instantiation)과 구현(materialization), 상태 관리(state management). - * - 순서가 0뿐인 작업(Rank 0 only actions) - - 로깅(logging), 프로파일링(profiling) 등. - * - 체크포인팅 / 조기 중단 / 콜백 / 로깅 (Checkpointing / Early stopping / Callbacks / Logging) - - 학습 과정을 쉽게 사용자 정의하고 상태를 관리할 수 있는 기능. - * - 결함-감내 학습(Fault-tolerant training) - - 오류 발생 시에 마치 오류가 없었던 것처럼 재개(resume)하는 기능. - - -위와 같은 과제들 중 하나를 맞이했다면, 이제 :class:`~pytorch_lightning.lite.LightningLite` 의 한계를 마주한 것입니다. -이러한 걱정을 할 필요가 없는 :doc:`Lightning <../starter/introduction>` 으로 변환하는 것을 추천합니다. - ----------- - -Lightning으로의 변환 -====================== - -:class:`~pytorch_lightning.lite.LightningLite` 은 수백가지 기능을 갖는 Lightning API로의 완전한 전환을 위한 디딤돌입니다. - -:class:`~pytorch_lightning.lite.LightningLite` 클래스 자체를 :class:`~pytorch_lightning.core.lightning.LightningModule` 의 개선된 버전(future)로 볼 수도 있으므로, -해당 API로 코드를 천천히 재구성(refactor)해보겠습니다. -아래에는 :meth:`~pytorch_lightning.core.lightning.LightningModule.training_step` 와 :meth:`~pytorch_lightning.core.lightning.LightningModule.forward`, -:meth:`~pytorch_lightning.core.lightning.LightningModule.configure_optimizers`, :meth:`~pytorch_lightning.core.lightning.LightningModule.train_dataloader` 메서드들이 -구현되어 있습니다. - - -.. code-block:: python - - class Lite(LightningLite): - - # 1. 이 부분은 LightningModule의 `__init__` 함수가 됩니다. - def run(self, args): - self.args = args - - self.model = MyModel(...) - - self.fit() # 이는 Lightning Trainer에 의해 자동화됩니다. - - # 2. Lightning이 자체적인 학습 루프(fitting loop)를 생성하고, - # 모델, 옵티마이저, 데이터로더 등을 설정하므로 이 코드는 완전히 제거해도 됩니다. - def fit(self): - # 필요한 것들을 설정 - optimizer = self.configure_optimizers() - self.model, optimizer = self.setup(self.model, optimizer) - dataloader = self.setup_dataloaders(self.train_dataloader()) - - # 학습(fitting) 시작 - self.model.train() - for epoch in range(num_epochs): - for batch in enumerate(dataloader): - optimizer.zero_grad() - loss = self.training_step(batch, batch_idx) - self.backward(loss) - optimizer.step() - - # 3. 이는 LightningModule에 속하므로 그대로 둡니다. - def forward(self, x): - return self.model(x) - - def training_step(self, batch, batch_idx): - return self.forward(batch) - - def configure_optimizers(self): - return torch.optim.SGD(self.model.parameters(), ...) - - # 4. [선택사항] 이는 그대로 두거나, LightningDataModule이 더 높은 결합성(composability)을 갖도록 따로 분리(extract)할 수도 있습니다. - def train_dataloader(self): - return DataLoader(MyDataset(...), ...) - - - Lite(...).run(args) - - -마지막으로, :meth:`~pytorch_lightning.lite.LightningLite.run` 을 :meth:`~pytorch_lightning.core.lightning.LightningModule.__init__` 으로 -바꾸고, 내부의 ``fit`` 호출 부분을 삭제합니다. - -.. code-block:: python - - from pytorch_lightning import LightningDataModule, LightningModule, Trainer - - - class LightningModel(LightningModule): - def __init__(self, args): - super().__init__() - self.model = MyModel(...) - - def forward(self, x): - return self.model(x) - - def training_step(self, batch, batch_idx): - loss = self(batch) - self.log("train_loss", loss) - return loss - - def configure_optimizers(self): - return torch.optim.SGD(self.model.parameters(), lr=0.001) - - - class BoringDataModule(LightningDataModule): - def train_dataloader(self): - return DataLoader(MyDataset(...), ...) - - - trainer = Trainer(max_epochs=10) - trainer.fit(LightningModel(), datamodule=BoringDataModule()) - - -이제 수백가지 기능들의 이점을 누릴 수 있는 PyTorch Lightning으로의 변환을 성공적으로 완료하였습니다! - ----------- - -******************************** -Lightning Lite 매개변수(flag) -******************************** - -Lite는 가속화된 분산 학습 및 추론(inference)에 특화되어 있습니다. 이는 장치 및 통신 전략을 손쉽게 구성하고, -다른 방식으로의 원활하게 전환할 수 있는 편리한 방법을 제공합니다. 용어(terminology) 및 사용법이 Lightning과 -동일하므로, 변환을 결심했을 때 변환에 드는 노력을 최소화할 수 있습니다. - - -accelerator (가속기 종류) -========================== - -``"cpu"``, ``"gpu"``, ``"tpu"``, ``"auto"`` 중 하나를 선택합니다 (IPU는 곧 제공 예정입니다). - -.. code-block:: python - - # CPU 가속기 - lite = Lite(accelerator="cpu") - - # 2개의 GPU 가속기에서 실행 - lite = Lite(devices=2, accelerator="gpu") - - # 8개의 TPU 가속기에서 실행 - lite = Lite(devices=8, accelerator="tpu") - - # DistributedDataParallel(ddp) 전략으로 GPU 가속기에서 실행 - lite = Lite(devices=4, accelerator="gpu", strategy="ddp") - -``"auto"`` 옵션은 사용 중인 기기를 인식하고 사용 가능한 가속기를 선택합니다. - -.. code-block:: python - - # 기기에 GPU가 있으면, GPU 가속기를 사용합니다. - lite = Lite(devices=2, accelerator="auto") - - -strategy (학습 전략) -====================== - -학습 전략을 선택합니다: ``"dp"``, ``"ddp"``, ``"ddp_spawn"``, ``"tpu_spawn"``, ``"deepspeed"``, ``"ddp_sharded"``, 또는 ``"ddp_sharded_spawn"`` - -.. code-block:: python - - # 4개의 GPU에서 DistributedDataParallel 전략 사용 - lite = Lite(strategy="ddp", accelerator="gpu", devices=4) - - # 4개의 CPU에서 DDP Spawn 전략 사용 - lite = Lite(strategy="ddp_spawn", accelerator="cpu", devices=4) - - -또한, 몇몇 매개변수를 추가로 설정해서 사용자 지정 전략을 사용할 수 있습니다. - -.. code-block:: python - - from pytorch_lightning.strategies import DeepSpeedStrategy - - lite = Lite(strategy=DeepSpeedStrategy(stage=2), accelerator="gpu", devices=2) - - -Horovoard 및 Full Sharded 학습 전략은 곧 지원될 예정입니다. - - -device (장치) -============== - -실행할 장치를 설정합니다. 아래와 같은 자료형일 수 있습니다: - -- int: 학습할 장치(예. GPU)의 개수 -- list of int: 학습할 장치의 인덱스(예. GPU ID, 0-indexed) -- str: 위 중 하나의 문자열 표현 - -.. code-block:: python - - # Lite에서 사용하는 기본 값, CPU에서 실행 - lite = Lite(devices=None) - - # 위와 동일 - lite = Lite(devices=0) - - # int: 2개의 GPU에서 실행 - lite = Lite(devices=2, accelerator="gpu") - - # list: GPU 1, 4에서 실행 (버스 순서에 따름) - lite = Lite(devices=[1, 4], accelerator="gpu") - lite = Lite(devices="1, 4", accelerator="gpu") # 위와 동일 - - # -1: 모든 GPU에서 실행 - lite = Lite(devices=-1, accelerator="gpu") - lite = Lite(devices="-1", accelerator="gpu") # 위와 동일 - - - -gpus (사용하지 않음) -======================= - -.. warning:: ``gpus=x`` 는 v1.7에서 더 이상 사용하지 않으며(deprecated), v2.0에서 제거될 예정입니다. - 대신에 ``accelerator='gpu'`` 및 ``devices=x`` 을 사용하십시오. - -``devices=X`` 및 ``accelerator="gpu"`` 의 약어(shorthand). - -.. code-block:: python - - # 2개의 GPU에서 실행 - lite = Lite(accelerator="gpu", devices=2) - - # 위와 동일 - lite = Lite(devices=2, accelerator="gpu") - - -tpu_cores (사용하지 않음) -============================ - -.. warning:: ``tpu_cores=x`` 는 v1.7에서 더 이상 사용하지 않으며(deprecated), v2.0에서 제거될 예정입니다. - 대신에 ``accelerator='tpu'`` 및 ``devices=x`` 을 사용하십시오. - -``devices=X`` 및 ``accelerator="tpu"`` 의 약어. - -.. code-block:: python - - # 8개의 TPU에서 실행 - lite = Lite(accelerator="tpu", devices=8) - - # 위와 동일 - lite = Lite(devices=8, accelerator="tpu") - - -num_nodes (노드의 수) -==================================== - -분산 작업 시의 클러스터 노드의 수. - -.. code-block:: python - - # Lite에서 사용하는 기본값 - lite = Lite(num_nodes=1) - - # 8개의 노드에서 실행 - lite = Lite(num_nodes=8) - - -클러스터에서의 분산 다중 노드 학습에 대해서는 :doc:`이 문서 <../clouds/cluster>` 에서 자세히 알아볼 수 있습니다. - - -precision (정밀도) -===================== - -Lightning Lite는 배정밀도(double precision; 64), 단정밀도(full precision; 32), 또는 반정밀도(half precision; 16) 연산(`bfloat16 `_ 포함)을 지원합니다. -반정밀도 또는 혼합 정밀도(mixed precision)는 32비트 정밀도와 16비트 정밀도를 합쳐서 사용하여 모델 학습 시의 메모리 공간(footprint)을 줄입니다. -그 결과 성능이 향상되어 최신 GPU에서 눈에 띄게 성능이 향상됩니다. - -.. code-block:: python - - # Lite에서 사용하는 기본값 - lite = Lite(precision=32, devices=1) - - # 16-비트 (혼합) 정밀도 - lite = Lite(precision=16, devices=1) - - # 16-비트 bfloat 정밀도 - lite = Lite(precision="bf16", devices=1) - - # 64-비트 (배(double)) 정밀도 - lite = Lite(precision=64, devices=1) - - -plugins (플러그인) -===================== - -:ref:`Plugins` 을 사용하여 임의의 백엔드(backend), 정밀도 라이브러리, 클러스터 등을 연결할 수 있습니다. -예: 임의의 동작을 정의하고 싶으면 관련 클래스를 상속받아 전달하면 됩니다. 다음은 직접 만든 -:class:`~pytorch_lightning.plugins.environments.ClusterEnvironment` 를 연결하는 예시입니다. - -.. code-block:: python - - from pytorch_lightning.plugins.environments import ClusterEnvironment - - - class MyCluster(ClusterEnvironment): - @property - def main_address(self): - return your_main_address - - @property - def main_port(self): - return your_main_port - - def world_size(self): - return the_world_size - - - lite = Lite(plugins=[MyCluster()], ...) - - ----------- - - -********************** -Lightning Lite 메소드 -********************** - - -run -==== - -run 메소드는 2가지 용도로 사용합니다: - -1. :class:`~pytorch_lightning.lite.lite.LightningLite` 클래스에서 이 메시드를 재정의(override)하고 - 학습(또는 추론) 코드를 내부에 넣습니다. -2. run 메소드를 호출하여 학습 절차를 시작합니다. Lite는 분산 백엔드 설정을 처리합니다. - -선택적으로 run 메소드에 인자(예를 들어 모델의 하이퍼파라매터나 백엔드)를 전달할 수 있습니다. - -.. code-block:: python - - from pytorch_lightning.lite import LightningLite - - - class Lite(LightningLite): - - # 입력 인자는 선택 사항입니다; 필요 시에 넣으세요. - def run(self, learning_rate, num_layers): - """여기에 학습 과정이 들어갑니다.""" - - - lite = Lite(accelerator="gpu", devices=2) - lite.run(learning_rate=0.01, num_layers=12) - - -setup -====== - -모델 및 해당하는 옵티마이저(들)을 설정합니다. 여러 모델을 설정해야 하는 경우, 각각에 대해서 ``setup()`` 을 호출하십시오. -모델과 옵티마이저는 적절한 장치로 자동으로 이동합니다. - -.. code-block:: python - - model = nn.Linear(32, 64) - optimizer = torch.optim.SGD(model.parameters(), lr=0.001) - - # 가속화된 학습을 위해 모델 및 옵티마이저 설정 - model, optimizer = self.setup(model, optimizer) - - # Lite가 장치를 설정하는 것을 원치 않는 경우 - model, optimizer = self.setup(model, optimizer, move_to_device=False) - - -setup 메소드는 선택한 정밀도로 모델을 준비하여 ``forward()`` 중 연산들이 자동으로 변환(cast)되도록 합니다. - -setup_dataloaders -================= - -가속화된 연산을 위해 하나 이상의 데이터로더를 설정합니다. 분산 전략(예. DDP)을 사용하는 경우, Lite는 자동으로 샘플러(sampler)를 -대체합니다. 또한, 데이터로더는 반환된 데이터 텐서를 적절한 장치로 자동으로 이동하도록 설정됩니다. - -.. code-block:: python - - train_data = torch.utils.DataLoader(train_dataset, ...) - test_data = torch.utils.DataLoader(test_dataset, ...) - - train_data, test_data = self.setup_dataloaders(train_data, test_data) - - # Lite가 데이터를 자동으로 장치로 이동시키는 것을 원치 않는 경우 - train_data, test_data = self.setup_dataloaders(train_data, test_data, move_to_device=False) - - # Lite가 분산 학습 도중 샘플러를 대체하기를 원치 않는 경우 - train_data, test_data = self.setup_dataloaders(train_data, test_data, replace_sampler=False) - - -backward -=========== - -``loss.backward()`` 을 대체하여 정밀도와 가속기 코드를 신경쓰지 않도록(agnostic) 합니다. - -.. code-block:: python - - output = model(input) - loss = loss_fn(output, target) - - # loss.backward() - self.backward(loss) - - -to_device -========= - -:meth:`~pytorch_lightning.lite.lite.LightningLite.to_device` 를 사용하여 모델 또는 텐서, 텐서 컬렉션을 현재 장치로 이동합니다. -기본적으로 :meth:`~pytorch_lightning.lite.lite.LightningLite.setup` 및 :meth:`~pytorch_lightning.lite.lite.LightningLite.setup_dataloaders` 가 -모델과 데이터를 적절한 장치로 이동했으므로, 이 메소드는 수동 작업이 필요할 때만 사용합니다. - -.. code-block:: python - - data = torch.load("dataset.pt") - data = self.to_device(data) - - -seed_everything -=============== - -run의 시작 부분에 이 메소드를 호출하여 코드를 재현 가능하도록 합니다. - -.. code-block:: python - - # `torch.manual_seed(...)` 대신 다음을 호출: - self.seed_everything(1234) - - -이는 PyTorch 및 NumPy, Python 난수 생성기를 포괄합니다. 또한, Lite는 데이터로더 워커(worker) 프로세서의 시드(seed)를 적절히 초기화합니다. -(``workers=False`` 를 전달하여 이 기능을 끌 수 있습니다.) - - -autocast -======== - -정밀도 백엔드가 autocast 컨텍스트 매니저 내부의 코드 블록을 자동으로 캐스팅하도록 합니다. 이는 선택사항이며, Lite가 -(모델이 :meth:`~pytorch_lightning.lite.lite.LightningLite.setup` 될 때) 이미 모델의 forward 메소드에 적용하였습니다 -모델 forward 메소드 외부의 추가 연산들에 대해 자동으로 캐스팅하려는 경우에만 사용합니다: - -.. code-block:: python - - model, optimizer = self.setup(model, optimizer) - - # Lite가 모델의 정밀도를 자동으로 처리합니다 - output = model(inputs) - - with self.autocast(): # 선택 사항 - loss = loss_function(output, target) - - self.backward(loss) - ... - - -print -===== - -내장 print 함수를 통해 콘솔에 출력하지만, 메인 프로세스(main process)에서만 가능합니다. -이는 여러 장치/노드에서 실행할 때 과도한 출력 및 로그를 방지합니다. - - -.. code-block:: python - - # 메인 프로세스에서만 출력 - self.print(f"{epoch}/{num_epochs}| Train Epoch Loss: {loss}") - - -save -==== - -체크포인트(checkpoint)에 내용을 저장합니다. 기존의 ``torch.save(...)`` 를 모두 대체합니다. Lite는 단일 장치나 다중 장치, -다중 노드 중 어디에서 실행하던지 잘 저장될 수 있도록 처리합니다. - -.. code-block:: python - - # `torch.save(...)` 대신 다음을 호출: - self.save(model.state_dict(), "path/to/checkpoint.ckpt") - - -load -==== - -파일로부터 체크포인트 내용을 불러옵니다. 기존의 ``torch.load(...)`` 를 모두 대체합니다. Lite는 단일 장치나 다중 장치, -다중 노드 중 어디에서 실행하던지 잘 불러올 수 있도록 처리합니다. - -.. code-block:: python - - # `torch.load(...)` 대신 다음을 호출: - self.load("path/to/checkpoint.ckpt") - - -barrier -======= - -모든 프로세스들이 대기해였다가 동기화되길 원할 때 사용합니다. 모든 프로세스가 barrier 호출에 진입하면, 그 때 계속 실행합니다. -예를 들어 한 프로세스가 데이터를 다운로드해서 디스크에 쓰는 동안 다른 모든 프로세스들이 대기하도록 할 때 유용합니다. - -.. code-block:: python - - # 한 프로세스에서만 데이터 다운로드 - if self.global_rank == 0: - download_data("http://...") - - # 모든 프로세스가 여기서 만날 때까지 대기 - self.barrier() - - # 이제 모든 프로세스가 데이터를 읽을 수 있음 diff --git a/source/starter/style_guide.rst b/source/starter/style_guide.rst deleted file mode 100644 index 7a00b58..0000000 --- a/source/starter/style_guide.rst +++ /dev/null @@ -1,232 +0,0 @@ -################ -스타일 가이드 -################ -PyTorch Lightning의 주요한 목표는 가독성(readability)과 재현성(reproducibility)을 향상시키는 것입니다. GitHub 저장소나 리서치 프로젝트에서 -:class:`~pytorch_lightning.core.lightning.LightningModule` 을 발견하고, 필요한 부분이 어디에 있는지 찾아보기 위해 정확히 어디를 봐야 하는지 -알 수 있다고 생각해보세요. - -이 스타일 가이드의 목표는 Lightning의 코드가 유사하게 구성되도록 권장하기 위함입니다. - --------------- - -***************** -LightningModule -***************** - -:class:`~pytorch_lightning.core.lightning.LightningModule` 클래스를 구성하는 모범 사례를 살펴보겠습니다: - -시스템(System)과 모델(Model) -============================== - -.. figure:: https://pl-bolts-doc-images.s3.us-east-2.amazonaws.com/pl_docs/model_system.png - :width: 400 - -LightningModule의 주요한 원칙은 전체 시스템이 반드시 독립적(self-contained)이어야 한다는 것입니다. -Lightning에서는 시스템(system)과 모델(model)을 구분합니다. - -모델은 ResNet18, RNN 등과 같은 것입니다. - -시스템은 모델들(a collection of models)이 사용자가 정의한 학습/검증 로직을 사용하여 어떻게 상호작용하는지에 대해 정의합니다. -이에 대한 예시는 다음과 같습니다: - -* GAN -* Seq2Seq -* BERT -* 그 외 - -LightningModule은 시스템과 모델 모두를 정의할 수 있습니다: - -다음은 시스템을 정의하는 LightningModule입니다. 아래와 같은 구조로 코드를 작성하는 것을 권장합니다. 모델을 시스템으로부터 분리하면 -모듈성(modularity)이 향상되어, 더 나은 테스팅에 도움이 되고 시스템에 의존성이 줄어들어 리팩토링이 더 쉬워집니다. - -.. testcode:: - - class Encoder(nn.Module): - ... - - - class Decoder(nn.Module): - ... - - - class AutoEncoder(nn.Module): - def __init__(self): - super().__init__() - self.encoder = Encoder() - self.decoder = Decoder() - - def forward(self, x): - return self.encoder(x) - - - class AutoEncoderSystem(LightningModule): - def __init__(self): - super().__init__() - self.auto_encoder = AutoEncoder() - - -빠른 프로토타이핑을 위해서는 모든 연산을 LightningModule 내에 정의하는 것이 유용합니다. 재현성과 확장성을 -위해서는 관련된 백본(backbone)에 전달하는 것이 더 나을 수 있습니다. - -다음은 LightningModule로 모델을 정의하는 것이지만, 아래 예시처럼 모델을 정의하는 것은 권장하지 않습니다. - -.. testcode:: - - class LitModel(LightningModule): - def __init__(self): - super().__init__() - self.layer_1 = nn.Linear() - self.layer_2 = nn.Linear() - self.layer_3 = nn.Linear() - - -독립성(self-contained) -=========================== - -LightningModule은 반드시 독립적(self-contained)이어야 합니다. 모델이 독립적인지를 확인해보는 좋은 방법 중에 하나는, -다음과 같이 스스로에게 물어보는 것입니다: - -"누군가 모델의 내부에 대해서 전혀 모르는 상태에서 이 파일을 Trainer에 사용(drop)할 수 있을까?" - -예를 들어, 주요한 모델들은 특정 옵티마이저(optimizer)와 학습률 스케쥴러(learning rate scheduler)에서 잘 동작하기 때문에 -옵티마이저는 모델과 결합(couple)합니다. - -초기화(init) -================= - -LightningModule이 독립성을 띄지 못하게 되는 첫번째 위치는 초기화(init) 부분입니다. 사용자가 추측할 필요가 없도록 초기화 부분에 -모든 관련된 적절한 기본값(sensible defaults)을 정의해주세요. - -다음은 이 LightningModule이 어떻게 초기화되었는지 알아보기 위해 사용자가 파일을 찾아봐야만 하는 예시입니다. - -.. testcode:: - - class LitModel(LightningModule): - def __init__(self, params): - self.lr = params.lr - self.coef_x = params.coef_x - -이렇게 정의된 모델은 많은 궁금증들, 예를 들면 ``coef_x`` 는 무엇인지? 문자열인지? 실수(float)인지? 범위는 어떻게 되는지? 를 -갖게 합니다. 이렇게 하는 대신, 명시적으로 초기화를 하는 것이 좋습니다. - -.. testcode:: - - class LitModel(LightningModule): - def __init__(self, encoder: nn.Module, coef_x: float = 0.2, lr: float = 1e-3): - ... - -이제 사용자는 추측할 필요가 없습니다. 값의 타입(type) 뿐만 아니라, 모델에는 사용자가 즉시 확인할 수 있는 적절한 기본값도 -존재합니다. - - -메소드 순서 -============ -LightningModule에서 필요로 하는 메소드들은 다음의 것들 뿐입니다: - -* init -* training_step -* configure_optimizers - -하지만, 다른 선택적인 메소드들을 구현하기로 마음먹었다면, 권장하는 순서는 다음과 같습니다: - -* 모델/시스템 정의 (초기화) -* 추론(inference)을 한다면, forward 정의 -* 학습용 훅(training hooks) -* 검증용 훅(validation hooks) -* 테스트용 훅(test hooks) -* 예측용 훅(predict hooks) -* 옵티마이저 설정(configure_optimizers) -* 다른 훅(hooks) - -실제 코드는 다음과 같습니다: - -.. code-block:: - - class LitModel(pl.LightningModule): - - def __init__(...): - - def forward(...): - - def training_step(...): - - def training_step_end(...): - - def training_epoch_end(...): - - def validation_step(...): - - def validation_step_end(...): - - def validation_epoch_end(...): - - def test_step(...): - - def test_step_end(...): - - def test_epoch_end(...): - - def configure_optimizers(...): - - def any_extra_hook(...): - - -forward와 training_step -======================== - -:meth:`~pytorch_lightning.core.lightning.LightningModule.forward` 는 추론/예측을 위해 사용하고, -:meth:`~pytorch_lightning.core.lightning.LightningModule.training_step` 를 독립적으로 유지하는 것을 추천합니다. - -.. code-block:: python - - def forward(self, x): - embeddings = self.encoder(x) - return embeddings - - - def training_step(self, batch, batch_idx): - x, _ = batch - z = self.encoder(x) - pred = self.decoder(z) - ... - - --------------- - -************ -데이터 -************ - -데이터를 다루는 모범 사례입니다. - -DataLoader -============== - -Lightning은 :class:`~torch.utils.data.DataLoader` 를 사용해서 시스템 전반의 모든 데이터 흐름을 다룹니다. DataLoader를 구성할 때는 -최대의 효율을 위해 워커(worker)의 수를 반드시 적절하게 조절해야 합니다. - -.. warning:: 코드가 병목을 일으킬 수 있으므로 DataLoader에서 ``Trainer(strategy="ddp_spawn")`` 를 ``num_workers>0`` 로 사용하지 않도록 주의하세요. - -DataModule -============== - -:class:`~pytorch_lightning.core.datamodule.LightningDataModule` 은 데이터와 관련된 훅들을 :class:`~pytorch_lightning.core.lightning.LightningModule` 로부터 -분리하도록 설계되어 데이터셋 종류에 구애받지 않는 모델을 만들 수 있습니다. 이렇게 하면 모델이 서로 다른 데이터셋을 사용하도록 언제든지 교체(hot swap)할 수 있어, -여러 분야(domain)에서 테스트와 벤치마킹을 할 수 있습니다. 또한 프로젝트들 간에 정확한 데이터 분할(split)과 변환(transform)을 공유하고 재사용 할 수 있게 합니다. - -Lightning에서의 데이터 관리 방법과 모범 사례는 :ref:`data` 문서를 참고하세요. - -* 어떠한 데이터 분할(split) 방법이 사용되었나요? -* 전체와 분할된 데이터셋 각각에는 몇 개의 샘플이 있나요? -* 어떠한 변환(transform) 방법이 사용되었나요? - -이러한 이유들 때문에 DataModule 사용하기를 권하고 있습니다. 이는 협업할 때 팀의 시간을 많이 절약할 수 있기에 특히 중요합니다. - -사용자들은 DataModule을 Trainer에 던져놓기만 하고, 데이터에 어떠한 작업이 수행되는지는 신경쓰지 않아도 됩니다. - -이는 데이터의 정제(cleaning)와 특정 목적의 작업(ad-hoc instruction) 때문에 아이디어를 반복하는 과정이 느려지는 학계(academic)나 기업(corporate) 모두에 -해당됩니다. - -- 직접 손으로 따라해볼 수 있는 예제들입니다: -- `Introduction to PyTorch Lightning `_ -- `Introduction to DataModules `_ diff --git a/source/visualize/supported_exp_managers.rst b/source/visualize/supported_exp_managers.rst deleted file mode 100644 index 1a15ee2..0000000 --- a/source/visualize/supported_exp_managers.rst +++ /dev/null @@ -1,198 +0,0 @@ -Comet.ml -======== -To use `Comet.ml `_ first install the comet package: - -.. code-block:: bash - - pip install comet-ml - -Configure the logger and pass it to the :class:`~pytorch_lightning.trainer.trainer.Trainer`: - -.. code-block:: python - - from pytorch_lightning.loggers import CometLogger - - comet_logger = CometLogger(api_key="YOUR_COMET_API_KEY") - trainer = Trainer(logger=comet_logger) - -Access the comet logger from any function (except the LightningModule *init*) to use its API for tracking advanced artifacts - -.. code-block:: python - - class LitModel(LightningModule): - def any_lightning_module_function_or_hook(self): - comet = self.logger.experiment - fake_images = torch.Tensor(32, 3, 28, 28) - comet.add_image("generated_images", fake_images, 0) - -Here's the full documentation for the :class:`~pytorch_lightning.loggers.CometLogger`. - ----- - -MLflow -====== -To use `MLflow `_ first install the MLflow package: - -.. code-block:: bash - - pip install mlflow - -Configure the logger and pass it to the :class:`~pytorch_lightning.trainer.trainer.Trainer`: - -.. code-block:: python - - from pytorch_lightning.loggers import MLFlowLogger - - mlf_logger = MLFlowLogger(experiment_name="lightning_logs", tracking_uri="file:./ml-runs") - trainer = Trainer(logger=mlf_logger) - -Access the comet logger from any function (except the LightningModule *init*) to use its API for tracking advanced artifacts - -.. code-block:: python - - class LitModel(LightningModule): - def any_lightning_module_function_or_hook(self): - mlf_logger = self.logger.experiment - fake_images = torch.Tensor(32, 3, 28, 28) - mlf_logger.add_image("generated_images", fake_images, 0) - -Here's the full documentation for the :class:`~pytorch_lightning.loggers.MLFlowLogger`. - ----- - -Neptune.ai -========== -To use `Neptune.ai `_ first install the neptune package: - -.. code-block:: bash - - pip install neptune-client - -or with conda: - -.. code-block:: bash - - conda install -c conda-forge neptune-client - -Configure the logger and pass it to the :class:`~pytorch_lightning.trainer.trainer.Trainer`: - -.. code-block:: python - - from pytorch_lightning.loggers import NeptuneLogger - - neptune_logger = NeptuneLogger( - api_key="ANONYMOUS", # replace with your own - project="common/pytorch-lightning-integration", # format "" - ) - trainer = Trainer(logger=neptune_logger) - -Access the neptune logger from any function (except the LightningModule *init*) to use its API for tracking advanced artifacts - -.. code-block:: python - - class LitModel(LightningModule): - def any_lightning_module_function_or_hook(self): - neptune_logger = self.logger.experiment["your/metadata/structure"] - neptune_logger.log(metadata) - -Here's the full documentation for the :class:`~pytorch_lightning.loggers.NeptuneLogger`. - ----- - -Tensorboard -=========== -`TensorBoard `_ already comes installed with Lightning. If you removed the install install the following package. - -.. code-block:: bash - - pip install tensorboard - -Configure the logger and pass it to the :class:`~pytorch_lightning.trainer.trainer.Trainer`: - -.. code-block:: python - - from pytorch_lightning.loggers import TensorBoardLogger - - logger = TensorBoardLogger() - trainer = Trainer(logger=logger) - -Access the tensorboard logger from any function (except the LightningModule *init*) to use its API for tracking advanced artifacts - -.. code-block:: python - - class LitModel(LightningModule): - def any_lightning_module_function_or_hook(self): - tensorboard_logger = self.logger.experiment - fake_images = torch.Tensor(32, 3, 28, 28) - tensorboard_logger.add_image("generated_images", fake_images, 0) - -Here's the full documentation for the :class:`~pytorch_lightning.loggers.TensorBoardLogger`. - ----- - -Weights and Biases -================== -To use `Weights and Biases `_ (wandb) first install the wandb package: - -.. code-block:: bash - - pip install wandb - -Configure the logger and pass it to the :class:`~pytorch_lightning.trainer.trainer.Trainer`: - -.. code-block:: python - - from pytorch_lightning.loggers import WandbLogger - - wandb_logger = WandbLogger(project="MNIST", log_model="all") - trainer = Trainer(logger=wandb_logger) - - # log gradients and model topology - wandb_logger.watch(model) - -Access the wandb logger from any function (except the LightningModule *init*) to use its API for tracking advanced artifacts - -.. code-block:: python - - class MyModule(LightningModule): - def any_lightning_module_function_or_hook(self): - wandb_logger = self.logger.experiment - fake_images = torch.Tensor(32, 3, 28, 28) - - # Option 1 - wandb_logger.log({"generated_images": [wandb.Image(fake_images, caption="...")]}) - - # Option 2 for specifically logging images - wandb_logger.log_image(key="generated_images", images=[fake_images]) - -Here's the full documentation for the :class:`~pytorch_lightning.loggers.WandbLogger`. -`Demo in Google Colab `__ with hyperparameter search and model logging. - ----- - -Use multiple exp managers -========================= -To use multiple experiment managers at the same time, pass a list to the *logger* :class:`~pytorch_lightning.trainer.trainer.Trainer` argument. - -.. code-block:: python - - from pytorch_lightning.loggers import TensorBoardLogger, WandbLogger - - logger1 = TensorBoardLogger() - logger2 = WandbLogger() - trainer = Trainer(logger=[logger1, logger2]) - - -Access all loggers from any function (except the LightningModule *init*) to use their APIs for tracking advanced artifacts - -.. code-block:: python - - class MyModule(LightningModule): - def any_lightning_module_function_or_hook(self): - tensorboard_logger = self.logger.experiment[0] - wandb_logger = self.logger.experiment[1] - - fake_images = torch.Tensor(32, 3, 28, 28) - - tensorboard_logger.add_image("generated_images", fake_images, 0) - wandb_logger.add_image("generated_images", fake_images, 0)