[test] cover python 3.7 to 3.9 on CPU (#303)

* [test] cover python 3.7 to 3.9 on CPU - covering common python versions on CPU tests - added doc build test * add doc build test * skipping failing tests on py39 * catching doc build warnings * add doc build to py38 and py39 * minor fix * fix doc build for adascale * removed dead code * fix the skipping * skip unit test for py39 * add failing example * no more py39 skipping the tests

[test] cover python 3.7 to 3.9 on CPU (#303)
* [test] cover python 3.7 to 3.9 on CPU - covering common python versions on CPU tests - added doc build test * add doc build test * skipping failing tests on py39 * catching doc build warnings * add doc build to py38 and py39 * minor fix * fix doc build for adascale * removed dead code * fix the skipping * skip unit test for py39 * add failing example * no more py39 skipping the tests
8459634f · Min Xu · GitHub · 331aed2c · 8459634f · 8459634f
Unverified Commit 8459634f authored Jan 25, 2021 by Min Xu Committed by GitHub Jan 25, 2021
Hide whitespace changes
Inline Side-by-side

Showing with 142 additions and 38 deletions

.circleci/config.yml .circleci/config.yml +133 -31

fairscale/optim/adascale.py fairscale/optim/adascale.py +4 -3

requirements-test.txt requirements-test.txt +5 -4

No files found.
--- a/.circleci/config.yml
+++ b/.circleci/config.yml
@@ -10,11 +10,21 @@ version: 2
 # -------------------------------------------------------------------------------------
 # Environments to run the jobs in
 # -------------------------------------------------------------------------------------
-cpu: &cpu
+cpu_py37: &cpu_py37
  docker:
    - image: circleci/python:3.7
  resource_class: medium
+cpu_py38: &cpu_py38
+  docker:
+    - image: circleci/python:3.8
+  resource_class: medium
+cpu_py39: &cpu_py39
+  docker:
+    - image: circleci/python:3.9
+  resource_class: medium
 gpu: &gpu
  environment:
    CUDA_VERSION: "10.1"
@@ -61,7 +71,6 @@ install_dep_160: &install_dep_160
        python -c 'import torch; assert torch.__version__.split(".")[:2] == ["1", "6"], "wrong torch version"'
        python -m torch.utils.collect_env
 install_dep_171: &install_dep_171
  - run:
      name: Install Dependencies
@@ -89,6 +98,32 @@ install_repo_gpu: &install_repo_gpu
        export CUDA_HOME=/usr/local/cuda-10.1
        pip install -e .
+run_isort: &run_isort
+   - run:
+       name: Run Linter (isort)
+       command: |
+         isort . --check
+run_black: &run_black
+   - run:
+       name: Run Linter (black)
+       command: |
+         black --check .
+run_mypy: &run_mypy
+   - run:
+       name: Run type-checking (mypy)
+       command: |
+         mypy --ignore-missing-imports --scripts-are-modules --pretty .
+run_flake8: &run_flake8
+  - run:
+      name: Run Linter (flake8)
+      command: |
+        flake8 --show-source --statistics
 run_coverage: &run_coverage
  - run:
      name: Run Unit Tests With Coverage
@@ -109,11 +144,6 @@ run_mpi_unittests: &run_mpi_unittests
      command: |
        mpirun -n 4 python -m pytest -p torch_pg.pytest --only-mpi --junitxml=test-results/junit.xml --verbose tests/nn/moe
-run_flake8: &run_flake8
-  - run:
-      name: Run Linter (flake8)
-      command: |
-        flake8 --show-source --statistics
 run_pipe_benchmark: &run_pipe_benchmark
  - run:
@@ -135,20 +165,30 @@ run_oss_gloo: &run_oss_gloo
        python benchmarks/oss.py --gloo --optim_type oss_ddp --epochs 2
        python benchmarks/oss.py --gloo --optim_type oss_sharded_ddp --epochs 2
 run_oss_amp: &run_oss_amp
- run:
+   - run:
-    name: Run OSS with Torch AMP
+       name: Run OSS with Torch AMP
-    command: |
+       command: |
-      python benchmarks/oss.py --amp --epochs 3 --optim_type oss_sharded_ddp
+         python benchmarks/oss.py --amp --epochs 3 --optim_type oss_sharded_ddp
+run_doc_build: &run_doc_build
+   - run:
+       name: Testing doc build
+       command: |
+         cd docs
+         pip install --progress-bar off -r requirements.txt
+         make help
+         make singlehtml | tee make.out
+         ! tail make.out | grep -q warning
 # -------------------------------------------------------------------------------------
 # Jobs to run
 # -------------------------------------------------------------------------------------
 jobs:
-  cpu_tests:
+  cpu_tests_py37:
-    <<: *cpu
+    <<: *cpu_py37
    working_directory: ~/fairscale
@@ -159,41 +199,101 @@ jobs:
      # Cache the venv directory that contains dependencies
      - restore_cache:
          keys:
-            - cache-key-cpu-171-{{ checksum "setup.py"}}-{{ checksum "requirements-test.txt"}}
+            - cache-key-cpu-py37-171-{{ checksum "setup.py"}}-{{ checksum "requirements-test.txt"}}
      - <<: *install_dep_171
      - save_cache:
          paths:
            - ~/venv
-          key: cache-key-cpu-171-{{ checksum "setup.py"}}-{{ checksum "requirements-test.txt"}}
+          key: cache-key-cpu-py37-171-{{ checksum "setup.py"}}-{{ checksum "requirements-test.txt"}}
      - <<: *install_repo_cpu
-      - run:
+      - <<: *run_isort
-          name: Run Linter (isort)
+      - <<: *run_black
-          command: |
+      - <<: *run_mypy
-            isort . --check
+      - <<: *run_flake8
+      - <<: *run_unittests
+      - <<: *run_mpi_unittests
+      - <<: *run_doc_build
+      - store_test_results:
+          path: test-results
-      - run:
+  cpu_tests_py38:
-          name: Run Linter (black)
+    <<: *cpu_py38
-          command: |
-            black --check .
-      - run:
+    working_directory: ~/fairscale
-          name: Run type-checking (mypy)
-          command: |
-            mypy --ignore-missing-imports --scripts-are-modules --pretty .
-      - <<: *run_flake8
+    steps:
+      - checkout
+      - <<: *setup_venv
-      - <<: *run_unittests
+      # Cache the venv directory that contains dependencies
+      - restore_cache:
+          keys:
+            - cache-key-cpu-py38-171-{{ checksum "setup.py"}}-{{ checksum "requirements-test.txt"}}
+      - <<: *install_dep_171
+      - save_cache:
+          paths:
+            - ~/venv
+          key: cache-key-cpu-py38-171-{{ checksum "setup.py"}}-{{ checksum "requirements-test.txt"}}
+      - <<: *install_repo_cpu
+      - <<: *run_isort
+      - <<: *run_black
+      - <<: *run_mypy
+      - <<: *run_flake8
+      - <<: *run_unittests
      - <<: *run_mpi_unittests
+      - <<: *run_doc_build
      - store_test_results:
          path: test-results
+  cpu_tests_py39:
+    <<: *cpu_py39
+    working_directory: ~/fairscale
+    steps:
+      - checkout
+      - <<: *setup_venv
+      # Cache the venv directory that contains dependencies
+      - restore_cache:
+          keys:
+            - cache-key-cpu-py39-171-{{ checksum "setup.py"}}-{{ checksum "requirements-test.txt"}}
+      - <<: *install_dep_171
+      - save_cache:
+          paths:
+            - ~/venv
+          key: cache-key-cpu-py39-171-{{ checksum "setup.py"}}-{{ checksum "requirements-test.txt"}}
+      - <<: *install_repo_cpu
+      - <<: *run_isort
+      - <<: *run_black
+      - <<: *run_mypy
+      - <<: *run_flake8
+      # FIXME: py39 still not stable for us, example:
+      # https://app.circleci.com/pipelines/github/facebookresearch/fairscale/1349/workflows/534aae41-e01d-404e-bfc1-fdc58566c39c/jobs/5952
+      # - <<: *run_unittests
+      # example:
+      # https://app.circleci.com/pipelines/github/facebookresearch/fairscale/1350/workflows/26ebd69e-777e-491a-ae12-da3154ef80f9/jobs/5953
+      # - <<: *run_mpi_unittests
+      - <<: *run_doc_build
+      - store_test_results:
+          path: test-results
  gpu_tests_151:
    <<: *gpu
@@ -342,7 +442,9 @@ workflows:
  version: 2
  build:
    jobs:
-      - cpu_tests
+      - cpu_tests_py37
+      - cpu_tests_py38
+      - cpu_tests_py39
      - gpu_tests_151
      - gpu_tests_160
      - gpu_tests_171

--- a/fairscale/optim/adascale.py
+++ b/fairscale/optim/adascale.py
@@ -557,10 +557,11 @@ class AdaScale(Optimizer):
        `set_scale` needs to be called to update the scale as well.
        TODO (min): need a way of determine how much to increase the step size?
        TODO (min): have both `set_scale` and `set_num_gradients_to_accumulate`
-                    is hard to use and easy to make mistake. I think it is better
+        is hard to use and easy to make mistake. I think it is better
-                    to specific a specify a `base_scale`. But more discussion is
+        to specific a specify a `base_scale`. But more discussion is
-                    needed here.
+        needed here.
        Args:
            num_gradients_to_accumulate (int):

--- a/requirements-test.txt
+++ b/requirements-test.txt
+# Tools for static checking.
 black == 19.10b0
 flake8 == 3.7.9
 isort == 5.6.4
-mpi4py == 3.0.3
+mypy == 0.790
-mypy == 0.770
+# Tools for testing & coverage.
 pytest == 5.4.1
 pytest-cov == 2.10.0
 pytest-mpi == 0.4
 pytest-timeout == 1.4.2
+mpi4py == 3.0.3
+# Library dependencies.
 torchtext == 0.6.0
 torch >= 1.5.1
 torchvision >= 0.6.0
-# NOTE(msb) not a dependency but needed by torch
-numpy == 1.17.4
 timm == 0.3.4