Dependency pruning (#528)

* remove cpu-feature * remove psutils requirement

Dependency pruning (#528)
* remove cpu-feature * remove psutils requirement
0dc84200 · Jeff Rasley · GitHub · d779bd53 · 0dc84200 · 0dc84200
Unverified Commit 0dc84200 authored Nov 13, 2020 by Jeff Rasley Committed by GitHub Nov 13, 2020
Showing with 28 additions and 30 deletions

deepspeed/utils/timer.py deepspeed/utils/timer.py +11 -2

op_builder/cpu_adam.py op_builder/cpu_adam.py +17 -26

requirements/requirements.txt requirements/requirements.txt +0 -2

No files found.
--- a/deepspeed/utils/timer.py
+++ b/deepspeed/utils/timer.py
@@ -3,11 +3,17 @@ Copyright 2019 The Microsoft DeepSpeed Team
 '''
 import time
-import psutil
 import torch
 from deepspeed.utils import logger
+try:
+    import psutil
+    PSUTILS_INSTALLED = True
+except ImportError:
+    PSUTILS_INSTALLED = False
+    pass
 def print_rank_0(message):
    if torch.distributed.is_initialized():
@@ -103,7 +109,7 @@ class ThroughputTimer():
                 num_workers,
                 start_step=2,
                 steps_per_output=50,
-                 monitor_memory=True,
+                 monitor_memory=False,
                 logging_fn=None):
        self.start_time = 0
        self.end_time = 0
@@ -124,6 +130,9 @@ class ThroughputTimer():
            self.logging = logger.info
        self.initialized = False
+        if self.monitor_memory and not PSUTILS_INSTALLED:
+            raise ImportError("Unable to import 'psutils', please install package")
    def update_epoch_count(self):
        self.epoch_count += 1
        self.local_step_count = 0

--- a/op_builder/cpu_adam.py
+++ b/op_builder/cpu_adam.py
 import os
 import torch
-import warnings
+import subprocess
 from .builder import CUDAOpBuilder
@@ -21,35 +21,26 @@ class CPUAdamBuilder(CUDAOpBuilder):
        CUDA_INCLUDE = os.path.join(torch.utils.cpp_extension.CUDA_HOME, "include")
        return ['csrc/includes', CUDA_INCLUDE]
-    def available_vector_instructions(self):
+    def simd_width(self):
-        try:
+        if not self.command_exists('lscpu'):
-            import cpufeature
+            self.warning(
-        except ImportError:
+                "CPUAdam attempted to query 'lscpu' to detect the existence "
-            warnings.warn(
+                "of AVX instructions. However, 'lscpu' does not appear to exist on "
-                f'import cpufeature failed - CPU vector optimizations are not available for CPUAdam'
+                "your system, will fall back to non-vectorized execution.")
-            )
+            return ''
-            return {}
-        cpu_vector_instructions = {}
+        result = subprocess.check_output('lscpu', shell=True)
-        try:
+        result = result.decode('utf-8').strip().lower()
-            cpu_vector_instructions = cpufeature.CPUFeature
+        if 'genuineintel' in result:
-        except _:
+            if 'avx512' in result:
-            warnings.warn(
+                return '-D__AVX512__'
-                f'cpufeature.CPUFeature failed - CPU vector optimizations are not available for CPUAdam'
+            elif 'avx2' in result:
-            )
+                return '-D__AVX256__'
-            return {}
+        return ''
-        return cpu_vector_instructions
    def cxx_args(self):
        CUDA_LIB64 = os.path.join(torch.utils.cpp_extension.CUDA_HOME, "lib64")
-        cpu_info = self.available_vector_instructions()
+        SIMD_WIDTH = self.simd_width()
-        SIMD_WIDTH = ''
-        if 'Intel' in cpu_info.get('VendorId', ''):
-            if cpu_info.get('AVX512f', False):
-                SIMD_WIDTH = '-D__AVX512__'
-            elif cpu_info.get('AVX2', False):
-                SIMD_WIDTH = '-D__AVX256__'
        return [
            '-O3',

--- a/requirements/requirements.txt
+++ b/requirements/requirements.txt
 torch>=1.2
 torchvision>=0.4.0
 tqdm
-psutil
 tensorboardX==1.8
 ninja
-cpufeature