microsoft · ultmaster · May 28, 2021 · May 11, 2021 · May 11, 2021 · May 12, 2021
diff --git a/docs/en_US/Compression/AutoCompression.rst b/docs/en_US/Compression/AutoCompression.rst
@@ -0,0 +1,101 @@
+Auto Compression with NNI Experiment
+====================================
+
+This approach is mainly a combination of compression and nni experiments.
+It allows users to define compressor search space, including types, parameters, etc.
+Its using experience is similar to launch the NNI experiment from python.
+The main differences are as follows:
+
+* Use a generator to help generate search space object.
+* Need to implement the abstract class ``AbstractAutoCompressModule`` as ``AutoCompressModule``.
+* No need to set ``trial_command``, additional need to set ``auto_compress_module_file_name``.
+
+Generate search space
+---------------------
+
+Due to the extensive use of nested search space, we recommend using generator to configure search space.
+The following is an example. Using ``add_pruner_config()`` and ``add_quantizer_config()`` add subconfig, then ``dumps()`` search space dict.
+
+.. code-block:: python
+
+    from nni.algorithms.compression.pytorch.auto_compress import AutoCompressSearchSpaceGenerator
+
+    generator = AutoCompressSearchSpaceGenerator()
+    generator.add_pruner_config('level', [
+        {
+            "sparsity": {
+                "_type": "uniform",
+                "_value": [0.01, 0.99]
+            },
+            'op_types': ['default']
+        }
+    ])
+    generator.add_quantizer_config('qat', [
+    {
+        'quant_types': ['weight', 'output'],
+        'quant_bits': {
+            'weight': 8,
+            'output': 8
+        },
+        'op_types': ['Conv2d', 'Linear']
+    }])
+
+    search_space = generator.dumps()
+
+Now we support the following pruners and quantizers:
+
+.. code-block:: python
+
+    PRUNER_DICT = {
+        'level': LevelPruner,
+        'slim': SlimPruner,
+        'l1': L1FilterPruner,
+        'l2': L2FilterPruner,
+        'fpgm': FPGMPruner,
+        'taylorfo': TaylorFOWeightFilterPruner,
+        'apoz': ActivationAPoZRankFilterPruner,
+        'mean_activation': ActivationMeanRankFilterPruner
+    }
+
+    QUANTIZER_DICT = {
+        'naive': NaiveQuantizer,
+        'qat': QAT_Quantizer,
+        'dorefa': DoReFaQuantizer,
+        'bnn': BNNQuantizer
+    }
+
+Implement ``AbstractAutoCompressModule``
+----------------------------------------
+
+This class will be called by ``AutoCompressEngine`` on training service.
+Users need to implement at least ``model()`` and ``evaluator``, and naming the class as ``AutoCompressModule``.
+The path of file that contains the ``AutoCompressModule`` needs to be specified in experiment config.
+The full abstract interface refers to :githublink:`interface.py <nni/algorithms/compression/pytorch/auto_compress/interface.py>`.
+An example of ``AutoCompressModule`` implementation refers to :githublink:`auto_compress_module.py <examples/model_compress/auto_compress/torch/auto_compress_module.py>`.
+
+Launch NNI experiment
+---------------------
+
+Similar to launch from python, the difference is no need to set ``trial_command``.
+By default, ``auto_compress_module_file_name`` is set as ``./auto_compress_module.py``.
+Remember that ``auto_compress_module_file_name`` is the relative file path under ``trial_code_directory``.
+
+.. code-block:: python
+
+    from pathlib import Path
+    from nni.algorithms.compression.pytorch.auto_compress import AutoCompressExperiment
+
+    experiment = AutoCompressExperiment('local')
+    experiment.config.experiment_name = 'auto compress torch example'
+    experiment.config.trial_concurrency = 1
+    experiment.config.max_trial_number = 10
+    experiment.config.search_space = search_space
+    experiment.config.trial_code_directory = Path(__file__).parent
+    experiment.config.tuner.name = 'TPE'
+    experiment.config.tuner.class_args['optimize_mode'] = 'maximize'
+    experiment.config.training_service.use_active_gpu = True
+
+    # the relative file path under trial_code_directory, which contains the class AutoCompressModule
+    experiment.config.auto_compress_module_file_name = './auto_compress_module.py'
+
+    experiment.run(8088)
diff --git a/docs/en_US/Compression/AutoPruningUsingTuners.rst b/docs/en_US/Compression/AutoPruningUsingTuners.rst
@@ -3,7 +3,7 @@ Automatic Model Pruning using NNI Tuners
 
 It's convenient to implement auto model pruning with NNI compression and NNI tuners
 
-First, model compression with NNI
+First, model pruning with NNI
 ---------------------------------
 
 You can easily compress a model with NNI compression. Take pruning for example, you can prune a pretrained model with L2FilterPruner like this

diff --git a/docs/en_US/Compression/advanced.rst b/docs/en_US/Compression/advanced.rst
@@ -6,4 +6,5 @@ Advanced Usage
 
     Framework <./Framework>
     Customize a new algorithm <./CustomizeCompressor>
-    Automatic Model Compression <./AutoPruningUsingTuners>
+    Automatic Model Pruning <./AutoPruningUsingTuners>
+    Automatic Model Compression (Beta) <./AutoCompression>
diff --git a/examples/model_compress/auto_compress/torch/auto_compress_module.py b/examples/model_compress/auto_compress/torch/auto_compress_module.py
@@ -0,0 +1,120 @@
+# Copyright (c) Microsoft Corporation.
+# Licensed under the MIT license.
+
+from typing import Callable, Optional
+
+import torch
+import torch.nn as nn
+import torch.optim as optim
+import torch.nn.functional as F
+from torch.optim.lr_scheduler import StepLR
+from torchvision import datasets, transforms
+
+from nni.algorithms.compression.pytorch.auto_compress import AbstractAutoCompressModule
+
+torch.manual_seed(1)
+
+class LeNet(nn.Module):
+    def __init__(self):
+        super(LeNet, self).__init__()
+        self.conv1 = nn.Conv2d(1, 32, 3, 1)
+        self.conv2 = nn.Conv2d(32, 64, 3, 1)
+        self.dropout1 = nn.Dropout2d(0.25)
+        self.dropout2 = nn.Dropout2d(0.5)
+        self.fc1 = nn.Linear(9216, 128)
+        self.fc2 = nn.Linear(128, 10)
+
+    def forward(self, x):
+        x = self.conv1(x)
+        x = F.relu(x)
+        x = self.conv2(x)
+        x = F.relu(x)
+        x = F.max_pool2d(x, 2)
+        x = self.dropout1(x)
+        x = torch.flatten(x, 1)
+        x = self.fc1(x)
+        x = F.relu(x)
+        x = self.dropout2(x)
+        x = self.fc2(x)
+        output = F.log_softmax(x, dim=1)
+        return output
+
+_use_cuda = torch.cuda.is_available()
+
+_train_kwargs = {'batch_size': 64}
+_test_kwargs = {'batch_size': 1000}
+if _use_cuda:
+    _cuda_kwargs = {'num_workers': 1,
+                    'pin_memory': True,
+                    'shuffle': True}
+    _train_kwargs.update(_cuda_kwargs)
+    _test_kwargs.update(_cuda_kwargs)
+
+_transform = transforms.Compose([
+    transforms.ToTensor(),
+    transforms.Normalize((0.1307,), (0.3081,))
+])
+
+_dataset1 = datasets.MNIST('./data', train=True, download=True, transform=_transform)
+_dataset2 = datasets.MNIST('./data', train=False, transform=_transform)
+_train_loader = torch.utils.data.DataLoader(_dataset1, **_train_kwargs)
+_test_loader = torch.utils.data.DataLoader(_dataset2, **_test_kwargs)
+
+_device = torch.device("cuda" if _use_cuda else "cpu")
+_epoch = 2
+
+def _train(model, optimizer):
+    model.train()
+    for data, target in _train_loader:
+        data, target = data.to(_device), target.to(_device)
+        optimizer.zero_grad()
+        output = model(data)
+        loss = F.nll_loss(output, target)
+        loss.backward()
+        optimizer.step()
+
+def _test(model):
+    model.eval()
+    test_loss = 0
+    correct = 0
+    with torch.no_grad():
+        for data, target in _test_loader:
+            data, target = data.to(_device), target.to(_device)
+            output = model(data)
+            test_loss += F.nll_loss(output, target, reduction='sum').item()
+            pred = output.argmax(dim=1, keepdim=True)
+            correct += pred.eq(target.view_as(pred)).sum().item()
+    test_loss /= len(_test_loader.dataset)
+    acc = 100 * correct / len(_test_loader.dataset)
+    print('\nTest set: Average loss: {:.4f}, Accuracy: {}/{} ({:.0f}%)\n'.format(
+        test_loss, correct, len(_test_loader.dataset), acc))
+    return acc
+
+_model = LeNet().to(_device)
+
+_pre_train_optimizer = optim.Adadelta(_model.parameters(), lr=1)
+_scheduler = StepLR(_pre_train_optimizer, step_size=1, gamma=0.7)
+for _ in range(_epoch):
+    _train(_model, _pre_train_optimizer)
+    _test(_model)
+    _scheduler.step()
+
+class AutoCompressModule(AbstractAutoCompressModule):
+    @classmethod
+    def model(cls) -> nn.Module:
+        return _model
+
+    @classmethod
+    def optimizer(cls) -> torch.optim.Optimizer:
+        return torch.optim.SGD(_model.parameters(), lr=0.01)
+
+    @classmethod
+    def evaluator(cls) -> Callable[[nn.Module], float]:
+        return _test
+
+    @classmethod
+    def finetune_trainer(cls, compressor_type: str, algorithm_name: str) -> Optional[Callable[[nn.Module, optim.Optimizer], None]]:
+        def _trainer(model, optimizer):
+            for _ in range(_epoch):
+                _train(model, optimizer)
+        return _trainer
diff --git a/examples/model_compress/auto_compress/torch/auto_compress_torch.py b/examples/model_compress/auto_compress/torch/auto_compress_torch.py
@@ -0,0 +1,51 @@
+# Copyright (c) Microsoft Corporation.
+# Licensed under the MIT license.
+
+from pathlib import Path
+
+from nni.algorithms.compression.pytorch.auto_compress import AutoCompressExperiment, AutoCompressSearchSpaceGenerator
+
+generator = AutoCompressSearchSpaceGenerator()
+generator.add_pruner_config('level', [
+    {
+        "sparsity": {
+            "_type": "uniform",
+            "_value": [0.01, 0.99]
+        },
+        'op_types': ['default']
+    }
+])
+generator.add_pruner_config('l1', [
+    {
+        "sparsity": {
+            "_type": "uniform",
+            "_value": [0.01, 0.99]
+        },
+        'op_types': ['Conv2d']
+    }
+])
+generator.add_quantizer_config('qat', [
+    {
+        'quant_types': ['weight', 'output'],
+        'quant_bits': {
+            'weight': 8,
+            'output': 8
+        },
+        'op_types': ['Conv2d', 'Linear']
+    }])
+search_space = generator.dumps()
+
+experiment = AutoCompressExperiment('local')
+experiment.config.experiment_name = 'auto compress torch example'
+experiment.config.trial_concurrency = 1
+experiment.config.max_trial_number = 10
+experiment.config.search_space = search_space
+experiment.config.trial_code_directory = Path(__file__).parent
+experiment.config.tuner.name = 'TPE'
+experiment.config.tuner.class_args['optimize_mode'] = 'maximize'
+experiment.config.training_service.use_active_gpu = True
+
+# the relative file path under trial_code_directory, which contains the class AutoCompressModule
+experiment.config.auto_compress_module_file_name = './auto_compress_module.py'
+
+experiment.run(8088)
diff --git a/nni/algorithms/compression/pytorch/auto_compress/__init__.py b/nni/algorithms/compression/pytorch/auto_compress/__init__.py
@@ -0,0 +1,6 @@
+# Copyright (c) Microsoft Corporation.
+# Licensed under the MIT license.
+
+from .experiment import AutoCompressExperimentConfig, AutoCompressExperiment
+from .interface import AbstractAutoCompressModule
+from .utils import AutoCompressSearchSpaceGenerator