From 9778ebe2b4fb913fd1d7eaeceff83de8b8716885 Mon Sep 17 00:00:00 2001
From: Chris Yeh <chrisyeh96@users.noreply.github.com>
Date: Tue, 28 Jul 2020 16:42:49 -0600
Subject: [PATCH 1/3] Cosmetic improvements to code

1) Use PyTorch's own nn.Identity() function.

2) Update minimum Python version to 3.6 because of the use of f-strings.

3) Remove excess whitespace
---
 efficientnet_pytorch/__init__.py |  1 -
 efficientnet_pytorch/model.py    | 28 ++++++++++++-------------
 efficientnet_pytorch/utils.py    | 36 +++++++++++---------------------
 3 files changed, 26 insertions(+), 39 deletions(-)

diff --git a/efficientnet_pytorch/__init__.py b/efficientnet_pytorch/__init__.py
index a101872..b66a907 100644
--- a/efficientnet_pytorch/__init__.py
+++ b/efficientnet_pytorch/__init__.py
@@ -7,4 +7,3 @@
     efficientnet,
     get_model_params,
 )
-
diff --git a/efficientnet_pytorch/model.py b/efficientnet_pytorch/model.py
index dfa095e..761fde3 100755
--- a/efficientnet_pytorch/model.py
+++ b/efficientnet_pytorch/model.py
@@ -76,7 +76,7 @@ def __init__(self, block_args, global_params, image_size=None):
 
         # Squeeze and Excitation layer, if desired
         if self.has_se:
-            Conv2d = get_same_padding_conv2d(image_size=(1,1))
+            Conv2d = get_same_padding_conv2d(image_size=(1, 1))
             num_squeezed_channels = max(1, int(self._block_args.input_filters * self._block_args.se_ratio))
             self._se_reduce = Conv2d(in_channels=oup, out_channels=num_squeezed_channels, kernel_size=1)
             self._se_expand = Conv2d(in_channels=num_squeezed_channels, out_channels=oup, kernel_size=1)
@@ -147,7 +147,7 @@ class EfficientNet(nn.Module):
     Args:
         blocks_args (list[namedtuple]): A list of BlockArgs to construct blocks.
         global_params (namedtuple): A set of GlobalParams shared between blocks.
-    
+
     References:
         [1] https://arxiv.org/abs/1905.11946 (EfficientNet)
 
@@ -277,7 +277,7 @@ def extract_features(self, inputs):
             inputs (tensor): Input tensor.
 
         Returns:
-            Output of the final convolution 
+            Output of the final convolution
             layer in the efficientnet model.
         """
         # Stem
@@ -289,7 +289,7 @@ def extract_features(self, inputs):
             if drop_connect_rate:
                 drop_connect_rate *= float(idx) / len(self._blocks) # scale drop connect_rate
             x = block(x, drop_connect_rate=drop_connect_rate)
-        
+
         # Head
         x = self._swish(self._bn1(self._conv_head(x)))
 
@@ -323,7 +323,7 @@ def from_name(cls, model_name, in_channels=3, **override_params):
         Args:
             model_name (str): Name for efficientnet.
             in_channels (int): Input data's channel number.
-            override_params (other key word params): 
+            override_params (other key word params):
                 Params to override model's global_params.
                 Optional key:
                     'width_coefficient', 'depth_coefficient',
@@ -342,35 +342,35 @@ def from_name(cls, model_name, in_channels=3, **override_params):
         return model
 
     @classmethod
-    def from_pretrained(cls, model_name, weights_path=None, advprop=False, 
+    def from_pretrained(cls, model_name, weights_path=None, advprop=False,
                         in_channels=3, num_classes=1000, **override_params):
         """create an efficientnet model according to name.
 
         Args:
             model_name (str): Name for efficientnet.
-            weights_path (None or str): 
+            weights_path (None or str):
                 str: path to pretrained weights file on the local disk.
                 None: use pretrained weights downloaded from the Internet.
-            advprop (bool): 
+            advprop (bool):
                 Whether to load pretrained weights
                 trained with advprop (valid when weights_path is None).
             in_channels (int): Input data's channel number.
-            num_classes (int): 
+            num_classes (int):
                 Number of categories for classification.
                 It controls the output size for final linear layer.
-            override_params (other key word params): 
+            override_params (other key word params):
                 Params to override model's global_params.
                 Optional key:
                     'width_coefficient', 'depth_coefficient',
                     'image_size', 'dropout_rate',
-                    'num_classes', 'batch_norm_momentum',
+                    'batch_norm_momentum',
                     'batch_norm_epsilon', 'drop_connect_rate',
                     'depth_divisor', 'min_depth'
 
         Returns:
             A pretrained efficientnet model.
         """
-        model = cls.from_name(model_name, num_classes = num_classes, **override_params)
+        model = cls.from_name(model_name, num_classes=num_classes, **override_params)
         load_pretrained_weights(model, model_name, weights_path=weights_path, load_fc=(num_classes == 1000), advprop=advprop)
         model._change_in_channels(in_channels)
         return model
@@ -391,7 +391,7 @@ def get_image_size(cls, model_name):
 
     @classmethod
     def _check_model_name_is_valid(cls, model_name):
-        """Validates model name. 
+        """Validates model name.
 
         Args:
             model_name (str): Name for efficientnet.
@@ -409,6 +409,6 @@ def _change_in_channels(self, in_channels):
             in_channels (int): Input data's channel number.
         """
         if in_channels != 3:
-            Conv2d = get_same_padding_conv2d(image_size = self._global_params.image_size)
+            Conv2d = get_same_padding_conv2d(image_size=self._global_params.image_size)
             out_channels = round_filters(32, self._global_params)
             self._conv_stem = Conv2d(in_channels, out_channels, kernel_size=3, stride=2, bias=False)
diff --git a/efficientnet_pytorch/utils.py b/efficientnet_pytorch/utils.py
index da92838..0725c6e 100755
--- a/efficientnet_pytorch/utils.py
+++ b/efficientnet_pytorch/utils.py
@@ -34,7 +34,6 @@
 #     MaxPool2dStaticSamePadding
 #     It's an additional function, not used in EfficientNet,
 #     but can be used in other model (such as EfficientDet).
-# Identity: An implementation of identical mapping
 
 # Parameters for the entire model (stem, all blocks, and head)
 GlobalParams = collections.namedtuple('GlobalParams', [
@@ -125,7 +124,7 @@ def round_repeats(repeats, global_params):
 
 def drop_connect(inputs, p, training):
     """Drop connect.
-       
+
     Args:
         input (tensor: BCWH): Input of this structure.
         p (float: 0.0~1.0): Probability of drop connection.
@@ -134,7 +133,7 @@ def drop_connect(inputs, p, training):
     Returns:
         output: Output after drop connection.
     """
-    assert p >= 0 and p <= 1, 'p must be in range of [0,1]'
+    assert 0 <= p <= 1, 'p must be in range of [0,1]'
 
     if not training:
         return inputs
@@ -188,7 +187,7 @@ def calculate_output_image_size(input_image_size, stride):
     return [image_height, image_width]
 
 
-# Note: 
+# Note:
 # The following 'SamePadding' functions make output size equal ceil(input size/stride).
 # Only when stride equals 1, can the output size be the same as input size.
 # Don't be confused by their function names ! ! !
@@ -264,7 +263,7 @@ def __init__(self, in_channels, out_channels, kernel_size, stride=1, image_size=
         if pad_h > 0 or pad_w > 0:
             self.static_padding = nn.ZeroPad2d((pad_w // 2, pad_w - pad_w // 2, pad_h // 2, pad_h - pad_h // 2))
         else:
-            self.static_padding = Identity()
+            self.static_padding = nn.Identity()
 
     def forward(self, x):
         x = self.static_padding(x)
@@ -333,7 +332,7 @@ def __init__(self, kernel_size, stride, image_size=None, **kwargs):
         if pad_h > 0 or pad_w > 0:
             self.static_padding = nn.ZeroPad2d((pad_w // 2, pad_w - pad_w // 2, pad_h // 2, pad_h - pad_h // 2))
         else:
-            self.static_padding = Identity()
+            self.static_padding = nn.Identity()
 
     def forward(self, x):
         x = self.static_padding(x)
@@ -341,17 +340,6 @@ def forward(self, x):
                          self.dilation, self.ceil_mode, self.return_indices)
         return x
 
-class Identity(nn.Module):
-    """Identity mapping.
-       Send input to output directly.
-    """
-
-    def __init__(self):
-        super(Identity, self).__init__()
-
-    def forward(self, input):
-        return input
-
 
 ################################################################################
 ### Helper functions for loading model params
@@ -549,7 +537,7 @@ def get_model_params(model_name, override_params):
         blocks_args, global_params = efficientnet(
             width_coefficient=w, depth_coefficient=d, dropout_rate=p, image_size=s)
     else:
-        raise NotImplementedError('model name is not pre-defined: %s' % model_name)
+        raise NotImplementedError('model name is not pre-defined: {}'.format(model_name))
     if override_params:
         # ValueError will be raised here if override_params has fields not included in global_params.
         global_params = global_params._replace(**override_params)
@@ -592,29 +580,29 @@ def load_pretrained_weights(model, model_name, weights_path=None, load_fc=True,
     Args:
         model (Module): The whole model of efficientnet.
         model_name (str): Model name of efficientnet.
-        weights_path (None or str): 
+        weights_path (None or str):
             str: path to pretrained weights file on the local disk.
             None: use pretrained weights downloaded from the Internet.
         load_fc (bool): Whether to load pretrained weights for fc layer at the end of the model.
         advprop (bool): Whether to load pretrained weights
                         trained with advprop (valid when weights_path is None).
     """
-    if isinstance(weights_path,str):
+    if isinstance(weights_path, str):
         state_dict = torch.load(weights_path)
     else:
         # AutoAugment or Advprop (different preprocessing)
         url_map_ = url_map_advprop if advprop else url_map
         state_dict = model_zoo.load_url(url_map_[model_name])
-    
+
     if load_fc:
         ret = model.load_state_dict(state_dict, strict=False)
-        assert not ret.missing_keys, f'Missing keys when loading pretrained weights: {ret.missing_keys}'
+        assert not ret.missing_keys, 'Missing keys when loading pretrained weights: {}'.format(ret.missing_keys)
     else:
         state_dict.pop('_fc.weight')
         state_dict.pop('_fc.bias')
         ret = model.load_state_dict(state_dict, strict=False)
         assert set(ret.missing_keys) == set(
-            ['_fc.weight', '_fc.bias']), f'Missing keys when loading pretrained weights: {ret.missing_keys}'
-    assert not ret.unexpected_keys, f'Missing keys when loading pretrained weights: {ret.unexpected_keys}'
+            ['_fc.weight', '_fc.bias']), 'Missing keys when loading pretrained weights: {}'.format(ret.missing_keys)
+    assert not ret.unexpected_keys, 'Missing keys when loading pretrained weights: {}'.format(ret.unexpected_keys)
 
     print('Loaded pretrained weights for {}'.format(model_name))

From f438ddbadf17fb8bbc143521a6dd0caa76a652ed Mon Sep 17 00:00:00 2001
From: Chris Yeh <chrisyeh96@users.noreply.github.com>
Date: Tue, 28 Jul 2020 16:50:02 -0600
Subject: [PATCH 2/3] Lint README.md

---
 README.md | 69 +++++++++++++++++++++++++++----------------------------
 1 file changed, 34 insertions(+), 35 deletions(-)

diff --git a/README.md b/README.md
index a361872..4207fd5 100644
--- a/README.md
+++ b/README.md
@@ -1,6 +1,6 @@
 # EfficientNet PyTorch
 
-### Quickstart 
+### Quickstart
 
 Install with `pip install efficientnet_pytorch` and load a pretrained EfficientNet with:
 ```python
@@ -12,24 +12,23 @@ model = EfficientNet.from_pretrained('efficientnet-b0')
 
 #### Update (May 14, 2020)
 
-This update adds comprehensive comments and documentation (thanks to @workingcoder). 
+This update adds comprehensive comments and documentation (thanks to @workingcoder).
 
 #### Update (January 23, 2020)
 
 This update adds a new category of pre-trained model based on adversarial training, called _advprop_. It is important to note that the preprocessing required for the advprop pretrained models is slightly different from normal ImageNet preprocessing. As a result, by default, advprop models are not used. To load a model with advprop, use:
-```
+```python
 model = EfficientNet.from_pretrained("efficientnet-b0", advprop=True)
 ```
 There is also a new, large `efficientnet-b8` pretrained model that is only available in advprop form. When using these models, replace ImageNet preprocessing code as follows:
-```
+```python
 if advprop:  # for models using advprop pretrained weights
     normalize = transforms.Lambda(lambda img: img * 2.0 - 1.0)
 else:
-    normalize = transforms.Normalize(mean=[0.485, 0.456, 0.406], 
+    normalize = transforms.Normalize(mean=[0.485, 0.456, 0.406],
                                      std=[0.229, 0.224, 0.225])
-
 ```
-This update also addresses multiple other issues ([#115](https://github.com/lukemelas/EfficientNet-PyTorch/issues/115), [#128](https://github.com/lukemelas/EfficientNet-PyTorch/issues/128)). 
+This update also addresses multiple other issues ([#115](https://github.com/lukemelas/EfficientNet-PyTorch/issues/115), [#128](https://github.com/lukemelas/EfficientNet-PyTorch/issues/128)).
 
 #### Update (October 15, 2019)
 
@@ -37,21 +36,21 @@ This update allows you to choose whether to use a memory-efficient Swish activat
 
 #### Update (October 12, 2019)
 
-This update makes the Swish activation function more memory-efficient. It also addresses pull requests [#72](https://github.com/lukemelas/EfficientNet-PyTorch/pull/72), [#73](https://github.com/lukemelas/EfficientNet-PyTorch/pull/73), [#85](https://github.com/lukemelas/EfficientNet-PyTorch/pull/85), and [#86](https://github.com/lukemelas/EfficientNet-PyTorch/pull/86). Thanks to the authors of all the pull requests! 
+This update makes the Swish activation function more memory-efficient. It also addresses pull requests [#72](https://github.com/lukemelas/EfficientNet-PyTorch/pull/72), [#73](https://github.com/lukemelas/EfficientNet-PyTorch/pull/73), [#85](https://github.com/lukemelas/EfficientNet-PyTorch/pull/85), and [#86](https://github.com/lukemelas/EfficientNet-PyTorch/pull/86). Thanks to the authors of all the pull requests!
 
 #### Update (July 31, 2019)
 
 _Upgrade the pip package with_ `pip install --upgrade efficientnet-pytorch`
 
-The B6 and B7 models are now available. Additionally, _all_ pretrained models have been updated to use AutoAugment preprocessing, which translates to better performance across the board. Usage is the same as before: 
+The B6 and B7 models are now available. Additionally, _all_ pretrained models have been updated to use AutoAugment preprocessing, which translates to better performance across the board. Usage is the same as before:
 ```python
 from efficientnet_pytorch import EfficientNet
-model = EfficientNet.from_pretrained('efficientnet-b7') 
+model = EfficientNet.from_pretrained('efficientnet-b7')
 ```
 
 #### Update (June 29, 2019)
 
-This update adds easy model exporting ([#20](https://github.com/lukemelas/EfficientNet-PyTorch/issues/20)) and feature extraction ([#38](https://github.com/lukemelas/EfficientNet-PyTorch/issues/38)). 
+This update adds easy model exporting ([#20](https://github.com/lukemelas/EfficientNet-PyTorch/issues/20)) and feature extraction ([#38](https://github.com/lukemelas/EfficientNet-PyTorch/issues/38)).
 
  * [Example: Export to ONNX](#example-export)
  * [Example: Extract features](#example-feature-extraction)
@@ -60,29 +59,29 @@ This update adds easy model exporting ([#20](https://github.com/lukemelas/Effici
 It is also now incredibly simple to load a pretrained model with a new number of classes for transfer learning:
 ```python
 model = EfficientNet.from_pretrained('efficientnet-b1', num_classes=23)
-``` 
+```
 
 
 #### Update (June 23, 2019)
 
-The B4 and B5 models are now available. Their usage is identical to the other models: 
+The B4 and B5 models are now available. Their usage is identical to the other models:
 ```python
 from efficientnet_pytorch import EfficientNet
-model = EfficientNet.from_pretrained('efficientnet-b4') 
+model = EfficientNet.from_pretrained('efficientnet-b4')
 ```
 
 ### Overview
-This repository contains an op-for-op PyTorch reimplementation of [EfficientNet](https://arxiv.org/abs/1905.11946), along with pre-trained models and examples. 
+This repository contains an op-for-op PyTorch reimplementation of [EfficientNet](https://arxiv.org/abs/1905.11946), along with pre-trained models and examples.
 
-The goal of this implementation is to be simple, highly extensible, and easy to integrate into your own projects. This implementation is a work in progress -- new features are currently being implemented. 
+The goal of this implementation is to be simple, highly extensible, and easy to integrate into your own projects. This implementation is a work in progress -- new features are currently being implemented.
 
-At the moment, you can easily:  
- * Load pretrained EfficientNet models 
- * Use EfficientNet models for classification or feature extraction 
+At the moment, you can easily:
+ * Load pretrained EfficientNet models
+ * Use EfficientNet models for classification or feature extraction
  * Evaluate EfficientNet models on ImageNet or your own images
 
 _Upcoming features_: In the next few days, you will be able to:
- * Train new models from scratch on ImageNet with a simple command 
+ * Train new models from scratch on ImageNet with a simple command
  * Quickly finetune an EfficientNet on your own dataset
  * Export EfficientNet models for production
 
@@ -95,11 +94,11 @@ _Upcoming features_: In the next few days, you will be able to:
     * [Example: Classify](#example-classification)
     * [Example: Extract features](#example-feature-extraction)
     * [Example: Export to ONNX](#example-export)
-6. [Contributing](#contributing) 
+6. [Contributing](#contributing)
 
 ### About EfficientNet
 
-If you're new to EfficientNets, here is an explanation straight from the official TensorFlow implementation: 
+If you're new to EfficientNets, here is an explanation straight from the official TensorFlow implementation:
 
 EfficientNets are a family of image classification models, which achieve state-of-the-art accuracy, yet being an order-of-magnitude smaller and faster than previous models. We develop EfficientNets based on AutoML and Compound Scaling. In particular, we first use [AutoML Mobile framework](https://ai.googleblog.com/2018/08/mnasnet-towards-automating-design-of.html) to develop a mobile-size baseline network, named as EfficientNet-B0; Then, we use the compound scaling method to scale up this baseline to obtain EfficientNet-B1 to B7.
 
@@ -141,25 +140,25 @@ Or install from source:
 git clone https://github.com/lukemelas/EfficientNet-PyTorch
 cd EfficientNet-Pytorch
 pip install -e .
-``` 
+```
 
 ### Usage
 
 #### Loading pretrained models
 
-Load an EfficientNet:  
+Load an EfficientNet:
 ```python
 from efficientnet_pytorch import EfficientNet
 model = EfficientNet.from_name('efficientnet-b0')
 ```
 
-Load a pretrained EfficientNet: 
+Load a pretrained EfficientNet:
 ```python
 from efficientnet_pytorch import EfficientNet
 model = EfficientNet.from_pretrained('efficientnet-b0')
 ```
 
-Details about the models are below: 
+Details about the models are below:
 
 |    *Name*         |*# Params*|*Top-1 Acc.*|*Pretrained?*|
 |:-----------------:|:--------:|:----------:|:-----------:|
@@ -177,7 +176,7 @@ Details about the models are below:
 
 Below is a simple, complete example. It may also be found as a jupyter notebook in `examples/simple` or as a [Colab Notebook](https://colab.research.google.com/drive/1Jw28xZ1NJq4Cja4jLe6tJ6_F5lCzElb4).
 
-We assume that in your current directory, there is a `img.jpg` file and a `labels_map.txt` file (ImageNet class names). These are both included in `examples/simple`. 
+We assume that in your current directory, there is a `img.jpg` file and a `labels_map.txt` file (ImageNet class names). These are both included in `examples/simple`.
 
 ```python
 import json
@@ -210,7 +209,7 @@ for idx in torch.topk(outputs, k=5).indices.squeeze(0).tolist():
     print('{label:<75} ({p:.2f}%)'.format(label=labels_map[idx], p=prob*100))
 ```
 
-#### Example: Feature Extraction 
+#### Example: Feature Extraction
 
 You can easily extract features with `model.extract_features`:
 ```python
@@ -224,20 +223,20 @@ features = model.extract_features(img)
 print(features.shape) # torch.Size([1, 1280, 7, 7])
 ```
 
-#### Example: Export to ONNX  
+#### Example: Export to ONNX
 
-Exporting to ONNX for deploying to production is now simple: 
+Exporting to ONNX for deploying to production is now simple:
 ```python
-import torch 
+import torch
 from efficientnet_pytorch import EfficientNet
 
 model = EfficientNet.from_pretrained('efficientnet-b1')
 dummy_input = torch.randn(10, 3, 240, 240)
 
 torch.onnx.export(model, dummy_input, "test-b1.onnx", verbose=True)
-``` 
+```
 
-[Here](https://colab.research.google.com/drive/1rOAEXeXHaA8uo3aG2YcFDHItlRJMV0VP) is a Colab example. 
+[Here](https://colab.research.google.com/drive/1rOAEXeXHaA8uo3aG2YcFDHItlRJMV0VP) is a Colab example.
 
 
 #### ImageNet
@@ -246,6 +245,6 @@ See `examples/imagenet` for details about evaluating on ImageNet.
 
 ### Contributing
 
-If you find a bug, create a GitHub issue, or even better, submit a pull request. Similarly, if you have questions, simply post them as GitHub issues.   
+If you find a bug, create a GitHub issue, or even better, submit a pull request. Similarly, if you have questions, simply post them as GitHub issues.
 
-I look forward to seeing what the community does with these models! 
+I look forward to seeing what the community does with these models!

From 85e0a35c6c1b8bed9428b4c06c8cb7d0e2cbcc4f Mon Sep 17 00:00:00 2001
From: Chris Yeh <chrisyeh96@users.noreply.github.com>
Date: Thu, 30 Jul 2020 00:12:01 -0600
Subject: [PATCH 3/3] remove f-strings

---
 efficientnet_pytorch/model.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/efficientnet_pytorch/model.py b/efficientnet_pytorch/model.py
index 761fde3..3efabfa 100755
--- a/efficientnet_pytorch/model.py
+++ b/efficientnet_pytorch/model.py
@@ -261,12 +261,12 @@ def extract_endpoints(self, inputs):
                 drop_connect_rate *= float(idx) / len(self._blocks) # scale drop connect_rate
             x = block(x, drop_connect_rate=drop_connect_rate)
             if prev_x.size(2) > x.size(2):
-                endpoints[f'reduction_{len(endpoints)+1}'] = prev_x
+                endpoints['reduction_{}'.format(len(endpoints)+1)] = prev_x
             prev_x = x
 
         # Head
         x = self._swish(self._bn1(self._conv_head(x)))
-        endpoints[f'reduction_{len(endpoints)+1}'] = x
+        endpoints['reduction_{}'.format(len(endpoints)+1)] = x
 
         return endpoints