Commit 02e295a

authored

Merge branch 'master' into patch-1

2 parents 8f22066 + 1b181b1 commit 02e295aCopy full SHA for 02e295a

File tree

7 files changed

+70

-31

lines changed

.github/workflows
- main.yml
README.md
efficientnet_pytorch
examples/imagenet
- main.py
setup.py

7 files changed

+70

-31

lines changed

`‎.github/workflows/main.yml‎`

Lines changed: 21 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,21 @@`
	`1`	`+name: Workflow`
	`2`	`+`
	`3`	`+on:`
	`4`	`+ push:`
	`5`	`+ branches:`
	`6`	`+ - master`
	`7`	`+`
	`8`	`+jobs:`
	`9`	`+ pypi-job:`
	`10`	`+ runs-on: ubuntu-latest`
	`11`	`+ steps:`
	`12`	`+ - uses: actions/checkout@v2`
	`13`	`+ - name: Install twine`
	`14`	`+ run: pip install twine`
	`15`	`+ - name: Build package`
	`16`	`+ run: python setup.py sdist`
	`17`	`+ - name: Publish a Python distribution to PyPI`
	`18`	`+ uses: pypa/gh-action-pypi-publish@release/v1`
	`19`	`+ with:`
	`20`	`+ user: __token__`
	`21`	`+ password: ${{ secrets.PYPI_API_TOKEN }}`

`‎README.md‎`

Lines changed: 11 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -10,6 +10,17 @@ model = EfficientNet.from_pretrained('efficientnet-b0')`
`10`	`10`
`11`	`11`	`### Updates`
`12`	`12`
	`13`	`+#### Update (April 2, 2021)`
	`14`	`+`
	`15`	`+The [EfficientNetV2 paper](https://arxiv.org/abs/2104.00298) has been released! I am working on implementing it as you read this :)`
	`16`	`+`
	`17`	`+About EfficientNetV2:`
	`18`	`+> EfficientNetV2 is a new family of convolutional networks that have faster training speed and better parameter efficiency than previous models. To develop this family of models, we use a combination of training-aware neural architecture search and scaling, to jointly optimize training speed and parameter efficiency. The models were searched from the search space enriched with new ops such as Fused-MBConv.`
	`19`	`+`
	`20`	`+Here is a comparison:`
	`21`	`+> <img src="https://github.com/lukemelas/EfficientNet-PyTorch/releases/download/1.0/efficientnetv2-image.png" width="100%" />`
	`22`	`+`
	`23`	`+`
`13`	`24`	`#### Update (Aug 25, 2020)`
`14`	`25`
`15`	`26`	`This update adds:`

`‎efficientnet_pytorch/init.py‎`

Lines changed: 1 addition & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,4 @@`
`1`		`-__version__ = "0.7.0"`
	`1`	`+__version__ = "0.7.1"`
`2`	`2`	`from .model import EfficientNet, VALID_MODELS`
`3`	`3`	`from .utils import (`
`4`	`4`	`GlobalParams,`

`‎efficientnet_pytorch/model.py‎`

Lines changed: 17 additions & 16 deletions

Original file line number	Diff line number	Diff line change
`@@ -50,7 +50,7 @@ class MBConvBlock(nn.Module):`
`50`	`50`	`def __init__(self, block_args, global_params, image_size=None):`
`51`	`51`	`super().__init__()`
`52`	`52`	`self._block_args = block_args`
`53`		`- self._bn_mom = 1 - global_params.batch_norm_momentum # pytorch's difference from tensorflow`
	`53`	`+ self._bn_mom = 1 - global_params.batch_norm_momentum # pytorch's difference from tensorflow`
`54`	`54`	`self._bn_eps = global_params.batch_norm_epsilon`
`55`	`55`	`self.has_se = (self._block_args.se_ratio is not None) and (0 < self._block_args.se_ratio <= 1)`
`56`	`56`	`self.id_skip = block_args.id_skip # whether to use skip connection and drop connect`
`@@ -152,9 +152,7 @@ class EfficientNet(nn.Module):`
`152`	`152`	`[1] https://arxiv.org/abs/1905.11946 (EfficientNet)`
`153`	`153`
`154`	`154`	`Example:`
`155`		`-`
`156`		`-`
`157`		`- import torch`
	`155`	`+ >>> import torch`
`158`	`156`	`>>> from efficientnet.model import EfficientNet`
`159`	`157`	`>>> inputs = torch.rand(1, 3, 224, 224)`
`160`	`158`	`>>> model = EfficientNet.from_pretrained('efficientnet-b0')`
`@@ -198,7 +196,7 @@ def __init__(self, blocks_args=None, global_params=None):`
`198`	`196`	`# The first block needs to take care of stride and filter size increase.`
`199`	`197`	`self._blocks.append(MBConvBlock(block_args, self._global_params, image_size=image_size))`
`200`	`198`	`image_size = calculate_output_image_size(image_size, block_args.stride)`
`201`		`- if block_args.num_repeat > 1: # modify block_args to keep same output size`
	`199`	`+ if block_args.num_repeat > 1: # modify block_args to keep same output size`
`202`	`200`	`block_args = block_args._replace(input_filters=block_args.output_filters, stride=1)`
`203`	`201`	`for _ in range(block_args.num_repeat - 1):`
`204`	`202`	`self._blocks.append(MBConvBlock(block_args, self._global_params, image_size=image_size))`
`@@ -213,16 +211,18 @@ def __init__(self, blocks_args=None, global_params=None):`
`213`	`211`
`214`	`212`	`# Final linear layer`
`215`	`213`	`self._avg_pooling = nn.AdaptiveAvgPool2d(1)`
`216`		`- self._dropout = nn.Dropout(self._global_params.dropout_rate)`
`217`		`- self._fc = nn.Linear(out_channels, self._global_params.num_classes)`
	`214`	`+ if self._global_params.include_top:`
	`215`	`+ self._dropout = nn.Dropout(self._global_params.dropout_rate)`
	`216`	`+ self._fc = nn.Linear(out_channels, self._global_params.num_classes)`
	`217`	`+`
	`218`	`+ # set activation to memory efficient swish by default`
`218`	`219`	`self._swish = MemoryEfficientSwish()`
`219`	`220`
`220`	`221`	`def set_swish(self, memory_efficient=True):`
`221`	`222`	`"""Sets swish function as memory efficient (for training) or standard (for export).`
`222`	`223`
`223`	`224`	`Args:`
`224`	`225`	`memory_efficient (bool): Whether to use memory-efficient version of swish.`
`225`		`-`
`226`	`226`	`"""`
`227`	`227`	`self._swish = MemoryEfficientSwish() if memory_efficient else Swish()`
`228`	`228`	`for block in self._blocks:`
`@@ -261,17 +261,17 @@ def extract_endpoints(self, inputs):`
`261`	`261`	`for idx, block in enumerate(self._blocks):`
`262`	`262`	`drop_connect_rate = self._global_params.drop_connect_rate`
`263`	`263`	`if drop_connect_rate:`
`264`		`- drop_connect_rate *= float(idx) / len(self._blocks) # scale drop connect_rate`
	`264`	`+ drop_connect_rate *= float(idx) / len(self._blocks) # scale drop connect_rate`
`265`	`265`	`x = block(x, drop_connect_rate=drop_connect_rate)`
`266`	`266`	`if prev_x.size(2) > x.size(2):`
`267`		`- endpoints['reduction_{}'.format(len(endpoints)+1)] = prev_x`
	`267`	`+ endpoints['reduction_{}'.format(len(endpoints)+1)] = prev_x`
`268`	`268`	`elif idx == len(self._blocks) - 1:`
`269`		`- endpoints['reduction_{}'.format(len(endpoints)+1)] = x`
	`269`	`+ endpoints['reduction_{}'.format(len(endpoints)+1)] = x`
`270`	`270`	`prev_x = x`
`271`	`271`
`272`	`272`	`# Head`
`273`	`273`	`x = self._swish(self._bn1(self._conv_head(x)))`
`274`		`- endpoints['reduction_{}'.format(len(endpoints)+1)] = x`
	`274`	`+ endpoints['reduction_{}'.format(len(endpoints)+1)] = x`
`275`	`275`
`276`	`276`	`return endpoints`
`277`	`277`
`@@ -292,7 +292,7 @@ def extract_features(self, inputs):`
`292`	`292`	`for idx, block in enumerate(self._blocks):`
`293`	`293`	`drop_connect_rate = self._global_params.drop_connect_rate`
`294`	`294`	`if drop_connect_rate:`
`295`		`- drop_connect_rate *= float(idx) / len(self._blocks) # scale drop connect_rate`
	`295`	`+ drop_connect_rate *= float(idx) / len(self._blocks) # scale drop connect_rate`
`296`	`296`	`x = block(x, drop_connect_rate=drop_connect_rate)`
`297`	`297`
`298`	`298`	`# Head`
`@@ -322,7 +322,7 @@ def forward(self, inputs):`
`322`	`322`
`323`	`323`	`@classmethod`
`324`	`324`	`def from_name(cls, model_name, in_channels=3, **override_params):`
`325`		`- """create an efficientnet model according to name.`
	`325`	`+ """Create an efficientnet model according to name.`
`326`	`326`
`327`	`327`	`Args:`
`328`	`328`	`model_name (str): Name for efficientnet.`
`@@ -348,7 +348,7 @@ def from_name(cls, model_name, in_channels=3, **override_params):`
`348`	`348`	`@classmethod`
`349`	`349`	`def from_pretrained(cls, model_name, weights_path=None, advprop=False,`
`350`	`350`	`in_channels=3, num_classes=1000, **override_params):`
`351`		`- """create an efficientnet model according to name.`
	`351`	`+ """Create an efficientnet model according to name.`
`352`	`352`
`353`	`353`	`Args:`
`354`	`354`	`model_name (str): Name for efficientnet.`
`@@ -375,7 +375,8 @@ def from_pretrained(cls, model_name, weights_path=None, advprop=False,`
`375`	`375`	`A pretrained efficientnet model.`
`376`	`376`	`"""`
`377`	`377`	`model = cls.from_name(model_name, num_classes=num_classes, **override_params)`
`378`		`- load_pretrained_weights(model, model_name, weights_path=weights_path, load_fc=(num_classes == 1000), advprop=advprop)`
	`378`	`+ load_pretrained_weights(model, model_name, weights_path=weights_path,`
	`379`	`+ load_fc=(num_classes == 1000), advprop=advprop)`
`379`	`380`	`model._change_in_channels(in_channels)`
`380`	`381`	`return model`
`381`	`382`

`‎efficientnet_pytorch/utils.py‎`

Lines changed: 18 additions & 12 deletions

Original file line number	Diff line number	Diff line change
`@@ -17,7 +17,7 @@`
`17`	`17`
`18`	`18`
`19`	`19`	`################################################################################`
`20`		`-### Help functions for model architecture`
	`20`	`+# Help functions for model architecture`
`21`	`21`	`################################################################################`
`22`	`22`
`23`	`23`	`# GlobalParams and BlockArgs: Two namedtuples`
`@@ -50,11 +50,14 @@`
`50`	`50`	`GlobalParams.__new__.__defaults__ = (None,) * len(GlobalParams._fields)`
`51`	`51`	`BlockArgs.__new__.__defaults__ = (None,) * len(BlockArgs._fields)`
`52`	`52`
`53`		`-`
`54`		`-# An ordinary implementation of Swish function`
`55`		`-class Swish(nn.Module):`
`56`		`- def forward(self, x):`
`57`		`- return x * torch.sigmoid(x)`
	`53`	`+# Swish activation function`
	`54`	`+if hasattr(nn, 'SiLU'):`
	`55`	`+ Swish = nn.SiLU`
	`56`	`+else:`
	`57`	`+ # For compatibility with old PyTorch versions`
	`58`	`+ class Swish(nn.Module):`
	`59`	`+ def forward(self, x):`
	`60`	`+ return x * torch.sigmoid(x)`
`58`	`61`
`59`	`62`
`60`	`63`	`# A memory-efficient implementation of Swish function`
`@@ -71,6 +74,7 @@ def backward(ctx, grad_output):`
`71`	`74`	`sigmoid_i = torch.sigmoid(i)`
`72`	`75`	`return grad_output * (sigmoid_i * (1 + i * (1 - sigmoid_i)))`
`73`	`76`
	`77`	`+`
`74`	`78`	`class MemoryEfficientSwish(nn.Module):`
`75`	`79`	`def forward(self, x):`
`76`	`80`	`return SwishImplementation.apply(x)`
`@@ -96,10 +100,10 @@ def round_filters(filters, global_params):`
`96`	`100`	`divisor = global_params.depth_divisor`
`97`	`101`	`min_depth = global_params.min_depth`
`98`	`102`	`filters *= multiplier`
`99`		`- min_depth = min_depth or divisor # pay attention to this line when using min_depth`
	`103`	`+ min_depth = min_depth or divisor # pay attention to this line when using min_depth`
`100`	`104`	`# follow the formula transferred from official TensorFlow implementation`
`101`	`105`	`new_filters = max(min_depth, int(filters + divisor / 2) // divisor * divisor)`
`102`		`- if new_filters < 0.9 * filters: # prevent rounding by more than 10%`
	`106`	`+ if new_filters < 0.9 * filters: # prevent rounding by more than 10%`
`103`	`107`	`new_filters += divisor`
`104`	`108`	`return int(new_filters)`
`105`	`109`
`@@ -233,7 +237,7 @@ def forward(self, x):`
`233`	`237`	`ih, iw = x.size()[-2:]`
`234`	`238`	`kh, kw = self.weight.size()[-2:]`
`235`	`239`	`sh, sw = self.stride`
`236`		`- oh, ow = math.ceil(ih / sh), math.ceil(iw / sw) # change the output size according to stride ! ! !`
	`240`	`+ oh, ow = math.ceil(ih / sh), math.ceil(iw / sw) # change the output size according to stride ! ! !`
`237`	`241`	`pad_h = max((oh - 1) * self.stride[0] + (kh - 1) * self.dilation[0] + 1 - ih, 0)`
`238`	`242`	`pad_w = max((ow - 1) * self.stride[1] + (kw - 1) * self.dilation[1] + 1 - iw, 0)`
`239`	`243`	`if pad_h > 0 or pad_w > 0:`
`@@ -311,6 +315,7 @@ def forward(self, x):`
`311`	`315`	`return F.max_pool2d(x, self.kernel_size, self.stride, self.padding,`
`312`	`316`	`self.dilation, self.ceil_mode, self.return_indices)`
`313`	`317`
	`318`	`+`
`314`	`319`	`class MaxPool2dStaticSamePadding(nn.MaxPool2d):`
`315`	`320`	`"""2D MaxPooling like TensorFlow's 'SAME' mode, with the given input image size.`
`316`	`321`	`The padding mudule is calculated in construction function, then used in forward.`
`@@ -343,7 +348,7 @@ def forward(self, x):`
`343`	`348`
`344`	`349`
`345`	`350`	`################################################################################`
`346`		`-### Helper functions for loading model params`
	`351`	`+# Helper functions for loading model params`
`347`	`352`	`################################################################################`
`348`	`353`
`349`	`354`	`# BlockDecoder: A Class for encoding and decoding BlockArgs`
`@@ -576,7 +581,7 @@ def get_model_params(model_name, override_params):`
`576`	`581`	`# TODO: add the petrained weights url map of 'efficientnet-l2'`
`577`	`582`
`578`	`583`
`579`		`-def load_pretrained_weights(model, model_name, weights_path=None, load_fc=True, advprop=False):`
	`584`	`+def load_pretrained_weights(model, model_name, weights_path=None, load_fc=True, advprop=False, verbose=True):`
`580`	`585`	`"""Loads pretrained weights from weights path or download using url.`
`581`	`586`
`582`	`587`	`Args:`
`@@ -607,4 +612,5 @@ def load_pretrained_weights(model, model_name, weights_path=None, load_fc=True,`
`607`	`612`	`['_fc.weight', '_fc.bias']), 'Missing keys when loading pretrained weights: {}'.format(ret.missing_keys)`
`608`	`613`	`assert not ret.unexpected_keys, 'Missing keys when loading pretrained weights: {}'.format(ret.unexpected_keys)`
`609`	`614`
`610`		`- print('Loaded pretrained weights for {}'.format(model_name))`
	`615`	`+ if verbose:`
	`616`	`+ print('Loaded pretrained weights for {}'.format(model_name))`

`‎examples/imagenet/main.py‎`

Lines changed: 1 addition & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -434,7 +434,7 @@ def accuracy(output, target, topk=(1,)):`
`434`	`434`
`435`	`435`	`res = []`
`436`	`436`	`for k in topk:`
`437`		`- correct_k = correct[:k].view(-1).float().sum(0, keepdim=True)`
	`437`	`+ correct_k = correct[:k].reshape(-1).float().sum(0, keepdim=True)`
`438`	`438`	`res.append(correct_k.mul_(100.0 / batch_size))`
`439`	`439`	`return res`
`440`	`440`

`‎setup.py‎`

Lines changed: 1 addition & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -18,7 +18,7 @@`
`18`	`18`	`EMAIL = 'lmelaskyriazi@college.harvard.edu'`
`19`	`19`	`AUTHOR = 'Luke'`
`20`	`20`	`REQUIRES_PYTHON = '>=3.5.0'`
`21`		`-VERSION = '0.7.0'`
	`21`	`+VERSION = '0.7.1'`
`22`	`22`
`23`	`23`	`# What packages are required for this module to be executed?`
`24`	`24`	`REQUIRED = [`

0 commit comments

Comments

(0)

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commit 02e295a

File tree

7 files changed

7 files changed

`‎.github/workflows/main.yml‎`

`‎README.md‎`

`‎efficientnet_pytorch/init.py‎`

`‎efficientnet_pytorch/model.py‎`

`‎efficientnet_pytorch/utils.py‎`

`‎examples/imagenet/main.py‎`

`‎setup.py‎`

0 commit comments

File tree

7 files changed

7 files changed

‎.github/workflows/main.yml‎

‎README.md‎

‎efficientnet_pytorch/__init__.py‎

‎efficientnet_pytorch/model.py‎

‎efficientnet_pytorch/utils.py‎

‎examples/imagenet/main.py‎

‎setup.py‎

0 commit comments

`‎.github/workflows/main.yml‎`

`‎README.md‎`

`‎efficientnet_pytorch/init.py‎`

`‎efficientnet_pytorch/model.py‎`

`‎efficientnet_pytorch/utils.py‎`

`‎examples/imagenet/main.py‎`

`‎setup.py‎`