Commit 1039e00

committed

Add GitHub action and nn.SiLU

1 parent c1ee2d1 commit 1039e00Copy full SHA for 1039e00

File tree

3 files changed

+30

-19

lines changed

.github/workflows
- main.yml
efficientnet_pytorch
- model.py
- utils.py

3 files changed

+30

-19

lines changed

`‎.github/workflows/main.yml‎`

Lines changed: 5 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,5 @@`
	`1`	`+- name: Publish a Python distribution to PyPI`
	`2`	`+ uses: pypa/gh-action-pypi-publish@release/v1`
	`3`	`+ with:`
	`4`	`+ user: __token__`
	`5`	`+ password: ${{ secrets.PYPI_API_TOKEN }}`

`‎efficientnet_pytorch/model.py‎`

Lines changed: 8 additions & 7 deletions

Original file line number	Diff line number	Diff line change
`@@ -50,7 +50,7 @@ class MBConvBlock(nn.Module):`
`50`	`50`	`def __init__(self, block_args, global_params, image_size=None):`
`51`	`51`	`super().__init__()`
`52`	`52`	`self._block_args = block_args`
`53`		`- self._bn_mom = 1 - global_params.batch_norm_momentum # pytorch's difference from tensorflow`
	`53`	`+ self._bn_mom = 1 - global_params.batch_norm_momentum # pytorch's difference from tensorflow`
`54`	`54`	`self._bn_eps = global_params.batch_norm_epsilon`
`55`	`55`	`self.has_se = (self._block_args.se_ratio is not None) and (0 < self._block_args.se_ratio <= 1)`
`56`	`56`	`self.id_skip = block_args.id_skip # whether to use skip connection and drop connect`
`@@ -196,7 +196,7 @@ def __init__(self, blocks_args=None, global_params=None):`
`196`	`196`	`# The first block needs to take care of stride and filter size increase.`
`197`	`197`	`self._blocks.append(MBConvBlock(block_args, self._global_params, image_size=image_size))`
`198`	`198`	`image_size = calculate_output_image_size(image_size, block_args.stride)`
`199`		`- if block_args.num_repeat > 1: # modify block_args to keep same output size`
	`199`	`+ if block_args.num_repeat > 1: # modify block_args to keep same output size`
`200`	`200`	`block_args = block_args._replace(input_filters=block_args.output_filters, stride=1)`
`201`	`201`	`for _ in range(block_args.num_repeat - 1):`
`202`	`202`	`self._blocks.append(MBConvBlock(block_args, self._global_params, image_size=image_size))`
`@@ -261,15 +261,15 @@ def extract_endpoints(self, inputs):`
`261`	`261`	`for idx, block in enumerate(self._blocks):`
`262`	`262`	`drop_connect_rate = self._global_params.drop_connect_rate`
`263`	`263`	`if drop_connect_rate:`
`264`		`- drop_connect_rate *= float(idx) / len(self._blocks) # scale drop connect_rate`
	`264`	`+ drop_connect_rate *= float(idx) / len(self._blocks) # scale drop connect_rate`
`265`	`265`	`x = block(x, drop_connect_rate=drop_connect_rate)`
`266`	`266`	`if prev_x.size(2) > x.size(2):`
`267`		`- endpoints['reduction_{}'.format(len(endpoints)+1)] = prev_x`
	`267`	`+ endpoints['reduction_{}'.format(len(endpoints)+1)] = prev_x`
`268`	`268`	`prev_x = x`
`269`	`269`
`270`	`270`	`# Head`
`271`	`271`	`x = self._swish(self._bn1(self._conv_head(x)))`
`272`		`- endpoints['reduction_{}'.format(len(endpoints)+1)] = x`
	`272`	`+ endpoints['reduction_{}'.format(len(endpoints)+1)] = x`
`273`	`273`
`274`	`274`	`return endpoints`
`275`	`275`
`@@ -290,7 +290,7 @@ def extract_features(self, inputs):`
`290`	`290`	`for idx, block in enumerate(self._blocks):`
`291`	`291`	`drop_connect_rate = self._global_params.drop_connect_rate`
`292`	`292`	`if drop_connect_rate:`
`293`		`- drop_connect_rate *= float(idx) / len(self._blocks) # scale drop connect_rate`
	`293`	`+ drop_connect_rate *= float(idx) / len(self._blocks) # scale drop connect_rate`
`294`	`294`	`x = block(x, drop_connect_rate=drop_connect_rate)`
`295`	`295`
`296`	`296`	`# Head`
`@@ -373,7 +373,8 @@ def from_pretrained(cls, model_name, weights_path=None, advprop=False,`
`373`	`373`	`A pretrained efficientnet model.`
`374`	`374`	`"""`
`375`	`375`	`model = cls.from_name(model_name, num_classes=num_classes, **override_params)`
`376`		`- load_pretrained_weights(model, model_name, weights_path=weights_path, load_fc=(num_classes == 1000), advprop=advprop)`
	`376`	`+ load_pretrained_weights(model, model_name, weights_path=weights_path,`
	`377`	`+ load_fc=(num_classes == 1000), advprop=advprop)`
`377`	`378`	`model._change_in_channels(in_channels)`
`378`	`379`	`return model`
`379`	`380`

`‎efficientnet_pytorch/utils.py‎`

Lines changed: 17 additions & 12 deletions

Original file line number	Diff line number	Diff line change
`@@ -17,7 +17,7 @@`
`17`	`17`
`18`	`18`
`19`	`19`	`################################################################################`
`20`		`-### Help functions for model architecture`
	`20`	`+# Help functions for model architecture`
`21`	`21`	`################################################################################`
`22`	`22`
`23`	`23`	`# GlobalParams and BlockArgs: Two namedtuples`
`@@ -50,11 +50,14 @@`
`50`	`50`	`GlobalParams.__new__.__defaults__ = (None,) * len(GlobalParams._fields)`
`51`	`51`	`BlockArgs.__new__.__defaults__ = (None,) * len(BlockArgs._fields)`
`52`	`52`
`53`		`-`
`54`		`-# An ordinary implementation of Swish function`
`55`		`-class Swish(nn.Module):`
`56`		`- def forward(self, x):`
`57`		`- return x * torch.sigmoid(x)`
	`53`	`+# Swish activation function`
	`54`	`+if hasattr(nn, 'SiLU'):`
	`55`	`+ Swish = nn.SiLU`
	`56`	`+else:`
	`57`	`+ # For compatibility with old PyTorch versions`
	`58`	`+ class Swish(nn.Module):`
	`59`	`+ def forward(self, x):`
	`60`	`+ return x * torch.sigmoid(x)`
`58`	`61`
`59`	`62`
`60`	`63`	`# A memory-efficient implementation of Swish function`
`@@ -97,10 +100,10 @@ def round_filters(filters, global_params):`
`97`	`100`	`divisor = global_params.depth_divisor`
`98`	`101`	`min_depth = global_params.min_depth`
`99`	`102`	`filters *= multiplier`
`100`		`- min_depth = min_depth or divisor # pay attention to this line when using min_depth`
	`103`	`+ min_depth = min_depth or divisor # pay attention to this line when using min_depth`
`101`	`104`	`# follow the formula transferred from official TensorFlow implementation`
`102`	`105`	`new_filters = max(min_depth, int(filters + divisor / 2) // divisor * divisor)`
`103`		`- if new_filters < 0.9 * filters: # prevent rounding by more than 10%`
	`106`	`+ if new_filters < 0.9 * filters: # prevent rounding by more than 10%`
`104`	`107`	`new_filters += divisor`
`105`	`108`	`return int(new_filters)`
`106`	`109`
`@@ -234,7 +237,7 @@ def forward(self, x):`
`234`	`237`	`ih, iw = x.size()[-2:]`
`235`	`238`	`kh, kw = self.weight.size()[-2:]`
`236`	`239`	`sh, sw = self.stride`
`237`		`- oh, ow = math.ceil(ih / sh), math.ceil(iw / sw) # change the output size according to stride ! ! !`
	`240`	`+ oh, ow = math.ceil(ih / sh), math.ceil(iw / sw) # change the output size according to stride ! ! !`
`238`	`241`	`pad_h = max((oh - 1) * self.stride[0] + (kh - 1) * self.dilation[0] + 1 - ih, 0)`
`239`	`242`	`pad_w = max((ow - 1) * self.stride[1] + (kw - 1) * self.dilation[1] + 1 - iw, 0)`
`240`	`243`	`if pad_h > 0 or pad_w > 0:`
`@@ -312,6 +315,7 @@ def forward(self, x):`
`312`	`315`	`return F.max_pool2d(x, self.kernel_size, self.stride, self.padding,`
`313`	`316`	`self.dilation, self.ceil_mode, self.return_indices)`
`314`	`317`
	`318`	`+`
`315`	`319`	`class MaxPool2dStaticSamePadding(nn.MaxPool2d):`
`316`	`320`	`"""2D MaxPooling like TensorFlow's 'SAME' mode, with the given input image size.`
`317`	`321`	`The padding mudule is calculated in construction function, then used in forward.`
`@@ -344,7 +348,7 @@ def forward(self, x):`
`344`	`348`
`345`	`349`
`346`	`350`	`################################################################################`
`347`		`-### Helper functions for loading model params`
	`351`	`+# Helper functions for loading model params`
`348`	`352`	`################################################################################`
`349`	`353`
`350`	`354`	`# BlockDecoder: A Class for encoding and decoding BlockArgs`
`@@ -577,7 +581,7 @@ def get_model_params(model_name, override_params):`
`577`	`581`	`# TODO: add the petrained weights url map of 'efficientnet-l2'`
`578`	`582`
`579`	`583`
`580`		`-def load_pretrained_weights(model, model_name, weights_path=None, load_fc=True, advprop=False):`
	`584`	`+def load_pretrained_weights(model, model_name, weights_path=None, load_fc=True, advprop=False, verbose=True):`
`581`	`585`	`"""Loads pretrained weights from weights path or download using url.`
`582`	`586`
`583`	`587`	`Args:`
`@@ -608,4 +612,5 @@ def load_pretrained_weights(model, model_name, weights_path=None, load_fc=True,`
`608`	`612`	`['_fc.weight', '_fc.bias']), 'Missing keys when loading pretrained weights: {}'.format(ret.missing_keys)`
`609`	`613`	`assert not ret.unexpected_keys, 'Missing keys when loading pretrained weights: {}'.format(ret.unexpected_keys)`
`610`	`614`
`611`		`- print('Loaded pretrained weights for {}'.format(model_name))`
	`615`	`+ if verbose:`
	`616`	`+ print('Loaded pretrained weights for {}'.format(model_name))`

0 commit comments

Comments

(0)

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commit 1039e00

File tree

3 files changed

3 files changed

`‎.github/workflows/main.yml‎`

`‎efficientnet_pytorch/model.py‎`

`‎efficientnet_pytorch/utils.py‎`

0 commit comments