Commit f0abda4

committed

Big ugly commit, may Linus forgive me.

1 parent f260e1a commit f0abda4Copy full SHA for f0abda4

File tree

29 files changed

+1401

-287

lines changed

hyperfind.py
inclearn
- convnet
  - my_resnet.py
- lib
  - __init__.py
  - data
  - distance.py
  - factory.py
  - herding.py
  - loops
    - loops.py
  - losses
    - distillation.py
    - regularizations.py
  - metrics.py
  - network
  - results_utils.py
  - utils.py
  - vizualization.py
- models
- parser.py
- train.py

29 files changed

+1401

-287

lines changed

`‎hyperfind.py‎`

Lines changed: 25 additions & 10 deletions

Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,7 @@`
`1`	`1`	`import argparse`
`2`	`2`	`import copy`
`3`	`3`	`import os`
	`4`	`+import statistics`
`4`	`5`
`5`	`6`	`import ray`
`6`	`7`	`import yaml`
`@@ -22,6 +23,9 @@ def parse_args():`
`22`	`23`	`parser.add_argument("-per", "--gpu-percent", type=float, default=0.5)`
`23`	`24`	`parser.add_argument("-topn", "--topn", default=5, type=int)`
`24`	`25`	`parser.add_argument("-earlystop", default="ucir", type=str)`
	`26`	`+ parser.add_argument("-options", "--options", default=None, nargs="+")`
	`27`	`+ parser.add_argument("-threads", default=2, type=int)`
	`28`	`+ parser.add_argument("-resume", default=False, action="store_true")`
`25`	`29`
`26`	`30`	`return parser.parse_args()`
`27`	`31`
`@@ -31,15 +35,17 @@ def train_func(config, reporter):`
`31`	`35`	`train_args.update(config)`
`32`	`36`
`33`	`37`	`train_args["device"] = [0]`
`34`		`- train_args["threads"] = 2`
`35`		`- train_args["logging"] = "critical"`
	`38`	`+ train_args["logging"] = "warning"`
`36`	`39`	`train_args["no_progressbar"] = True`
`37`	`40`
`38`		`- for i, (avg_inc_acc, last_acc, _) in enumerate(inclearn.train.train(train_args)):`
`39`		`- last_acc = last_acc * 100`
	`41`	`+ all_acc = []`
	`42`	`+ for i, (avg_inc_acc, last_acc, _, is_last) in enumerate(inclearn.train.train(train_args)):`
	`43`	`+ if is_last:`
	`44`	`+ all_acc.append(avg_inc_acc)`
`40`	`45`
`41`		`- reporter(avg_inc_acc=avg_inc_acc)`
`42`		`- return avg_inc_acc`
	`46`	`+ total_avg_inc_acc = statistics.mean(all_acc)`
	`47`	`+ reporter(avg_inc_acc=total_avg_inc_acc)`
	`48`	`+ return total_avg_inc_acc`
`43`	`49`
`44`	`50`
`45`	`51`	`def _get_abs_path(path):`
`@@ -61,6 +67,7 @@ def analyse_ray_dump(ray_directory, topn):`
`61`	`67`	`elif col == "avg_inc_acc":`
`62`	`68`	`result_index = index`
`63`	`69`
	`70`	`+ print("Ray config: {}".format(ray_directory))`
`64`	`71`	`print("Best Config:")`
`65`	`72`	`print(`
`66`	`73`	`"avg_inc_acc: {} with {}.".format(`
`@@ -90,7 +97,6 @@ def _get_line_results(df, row_index, mapping):`
`90`	`97`	`for col, index in mapping.items():`
`91`	`98`	`if col.startswith("var:"):`
`92`	`99`	`col = col[4:]`
`93`		`-`
`94`	`100`	`results[col] = df.iloc[row_index][index]`
`95`	`101`	`return results`
`96`	`102`
`@@ -109,7 +115,7 @@ def set_seen_gpus(gpus):`
`109`	`115`	`os.environ["CUDA_VISIBLE_DEVICES"] = ",".join(gpus)`
`110`	`116`
`111`	`117`
`112`		`-def get_tune_config(tune_options):`
	`118`	`+def get_tune_config(tune_options, options_files):`
`113`	`119`	`with open(tune_options) as f:`
`114`	`120`	`options = yaml.load(f, Loader=yaml.FullLoader)`
`115`	`121`
`@@ -120,6 +126,10 @@ def get_tune_config(tune_options):`
`120`	`126`	`else:`
`121`	`127`	`config[k.replace("var:", "")] = tune.grid_search(v)`
`122`	`128`
	`129`	`+ if options_files is not None:`
	`130`	`+ print("Options files: {}".format(options_files))`
	`131`	`+ config["options"] = [os.path.realpath(op) for op in options_files]`
	`132`	`+`
`123`	`133`	`return config`
`124`	`134`
`125`	`135`
`@@ -129,7 +139,8 @@ def main():`
`129`	`139`	`set_seen_gpus(args.gpus)`
`130`	`140`
`131`	`141`	`if args.tune is not None:`
`132`		`- config = get_tune_config(args.tune)`
	`142`	`+ config = get_tune_config(args.tune, args.options)`
	`143`	`+ config["threads"] = args.threads`
`133`	`144`	`ray.init()`
`134`	`145`	`tune.run(`
`135`	`146`	`train_func,`
`@@ -140,11 +151,15 @@ def main():`
`140`	`151`	`"cpu": 2,`
`141`	`152`	`"gpu": args.gpu_percent`
`142`	`153`	`},`
`143`		`- local_dir=args.ray_directory`
	`154`	`+ local_dir=args.ray_directory,`
	`155`	`+ resume=args.resume`
`144`	`156`	`)`
`145`	`157`
`146`	`158`	`args.ray_directory = os.path.join(args.ray_directory, args.tune.rstrip("/").split("/")[-1])`
`147`	`159`
	`160`	`+ if args.tune is not None:`
	`161`	`+ print("\n\n", args.tune, "\n\n")`
	`162`	`+`
`148`	`163`	`if args.ray_directory is not None:`
`149`	`164`	`best_config = analyse_ray_dump(_get_abs_path(args.ray_directory), args.topn)`
`150`	`165`

`‎inclearn/convnet/my_resnet.py‎`

Lines changed: 7 additions & 9 deletions

Original file line number	Diff line number	Diff line change
`@@ -2,13 +2,17 @@`
`2`	`2`
`3`	`3`	`https://github.com/srebuffi/iCaRL/blob/master/iCaRL-TheanoLasagne/utils_cifar100.py`
`4`	`4`	`"""`
	`5`	`+import logging`
	`6`	`+`
`5`	`7`	`import torch`
`6`	`8`	`import torch.nn as nn`
`7`	`9`	`import torch.nn.functional as F`
`8`	`10`	`from torch.nn import init`
`9`	`11`
`10`	`12`	`from inclearn.lib import pooling`
`11`	`13`
	`14`	`+logger = logging.getLogger(__name__)`
	`15`	`+`
`12`	`16`
`13`	`17`	`class DownsampleStride(nn.Module):`
`14`	`18`
`@@ -189,7 +193,7 @@ def __init__(`
`189`	`193`	`raise ValueError("Unused kwargs: {}.".format(kwargs))`
`190`	`194`
`191`	`195`	`self.all_attentions = all_attentions`
`192`		`- print("Downsampling type", downsampling)`
	`196`	`+ logger.info("Downsampling type {}".format(downsampling))`
`193`	`197`	`self._downsampling_type = downsampling`
`194`	`198`	`self.last_relu = last_relu`
`195`	`199`
`@@ -255,9 +259,7 @@ def _make_layer(self, Block, planes, increase_dim=False, n=None):`
`255`	`259`	`planes = 2 * planes`
`256`	`260`
`257`	`261`	`for i in range(n):`
`258`		`- layers.append(`
`259`		`- Block(planes, last_relu=False, downsampling=self._downsampling_type)`
`260`		`- )`
	`262`	`+ layers.append(Block(planes, last_relu=False, downsampling=self._downsampling_type))`
`261`	`263`
`262`	`264`	`return Stage(layers, block_relu=self.last_relu)`
`263`	`265`
`@@ -282,11 +284,7 @@ def forward(self, x):`
`282`	`284`	`else:`
`283`	`285`	`attentions = [feats_s1[-1], feats_s2[-1], feats_s3[-1], x]`
`284`	`286`
`285`		`- return {`
`286`		`- "raw_features": raw_features,`
`287`		`- "features": features,`
`288`		`- "attention": attentions`
`289`		`- }`
	`287`	`+ return {"raw_features": raw_features, "features": features, "attention": attentions}`
`290`	`288`
`291`	`289`	`def end_features(self, x):`
`292`	`290`	`x = self.pool(x)`

`‎inclearn/lib/init.py‎`

Lines changed: 2 additions & 2 deletions

Original file line number	Diff line number	Diff line change
`@@ -1,5 +1,5 @@`
`1`	`1`	`# flake8: noqa`
`2`	`2`	`from . import (`
`3`		`- calibration, callbacks, data, factory, herding, loops, losses, metrics, network, pooling,`
`4`		`- results_utils, schedulers, utils, vizualization`
	`3`	`+ calibration, callbacks, data, distance, factory, herding, loops, losses, metrics, network,`
	`4`	`+ pooling, results_utils, schedulers, utils, vizualization`
`5`	`5`	`)`

`‎inclearn/lib/data/init.py‎`

Lines changed: 1 addition & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -1,5 +1,6 @@`
`1`	`1`	`# flake8: noqa`
`2`	`2`	`from .datasets import *`
	`3`	`+from .download import *`
`3`	`4`	`from .incdataset import *`
`4`	`5`	`from .samplers import *`
`5`	`6`	`from .weights import *`

`‎inclearn/lib/data/download.py‎`

Lines changed: 39 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,39 @@`
	`1`	`+import gzip`
	`2`	`+import io`
	`3`	`+import logging`
	`4`	`+import os`
	`5`	`+import urllib.request`
	`6`	`+`
	`7`	`+logger = logging.getLogger(__name__)`
	`8`	`+`
	`9`	`+URLS = {`
	`10`	`+ "googlenews":`
	`11`	`+ "https://github.com/eyaler/word2vec-slim/raw/master/GoogleNews-vectors-negative300-SLIM.bin.gz"`
	`12`	`+}`
	`13`	`+`
	`14`	`+`
	`15`	`+def fetch_word_embeddings(folder, name="googlenews"):`
	`16`	`+ if name == "googlenews":`
	`17`	`+ return _fetch_googlenews_word2vec(folder)`
	`18`	`+ raise ValueError("Unknown embedding type {}.".format(name))`
	`19`	`+`
	`20`	`+`
	`21`	`+def _fetch_googlenews_word2vec(folder):`
	`22`	`+ output_file = os.path.join(folder, "googlenews.bin")`
	`23`	`+`
	`24`	`+ if os.path.exists(output_file):`
	`25`	`+ logger.info("googlenews.bin already exist! Skipping.")`
	`26`	`+ return output_file`
	`27`	`+`
	`28`	`+ response = urllib.request.urlopen(URLS["googlenews"])`
	`29`	`+`
	`30`	`+ logger.info("Downloading googlenews...")`
	`31`	`+ compressed_file = io.BytesIO(response.read())`
	`32`	`+`
	`33`	`+ logger.info("Decompressing googlenews...")`
	`34`	`+ decompressed_file = gzip.GzipFile(fileobj=compressed_file, mode='rb')`
	`35`	`+`
	`36`	`+ with open(output_file, 'wb+') as f:`
	`37`	`+ f.write(decompressed_file.read())`
	`38`	`+`
	`39`	`+ return output_file`

`‎inclearn/lib/data/incdataset.py‎`

Lines changed: 17 additions & 8 deletions

Original file line number	Diff line number	Diff line change
`@@ -7,8 +7,9 @@`
`7`	`7`	`from torch.utils.data import DataLoader`
`8`	`8`	`from torchvision import transforms`
`9`	`9`
`10`		`-from .datasets import (ImageNet100, ImageNet100UCIR, ImageNet1000,`
`11`		`- TinyImageNet200, iCIFAR10, iCIFAR100)`
	`10`	`+from .datasets import (`
	`11`	`+ ImageNet100, ImageNet100UCIR, ImageNet1000, TinyImageNet200, iCIFAR10, iCIFAR100`
	`12`	`+)`
`12`	`13`
`13`	`14`	`logger = logging.getLogger(__name__)`
`14`	`15`
`@@ -49,7 +50,8 @@ def __init__(`
`49`	`50`	`sampler_config=None,`
`50`	`51`	`data_path="data",`
`51`	`52`	`class_order=None,`
`52`		`- dataset_transforms=None`
	`53`	`+ dataset_transforms=None,`
	`54`	`+ all_test_classes=False,`
`53`	`55`	`):`
`54`	`56`	`datasets = _get_datasets(dataset_name)`
`55`	`57`	`self._setup_data(`
`@@ -80,6 +82,7 @@ def __init__(`
`80`	`82`	`self._onehot = onehot`
`81`	`83`	`self._sampler = sampler`
`82`	`84`	`self._sampler_config = sampler_config`
	`85`	`+ self._all_test_classes = all_test_classes`
`83`	`86`
`84`	`87`	`@property`
`85`	`88`	`def n_tasks(self):`
`@@ -97,7 +100,13 @@ def new_task(self, memory=None, memory_val=None):`
`97`	`100`	`x_val, y_val = self._select(`
`98`	`101`	`self.data_val, self.targets_val, low_range=min_class, high_range=max_class`
`99`	`102`	`)`
`100`		`- x_test, y_test = self._select(self.data_test, self.targets_test, high_range=max_class)`
	`103`	`+ if self._all_test_classes:`
	`104`	`+ logger.info("Testing on all classes!")`
	`105`	`+ x_test, y_test = self._select(`
	`106`	`+ self.data_test, self.targets_test, high_range=sum(self.increments)`
	`107`	`+ )`
	`108`	`+ else:`
	`109`	`+ x_test, y_test = self._select(self.data_test, self.targets_test, high_range=max_class)`
`101`	`110`
`102`	`111`	`if self._onehot:`
`103`	`112`
`@@ -108,12 +117,12 @@ def to_onehot(x):`
`108`	`117`	`y_train = to_onehot(y_train)`
`109`	`118`
`110`	`119`	`if memory is not None:`
`111`		`- print("Set memory of size: {}.".format(memory[0].shape[0]))`
	`120`	`+ logger.info("Set memory of size: {}.".format(memory[0].shape[0]))`
`112`	`121`	`x_train, y_train, train_memory_flags = self._add_memory(x_train, y_train, *memory)`
`113`	`122`	`else:`
`114`	`123`	`train_memory_flags = np.zeros((x_train.shape[0],))`
`115`	`124`	`if memory_val is not None:`
`116`		`- print("Set validation memory of size: {}.".format(memory_val[0].shape[0]))`
	`125`	`+ logger.info("Set validation memory of size: {}.".format(memory_val[0].shape[0]))`
`117`	`126`	`x_val, y_val, val_memory_flags = self._add_memory(x_val, y_val, *memory_val)`
`118`	`127`	`else:`
`119`	`128`	`val_memory_flags = np.zeros((x_val.shape[0],))`
`@@ -191,7 +200,7 @@ def get_custom_loader(`
`191`	`200`	`data = np.concatenate(data)`
`192`	`201`	`targets = np.concatenate(targets)`
`193`	`202`
`194`		`- if memory is not None:`
	`203`	`+ if memory is not Noneor (isinstance(memory, tuple) andmemory[0] isNone):`
`195`	`204`	`if len(data) > 0:`
`196`	`205`	`data, targets, memory_flags = self._add_memory(data, targets, *memory)`
`197`	`206`	`else:`
`@@ -283,7 +292,7 @@ def _setup_data(`
`283`	`292`	`elif dataset.class_order is not None:`
`284`	`293`	`order = dataset.class_order`
`285`	`294`
`286`		`- print("Dataset {}: class ordering: {}.".format(dataset, order))`
	`295`	`+ logger.info("Dataset {}: class ordering: {}.".format(dataset, order))`
`287`	`296`
`288`	`297`	`self.class_order.append(order)`
`289`	`298`

`‎inclearn/lib/distance.py‎`

Lines changed: 41 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,41 @@`
	`1`	`+import torch`
	`2`	`+from torch.nn import functional as F`
	`3`	`+`
	`4`	`+`
	`5`	`+def squared_euclidian_distance(a, b):`
	`6`	`+ return torch.cdist(a, b)**2`
	`7`	`+`
	`8`	`+`
	`9`	`+def cosine_similarity(a, b):`
	`10`	`+ return torch.mm(F.normalize(a, p=2, dim=-1), F.normalize(b, p=2, dim=-1).T)`
	`11`	`+`
	`12`	`+`
	`13`	`+def stable_cosine_distance(a, b, squared=True):`
	`14`	`+ """Computes the pairwise distance matrix with numerical stability."""`
	`15`	`+ mat = torch.cat([a, b])`
	`16`	`+`
	`17`	`+ pairwise_distances_squared = torch.add(`
	`18`	`+ mat.pow(2).sum(dim=1, keepdim=True).expand(mat.size(0), -1),`
	`19`	`+ torch.t(mat).pow(2).sum(dim=0, keepdim=True).expand(mat.size(0), -1)`
	`20`	`+ ) - 2 * (torch.mm(mat, torch.t(mat)))`
	`21`	`+`
	`22`	`+ # Deal with numerical inaccuracies. Set small negatives to zero.`
	`23`	`+ pairwise_distances_squared = torch.clamp(pairwise_distances_squared, min=0.0)`
	`24`	`+`
	`25`	`+ # Get the mask where the zero distances are at.`
	`26`	`+ error_mask = torch.le(pairwise_distances_squared, 0.0)`
	`27`	`+`
	`28`	`+ # Optionally take the sqrt.`
	`29`	`+ if squared:`
	`30`	`+ pairwise_distances = pairwise_distances_squared`
	`31`	`+ else:`
	`32`	`+ pairwise_distances = torch.sqrt(pairwise_distances_squared + error_mask.float() * 1e-16)`
	`33`	`+`
	`34`	`+ # Undo conditionally adding 1e-16.`
	`35`	`+ pairwise_distances = torch.mul(pairwise_distances, (error_mask == False).float())`
	`36`	`+`
	`37`	`+ # Explicitly set diagonals to zero.`
	`38`	`+ mask_offdiagonals = 1 - torch.eye(*pairwise_distances.size(), device=pairwise_distances.device)`
	`39`	`+ pairwise_distances = torch.mul(pairwise_distances, mask_offdiagonals)`
	`40`	`+`
	`41`	`+ return pairwise_distances[:a.shape[0], a.shape[0]:]`

`‎inclearn/lib/factory.py‎`

Lines changed: 4 additions & 2 deletions

Original file line number	Diff line number	Diff line change
`@@ -56,7 +56,8 @@ def get_model(args):`
`56`	`56`	`"bic": models.BiC,`
`57`	`57`	`"ucir": models.UCIR,`
`58`	`58`	`"still": models.STILL,`
`59`		`- "lwm": models.LwM`
	`59`	`+ "lwm": models.LwM,`
	`60`	`+ "zil": models.ZIL`
`60`	`61`	`}`
`61`	`62`
`62`	`63`	`model = args["model"].lower()`
`@@ -85,7 +86,8 @@ def get_data(args, class_order=None):`
`85`	`86`	`data_path=args["data_path"],`
`86`	`87`	`class_order=class_order,`
`87`	`88`	`seed=args["seed"],`
`88`		`- dataset_transforms=args.get("dataset_transforms", {})`
	`89`	`+ dataset_transforms=args.get("dataset_transforms", {}),`
	`90`	`+ all_test_classes=args.get("all_test_classes", False)`
`89`	`91`	`)`
`90`	`92`
`91`	`93`

0 commit comments

Comments

(0)

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commit f0abda4

File tree

29 files changed

29 files changed

`‎hyperfind.py‎`

`‎inclearn/convnet/my_resnet.py‎`

`‎inclearn/lib/init.py‎`

`‎inclearn/lib/data/init.py‎`

`‎inclearn/lib/data/download.py‎`

`‎inclearn/lib/data/incdataset.py‎`

`‎inclearn/lib/distance.py‎`

`‎inclearn/lib/factory.py‎`

0 commit comments