CoCalc -- learner.py

GitHub Repository: jantic/deoldify
Path: blob/master/fastai/vision/learner.py
⁸⁴⁰ views
1
"`Learner` support for computer vision"
2
from ..torch_core import *
3
from ..basic_train import *
4
from ..basic_data import *
5
from .image import *
6
from . import models
7
from ..callback import *
8
from ..layers import *
9
from ..callbacks.hooks import *
10
from ..train import ClassificationInterpretation
11

12
__all__ = ['cnn_learner', 'create_cnn', 'create_cnn_model', 'create_body', 'create_head', 'unet_learner']
13
# By default split models between first and second layer
14
def _default_split(m:nn.Module): return (m[1],)
15
# Split a resnet style model
16
def _resnet_split(m:nn.Module): return (m[0][6],m[1])
17
# Split squeezenet model on maxpool layers
18
def _squeezenet_split(m:nn.Module): return (m[0][0][5], m[0][0][8], m[1])
19
def _densenet_split(m:nn.Module): return (m[0][0][7],m[1])
20
def _vgg_split(m:nn.Module): return (m[0][0][22],m[1])
21
def _alexnet_split(m:nn.Module): return (m[0][0][6],m[1])
22

23
_default_meta    = {'cut':None, 'split':_default_split}
24
_resnet_meta     = {'cut':-2, 'split':_resnet_split }
25
_squeezenet_meta = {'cut':-1, 'split': _squeezenet_split}
26
_densenet_meta   = {'cut':-1, 'split':_densenet_split}
27
_vgg_meta        = {'cut':-1, 'split':_vgg_split}
28
_alexnet_meta    = {'cut':-1, 'split':_alexnet_split}
29

30
model_meta = {
31
    models.resnet18 :{**_resnet_meta}, models.resnet34: {**_resnet_meta},
32
    models.resnet50 :{**_resnet_meta}, models.resnet101:{**_resnet_meta},
33
    models.resnet152:{**_resnet_meta},
34

35
    models.squeezenet1_0:{**_squeezenet_meta},
36
    models.squeezenet1_1:{**_squeezenet_meta},
37

38
    models.densenet121:{**_densenet_meta}, models.densenet169:{**_densenet_meta},
39
    models.densenet201:{**_densenet_meta}, models.densenet161:{**_densenet_meta},
40
    models.vgg16_bn:{**_vgg_meta}, models.vgg19_bn:{**_vgg_meta},
41
    models.alexnet:{**_alexnet_meta}}
42

43
def cnn_config(arch):
44
    "Get the metadata associated with `arch`."
45
    #torch.backends.cudnn.benchmark = True
46
    return model_meta.get(arch, _default_meta)
47

48
def has_pool_type(m):
49
    if is_pool_type(m): return True
50
    for l in m.children():
51
        if has_pool_type(l): return True
52
    return False
53

54
def create_body(arch:Callable, pretrained:bool=True, cut:Optional[Union[int, Callable]]=None):
55
    "Cut off the body of a typically pretrained `model` at `cut` (int) or cut the model as specified by `cut(model)` (function)."
56
    model = arch(pretrained=pretrained)
57
    cut = ifnone(cut, cnn_config(arch)['cut'])
58
    if cut is None:
59
        ll = list(enumerate(model.children()))
60
        cut = next(i for i,o in reversed(ll) if has_pool_type(o))
61
    if   isinstance(cut, int):      return nn.Sequential(*list(model.children())[:cut])
62
    elif isinstance(cut, Callable): return cut(model)
63
    else:                           raise NamedError("cut must be either integer or a function")
64

65

66
def create_head(nf:int, nc:int, lin_ftrs:Optional[Collection[int]]=None, ps:Floats=0.5,
67
                concat_pool:bool=True, bn_final:bool=False):
68
    "Model head that takes `nf` features, runs through `lin_ftrs`, and about `nc` classes."
69
    lin_ftrs = [nf, 512, nc] if lin_ftrs is None else [nf] + lin_ftrs + [nc]
70
    ps = listify(ps)
71
    if len(ps) == 1: ps = [ps[0]/2] * (len(lin_ftrs)-2) + ps
72
    actns = [nn.ReLU(inplace=True)] * (len(lin_ftrs)-2) + [None]
73
    pool = AdaptiveConcatPool2d() if concat_pool else nn.AdaptiveAvgPool2d(1)
74
    layers = [pool, Flatten()]
75
    for ni,no,p,actn in zip(lin_ftrs[:-1], lin_ftrs[1:], ps, actns):
76
        layers += bn_drop_lin(ni, no, True, p, actn)
77
    if bn_final: layers.append(nn.BatchNorm1d(lin_ftrs[-1], momentum=0.01))
78
    return nn.Sequential(*layers)
79

80
def create_cnn_model(base_arch:Callable, nc:int, cut:Union[int,Callable]=None, pretrained:bool=True,
81
                     lin_ftrs:Optional[Collection[int]]=None, ps:Floats=0.5, custom_head:Optional[nn.Module]=None,
82
                     bn_final:bool=False, concat_pool:bool=True):
83
    "Create custom convnet architecture"
84
    body = create_body(base_arch, pretrained, cut)
85
    if custom_head is None:
86
        nf = num_features_model(nn.Sequential(*body.children())) * (2 if concat_pool else 1)
87
        head = create_head(nf, nc, lin_ftrs, ps=ps, concat_pool=concat_pool, bn_final=bn_final)
88
    else: head = custom_head
89
    return nn.Sequential(body, head)
90

91
def cnn_learner(data:DataBunch, base_arch:Callable, cut:Union[int,Callable]=None, pretrained:bool=True,
92
                lin_ftrs:Optional[Collection[int]]=None, ps:Floats=0.5, custom_head:Optional[nn.Module]=None,
93
                split_on:Optional[SplitFuncOrIdxList]=None, bn_final:bool=False, init=nn.init.kaiming_normal_,
94
                concat_pool:bool=True, **kwargs:Any)->Learner:
95
    "Build convnet style learner."
96
    meta = cnn_config(base_arch)
97
    model = create_cnn_model(base_arch, data.c, cut, pretrained, lin_ftrs, ps=ps, custom_head=custom_head,
98
        bn_final=bn_final, concat_pool=concat_pool)
99
    learn = Learner(data, model, **kwargs)
100
    learn.split(split_on or meta['split'])
101
    if pretrained: learn.freeze()
102
    if init: apply_init(model[1], init)
103
    return learn
104

105
def create_cnn(data, base_arch, **kwargs):
106
    warn("`create_cnn` is deprecated and is now named `cnn_learner`.")
107
    return cnn_learner(data, base_arch, **kwargs)
108

109
def unet_learner(data:DataBunch, arch:Callable, pretrained:bool=True, blur_final:bool=True,
110
                 norm_type:Optional[NormType]=NormType, split_on:Optional[SplitFuncOrIdxList]=None, blur:bool=False,
111
                 self_attention:bool=False, y_range:Optional[Tuple[float,float]]=None, last_cross:bool=True,
112
                 bottle:bool=False, cut:Union[int,Callable]=None, **learn_kwargs:Any)->Learner:
113
    "Build Unet learner from `data` and `arch`."
114
    meta = cnn_config(arch)
115
    body = create_body(arch, pretrained, cut)
116
    try:    size = data.train_ds[0][0].size
117
    except: size = next(iter(data.train_dl))[0].shape[-2:]
118
    model = to_device(models.unet.DynamicUnet(body, n_classes=data.c, img_size=size, blur=blur, blur_final=blur_final,
119
          self_attention=self_attention, y_range=y_range, norm_type=norm_type, last_cross=last_cross,
120
          bottle=bottle), data.device)
121
    learn = Learner(data, model, **learn_kwargs)
122
    learn.split(ifnone(split_on, meta['split']))
123
    if pretrained: learn.freeze()
124
    apply_init(model[2], nn.init.kaiming_normal_)
125
    return learn
126

127
@classmethod
128
def _cl_int_from_learner(cls, learn:Learner, ds_type:DatasetType=DatasetType.Valid, activ:nn.Module=None, tta=False):
129
    "Create an instance of `ClassificationInterpretation`. `tta` indicates if we want to use Test Time Augmentation."
130
    preds = learn.TTA(ds_type=ds_type, with_loss=True) if tta else learn.get_preds(ds_type=ds_type, activ=activ, with_loss=True)
131

132
    return cls(learn, *preds, ds_type=ds_type)
133

134
def _test_cnn(m):
135
    if not isinstance(m, nn.Sequential) or not len(m) == 2: return False
136
    return isinstance(m[1][0], (AdaptiveConcatPool2d, nn.AdaptiveAvgPool2d))
137

138
def _cl_int_gradcam(self, idx, heatmap_thresh:int=16, image:bool=True):
139
    m = self.learn.model.eval()
140
    im,cl = self.learn.data.dl(DatasetType.Valid).dataset[idx]
141
    cl = int(cl)
142
    xb,_ = self.data.one_item(im, detach=False, denorm=False) #put into a minibatch of batch size = 1
143
    with hook_output(m[0]) as hook_a: 
144
        with hook_output(m[0], grad=True) as hook_g:
145
            preds = m(xb)
146
            preds[0,int(cl)].backward() 
147
    acts  = hook_a.stored[0].cpu() #activation maps
148
    if (acts.shape[-1]*acts.shape[-2]) >= heatmap_thresh:
149
        grad = hook_g.stored[0][0].cpu()
150
        grad_chan = grad.mean(1).mean(1)
151
        mult = F.relu(((acts*grad_chan[...,None,None])).sum(0))
152
        if image:
153
            xb_im = Image(xb[0])
154
            _,ax = plt.subplots()
155
            sz = list(xb_im.shape[-2:])
156
            xb_im.show(ax,title=f"pred. class: {self.pred_class[idx]}, actual class: {self.learn.data.classes[cl]}")
157
            ax.imshow(mult, alpha=0.4, extent=(0,*sz[::-1],0),
158
              interpolation='bilinear', cmap='magma')
159
        return mult
160

161
ClassificationInterpretation.GradCAM =_cl_int_gradcam
162

163
def _cl_int_plot_top_losses(self, k, largest=True, figsize=(12,12), heatmap:bool=False, heatmap_thresh:int=16,
164
                            return_fig:bool=None)->Optional[plt.Figure]:
165
    "Show images in `top_losses` along with their prediction, actual, loss, and probability of actual class."
166
    assert not heatmap or _test_cnn(self.learn.model), "`heatmap=True` requires a model like `cnn_learner` produces."
167
    if heatmap is None: heatmap = _test_cnn(self.learn.model)
168
    tl_val,tl_idx = self.top_losses(k, largest)
169
    classes = self.data.classes
170
    cols = math.ceil(math.sqrt(k))
171
    rows = math.ceil(k/cols)
172
    fig,axes = plt.subplots(rows, cols, figsize=figsize)
173
    fig.suptitle('prediction/actual/loss/probability', weight='bold', size=14)
174
    for i,idx in enumerate(tl_idx):
175
        im,cl = self.data.dl(self.ds_type).dataset[idx]
176
        cl = int(cl)
177
        im.show(ax=axes.flat[i], title=
178
            f'{classes[self.pred_class[idx]]}/{classes[cl]} / {self.losses[idx]:.2f} / {self.preds[idx][cl]:.2f}')
179
        if heatmap:
180
            mult = self.GradCAM(idx,heatmap_thresh,image=False)
181
            if mult is not None:
182
                sz = list(im.shape[-2:])
183
                axes.flat[i].imshow(mult, alpha=0.6, extent=(0,*sz[::-1],0), interpolation='bilinear', cmap='magma')                
184
    if ifnone(return_fig, defaults.return_fig): return fig
185

186
def _cl_int_plot_multi_top_losses(self, samples:int=3, figsize:Tuple[int,int]=(8,8), save_misclassified:bool=False):
187
    "Show images in `top_losses` along with their prediction, actual, loss, and probability of predicted class in a multilabeled dataset."
188
    if samples >20:
189
        print("Max 20 samples")
190
        return
191
    losses, idxs = self.top_losses(self.data.c)
192
    l_dim = len(losses.size())
193
    if l_dim == 1: losses, idxs = self.top_losses()
194
    infolist, ordlosses_idxs, mismatches_idxs, mismatches, losses_mismatches, mismatchescontainer = [],[],[],[],[],[]
195
    truthlabels = np.asarray(self.y_true, dtype=int)
196
    classes_ids = [k for k in enumerate(self.data.classes)]
197
    predclass = np.asarray(self.pred_class)
198
    for i,pred in enumerate(predclass):
199
        where_truth = np.nonzero((truthlabels[i]>0))[0]
200
        mismatch = np.all(pred!=where_truth)
201
        if mismatch:
202
            mismatches_idxs.append(i)
203
            if l_dim > 1 : losses_mismatches.append((losses[i][pred], i))
204
            else: losses_mismatches.append((losses[i], i))
205
        if l_dim > 1: infotup = (i, pred, where_truth, losses[i][pred], np.round(self.preds[i], decimals=3)[pred], mismatch)
206
        else: infotup = (i, pred, where_truth, losses[i], np.round(self.preds[i], decimals=3)[pred], mismatch)
207
        infolist.append(infotup)
208
    ds = self.data.dl(self.ds_type).dataset
209
    mismatches = ds[mismatches_idxs]
210
    ordlosses = sorted(losses_mismatches, key = lambda x: x[0], reverse=True)
211
    for w in ordlosses: ordlosses_idxs.append(w[1])
212
    mismatches_ordered_byloss = ds[ordlosses_idxs]
213
    print(f'{str(len(mismatches))} misclassified samples over {str(len(self.data.valid_ds))} samples in the validation set.')
214
    samples = min(samples, len(mismatches))
215
    for ima in range(len(mismatches_ordered_byloss)):
216
        mismatchescontainer.append(mismatches_ordered_byloss[ima][0])
217
    for sampleN in range(samples):
218
        actualclasses = ''
219
        for clas in infoList[ordlosses_idxs[sampleN]][2]:
220
            actualclasses = f'{actualclasses} -- {str(classes_ids[clas][1])}'
221
        imag = mismatches_ordered_byloss[sampleN][0]
222
        imag = show_image(imag, figsize=figsize)
223
        imag.set_title(f"""Predicted: {classes_ids[infoList[ordlosses_idxs[sampleN]][1]][1]} \nActual: {actualclasses}\nLoss: {infoList[ordlosses_idxs[sampleN]][3]}\nProbability: {infoList[ordlosses_idxs[sampleN]][4]}""",
224
                        loc='left')
225
        plt.show()
226
        if save_misclassified: return mismatchescontainer
227

228
ClassificationInterpretation.from_learner          = _cl_int_from_learner
229
ClassificationInterpretation.plot_top_losses       = _cl_int_plot_top_losses
230
ClassificationInterpretation.plot_multi_top_losses = _cl_int_plot_multi_top_losses
231
 
232

233
def _learner_interpret(learn:Learner, ds_type:DatasetType=DatasetType.Valid, tta=False):
234
    "Create a `ClassificationInterpretation` object from `learner` on `ds_type` with `tta`."
235
    return ClassificationInterpretation.from_learner(learn, ds_type=ds_type, tta=tta)
236
Learner.interpret = _learner_interpret
237

238
Product

Resources

Company