X-Git-Url: https://fleuret.org/cgi-bin/gitweb/gitweb.cgi?a=blobdiff_plain;f=mygpt.py;h=0b63ac800ccccc96f014c0b5c149476814698820;hb=280f38363e34e202d38e6f7c00288329ab067a81;hp=bd79676b2093a2d1c6159dcddf32dafe805deb82;hpb=91ed776af5968643864c4ccce2c8cc7f519a9d65;p=beaver.git diff --git a/mygpt.py b/mygpt.py index bd79676..0b63ac8 100755 --- a/mygpt.py +++ b/mygpt.py @@ -246,12 +246,22 @@ class MyGPT(nn.Module): m.bias.zero_() m.weight.fill_(1.0) - def forward(self, bs, with_readout=True): + def forward(self, bs, mode="standard"): bs.x = F.pad(bs.x, (1, -1)) bs = self.embedding(bs) - bs = self.trunk(bs) - if with_readout: + if mode == "standard": + bs = self.trunk(bs) bs = self.readout(bs) + elif mode == "head": + bs = self.trunk(bs) + elif mode == "deep": + r = [] + for l in self.trunk: + bs = l(bs) + r += [bs.slice()] + bs = BracketedSequence(torch.cat(r, -1)) + else: + raise ValueError return bs