X-Git-Url: https://fleuret.org/cgi-bin/gitweb/gitweb.cgi?a=blobdiff_plain;ds=sidebyside;f=tasks.py;h=bad4536c8cea90c1c555385d3f34083f54041097;hb=5d46a9bd7d032d90ef4c4b38ac3c9b5b66526527;hp=0a4dd6fa2f880e93aecbbd494621fae26b7dcdbb;hpb=a291e213a152364b74e833200191c08a36451a90;p=picoclvr.git diff --git a/tasks.py b/tasks.py index 0a4dd6f..bad4536 100755 --- a/tasks.py +++ b/tasks.py @@ -1,5 +1,10 @@ #!/usr/bin/env python +# Any copyright is dedicated to the Public Domain. +# https://creativecommons.org/publicdomain/zero/1.0/ + +# Written by Francois Fleuret + import math, os, tqdm import torch, torchvision @@ -108,9 +113,7 @@ class ProblemLevel1(Problem): source = torch.rand(nb, 10).sort(dim=1).indices[:, : self.len_source] marker2 = torch.full((nb, 1), 11) result = operators.bmm(source[:, :, None]).squeeze(-1) - print(f"{nb_operators.dtype=} {marker1.dtype=}") sequences = torch.cat((nb_operators, marker1, source, marker2, result), 1) - print(f"{sequences.size()=}") ar_mask = (sequences == 11).long() ar_mask = (ar_mask.cumsum(1) - ar_mask).clamp(max=1) return sequences, ar_mask @@ -1091,7 +1094,6 @@ class RPL(Task): symbols = list(filter(lambda x: type(x) is str, symbols)) symbols.sort() symbols += [str(n) for n in range(val_max + 1)] - print(f"{val_max=}") self.token2id = dict([(c, n) for n, c in enumerate(symbols)]) self.id2token = dict([(n, c) for c, n in self.token2id.items()]) @@ -1101,6 +1103,7 @@ class RPL(Task): self.test_input = self.tensorize(test_sequences) if logger is not None: + logger(f"value_max {val_max}") for x in self.train_input[:25]: end = (x != self.t_nul).nonzero().max().item() + 1 seq = [self.id2token[i.item()] for i in x[:end]]