# mask * K[n, src_head, src_time, dk]
# + (1 - mask) * self.rec_K[:, :, t0:t1]
# )
+
+######################################################################
+
+2024 Jan 10 08:10:39 (from mygpt.py)
+
+ # That was a bad idea
+ # G = F.dropout(G, self.attention_dropout, self.training)
+