X-Git-Url: https://fleuret.org/cgi-bin/gitweb/gitweb.cgi?a=blobdiff_plain;f=main.py;h=74e70b2a9780601053e51e0d359d082e7a869e1d;hb=cb737bdbd2f112826f739e4581fbe6546aeef638;hp=df4665246df74c443c3676e2930022884da6a7d5;hpb=4395f9a90218819997c706de9505cda1c86ad507;p=mygptrnn.git diff --git a/main.py b/main.py index df46652..74e70b2 100755 --- a/main.py +++ b/main.py @@ -346,6 +346,7 @@ default_model_args = { "nb_blocks": 6, }, "37M": { + "attention": "mha", "dim_model": 512, "dim_keys": 64, "dim_hidden": 2048,