attention_dropout=0.0,
len_max=1e5,
logger=print,
- args,
+ args=None,
):
super().__init__()
attention_dropout=0.0,
len_max=1e5,
logger=print,
- args,
+ args=None,
):
super().__init__()
attention_dropout=0.0,
len_max=1e5,
logger=print,
- args,
+ args=None,
):
super().__init__()
causal=False,
attention_dropout=0.0,
logger=print,
- args,
+ args=None,
):
super().__init__()
len_max=1e5,
attention_layer="kvrec",
logger=print,
- args,
+ args=None,
):
super().__init__()
causal=causal,
attention_dropout=dropout,
logger=logger,
- args,
+ args=args,
)
elif attention_layer == "dumbrec":
return DumbRec(
nb_lines=nb_lines,
attention_dropout=dropout,
logger=logger,
- args,
+ args=args,
)
elif attention_layer == "kvrec":
return KVRec(
nb_lines=nb_lines,
attention_dropout=dropout,
logger=logger,
- args,
+ args=args,
)
elif attention_layer == "caterpillar":
return Caterpillar(
caterpillar_height=self.caterpillar_height,
attention_dropout=dropout,
logger=logger,
- args,
+ args=args,
)
else:
raise ValueError(f"Unknown attention type {attention_layer}.")